latest/html/TritonData_8h_source.html

 #ifndef NuSonic_Triton_TritonData
 #define NuSonic_Triton_TritonData

 #include "cetlib_except/exception.h"
 #include "larrecodnn/ImagePatternAlgs/NuSonic/Triton/Span.h"
 #include "larrecodnn/ImagePatternAlgs/NuSonic/Triton/triton_utils.h"

 #include <algorithm>
 #include <any>
 #include <memory>
 #include <numeric>
 #include <string>
 #include <unordered_map>
 #include <vector>

 #include "grpc_client.h"
 #include "triton/common/model_config.h"

 namespace nic = triton::client;

 namespace lartriton {

   //forward declaration
   class TritonClient;

   //aliases for local input and output types
   template <typename DT>
   using TritonInput = std::vector<std::vector<DT>>;
   template <typename DT>
   using TritonOutput = std::vector<triton_span::Span<const DT*>>;

   //store all the info needed for triton input and output
   template <typename IO>
   class TritonData {
   public:
     using Result = nic::InferResult;
     using TensorMetadata = inference::ModelMetadataResponse_TensorMetadata;
     using ShapeType = std::vector<int64_t>;
     using ShapeView = triton_span::Span<ShapeType::const_iterator>;

     //constructor
     TritonData(const std::string& name, const TensorMetadata& model_info, bool noBatch);

     //some members can be modified
     bool setShape(const ShapeType& newShape) { return setShape(newShape, true); }
     bool setShape(unsigned loc, int64_t val) { return setShape(loc, val, true); }

     //io accessors
     template <typename DT>
     void toServer(std::shared_ptr<TritonInput<DT>> ptr)
     {
       const auto& data_in = *ptr;

       //check batch size
       if (data_in.size() != batchSize_) {
         throw cet::exception("TritonDataError")
           << name_ << " input(): input vector has size " << data_in.size()
           << " but specified batch size is " << batchSize_;
       }

       //shape must be specified for variable dims or if batch size changes
       data_->SetShape(fullShape_);

       if (byteSize_ != sizeof(DT))
         throw cet::exception("TritonDataError")
           << name_ << " input(): inconsistent byte size " << sizeof(DT) << " (should be "
           << byteSize_ << " for " << dname_ << ")";

       for (unsigned i0 = 0; i0 < batchSize_; ++i0) {
         const DT* arr = data_in[i0].data();
         triton_utils::throwIfError(
           data_->AppendRaw(reinterpret_cast<const uint8_t*>(arr), data_in[i0].size() * byteSize_),
           name_ + " input(): unable to set data for batch entry " + std::to_string(i0));
       }

       //keep input data in scope
       holder_ = std::move(ptr);
     }

     template <typename DT>
     TritonOutput<DT> fromServer() const;

     //const accessors
     const ShapeView& shape() const { return shape_; }
     int64_t byteSize() const { return byteSize_; }
     const std::string& dname() const { return dname_; }
     unsigned batchSize() const { return batchSize_; }

     //utilities
     bool variableDims() const { return variableDims_; }
     int64_t sizeDims() const { return productDims_; }
     //default to dims if shape isn't filled
     int64_t sizeShape() const { return variableDims_ ? dimProduct(shape_) : sizeDims(); }

   private:
     friend class TritonClient;

     //private accessors only used by client
     bool setShape(const ShapeType& newShape, bool canThrow);
     bool setShape(unsigned loc, int64_t val, bool canThrow);
     void setBatchSize(unsigned bsize);
     void reset();
     void setResult(std::shared_ptr<Result> result) { result_ = result; }
     IO* data() { return data_.get(); }

     //helpers
     bool anyNeg(const ShapeView& vec) const
     {
       return std::any_of(vec.begin(), vec.end(), [](int64_t i) { return i < 0; });
     }
     int64_t dimProduct(const ShapeView& vec) const
     {
       return std::accumulate(vec.begin(), vec.end(), 1, std::multiplies<int64_t>());
     }
     void createObject(IO** ioptr) const;

     //members
     std::string name_;
     std::shared_ptr<IO> data_;
     const ShapeType dims_;
     bool noBatch_;
     unsigned batchSize_;
     ShapeType fullShape_;
     ShapeView shape_;
     bool variableDims_;
     int64_t productDims_;
     std::string dname_;
     inference::DataType dtype_;
     int64_t byteSize_;
     std::any holder_;
     std::shared_ptr<Result> result_;
   };

   using TritonInputData = TritonData<nic::InferInput>;
   using TritonInputMap = std::unordered_map<std::string, TritonInputData>;
   using TritonOutputData = TritonData<nic::InferRequestedOutput>;
   using TritonOutputMap = std::unordered_map<std::string, TritonOutputData>;

   template <>
   void TritonInputData::reset();
   template <>
   void TritonOutputData::reset();
   template <>
   void TritonInputData::createObject(nic::InferInput** ioptr) const;
   template <>
   void TritonOutputData::createObject(nic::InferRequestedOutput** ioptr) const;

   //explicit template instantiation declarations
   extern template class TritonData<nic::InferInput>;
   extern template class TritonData<nic::InferRequestedOutput>;

 }
 #endif
lartriton::TritonData::data
IO * data()
Definition: TritonData.h:104

lartriton::TritonData::name_
std::string name_
Definition: TritonData.h:118

lartriton::TritonOutputMap
std::unordered_map< std::string, TritonOutputData > TritonOutputMap
Definition: TritonData.h:137

lartriton
Definition: TritonClient.cc:23

lartriton::TritonData::setBatchSize
void setBatchSize(unsigned bsize)
Definition: TritonData.cc:100

lartriton::TritonData::setShape
bool setShape(const ShapeType &newShape)
Definition: TritonData.h:45

lartriton::TritonData::TritonData
TritonData(const std::string &name, const TensorMetadata &model_info, bool noBatch)
Definition: TritonData.cc:17

lartriton::TritonData::dims_
const ShapeType dims_
Definition: TritonData.h:120

lartriton::TritonData::holder_
std::any holder_
Definition: TritonData.h:130

lartriton::TritonData::anyNeg
bool anyNeg(const ShapeView &vec) const
Definition: TritonData.h:107

Span.h

lartriton::TritonData::sizeDims
int64_t sizeDims() const
Definition: TritonData.h:91

lartriton::TritonData::variableDims
bool variableDims() const
Definition: TritonData.h:90

lartriton::TritonData::shape
const ShapeView & shape() const
Definition: TritonData.h:84

lartriton::TritonData
Definition: TritonData.h:34

lartriton::TritonData::fullShape_
ShapeType fullShape_
Definition: TritonData.h:123

lartriton::TritonData::ShapeType
std::vector< int64_t > ShapeType
Definition: TritonData.h:38

triton_span::Span::begin
T begin() const
Definition: Span.h:20

lartriton::TritonData::dtype_
inference::DataType dtype_
Definition: TritonData.h:128

triton_span::Span< ShapeType::const_iterator >

triton_utils::throwIfError
void throwIfError(const Error &err, std::string_view msg)
Definition: triton_utils.cc:26

lartriton::TritonClient
Definition: TritonClient.h:20

lartriton::TritonData::setResult
void setResult(std::shared_ptr< Result > result)
Definition: TritonData.h:103

lartriton::TritonData::toServer
void toServer(std::shared_ptr< TritonInput< DT >> ptr)
Definition: TritonData.h:50

triton_span::Span::end
T end() const
Definition: Span.h:21

lartriton::TritonData::byteSize_
int64_t byteSize_
Definition: TritonData.h:129

util::to_string
decltype(auto) constexpr to_string(T &&obj)
ADL-aware version of std::to_string.

lartriton::TritonInput
std::vector< std::vector< DT >> TritonInput
Definition: TritonData.h:28

lartriton::TritonData::noBatch_
bool noBatch_
Definition: TritonData.h:121

lartriton::TritonData::reset
void reset()
Definition: TritonData.cc:146

lartriton::TritonData::variableDims_
bool variableDims_
Definition: TritonData.h:125

lartriton::TritonData::batchSize
unsigned batchSize() const
Definition: TritonData.h:87

lartriton::TritonData::sizeShape
int64_t sizeShape() const
Definition: TritonData.h:93

nutools::dbi::DataType
DataType
Definition: DataType.h:6

lartriton::TritonData::createObject
void createObject(IO **ioptr) const

lartriton::TritonData::setShape
bool setShape(unsigned loc, int64_t val)
Definition: TritonData.h:46

triton_utils.h

lartriton::TritonData::shape_
ShapeView shape_
Definition: TritonData.h:124

lartriton::TritonData::batchSize_
unsigned batchSize_
Definition: TritonData.h:122

lartriton::TritonData::result_
std::shared_ptr< Result > result_
Definition: TritonData.h:131

lartriton::TritonOutput
std::vector< triton_span::Span< const DT * >> TritonOutput
Definition: TritonData.h:30

lartriton::TritonData::data_
std::shared_ptr< IO > data_
Definition: TritonData.h:119

lartriton::TritonData::dimProduct
int64_t dimProduct(const ShapeView &vec) const
Definition: TritonData.h:111

lartriton::TritonData::dname
const std::string & dname() const
Definition: TritonData.h:86

lartriton::TritonInputMap
std::unordered_map< std::string, TritonInputData > TritonInputMap
Definition: TritonData.h:135

lartriton::TritonData::byteSize
int64_t byteSize() const
Definition: TritonData.h:85

lartriton::TritonData::TensorMetadata
inference::ModelMetadataResponse_TensorMetadata TensorMetadata
Definition: TritonData.h:37

lartriton::TritonData::dname_
std::string dname_
Definition: TritonData.h:127

lartriton::TritonData::fromServer
TritonOutput< DT > fromServer() const
Definition: TritonData.cc:110

lartriton::TritonData::Result
nic::InferResult Result
Definition: TritonData.h:36

lartriton::TritonData::productDims_
int64_t productDims_
Definition: TritonData.h:126

fhicl::exception
cet::coded_exception< error, detail::translate > exception
Definition: exception.h:33