sopt/ort__session_8h_source.html

 #ifndef SOPT_ORT_SESSION_H

 #define SOPT_ORT_SESSION_H


 #include "onnxruntime_cxx_api.h"

 #include "sopt/logging.h"

 #include "sopt/utilities.h"

 #include "sopt/types.h"


 #include <memory>

 #include <sstream>

 #include <stdexcept>

 #include <string>

 #include <vector>


 namespace sopt {


 class ORTsession {


   public:


   ORTsession() = delete;


   ORTsession(const std::string& filename, const std::string& runname = "soptONNXrt") {


     // Set-up ONNXrt session

     _env = std::make_unique<Ort::Env>(ORT_LOGGING_LEVEL_WARNING, runname.c_str());


     // Load the model

     Ort::SessionOptions sessionopts;


     // Allow the number of threads used by the ONNX runtime to be set by an

     // environment variable. If unset it will use all available threads by default

     char* env_num_threads = std::getenv("ORT_NUM_THREADS");

     if(env_num_threads) {

       const int num_threads = std::stoi(env_num_threads);

       sessionopts.SetIntraOpNumThreads(num_threads);

       SOPT_INFO("ONNXRT using {} IntraOpThreads", num_threads);

     }


     _session = std::make_unique<Ort::Session>(*_env, filename.c_str(), sessionopts);


     // Store model hyperparameters (input/output shape etc.)

     _retrieveNetworkInfo();

   }


   std::vector<float> compute(std::vector<float>& inputs, const std::vector<int64_t>& inDims) const {


     if (inputs.empty()) {

       throw std::length_error("Input vector is empty!");

     }

     if (inDims.size() != _inShape) {

       throw std::length_error("Input tensor has incorrect shape! Expected "+std::to_string(_inShape)+" dimensions.");

     }


     // reshape flat input vector as tensor and run the model

     auto memory_info = Ort::MemoryInfo::CreateCpu(OrtArenaAllocator, OrtMemTypeDefault);

     auto input_tensor = Ort::Value::CreateTensor<float>(memory_info, inputs.data(), inputs.size(),

                                                         inDims.data(), inDims.size());

     auto output_tensors = _session->Run(Ort::RunOptions{nullptr}, _inNames.data(),

                                         &input_tensor, _inNames.size(),

                                         _outNames.data(), _outNames.size());


     // retrieve the ouput tensor and return flattened version

     auto outputInfo = output_tensors[0].GetTensorTypeAndShapeInfo();

     // Fix negative shape values - this appears to be an artefact of batch size issues

     int64_t outLen = 1;

     for (auto& dim : outputInfo.GetShape()) {

       if (dim < 0)  dim = abs(dim);

       outLen *= dim;

     }

     if (outLen == 0) {

       throw std::length_error("Invalid network structure: Output node with 0-length tensor encountered!");

     }

     float* floatarr = output_tensors.front().GetTensorMutableData<float>();

     std::vector<float> outputs;

     outputs.assign(floatarr, floatarr + outLen);

     return outputs;

   }


   template<typename T = t_real>

   Vector<T> compute(const Vector<T>& input, const std::vector<int64_t>& inDims) const {

     // ONNXrt requires floats as input

     std::vector<float> flat_input(input.size());

     for (size_t i = 0; i < input.size(); ++i) {

       if constexpr(std::is_same<T, t_complex>::value) {

         flat_input[i] = input[i].real();

       } else {

         flat_input[i] = input[i];

       }

     }

     std::vector<float> flat_output = compute(flat_input, inDims);

     Vector<T> rtn(flat_output.size());

     for (size_t i = 0; i < flat_output.size(); ++i) {

       if constexpr(std::is_same<T, t_complex>::value)

       {

         rtn[i] = t_complex(flat_output[i], 0);

       }

       else

       {

         rtn[i] = flat_output[i];

       }

     }

     return rtn;

   }


   template<typename T = t_real>

   Image<T> compute(const Image<T>& input, std::vector<int64_t> inDims = {}) const {


     // require an output node of the form {1, nRows, nCols}

     // in order to be able to map this onto a 2D tensor

     if (inDims.size() && inDims.size() != _inShape) {

       throw std::length_error("Input tensor has incorrect shape! Expected "+std::to_string(_inShape)+" dimensions.");

     }


     // ONNXrt requires floats as input

     const int nrows = input.rows();

     const int ncols = input.cols();

     std::vector<float> flat_input(nrows*ncols);

     for (int i = 0; i < nrows; ++i) {

       for (int j = 0; j < ncols; ++j) {

         flat_input[j*ncols+i] = input(i,j);

       }

     }

     if (inDims.empty()) {

       while (inDims.size() < _inShape-2)  inDims.push_back(1);

       inDims.push_back(nrows);

       inDims.push_back(ncols);

     }

     std::vector<float> flat_output = compute(flat_input, inDims);


     std::vector<T> tResults(flat_output.begin(), flat_output.end());

     Eigen::Map<Eigen::Array<T, Eigen::Dynamic, Eigen::Dynamic>> rtn(tResults.data(), nrows, ncols);

     return rtn;

   }


   const bool hasKey(const std::string& key) const {

     Ort::AllocatorWithDefaultOptions allocator;

     return  (bool)_metadata->LookupCustomMetadataMapAllocated(key.c_str(), allocator);

   }


   template <typename T>

   const T retrieve(const std::string& key) const {

     Ort::AllocatorWithDefaultOptions allocator;

     Ort::AllocatedStringPtr res = _metadata->LookupCustomMetadataMapAllocated(key.c_str(), allocator);

     if (!res) {

       throw std::runtime_error("Key '"+key+"' not found in network metadata!");

     }

     if constexpr (std::is_same<T, std::string>::value) {

       return res.get();

     }

     else {

       return utilities::lexical_cast<T>(res.get());

     }

   }


   template <typename T>

   const T retrieve(const std::string& key, const T& defaultreturn) const {

     try {

       return retrieve<T>(key);

     } catch (std::exception& e) {

       return defaultreturn;

     }

   }


   private:


   void _retrieveNetworkInfo() {


     Ort::AllocatorWithDefaultOptions allocator;


     // Retrieve network metadata

     _metadata = std::make_unique<Ort::ModelMetadata>(_session->GetModelMetadata());


     // find out how many input nodes the model expects

     const size_t num_input_nodes = _session->GetInputCount();

     if (num_input_nodes == 0) {

       throw std::length_error("Invalid network structure! Expected at least one input node.");

     }

     _inShape = _session->GetInputTypeInfo(0).GetTensorTypeAndShapeInfo().GetShape().size();

     _inNames.reserve(num_input_nodes);

     _inNamesPtr.reserve(num_input_nodes);

     SOPT_DEBUG("ORT input nodes = {}", num_input_nodes);

     for (size_t i = 0; i < num_input_nodes; ++i) {

       // query input node names

       auto input_name = _session->GetInputNameAllocated(i, allocator);

       _inNames.push_back(input_name.get());

       _inNamesPtr.push_back(std::move(input_name));

       SOPT_DEBUG("ORT input node {} is called {}", i, _inNames[_inNames.size()-1]);

     }


     // find out how many output nodes the model provides

     const size_t num_output_nodes = _session->GetOutputCount();

     if (num_output_nodes == 0) {

       throw std::length_error("Invalid network structure! Expected at least one output node.");

     }

     _outNames.reserve(num_output_nodes);

     _outNamesPtr.reserve(num_output_nodes);

     SOPT_DEBUG("ORT output nodes = {}", num_output_nodes);

     for (size_t i = 0; i < num_output_nodes; ++i) {

       // query input node names

       auto output_name = _session->GetOutputNameAllocated(i, allocator);

       _outNames.push_back(output_name.get());

       _outNamesPtr.push_back(std::move(output_name));

       SOPT_DEBUG("ORT output node {} is called {}", i, _outNames[_outNames.size()-1]);


     }

   }


   private:


   std::unique_ptr<Ort::Env> _env;


   std::unique_ptr<Ort::Session> _session;


   std::unique_ptr<Ort::ModelMetadata> _metadata;


   std::vector<Ort::AllocatedStringPtr> _inNamesPtr, _outNamesPtr;


   std::vector<const char*> _inNames, _outNames;


   size_t _inShape;


 };


 } // end of namespace sopt


 #endif

sopt::ORTsession
Sopt interface class to hold a ONNXrt session.
Definition: ort_session.h:18

sopt::ORTsession::ORTsession
ORTsession(const std::string &filename, const std::string &runname="soptONNXrt")
Constructor.
Definition: ort_session.h:25

sopt::ORTsession::ORTsession
ORTsession()=delete

sopt::ORTsession::retrieve
const T retrieve(const std::string &key) const
Definition: ort_session.h:151

sopt::ORTsession::compute
std::vector< float > compute(std::vector< float > &inputs, const std::vector< int64_t > &inDims) const
Definition: ort_session.h:50

sopt::ORTsession::compute
Vector< T > compute(const Vector< T > &input, const std::vector< int64_t > &inDims) const
Variant of compute() using input/output Eigen arrays.
Definition: ort_session.h:86

sopt::ORTsession::retrieve
const T retrieve(const std::string &key, const T &defaultreturn) const
Definition: ort_session.h:169

sopt::ORTsession::hasKey
const bool hasKey(const std::string &key) const
Method to check if key exists in network metadata.
Definition: ort_session.h:143

sopt::ORTsession::compute
Image< T > compute(const Image< T > &input, std::vector< int64_t > inDims={}) const
Variant of compute() using input/output Image.
Definition: ort_session.h:113

logging.h

SOPT_INFO
#define SOPT_INFO(...)
\macro Verbose informational message about normal condition
Definition: logging.h:215

SOPT_DEBUG
#define SOPT_DEBUG(...)
\macro Output some debugging
Definition: logging.h:217

sopt
Definition: bisection_method.h:10

sopt::Image
Eigen::Array< T, Eigen::Dynamic, Eigen::Dynamic > Image
A 2-dimensional list of elements of given type.
Definition: types.h:39

sopt::Vector
Eigen::Matrix< T, Eigen::Dynamic, 1 > Vector
A vector of a given type.
Definition: types.h:24

sopt::t_complex
std::complex< t_real > t_complex
Root of the type hierarchy for (real) complex numbers.
Definition: types.h:19

types.h

utilities.h