code/dev/RivetONNXrt_8hh_source.html

// -*- C++ -*-

#ifndef RIVET_RivetONNXrt_HH

#define RIVET_RivetONNXrt_HH


#include <iostream>

#include <functional>

#include <numeric>


#include "Rivet/Tools/RivetPaths.hh"

#include "Rivet/Tools/Utils.hh"

#include "onnxruntime/onnxruntime_cxx_api.h"


namespace Rivet {


  class RivetONNXrt {


  public:


    // Suppress default constructor

    RivetONNXrt() = delete;


    RivetONNXrt(const string& filename, const string& runname = "RivetONNXrt") {


      // Set some ORT variables that need to be kept in memory

      _env = std::make_unique<Ort::Env>(ORT_LOGGING_LEVEL_WARNING, runname.c_str());


      // Load the model

      Ort::SessionOptions sessionopts;

      _session = std::make_unique<Ort::Session> (*_env, filename.c_str(), sessionopts);


      // Store network hyperparameters (input/output shape, etc.)

      getNetworkInfo();


      MSG_DEBUG(*this);

    }


    vector<vector<float>> compute(vector<vector<float>>& inputs) const {


      if (inputs.size() != _inDims.size()) {

        throw("Expected " + to_string(_inDims.size())

              + " input nodes, received " + to_string(inputs.size()));

      }


      // Create input tensor objects from input data

      vector<Ort::Value> ort_input;

      ort_input.reserve(_inDims.size());

      auto memory_info = Ort::MemoryInfo::CreateCpu(OrtArenaAllocator, OrtMemTypeDefault);

      for (size_t i=0; i < _inDims.size(); ++i) {


        // Check that input data matches expected input node dimension

        if (inputs[i].size() != _inDimsFlat[i]) {

          throw("Expected flattened input node dimension " + to_string(_inDimsFlat[i])

                 + ", received " + to_string(inputs[i].size()));

        }


        ort_input.emplace_back(Ort::Value::CreateTensor<float>(memory_info,

                                                               inputs[i].data(), inputs[i].size(),

                                                               _inDims[i].data(), _inDims[i].size()));

      }


      // retrieve output tensors

      auto ort_output = _session->Run(Ort::RunOptions{nullptr}, _inNames.data(),

                                      ort_input.data(), ort_input.size(),

                                      _outNames.data(), _outNames.size());


      // construct flattened values and return

      vector<vector<float>> outputs; outputs.resize(_outDims.size());

      for (size_t i = 0; i < _outDims.size(); ++i) {

        float* floatarr = ort_output[i].GetTensorMutableData<float>();

        outputs[i].assign(floatarr, floatarr + _outDimsFlat[i]);

      }

      return outputs;

    }


    vector<float> compute(const vector<float>& inputs) const {

      if (_inDims.size() != 1 || _outDims.size() != 1) {

        throw("This method assumes a single input/output node!");

      }

      vector<vector<float>> wrapped_inputs = { inputs };

      vector<vector<float>> outputs = compute(wrapped_inputs);

      return outputs[0];

    }


    bool hasKey(const std::string& key) const {

      Ort::AllocatorWithDefaultOptions allocator;

      return (bool)_metadata->LookupCustomMetadataMapAllocated(key.c_str(), allocator);

    }


    template <typename T,

      typename std::enable_if_t<!is_iterable_v<T> | is_cstring_v<T> >>


    T retrieve(const std::string& key) const {

      Ort::AllocatorWithDefaultOptions allocator;

      Ort::AllocatedStringPtr res = _metadata->LookupCustomMetadataMapAllocated(key.c_str(), allocator);

      if (!res) {

        throw("Key '"+key+"' not found in network metadata!");

      }

      /*if constexpr (std::is_same<T, std::string>::value) {

        return res.get();

      }*/

      return lexical_cast<T>(res.get());

    }


    std::string retrieve(const std::string& key) const {

      Ort::AllocatorWithDefaultOptions allocator;

      Ort::AllocatedStringPtr res = _metadata->LookupCustomMetadataMapAllocated(key.c_str(), allocator);

      if (!res) {

        throw("Key '"+key+"' not found in network metadata!");

      }

      return res.get();

    }


    template <typename T>


    vector<T> retrieve(const std::string & key) const {

      const vector<string> stringvec = split(retrieve(key), ",");

      vector<T> returnvec = {};

      for (const string & s : stringvec){

        returnvec.push_back(lexical_cast<T>(s));

      }

      return returnvec;

    }


    template <typename T>


    vector<T> retrieve(const std::string & key, const vector<T> & defaultreturn) const {

      try {

        return retrieve<T>(key);

      } catch (...) {

        return defaultreturn;

      }

    }


    std::string retrieve(const std::string& key, const std::string& defaultreturn) const {

      try {

        return retrieve(key);

      } catch (...) {

        return defaultreturn;

      }

    }


    template <typename T,

      typename std::enable_if_t<!is_iterable_v<T> | is_cstring_v<T> >>


    T retrieve(const std::string& key, const T& defaultreturn) const {

      try {

        return retrieve<T>(key);

      } catch (...) {

        return defaultreturn;

      }

    }


    friend std::ostream& operator <<(std::ostream& os, const RivetONNXrt& rort){

      os << "RivetONNXrt Network Summary: \n";

      for (size_t i=0; i < rort._inNames.size(); ++i) {

        os << "- Input node " << i << " name: " << rort._inNames[i];

        os << ", dimensions: (";

        for (size_t j=0; j < rort._inDims[i].size(); ++j){

          if (j)  os << ", ";

          os << rort._inDims[i][j];

        }

        os << "), type (as ONNX enums): " << rort._inTypes[i] << "\n";

      }

      for (size_t i=0; i < rort._outNames.size(); ++i) {

        os << "- Output node " << i << " name: " << rort._outNames[i];

        os << ", dimensions: (";

        for (size_t j=0; j < rort._outDims[i].size(); ++j){

          if (j)  os << ", ";

          os << rort._outDims[i][j];

        }

        os << "), type (as ONNX enums): (" << rort._outTypes[i] << "\n";

      }

      return os;

    }


    Log& getLog() const {

      string logname = "Rivet.RivetONNXrt";

      return Log::getLog(logname);

    }


  private:


    void getNetworkInfo() {


      Ort::AllocatorWithDefaultOptions allocator;


      // Retrieve network metadat

      _metadata = std::make_unique<Ort::ModelMetadata>(_session->GetModelMetadata());


      // find out how many input nodes the model expects

      const size_t num_input_nodes = _session->GetInputCount();

      _inDimsFlat.reserve(num_input_nodes);

      _inTypes.reserve(num_input_nodes);

      _inDims.reserve(num_input_nodes);

      _inNames.reserve(num_input_nodes);

      _inNamesPtr.reserve(num_input_nodes);

      for (size_t i = 0; i < num_input_nodes; ++i) {

        // retrieve input node name

        auto input_name = _session->GetInputNameAllocated(i, allocator);

        _inNames.push_back(input_name.get());

        _inNamesPtr.push_back(std::move(input_name));


        // retrieve input node type

        auto in_type_info = _session->GetInputTypeInfo(i);

        auto in_tensor_info = in_type_info.GetTensorTypeAndShapeInfo();

        _inTypes.push_back(in_tensor_info.GetElementType());

        _inDims.push_back(in_tensor_info.GetShape());

      }


      // Fix negative shape values - appears to be an artefact of batch size issues.

      for (auto& dims : _inDims) {

        int64_t n = 1;

        for (auto& dim : dims) {

          if (dim < 0)  dim = abs(dim);

          n *= dim;

        }

        _inDimsFlat.push_back(n);

      }


      // find out how many output nodes the model expects

      const size_t num_output_nodes = _session->GetOutputCount();

      _outDimsFlat.reserve(num_output_nodes);

      _outTypes.reserve(num_output_nodes);

      _outDims.reserve(num_output_nodes);

      _outNames.reserve(num_output_nodes);

      _outNamesPtr.reserve(num_output_nodes);

      for (size_t i = 0; i < num_output_nodes; ++i) {

        // retrieve output node name

        auto output_name = _session->GetOutputNameAllocated(i, allocator);

        _outNames.push_back(output_name.get());

        _outNamesPtr.push_back(std::move(output_name));


        // retrieve input node type

        auto out_type_info = _session->GetOutputTypeInfo(i);

        auto out_tensor_info = out_type_info.GetTensorTypeAndShapeInfo();

        _outTypes.push_back(out_tensor_info.GetElementType());

        _outDims.push_back(out_tensor_info.GetShape());

      }


      // Fix negative shape values - appears to be an artefact of batch size issues.

      for (auto& dims : _outDims) {

        int64_t n = 1;

        for (auto& dim : dims) {

          if (dim < 0)  dim = abs(dim);

          n *= dim;

        }

        _outDimsFlat.push_back(n);

      }

    }


  private:


    std::unique_ptr<Ort::Env> _env;


    std::unique_ptr<Ort::Session> _session;


    std::unique_ptr<Ort::ModelMetadata> _metadata;


    vector<vector<int64_t>> _inDims, _outDims;


    vector<int64_t> _inDimsFlat, _outDimsFlat;


    vector<ONNXTensorElementDataType> _inTypes, _outTypes;


    vector<Ort::AllocatedStringPtr> _inNamesPtr, _outNamesPtr;


    vector<const char*> _inNames, _outNames;

  };


  inline string getONNXFilePath(const string& filename) {

    const string path1 = findAnalysisDataFile(filename);

    if (!path1.empty()) return path1;

    throw Rivet::Error("Couldn't find an ONNX data file for '" + filename + "' " +

                       "in the path " + toString(getRivetDataPath()));

  }


  inline unique_ptr<RivetONNXrt> getONNX(const string& analysisname, const string& suffix = ".onnx"){

    return make_unique<RivetONNXrt>(getONNXFilePath(analysisname+suffix));

  }


}


#endif

Rivet::Log
Logging system for controlled & formatted writing to stdout.
Definition Logging.hh:10

Rivet::Log::getLog
static Log & getLog(const std::string &name)

Rivet::RivetONNXrt
Simple interface class to take care of basic ONNX networks.
Definition RivetONNXrt.hh:21

Rivet::RivetONNXrt::getLog
Log & getLog() const
Logger.
Definition RivetONNXrt.hh:192

Rivet::RivetONNXrt::retrieve
T retrieve(const std::string &key, const T &defaultreturn) const
Definition RivetONNXrt.hh:159

Rivet::RivetONNXrt::retrieve
std::string retrieve(const std::string &key) const
Template specialisation of retrieve for std::string.
Definition RivetONNXrt.hh:117

Rivet::RivetONNXrt::operator<<
friend std::ostream & operator<<(std::ostream &os, const RivetONNXrt &rort)
Printing function for debugging.
Definition RivetONNXrt.hh:168

Rivet::RivetONNXrt::retrieve
vector< T > retrieve(const std::string &key, const vector< T > &defaultreturn) const
Overload of retrieve for vector<T>, with a default return.
Definition RivetONNXrt.hh:139

Rivet::RivetONNXrt::compute
vector< float > compute(const vector< float > &inputs) const
Given a single-node input vector, populate and return the single-node output vector.
Definition RivetONNXrt.hh:85

Rivet::RivetONNXrt::RivetONNXrt
RivetONNXrt(const string &filename, const string &runname="RivetONNXrt")
Constructor.
Definition RivetONNXrt.hh:29

Rivet::RivetONNXrt::compute
vector< vector< float > > compute(vector< vector< float > > &inputs) const
Given a multi-node input vector, populate and return the multi-node output vector.
Definition RivetONNXrt.hh:45

Rivet::RivetONNXrt::hasKey
bool hasKey(const std::string &key) const
Method to check if key exists in network metatdata.
Definition RivetONNXrt.hh:95

Rivet::RivetONNXrt::retrieve
T retrieve(const std::string &key) const
Definition RivetONNXrt.hh:104

Rivet::RivetONNXrt::retrieve
vector< T > retrieve(const std::string &key) const
Overload of retrieve for vector<T>
Definition RivetONNXrt.hh:128

MSG_DEBUG
#define MSG_DEBUG(x)
Debug messaging, not enabled by default, using MSG_LVL.
Definition Logging.hh:182

Rivet::findAnalysisDataFile
std::string findAnalysisDataFile(const std::string &filename, const std::vector< std::string > &pathprepend=std::vector< std::string >(), const std::vector< std::string > &pathappend=std::vector< std::string >())
Find the first file of the given name in the general data file search dirs.

Rivet::getRivetDataPath
std::string getRivetDataPath()
Get Rivet data install path.

Rivet::split
vector< string > split(const string &s, const string &sep)
Split a string on a specified separator string.
Definition Utils.hh:214

Rivet
Definition MC_CENT_PPB_Projections.hh:10

Rivet::getONNXFilePath
string getONNXFilePath(const string &filename)
Useful function for getting ONNX file paths.
Definition RivetONNXrt.hh:301

Rivet::getONNX
unique_ptr< RivetONNXrt > getONNX(const string &analysisname, const string &suffix=".onnx")
Definition RivetONNXrt.hh:315

Rivet::toString
std::string toString(const AnalysisInfo &ai)
String representation.

Rivet::Error
Generic runtime Rivet error.
Definition Exceptions.hh:12