development/doxygen/ONNX_8cc_source.html

/**************************************************************************

 * basf2 (Belle II Analysis Software Framework)                           *

 * Author: The Belle II Collaboration                                     *

 *                                                                        *

 * See git log for contributors and copyright holders.                    *

 * This file is licensed under LGPL-3.0, see LICENSE.md.                  *

 **************************************************************************/


#include <mva/methods/ONNX.h>


#include <framework/logging/Logger.h>

#include <iostream>

#include <vector>


using namespace Belle2::MVA;

using namespace Belle2::MVA::ONNX;


Session::Session(const std::string filename)

{

  // Ensure single-threaded execution, see

  // https://onnxruntime.ai/docs/performance/tune-performance/threading.html

  //

  // InterOpNumThreads is probably optional (not used in ORT_SEQUENTIAL mode)

  // Also, with batch size 1 and ORT_SEQUENTIAL mode, MLP-like models will

  // always run single threaded, but maybe not e.g. graph networks which can

  // run in parallel on nodes. Here, setting IntraOpNumThreads to 1 is

  // important to ensure single-threaded execution.

  m_sessionOptions.SetIntraOpNumThreads(1);

  m_sessionOptions.SetInterOpNumThreads(1);

  m_sessionOptions.SetExecutionMode(ORT_SEQUENTIAL); // default, but make it explicit


  m_session = std::make_unique<Ort::Session>(m_env, filename.c_str(), m_sessionOptions);

}


void Session::run(const std::map<std::string, std::shared_ptr<BaseTensor>>& inputMap,

                  const std::map<std::string, std::shared_ptr<BaseTensor>>& outputMap)

{

  std::vector<Ort::Value> inputs;

  std::vector<Ort::Value> outputs;

  std::vector<const char*> inputNames;

  std::vector<const char*> outputNames;

  for (auto& x : inputMap) {

    inputNames.push_back(x.first.c_str());

    inputs.push_back(x.second->createOrtTensor());

  }

  for (auto& x : outputMap) {

    outputNames.push_back(x.first.c_str());

    outputs.push_back(x.second->createOrtTensor());

  }

  run(inputNames, inputs, outputNames, outputs);

}


void Session::run(const std::vector<const char*>& inputNames,

                  std::vector<Ort::Value>& inputs,

                  const std::vector<const char*>& outputNames,

                  std::vector<Ort::Value>& outputs)

{

  m_session->Run(m_runOptions, inputNames.data(), inputs.data(), inputs.size(),

                 outputNames.data(), outputs.data(), outputs.size());

}


void ONNXOptions::load(const boost::property_tree::ptree& pt)

{

  m_outputName = pt.get<std::string>("ONNX_outputName", "output");

  m_modelFilename = pt.get<std::string>("ONNX_modelFilename", "model.onnx");

}


void ONNXOptions::save(boost::property_tree::ptree& pt) const

{

  pt.put("ONNX_outputName", m_outputName);

  pt.put("ONNX_modelFilename", m_modelFilename);

}


Weightfile ONNXTeacher::train(Dataset&) const

{

  B2WARNING("The ONNX interface does not perform any training - "

            "the train method just stores an existing ONNX model into an MVA weightfile.");

  if (m_specific_options.m_modelFilename.empty()) {

    B2FATAL("You have to provide a path to an ONNX model "

            "via `m_modelFilename` in the specific options");

  }

  Weightfile weightfile;

  weightfile.addOptions(m_general_options);

  weightfile.addOptions(m_specific_options);

  weightfile.addFile("ONNX_Modelfile", m_specific_options.m_modelFilename);

  return weightfile;

}


void ONNXExpert::configureInputOutputNames()

{

  const auto& inputNames = m_session->getOrtSession().GetInputNames();

  const auto& outputNames = m_session->getOrtSession().GetOutputNames();


  // Check if we have a single input model and set the input name to that

  if (inputNames.size() != 1) {

    std::stringstream msg;

    msg << "Model has multiple inputs: ";

    for (auto name : inputNames)

      msg << "\"" << name << "\" ";

    msg << "- only single-input models are supported.";

    B2FATAL(msg.str());

  }

  m_inputName = inputNames[0];


  m_outputName = m_specific_options.m_outputName;


  // For single-output models we just take the name of that single output

  if (outputNames.size() == 1) {

    if (!m_outputName.empty() && m_outputName != outputNames[0]) {

      B2INFO("Output name of the model is "

             << outputNames[0]

             << " - will use that despite the configured name being \""

             << m_outputName << "\"");

    }

    m_outputName = outputNames[0];

    return;

  }


  // Otherwise we have a multiple-output model and need to check if the

  // configured output name, or the fallback value "output", exists

  if (m_outputName.empty()) {

    m_outputName = "output";

  }

  auto outputFound = std::find(outputNames.begin(), outputNames.end(),

                               m_outputName) != outputNames.end();

  if (!outputFound) {

    std::stringstream msg;

    msg << "No output named \"" << m_outputName << "\" found. Instead got ";

    for (auto name : outputNames)

      msg << "\"" << name << "\" ";

    msg << "- either change your model to contain one named \"" << m_outputName

        << "\" or set `m_outputName` in the specific options to one of the available names.";

    B2FATAL(msg.str());

  }

}


void ONNXExpert::configureOutputValueIndex()

{

  int tensorIndex = 0;

  for (auto name : m_session->getOrtSession().GetOutputNames()) {

    if (name == m_outputName)

      break;

    ++tensorIndex;

  }

  auto typeInfo = m_session->getOrtSession().GetOutputTypeInfo(tensorIndex);

  auto shape = typeInfo.GetTensorTypeAndShapeInfo().GetShape();

  if (shape.back() == 2) {

    // We have 2 output values

    // -> configure to use signal_class index (default 1) in non-multiclass mode

    m_outputValueIndex = m_general_options.m_signal_class;

  } else {

    // otherwise use the default of 0

    m_outputValueIndex = 0;

  }

}


void ONNXExpert::load(Weightfile& weightfile)

{

  std::string onnxModelFileName = weightfile.generateFileName();

  weightfile.getFile("ONNX_Modelfile", onnxModelFileName);

  weightfile.getOptions(m_general_options);

  weightfile.getOptions(m_specific_options);

  m_session = std::make_unique<Session>(onnxModelFileName.c_str());

  configureInputOutputNames();

  configureOutputValueIndex();

}


std::vector<float> ONNXExpert::apply(Dataset& testData) const

{

  const auto nFeatures = testData.getNumberOfFeatures();

  const auto nEvents = testData.getNumberOfEvents();

  const int nOutputs = (m_outputValueIndex == 1) ? 2 : 1;

  auto input = Tensor<float>::make_shared({1, nFeatures});

  auto output = Tensor<float>::make_shared({1, nOutputs});

  std::vector<float> result;

  result.reserve(nEvents);

  for (unsigned int iEvent = 0; iEvent < nEvents; ++iEvent) {

    testData.loadEvent(iEvent);

    input->setValues(testData.m_input);

    m_session->run({{m_inputName, input}}, {{m_outputName, output}});

    result.push_back(output->at(m_outputValueIndex));

  }

  return result;

}


std::vector<std::vector<float>> ONNXExpert::applyMulticlass(Dataset& testData) const

{

  const unsigned int nClasses = m_general_options.m_nClasses;

  const auto nFeatures = testData.getNumberOfFeatures();

  const auto nEvents = testData.getNumberOfEvents();

  auto input = Tensor<float>::make_shared({1, nFeatures});

  auto output = Tensor<float>::make_shared({1, nClasses});

  std::vector<std::vector<float>> result(nEvents, std::vector<float>(nClasses));

  for (unsigned int iEvent = 0; iEvent < nEvents; ++iEvent) {

    testData.loadEvent(iEvent);

    input->setValues(testData.m_input);

    m_session->run({{m_inputName, input}}, {{m_outputName, output}});

    for (unsigned int iClass = 0; iClass < nClasses; ++iClass) {

      result[iEvent][iClass] = output->at(iClass);

    }

  }

  return result;

}


Belle2::MVA::Dataset
Abstract base class of all Datasets given to the MVA interface The current event can always be access...
Definition Dataset.h:33

Belle2::MVA::Dataset::getNumberOfEvents
virtual unsigned int getNumberOfEvents() const =0
Returns the number of events in this dataset.

Belle2::MVA::Dataset::getNumberOfFeatures
virtual unsigned int getNumberOfFeatures() const =0
Returns the number of features in this dataset.

Belle2::MVA::Dataset::loadEvent
virtual void loadEvent(unsigned int iEvent)=0
Load the event number iEvent.

Belle2::MVA::Dataset::m_input
std::vector< float > m_input
Contains all feature values of the currently loaded event.
Definition Dataset.h:123

Belle2::MVA::Expert::m_general_options
GeneralOptions m_general_options
General options loaded from the weightfile.
Definition Expert.h:70

Belle2::MVA::ONNXExpert::configureInputOutputNames
void configureInputOutputNames()
Set up input and output names and perform consistency checks.
Definition ONNX.cc:89

Belle2::MVA::ONNXExpert::m_specific_options
ONNXOptions m_specific_options
ONNX specific options loaded from weightfile.
Definition ONNX.h:489

Belle2::MVA::ONNXExpert::m_session
std::unique_ptr< ONNX::Session > m_session
The ONNX inference session wrapper.
Definition ONNX.h:484

Belle2::MVA::ONNXExpert::m_outputName
std::string m_outputName
Name of the output tensor (will either be determined automatically or loaded from specific options)
Definition ONNX.h:500

Belle2::MVA::ONNXExpert::load
virtual void load(Weightfile &weightfile) override
Load the expert from a Weightfile.
Definition ONNX.cc:157

Belle2::MVA::ONNXExpert::m_inputName
std::string m_inputName
Name of the input tensor (will be determined automatically)
Definition ONNX.h:494

Belle2::MVA::ONNXExpert::apply
virtual std::vector< float > apply(Dataset &testData) const override
Apply this expert onto a dataset.
Definition ONNX.cc:168

Belle2::MVA::ONNXExpert::m_outputValueIndex
int m_outputValueIndex
Index of the output value to pick in non-multiclass mode.
Definition ONNX.h:505

Belle2::MVA::ONNXExpert::applyMulticlass
virtual std::vector< std::vector< float > > applyMulticlass(Dataset &test_data) const override
Apply this expert onto a dataset and return multiple outputs.
Definition ONNX.cc:186

Belle2::MVA::ONNXExpert::configureOutputValueIndex
void configureOutputValueIndex()
Configure index of the value to be used for the configured output tensor.
Definition ONNX.cc:137

Belle2::MVA::ONNXOptions::m_modelFilename
std::string m_modelFilename
Filename of the model.
Definition ONNX.h:413

Belle2::MVA::ONNXOptions::m_outputName
std::string m_outputName
Name of the output Tensor that is used to make predictions.
Definition ONNX.h:407

Belle2::MVA::ONNXOptions::load
virtual void load(const boost::property_tree::ptree &) override
Load mechanism to load Options from a xml tree.
Definition ONNX.cc:62

Belle2::MVA::ONNXOptions::save
virtual void save(boost::property_tree::ptree &) const override
Save mechanism to store Options in a xml tree.
Definition ONNX.cc:68

Belle2::MVA::ONNXTeacher::m_specific_options
ONNXOptions m_specific_options
Method specific options.
Definition ONNX.h:440

Belle2::MVA::ONNXTeacher::train
virtual Weightfile train(Dataset &) const override
Won't do any actual training, but will return a valid MVA Weightfile.
Definition ONNX.cc:74

Belle2::MVA::ONNX::Session::m_runOptions
Ort::RunOptions m_runOptions
Options to be passed to Ort::Session::Run.
Definition ONNX.h:367

Belle2::MVA::ONNX::Session::m_env
Ort::Env m_env
Environment object for ONNX session.
Definition ONNX.h:352

Belle2::MVA::ONNX::Session::Session
Session(const std::string filename)
Constructs a new ONNX Runtime Session using the specified model file.
Definition ONNX.cc:18

Belle2::MVA::ONNX::Session::m_session
std::unique_ptr< Ort::Session > m_session
The ONNX inference session.
Definition ONNX.h:362

Belle2::MVA::ONNX::Session::m_sessionOptions
Ort::SessionOptions m_sessionOptions
ONNX session configuration.
Definition ONNX.h:357

Belle2::MVA::ONNX::Session::run
void run(const std::map< std::string, std::shared_ptr< BaseTensor > > &inputMap, const std::map< std::string, std::shared_ptr< BaseTensor > > &outputMap)
Runs inference on the model using named Tensor maps.
Definition ONNX.cc:35

Belle2::MVA::ONNX::Tensor::make_shared
static auto make_shared(std::vector< int64_t > shape)
Convenience method to create a shared pointer to a Tensor from shape.
Definition ONNX.h:145

Belle2::MVA::Teacher::m_general_options
GeneralOptions m_general_options
GeneralOptions containing all shared options.
Definition Teacher.h:49

Belle2::MVA::Weightfile
The Weightfile class serializes all information about a training into an xml tree.
Definition Weightfile.h:38