d1/d46/ExampleMLInferenceWithTriton_8h_source.html

// Copyright (C) 2002-2025 CERN for the benefit of the ATLAS collaboration


#pragma once


// Framework include(s).

#include "AthenaBaseComps/AthReentrantAlgorithm.h"

#include "AthOnnxInterfaces/IAthInferenceTool.h"


// System include(s).

#include <string>

#include <vector>


namespace AthInfer {


   class ExampleMLInferenceWithTriton: public AthReentrantAlgorithm {


   public:

      using AthReentrantAlgorithm::AthReentrantAlgorithm;


      virtual StatusCode initialize() override;

      virtual StatusCode execute( const EventContext& ctx ) const override;


   private:


      Gaudi::Property< std::string > m_pixelFileName{ this, "InputDataPixel",

         "dev/MLTest/2020-03-31/t10k-images-idx3-ubyte",

         "Name of the input pixel file to load" };


      Gaudi::Property<int> m_batchSize {this, "BatchSize", 1, "No. of elements/example in a batch"};


      ToolHandle< AthInfer::IAthInferenceTool >  m_tritonTool{

         this, "InferenceTool", "AthInfer::TritonTool", "Triton client tool"

      };


      std::vector<std::vector<std::vector<float>>> m_input_tensor_values_notFlat;


   private:

      std::vector<std::vector<std::vector<float>>> read_mnist_pixel_notFlat(const std::string &full_path) const;

      std::vector<float> flattenNestedVectors(const std::vector<std::vector<float>>& nestedVector) const;

   };


} // namespace AthInfer

AthReentrantAlgorithm.h

IAthInferenceTool.h

AthInfer::ExampleMLInferenceWithTriton
Algorithm demonstrating the usage of the Triton Client API.
Definition ExampleMLInferenceWithTriton.h:20

AthInfer::ExampleMLInferenceWithTriton::flattenNestedVectors
std::vector< float > flattenNestedVectors(const std::vector< std::vector< float > > &nestedVector) const

AthInfer::ExampleMLInferenceWithTriton::execute
virtual StatusCode execute(const EventContext &ctx) const override
Function executing the algorithm for a single event.
Definition ExampleMLInferenceWithTriton.cxx:32

AthInfer::ExampleMLInferenceWithTriton::initialize
virtual StatusCode initialize() override
Function initialising the algorithm.
Definition ExampleMLInferenceWithTriton.cxx:14

AthInfer::ExampleMLInferenceWithTriton::m_batchSize
Gaudi::Property< int > m_batchSize
Following properties needed to be consdered if the .onnx model is evaluated in batch mode.
Definition ExampleMLInferenceWithTriton.h:46

AthInfer::ExampleMLInferenceWithTriton::m_input_tensor_values_notFlat
std::vector< std::vector< std::vector< float > > > m_input_tensor_values_notFlat
Definition ExampleMLInferenceWithTriton.h:53

AthInfer::ExampleMLInferenceWithTriton::read_mnist_pixel_notFlat
std::vector< std::vector< std::vector< float > > > read_mnist_pixel_notFlat(const std::string &full_path) const
Definition ExampleMLInferenceWithTriton.cxx:89

AthInfer::ExampleMLInferenceWithTriton::m_pixelFileName
Gaudi::Property< std::string > m_pixelFileName
Name of the model file to load.
Definition ExampleMLInferenceWithTriton.h:41

AthInfer::ExampleMLInferenceWithTriton::m_tritonTool
ToolHandle< AthInfer::IAthInferenceTool > m_tritonTool
Tool handle for the Triton client.
Definition ExampleMLInferenceWithTriton.h:49

AthReentrantAlgorithm
An algorithm that can be simultaneously executed in multiple threads.
Definition AthReentrantAlgorithm.h:74

AthInfer
Definition ExampleMLInferenceWithTriton.cxx:12