da/d8a/SPInferenceToolBase_8cxx_source.html

/*

    Copyright (C) 2002-2025 CERN for the benefit of the ATLAS collaboration

*/

#include "SPInferenceToolBase.h"


#include "AthenaBaseComps/AthMsgStreamMacros.h"

#include "MuonInferenceInterfaces/GraphData.h"

#include "MuonInferenceInterfaces/NodeFeatureList.h"

#include "PathResolver/PathResolver.h"

#include "Acts/Utilities/MathHelpers.hpp"

#include <span>


namespace {

    template <typename T>

        std::ostream& operator<<(std::ostream& ostr, const std::vector<T>& vec) {

            ostr << "[";

            for (const T& val : vec) {

                ostr << val << ", ";

            }

            ostr << "]";

            return ostr;

        }

    template <typename T1 , typename T2>

        std::ostream& operator<<(std::ostream& ostr, const std::pair<T1, T2>& pair) {

            ostr << "(" << pair.first << ", " << pair.second << ")";

            return ostr;

        }


    std::vector<std::pair<int64_t, int64_t>> makeIndexPairs(const std::vector<int64_t>& edges) {

        std::vector<std::pair<int64_t, int64_t>> indexPairs;

        const size_t nEdges = edges.size() / 2;

        indexPairs.reserve(nEdges);

        for (size_t i = 0; i < nEdges; ++i) {

            indexPairs.emplace_back(std::make_pair(edges[i], edges[i+nEdges]));

        }

        return indexPairs;

    }


    std::vector<int64_t> makeSortedEdges(const std::vector<int64_t>& edges) {

        const size_t nEdges = edges.size() / 2;

        std::vector<std::pair<int64_t, int64_t>> indexPairs;

        indexPairs.reserve(nEdges);


        // Create (src, dst) pairs

        for (size_t i = 0; i < nEdges; ++i) {

            indexPairs.emplace_back(edges[i], edges[i + nEdges]);

        }


        // Sort by src, then dst

        std::sort(indexPairs.begin(), indexPairs.end(), [](const auto& a, const auto& b) {

            return (a.first < b.first) || (a.first == b.first && a.second < b.second);

        });


        // Reconstruct sorted flat edges: [sorted_src..., sorted_dst...]

        std::vector<int64_t> sortedEdges;

        sortedEdges.reserve(2 * nEdges);

        for (const auto& pair : indexPairs) {

            sortedEdges.push_back(pair.first);

        }

        for (const auto& pair : indexPairs) {

            sortedEdges.push_back(pair.second);

        }


        return sortedEdges;

    }


    std::string formatNodeFeatures(const std::vector<float>& featureLeaves, size_t numFeaturesPerNode) {

        std::ostringstream oss;


        const size_t numNodes = featureLeaves.size() / numFeaturesPerNode;

        oss << "Number of nodes: " << numNodes << "\n";

        oss << "Features per node: " << numFeaturesPerNode << "\n";


        for (size_t nodeIdx = 0; nodeIdx < numNodes; ++nodeIdx) {

            oss << "Node[" << nodeIdx << "]: [";

            for (size_t f = 0; f < numFeaturesPerNode; ++f) {

                if (f > 0) oss << ", ";

                oss << featureLeaves[nodeIdx * numFeaturesPerNode + f];

            }

            oss << "]\n";

        }


        return oss.str();

    }

}

namespace MuonML{


    Ort::Session& SPInferenceToolBase::model() const {

        return m_onnxSessionTool->session();

    }


    StatusCode SPInferenceToolBase::setupModel() {

        ATH_CHECK(m_onnxSessionTool.retrieve());

        ATH_CHECK(m_readKey.initialize());


        Ort::ModelMetadata metadata = model().GetModelMetadata();

        Ort::AllocatorWithDefaultOptions allocator;

        Ort::AllocatedStringPtr feature_json_ptr = metadata.LookupCustomMetadataMapAllocated("feature_names", allocator);


        if (feature_json_ptr) {

            std::string feature_json = feature_json_ptr.get();

            nlohmann::json json_obj = nlohmann::json::parse(feature_json);

            for (const auto& feature : json_obj) {

                m_graphFeatures.addFeature(feature.get<std::string>(), msgStream());

            }

        }

        m_graphFeatures.setConnector("fullyConnected", msgStream());


        if (!m_graphFeatures.isValid()) {

            ATH_MSG_FATAL("No graph features have been parsed. Please check the model: "<<m_graphFeatures.featureNames());

            return StatusCode::FAILURE;

        }

        return StatusCode::SUCCESS;

    }


    StatusCode SPInferenceToolBase::buildGraph(  const EventContext& ctx,

                                                    GraphRawData& graphData) const {


        if (graphData.previousList && (*graphData.previousList) != m_graphFeatures) {

            graphData.graph.reset();

        }

        if (graphData.graph) {

            return StatusCode::SUCCESS;

        }

        if (!m_graphFeatures.isValid()) {

            ATH_MSG_ERROR("The feature list is in complete. Either it has no features or no node connector set");

            return StatusCode::FAILURE;

        }


        graphData.graph = std::make_unique<InferenceGraph>();


        SG::ReadHandle spacePoints{m_readKey, ctx};

        ATH_CHECK(spacePoints.isPresent());


        int64_t nNodes{0}, possConn{0};

        graphData.spacePointsInBucket.clear();

        graphData.spacePointsInBucket.reserve(spacePoints->size());


        for (const MuonR4::SpacePointBucket* bucket : *spacePoints) {

            nNodes += graphData.spacePointsInBucket.emplace_back(bucket->size());

            possConn += Acts::sumUpToN(graphData.spacePointsInBucket.back());

        }


        graphData.nodeIndex = 0;

        graphData.featureLeaves.resize(nNodes * m_graphFeatures.numFeatures());

        graphData.currLeave = graphData.featureLeaves.begin();


        graphData.srcEdges.reserve(possConn);

        graphData.desEdges.reserve(possConn);


        for (const MuonR4::SpacePointBucket* bucket : *spacePoints) {

            const LayerSpBucket mlBucket{*bucket};

            m_graphFeatures.fillInData(mlBucket, graphData);

        }


        graphData.srcEdges.insert(graphData.srcEdges.end(), std::make_move_iterator(graphData.desEdges.begin()),

                                    std::make_move_iterator(graphData.desEdges.end()));


        ATH_MSG_DEBUG("Features:"<<m_graphFeatures.featureNames());

        ATH_MSG_DEBUG(formatNodeFeatures(graphData.featureLeaves, m_graphFeatures.numFeatures()));

        ATH_MSG_DEBUG("Edge indices:"<<makeIndexPairs(makeSortedEdges(graphData.srcEdges)));


        std::vector<int64_t> featShape{nNodes, static_cast<int64_t>(m_graphFeatures.numFeatures())};    // (N, nFeatures)

        std::vector<int64_t> edgeShape{2, static_cast<int64_t>(graphData.srcEdges.size() / 2)};         // (2, E)


        Ort::MemoryInfo memInfo = Ort::MemoryInfo::CreateCpu(OrtDeviceAllocator, OrtMemTypeCPU);

        graphData.graph->dataTensor.emplace_back(Ort::Value::CreateTensor<float>(memInfo,

                                                    graphData.featureLeaves.data(), graphData.featureLeaves.size(),

                                                    featShape.data(), featShape.size()));


        Ort::Value edge_tensor = Ort::Value::CreateTensor<int64_t>(memInfo, graphData.srcEdges.data(),

            graphData.srcEdges.size(), edgeShape.data(), edgeShape.size());


        graphData.graph->dataTensor.emplace_back(std::move(edge_tensor));


        graphData.previousList = &m_graphFeatures;


        graphData.srcEdges.clear();

        graphData.desEdges.clear();

        graphData.featureLeaves.clear();

        ATH_MSG_DEBUG("Graph data built successfully.");

        return StatusCode::SUCCESS;

    }


    StatusCode SPInferenceToolBase::runInference(GraphRawData& graphData) const {

        if (!m_graphFeatures.isValid()) {

            ATH_MSG_ERROR("ONNX model is not loaded. Please call setupModel()");

            return StatusCode::FAILURE;

        }

        if (!graphData.graph) {

            ATH_MSG_ERROR("Graph data is not built.");

            return StatusCode::FAILURE;

        }


        if (graphData.graph->dataTensor.size() < 2) {

            ATH_MSG_ERROR("Data tensor does not contain both feature and edge tensors.");

            return StatusCode::FAILURE;

        }


        std::vector<const char*> inputNames  = {"features", "edge_index"};

        std::vector<const char*> outputNames = {"output"};


        Ort::RunOptions run_options;

        run_options.SetRunLogSeverityLevel(ORT_LOGGING_LEVEL_WARNING);


        std::vector<Ort::Value> outputTensors = model().Run(run_options,

                                                inputNames.data(),                    // input tensor names

                                                graphData.graph->dataTensor.data(),  // pointer to the tensor vector

                                                graphData.graph->dataTensor.size(),   // size of the tensor vector

                                                outputNames.data(),                  // output tensor names

                                                outputNames.size());                 // number of output tensors


        if (outputTensors.empty()) {

            ATH_MSG_ERROR("Inference returned empty output.");

            return StatusCode::FAILURE;

        }


        float* output_data = outputTensors[0].GetTensorMutableData<float>();

        size_t output_size = outputTensors[0].GetTensorTypeAndShapeInfo().GetElementCount();


        std::span<float> predictions(output_data, output_data + output_size);


        for (size_t i = 0; i < output_size; i++) {

            if (!std::isfinite(predictions[i])) {

                ATH_MSG_WARNING("Non-finite prediction detected! Setting to -100..");

                predictions[i] = -100.0f;

            }

        }


        graphData.graph->dataTensor.emplace_back(std::move(outputTensors[0]));


        return StatusCode::SUCCESS;

    }


}


ATH_CHECK
#define ATH_CHECK
Evaluate an expression and check for errors.
Definition AthCheckMacros.h:40

AthMsgStreamMacros.h

ATH_MSG_ERROR
#define ATH_MSG_ERROR(x)
Definition AthMsgStreamMacros.h:33

ATH_MSG_FATAL
#define ATH_MSG_FATAL(x)
Definition AthMsgStreamMacros.h:34

ATH_MSG_WARNING
#define ATH_MSG_WARNING(x)
Definition AthMsgStreamMacros.h:32

ATH_MSG_DEBUG
#define ATH_MSG_DEBUG(x)
Definition AthMsgStreamMacros.h:29

vec
std::vector< size_t > vec
Definition CombinationsGeneratorTest.cxx:9

GraphData.h

a
static Double_t a
Definition LArPhysWaveHECTool.cxx:38

NodeFeatureList.h

PathResolver.h

SPInferenceToolBase.h

operator<<
std::ostream & operator<<(std::ostream &lhs, const TestGaudiProperty &rhs)
Definition TestGaudiProperty.cxx:69

MuonML::LayerSpBucket
The LayerSpBucket is a space pointbucket where the points are internally sorted by their layer number...
Definition LayerBucket.h:14

MuonML::SPInferenceToolBase::m_graphFeatures
NodeFeatureList m_graphFeatures
List of features to be used for the inference.
Definition SPInferenceToolBase.h:44

MuonML::SPInferenceToolBase::runInference
StatusCode runInference(GraphRawData &graphData) const
Definition SPInferenceToolBase.cxx:188

MuonML::SPInferenceToolBase::m_onnxSessionTool
ToolHandle< AthOnnx::IOnnxRuntimeSessionTool > m_onnxSessionTool
Definition SPInferenceToolBase.h:45

MuonML::SPInferenceToolBase::model
Ort::Session & model() const
Definition SPInferenceToolBase.cxx:87

MuonML::SPInferenceToolBase::buildGraph
StatusCode buildGraph(const EventContext &ctx, GraphRawData &graphData) const
Fill up the GraphRawData and construct the graph for the ML inference with ONNX.
Definition SPInferenceToolBase.cxx:114

MuonML::SPInferenceToolBase::m_readKey
SG::ReadHandleKey< MuonR4::SpacePointContainer > m_readKey
Input space points to filter.
Definition SPInferenceToolBase.h:41

MuonML::SPInferenceToolBase::setupModel
StatusCode setupModel()
Definition SPInferenceToolBase.cxx:90

MuonR4::SpacePointBucket
: The muon space point bucket represents a collection of points that will bre processed together in t...
Definition MuonSpectrometer/MuonPhaseII/Event/MuonSpacePoint/MuonSpacePoint/SpacePointContainer.h:21

SG::ReadHandle
Definition StoreGate/StoreGate/ReadHandle.h:67

pair
STL class.

MuonML
Definition BucketGraphUtils.h:19

Pythia8_RapidityOrderMPI.val
val
Definition Pythia8_RapidityOrderMPI.py:14

hist_file_dump.f
f
Definition hist_file_dump.py:140

lumiFormat.i
int i
Definition lumiFormat.py:85

std::sort
void sort(typename DataModel_detail::iterator< DVL > beg, typename DataModel_detail::iterator< DVL > end)
Specialization of sort for DataVector/List.
Definition DVL_algorithms.h:554

MuonML::GraphRawData
Helper struct to ship the Graph from the space point buckets to ONNX.
Definition GraphData.h:25

MuonML::GraphRawData::featureLeaves
FeatureVec_t featureLeaves
Vector containing all features.
Definition GraphData.h:30

MuonML::GraphRawData::graph
std::unique_ptr< InferenceGraph > graph
Pointer to the graph to be parsed to ONNX.
Definition GraphData.h:46

MuonML::GraphRawData::nodeIndex
unsigned int nodeIndex
Number of the already filled nodes.
Definition GraphData.h:52

MuonML::GraphRawData::previousList
const NodeFeatureList * previousList
Pointer to the latest parsed NodeFeatureList.
Definition GraphData.h:44

MuonML::GraphRawData::currLeave
std::vector< float >::iterator currLeave
The following variables are needed to fill the consistently the raw data for the Graph Building.
Definition GraphData.h:50

MuonML::GraphRawData::srcEdges
EdgeCounterVec_t srcEdges
Vector encoding the source index of the.
Definition GraphData.h:32

MuonML::GraphRawData::desEdges
EdgeCounterVec_t desEdges
Vect.
Definition GraphData.h:34

MuonML::GraphRawData::spacePointsInBucket
NodeConnectVec_t spacePointsInBucket
Vector keeping track of how many space points are in each parsed bucket.
Definition GraphData.h:36