ATLAS Offline Software
Loading...
Searching...
No Matches
MVAUtils::ForestXGBoost Class Referencefinalabstract

Implement XGBoost with nan support. More...

#include <ForestXGBoost.h>

Inheritance diagram for MVAUtils::ForestXGBoost:
Collaboration diagram for MVAUtils::ForestXGBoost:

Public Member Functions

 ForestXGBoost (TTree *tree)
 ForestXGBoost ()=default
 ForestXGBoost (const ForestXGBoost &)=default
ForestXGBoostoperator= (const ForestXGBoost &)=default
 ForestXGBoost (ForestXGBoost &&)=default
ForestXGBoostoperator= (ForestXGBoost &&)=default
 ~ForestXGBoost ()=default
virtual TTree * WriteTree (TString name) const override
 Return a TTree representing the BDT.
virtual void PrintForest () const override
virtual int GetNVars () const override
 Get the number of input variable to be passed with std::vector to Get* methods.
virtual float GetClassification (const std::vector< float > &values) const final
 Compute the prediction of a classification.
virtual float GetClassification (const std::vector< float * > &pointers) const=0
virtual float GetTreeResponse (const std::vector< float > &values, unsigned int itree) const override final
 Return the response of one tree Must pass the features in a std::vector<float> values and the index of the tree.
virtual float GetTreeResponse (const std::vector< float * > &pointers, unsigned int itree) const =0
virtual float GetOffset () const override
 Return the offset of the forest.
virtual float GetRawResponse (const std::vector< float > &values) const override final
 Return the response of the whole Forest.
virtual float GetRawResponse (const std::vector< float * > &pointers) const =0
virtual float GetResponse (const std::vector< float > &values) const override
 Compute the prediction for regression.
virtual float GetResponse (const std::vector< float * > &pointers) const =0
virtual std::vector< float > GetMultiResponse (const std::vector< float > &values, unsigned int numClasses) const override
 Compute the prediction for multiclassification (a score for each class).
virtual std::vector< float > GetMultiResponse (const std::vector< float * > &pointers, unsigned int numClasses) const =0
virtual unsigned int GetNTrees () const override final
virtual void PrintTree (unsigned int itree) const override
std::vector< NodeXGBoostGetTree (unsigned int itree) const
 Return the vector of nodes for the tree itree.

Protected Member Functions

float GetTreeResponseFromNode (const std::vector< float > &values, index_t index) const
 Get the response of a tree.
void newTree (const std::vector< NodeXGBoost > &nodes)
 append a new tree (defined by a vector of nodes serialized in preorder) to the forest

Private Attributes

int m_max_var =0
std::vector< index_tm_forest
 indices of the top-level nodes of each tree
std::vector< NodeXGBoostm_nodes
 where the nodes of the forest are stored

Detailed Description

Implement XGBoost with nan support.

Definition at line 44 of file ForestXGBoost.h.

Constructor & Destructor Documentation

◆ ForestXGBoost() [1/4]

ForestXGBoost::ForestXGBoost ( TTree * tree)
explicit

Definition at line 12 of file ForestXGBoost.cxx.

13 : ForestXGBoostBase<NodeXGBoost>()
14 , m_max_var(0)
15{
16
17
18 // variables read from the TTree
19 std::vector<int> *vars = nullptr;
20 std::vector<float> *values = nullptr;
21 std::vector<bool> *default_left = nullptr;
22
23 std::vector<NodeXGBoost> nodes;
24
25 tree->SetBranchAddress("vars", &vars);
26 tree->SetBranchAddress("values", &values);
27 tree->SetBranchAddress("default_left", &default_left);
28
29 for (int i = 0; i < tree->GetEntries(); ++i)
30 {
31 // each entry in the TTree is a decision tree
32 tree->GetEntry(i);
33 if (!vars) { throw std::runtime_error("vars pointer is null in ForestXGBoost constructor"); }
34 if (!values) { throw std::runtime_error("values pointers is null in ForestXGBoost constructor"); }
35 if (!default_left) { throw std::runtime_error("default_left pointers is null in ForestXGBoost constructor"); }
36 if (vars->size() != values->size()) { throw std::runtime_error("inconsistent size for vars and values in ForestXGBoost constructor"); }
37 if (default_left->size() != values->size()) { throw std::runtime_error("inconsistent size for default_left and values in ForestXGBoost constructor"); }
38
39 nodes.clear();
40
41 std::vector<MVAUtils::index_t> right = detail::computeRight(*vars);
42
43 for (size_t i = 0; i < vars->size(); ++i) {
44 nodes.emplace_back(vars->at(i), values->at(i), right[i], default_left->at(i));
45 if (vars->at(i) > m_max_var) { m_max_var = vars->at(i); }
46 }
47 newTree(nodes);
48 } // end loop on TTree, all decision tree loaded
49 delete vars;
50 delete values;
51 delete default_left;
52}
void newTree(const std::vector< NodeXGBoost > &nodes)
std::vector< index_t > computeRight(const std::vector< int > &vars)
Compute the offsets between the nodes to their right children from a serialized representation of the...
TChain * tree

◆ ForestXGBoost() [2/4]

MVAUtils::ForestXGBoost::ForestXGBoost ( )
default

◆ ForestXGBoost() [3/4]

MVAUtils::ForestXGBoost::ForestXGBoost ( const ForestXGBoost & )
default

◆ ForestXGBoost() [4/4]

MVAUtils::ForestXGBoost::ForestXGBoost ( ForestXGBoost && )
default

◆ ~ForestXGBoost()

MVAUtils::ForestXGBoost::~ForestXGBoost ( )
default

Member Function Documentation

◆ GetClassification() [1/2]

virtual float MVAUtils::IForest::GetClassification ( const std::vector< float * > & pointers) const
pure virtualinherited

◆ GetClassification() [2/2]

virtual float MVAUtils::ForestXGBoostBase< NodeXGBoost >::GetClassification ( const std::vector< float > & values) const
inlinefinalvirtualinherited

Compute the prediction of a classification.

Implements MVAUtils::IForest.

Definition at line 33 of file ForestXGBoost.h.

34 {
36 }
virtual float GetResponse(const std::vector< float > &values) const override
T sigmoid(T x)
Definition Forest.h:21

◆ GetMultiResponse() [1/2]

virtual std::vector< float > MVAUtils::Forest< NodeXGBoost >::GetMultiResponse ( const std::vector< float > & values,
unsigned int numClasses ) const
overridevirtualinherited

Compute the prediction for multiclassification (a score for each class).

In addition to the input values need to pass the number of classes

Implements MVAUtils::IForest.

◆ GetMultiResponse() [2/2]

virtual std::vector< float > MVAUtils::IForest::GetMultiResponse ( const std::vector< float * > & pointers,
unsigned int numClasses ) const
pure virtualinherited

Implemented in MVAUtils::Forest< Node_t >.

◆ GetNTrees()

virtual unsigned int MVAUtils::Forest< NodeXGBoost >::GetNTrees ( ) const
inlinefinaloverridevirtualinherited

Implements MVAUtils::IForest.

Definition at line 94 of file Forest.h.

95 {
96 return m_forest.size();
97 }
Generic Forest base class.
Definition Forest.h:54

◆ GetNVars()

virtual int MVAUtils::ForestXGBoost::GetNVars ( ) const
inlineoverridevirtual

Get the number of input variable to be passed with std::vector to Get* methods.

Implements MVAUtils::IForest.

Definition at line 57 of file ForestXGBoost.h.

57{ return m_max_var + 1; }

◆ GetOffset()

virtual float MVAUtils::Forest< NodeXGBoost >::GetOffset ( ) const
inlineoverridevirtualinherited

Return the offset of the forest.

Since by default there is no offset, return 0

Implements MVAUtils::IForest.

Definition at line 63 of file Forest.h.

63{ return 0.; }

◆ GetRawResponse() [1/2]

virtual float MVAUtils::Forest< NodeXGBoost >::GetRawResponse ( const std::vector< float > & values) const
finaloverridevirtualinherited

Return the response of the whole Forest.

Raw is just the sum of all the trees

Implements MVAUtils::IForest.

◆ GetRawResponse() [2/2]

virtual float MVAUtils::IForest::GetRawResponse ( const std::vector< float * > & pointers) const
pure virtualinherited

Implemented in MVAUtils::Forest< Node_t >.

◆ GetResponse() [1/2]

virtual float MVAUtils::Forest< NodeXGBoost >::GetResponse ( const std::vector< float > & values) const
overridevirtualinherited

Compute the prediction for regression.

Implements MVAUtils::IForest.

◆ GetResponse() [2/2]

virtual float MVAUtils::IForest::GetResponse ( const std::vector< float * > & pointers) const
pure virtualinherited

◆ GetTree()

std::vector< NodeXGBoost > MVAUtils::Forest< NodeXGBoost >::GetTree ( unsigned int itree) const
inherited

Return the vector of nodes for the tree itree.

◆ GetTreeResponse() [1/2]

virtual float MVAUtils::Forest< NodeXGBoost >::GetTreeResponse ( const std::vector< float > & values,
unsigned int itree ) const
finaloverridevirtualinherited

Return the response of one tree Must pass the features in a std::vector<float> values and the index of the tree.

Implements MVAUtils::IForest.

◆ GetTreeResponse() [2/2]

virtual float MVAUtils::IForest::GetTreeResponse ( const std::vector< float * > & pointers,
unsigned int itree ) const
pure virtualinherited

Implemented in MVAUtils::Forest< Node_t >.

◆ GetTreeResponseFromNode()

float MVAUtils::Forest< NodeXGBoost >::GetTreeResponseFromNode ( const std::vector< float > & values,
index_t index ) const
protectedinherited

Get the response of a tree.

Instead of specifying the index of the tree (as in GetTreeResponse) the index of the top node of the tree should be specified

◆ newTree()

void MVAUtils::Forest< NodeXGBoost >::newTree ( const std::vector< NodeXGBoost > & nodes)
protectedinherited

append a new tree (defined by a vector of nodes serialized in preorder) to the forest

◆ operator=() [1/2]

ForestXGBoost & MVAUtils::ForestXGBoost::operator= ( const ForestXGBoost & )
default

◆ operator=() [2/2]

ForestXGBoost & MVAUtils::ForestXGBoost::operator= ( ForestXGBoost && )
default

◆ PrintForest()

void ForestXGBoost::PrintForest ( ) const
overridevirtual

Reimplemented from MVAUtils::Forest< NodeXGBoost >.

Definition at line 81 of file ForestXGBoost.cxx.

82{
83 std::cout << "***BDT XGBoost: Printing entire forest***" << std::endl;
85}
virtual void PrintForest() const override

◆ PrintTree()

virtual void MVAUtils::Forest< NodeXGBoost >::PrintTree ( unsigned int itree) const
overridevirtualinherited

Implements MVAUtils::IForest.

◆ WriteTree()

TTree * ForestXGBoost::WriteTree ( TString ) const
overridevirtual

Return a TTree representing the BDT.

The called is the owner of the returned TTree

Implements MVAUtils::IForest.

Definition at line 55 of file ForestXGBoost.cxx.

56{
57 TTree *tree = new TTree(name.Data(), "creator=xgboost");
58
59 std::vector<int> vars;
60 std::vector<float> values;
61 std::vector<bool> default_left;
62
63 tree->Branch("vars", &vars);
64 tree->Branch("values", &values);
65 tree->Branch("default_left", &default_left);
66
67 for (size_t itree = 0; itree < GetNTrees(); ++itree) {
68 vars.clear();
69 values.clear();
70 default_left.clear();
71 for(const auto& node : GetTree(itree)) {
72 vars.push_back(node.GetVar());
73 values.push_back(node.GetVal());
74 default_left.push_back(node.GetDefaultLeft());
75 }
76 tree->Fill();
77 }
78 return tree;
79}
std::vector< NodeXGBoost > GetTree(unsigned int itree) const
virtual unsigned int GetNTrees() const override final
Definition Forest.h:94

Member Data Documentation

◆ m_forest

std::vector<index_t> MVAUtils::Forest< NodeXGBoost >::m_forest
privateinherited

indices of the top-level nodes of each tree

Definition at line 117 of file Forest.h.

◆ m_max_var

int MVAUtils::ForestXGBoost::m_max_var =0
private

Definition at line 59 of file ForestXGBoost.h.

◆ m_nodes

std::vector<NodeXGBoost> MVAUtils::Forest< NodeXGBoost >::m_nodes
privateinherited

where the nodes of the forest are stored

Definition at line 118 of file Forest.h.


The documentation for this class was generated from the following files: