Skip to content
Snippets Groups Projects
Commit 04b359fa authored by Christos Anastopoulos's avatar Christos Anastopoulos
Browse files

MVAUtils, move small methods to .icc, use final, remove virtual when seem it is not needed

parent 16dcd668
6 merge requests!58791DataQualityConfigurations: Modify L1Calo config for web display,!46784MuonCondInterface: Enable thread-safety checking.,!46776Updated LArMonitoring config file for WD to match new files produced using MT,!45405updated ART test cron job,!42417Draft: DIRE and VINCIA Base Fragments for Pythia 8.3,!38072MVAUtils, move small methods to .icc, use final, remove virtual when seem it is not needed
...@@ -106,33 +106,7 @@ namespace MVAUtils ...@@ -106,33 +106,7 @@ namespace MVAUtils
std::unique_ptr<IForest> m_forest; //!< the implementation of the forest, doing the hard work std::unique_ptr<IForest> m_forest; //!< the implementation of the forest, doing the hard work
std::vector<float*> m_pointers; //!< where vars to cut on can be set (but can also be passed) std::vector<float*> m_pointers; //!< where vars to cut on can be set (but can also be passed)
}; };
inline float BDT::GetResponse() const {
return (!m_pointers.empty() ? GetResponse(m_pointers) : -9999.);
}
inline float BDT::GetClassification() const {
return (!m_pointers.empty() ? GetClassification(m_pointers) : -9999.);
}
inline std::vector<float> BDT::GetMultiResponse(unsigned int numClasses) const {
return (!m_pointers.empty() ? GetMultiResponse(m_pointers, numClasses) : std::vector<float>());
}
inline std::vector<float> BDT::GetValues() const {
std::vector<float> result;
for (float* ptr : m_pointers)
{
assert (ptr);
result.push_back(*ptr);
}
return result;
}
inline const std::vector<float*>& BDT::GetPointers() const { return m_pointers; }
inline void BDT::SetPointers(const std::vector<float*>& pointers) { m_pointers = pointers; }
} }
#include "MVAUtils/BDT.icc"
#endif #endif
/*
Copyright (C) 2002-2020 CERN for the benefit of the ATLAS collaboration
*/
namespace MVAUtils {
inline float
BDT::GetResponse() const
{
return (!m_pointers.empty() ? GetResponse(m_pointers) : -9999.);
}
inline float
BDT::GetClassification() const
{
return (!m_pointers.empty() ? GetClassification(m_pointers) : -9999.);
}
inline std::vector<float>
BDT::GetMultiResponse(unsigned int numClasses) const
{
return (!m_pointers.empty() ? GetMultiResponse(m_pointers, numClasses)
: std::vector<float>());
}
inline std::vector<float>
BDT::GetValues() const
{
std::vector<float> result;
for (float* ptr : m_pointers) {
assert(ptr);
result.push_back(*ptr);
}
return result;
}
inline const std::vector<float*>&
BDT::GetPointers() const
{
return m_pointers;
}
inline void
BDT::SetPointers(const std::vector<float*>& pointers)
{
m_pointers = pointers;
}
inline unsigned int
BDT::GetNTrees() const
{
return m_forest->GetNTrees();
}
inline int
BDT::GetNVars() const
{
return m_forest->GetNVars();
}
inline float
BDT::GetOffset() const
{
return m_forest->GetOffset();
}
/** Return offset + the sum of the response of each tree **/
inline float
BDT::GetResponse(const std::vector<float>& values) const
{
return m_forest->GetResponse(values);
}
/** Return offset + the sum of the response of each tree **/
inline float
BDT::GetResponse(const std::vector<float*>& pointers) const
{
return m_forest->GetResponse(pointers);
}
inline float
BDT::GetClassification(const std::vector<float>& values) const
{
return m_forest->GetClassification(values);
}
inline float
BDT::GetClassification(const std::vector<float*>& pointers) const
{
return m_forest->GetClassification(pointers);
}
inline float
BDT::GetGradBoostMVA(const std::vector<float>& values) const
{
const float sum = m_forest->GetRawResponse(values); // ignores the offset
return 2. / (1 + std::exp(-2 * sum)) -
1; // output shaping for gradient boosted decision tree (-1,1)
}
inline float
BDT::GetGradBoostMVA(const std::vector<float*>& pointers) const
{
const float sum = m_forest->GetRawResponse(pointers); // ignores the offset
// output shaping for gradient boosted decision tree (-1,1)
return 2. / (1 + std::exp(-2 * sum)) - 1;
}
inline std::vector<float>
BDT::GetMultiResponse(const std::vector<float>& values,
unsigned int numClasses) const
{
return m_forest->GetMultiResponse(values, numClasses);
}
inline std::vector<float>
BDT::GetMultiResponse(const std::vector<float*>& pointers,
unsigned int numClasses) const
{
return m_forest->GetMultiResponse(pointers, numClasses);
}
inline float
BDT::GetTreeResponse(const std::vector<float>& values,
MVAUtils::index_t index) const
{
return m_forest->GetTreeResponse(values, index);
}
inline float
BDT::GetTreeResponse(const std::vector<float*>& pointers,
MVAUtils::index_t index) const
{
return m_forest->GetTreeResponse(pointers, index);
}
}
...@@ -53,43 +53,55 @@ namespace MVAUtils ...@@ -53,43 +53,55 @@ namespace MVAUtils
class Forest : public IForest class Forest : public IForest
{ {
public: public:
virtual float GetTreeResponse(const std::vector<float>& values,
virtual float GetTreeResponse(const std::vector<float>& values, unsigned int itree) const override; unsigned int itree) const override final;
virtual float GetTreeResponse(const std::vector<float*>& pointers, unsigned int itree) const override; virtual float GetTreeResponse(const std::vector<float*>& pointers,
unsigned int itree) const override final;
/** Return the offset of the forest. Since by default there is no offset, return 0 */
virtual float GetOffset() const override { return 0.; } /** Return the offset of the forest. Since by default there is no offset,
* return 0 */
/** Return the response of the whole Forest. Raw is just the sum of all the trees **/ virtual float GetOffset() const override { return 0.; }
// The method is not `final`, but it is very unlikely the derived class
// will redefine this (since it is "raw") /** Return the response of the whole Forest. Raw is just the sum of all
virtual float GetRawResponse(const std::vector<float>& values) const override; * the trees **/
virtual float GetRawResponse(const std::vector<float*>& pointers) const override; virtual float GetRawResponse(
const std::vector<float>& values) const override final;
/** Compute the prediction for regression **/ virtual float GetRawResponse(
// In this class it is equal to the raw-reponse. Derived class should const std::vector<float*>& pointers) const override final;
// override this.
virtual float GetResponse(const std::vector<float>& values) const override; /** Compute the prediction for regression **/
virtual float GetResponse(const std::vector<float*>& pointers) const override; // In this class it is equal to the raw-reponse. Derived class should
// override this.
/** Compute the prediction for multiclassification (a score for each class). virtual float GetResponse(
* In addition to the input values need to pass the number of classes const std::vector<float>& values) const override;
**/ virtual float GetResponse(
// Since TMVA and lgbm are identical the common implementation is here: const std::vector<float*>& pointers) const override;
// Return the softmax of the sub-forest raw-response
virtual std::vector<float> GetMultiResponse(const std::vector<float>& values, /** Compute the prediction for multiclassification (a score for each
unsigned int numClasses) const override; *class). In addition to the input values need to pass the number of
virtual std::vector<float> GetMultiResponse(const std::vector<float*>& pointers, *classes
unsigned int numClasses) const override; **/
// Since TMVA and lgbm are identical the common implementation is here:
virtual unsigned int GetNTrees() const final { return m_forest.size(); } // Return the softmax of the sub-forest raw-response
virtual std::vector<float> GetMultiResponse(
virtual void PrintForest() const override; const std::vector<float>& values,
unsigned int numClasses) const override;
virtual void PrintTree(unsigned int itree) const override;
virtual std::vector<float> GetMultiResponse(
/** Return the vector of nodes for the tree itree **/ const std::vector<float*>& pointers,
virtual std::vector<Node_t> GetTree(unsigned int itree) const final; unsigned int numClasses) const override;
virtual unsigned int GetNTrees() const override final
{
return m_forest.size();
}
virtual void PrintForest() const override;
virtual void PrintTree(unsigned int itree) const override;
/** Return the vector of nodes for the tree itree **/
std::vector<Node_t> GetTree(unsigned int itree) const;
protected: protected:
/** Get the response of a tree. Instead of specifying the index of the tree /** Get the response of a tree. Instead of specifying the index of the tree
......
...@@ -49,7 +49,6 @@ namespace MVAUtils ...@@ -49,7 +49,6 @@ namespace MVAUtils
ForestLGBMSimple (ForestLGBMSimple&&) = default; ForestLGBMSimple (ForestLGBMSimple&&) = default;
ForestLGBMSimple& operator=(ForestLGBMSimple&&) = default; ForestLGBMSimple& operator=(ForestLGBMSimple&&) = default;
~ForestLGBMSimple()=default; ~ForestLGBMSimple()=default;
virtual TTree* WriteTree(TString name) const override; virtual TTree* WriteTree(TString name) const override;
virtual void PrintForest() const override; virtual void PrintForest() const override;
virtual int GetNVars() const override { return m_max_var + 1; } virtual int GetNVars() const override { return m_max_var + 1; }
...@@ -69,7 +68,6 @@ namespace MVAUtils ...@@ -69,7 +68,6 @@ namespace MVAUtils
ForestLGBM (ForestLGBM&&) = default; ForestLGBM (ForestLGBM&&) = default;
ForestLGBM& operator=(ForestLGBM&&) = default; ForestLGBM& operator=(ForestLGBM&&) = default;
~ForestLGBM()=default; ~ForestLGBM()=default;
virtual TTree* WriteTree(TString name) const override; virtual TTree* WriteTree(TString name) const override;
virtual void PrintForest() const override; virtual void PrintForest() const override;
virtual int GetNVars() const override { return m_max_var + 1; } virtual int GetNVars() const override { return m_max_var + 1; }
......
...@@ -25,22 +25,16 @@ namespace MVAUtils ...@@ -25,22 +25,16 @@ namespace MVAUtils
public: public:
ForestWeighted() : m_sumWeights(0.) { } ForestWeighted() : m_sumWeights(0.) { }
float GetTreeResponseWeighted(const std::vector<float>& values, unsigned int itree) const using Forest<Node_t>::GetNTrees;
{
return Forest<Node_t>::GetTreeResponse(values, itree) * m_weights[itree];
}
float GetTreeResponseWeighted(const std::vector<float*>& pointers, unsigned int itree) const
{
return Forest<Node_t>::GetTreeResponse(pointers, itree) * m_weights[itree];
}
using Forest<Node_t>::GetNTrees; // lookup is deferred until template paramers are known, force it
using Forest<Node_t>::newTree; using Forest<Node_t>::newTree;
float GetTreeResponseWeighted(const std::vector<float>& values, unsigned int itree) const;
float GetTreeResponseWeighted(const std::vector<float*>& pointers, unsigned int itree) const;
float GetWeightedResponse(const std::vector<float>& values) const; float GetWeightedResponse(const std::vector<float>& values) const;
float GetWeightedResponse(const std::vector<float*>& pointers) const; float GetWeightedResponse(const std::vector<float*>& pointers) const;
virtual void newTree(const std::vector<Node_t>& nodes, float weight);
void newTree(const std::vector<Node_t>& nodes, float weight);
float GetTreeWeight(unsigned int itree) const { return m_weights[itree]; } float GetTreeWeight(unsigned int itree) const { return m_weights[itree]; }
float GetSumWeights() const { return m_sumWeights; } float GetSumWeights() const { return m_sumWeights; }
...@@ -57,33 +51,6 @@ namespace MVAUtils ...@@ -57,33 +51,6 @@ namespace MVAUtils
}; };
template<typename Node_t>
float ForestWeighted<Node_t>::GetWeightedResponse(const std::vector<float>& values) const {
float result = 0.;
for (unsigned int itree = 0; itree != GetNTrees(); ++itree)
{
result += GetTreeResponseWeighted(values, itree);
}
return result;
}
template<typename Node_t>
float ForestWeighted<Node_t>::GetWeightedResponse(const std::vector<float*>& pointers) const {
float result = 0.;
for (unsigned int itree = 0; itree != GetNTrees(); ++itree)
{
result += GetTreeResponseWeighted(pointers, itree);
}
return result;
}
template<typename Node_t>
void ForestWeighted<Node_t>::newTree(const std::vector<Node_t>& nodes, float weight) {
newTree(nodes);
m_weights.push_back(weight);
m_sumWeights += weight;
}
/* /*
* Support TMVA processing * Support TMVA processing
* *
...@@ -118,5 +85,5 @@ namespace MVAUtils ...@@ -118,5 +85,5 @@ namespace MVAUtils
}; };
} }
#include "MVAUtils/ForestTMVA.icc"
#endif #endif
/*
Copyright (C) 2002-2019 CERN for the benefit of the ATLAS collaboration
*/
namespace MVAUtils {
template<typename Node_t>
float
ForestWeighted<Node_t>::GetTreeResponseWeighted(
const std::vector<float>& values,
unsigned int itree) const
{
return Forest<Node_t>::GetTreeResponse(values, itree) * m_weights[itree];
}
template<typename Node_t>
float
ForestWeighted<Node_t>::GetTreeResponseWeighted(
const std::vector<float*>& pointers,
unsigned int itree) const
{
return Forest<Node_t>::GetTreeResponse(pointers, itree) * m_weights[itree];
}
template<typename Node_t>
float
ForestWeighted<Node_t>::GetWeightedResponse(
const std::vector<float>& values) const
{
float result = 0.;
for (unsigned int itree = 0; itree != GetNTrees(); ++itree) {
result += GetTreeResponseWeighted(values, itree);
}
return result;
}
template<typename Node_t>
float
ForestWeighted<Node_t>::GetWeightedResponse(
const std::vector<float*>& pointers) const
{
float result = 0.;
for (unsigned int itree = 0; itree != GetNTrees(); ++itree) {
result += GetTreeResponseWeighted(pointers, itree);
}
return result;
}
template<typename Node_t>
void
ForestWeighted<Node_t>::newTree(const std::vector<Node_t>& nodes, float weight)
{
newTree(nodes);
m_weights.push_back(weight);
m_sumWeights += weight;
}
inline float
ForestTMVA::GetResponse(const std::vector<float>& values) const
{
return GetRawResponse(values) + GetOffset();
}
inline float
ForestTMVA::GetResponse(const std::vector<float*>& pointers) const
{
return GetRawResponse(pointers) + GetOffset();
}
inline float
ForestTMVA::GetClassification(const std::vector<float>& values) const
{
float result = GetWeightedResponse(values);
return result / GetSumWeights();
}
inline float
ForestTMVA::GetClassification(const std::vector<float*>& pointers) const
{
float result = GetWeightedResponse(pointers);
return result / GetSumWeights();
}
}
...@@ -30,7 +30,7 @@ std::string get_default_string_map(const std::map <std::string, std::string> & m ...@@ -30,7 +30,7 @@ std::string get_default_string_map(const std::map <std::string, std::string> & m
{ {
std::map<std::string, std::string>::const_iterator it = m.find(key); std::map<std::string, std::string>::const_iterator it = m.find(key);
if (it == m.end()) { return defval; } if (it == m.end()) { return defval; }
return it->second; return it->second;
} }
std::map<std::string, std::string> parseOptions(const std::string& raw_options) std::map<std::string, std::string> parseOptions(const std::string& raw_options)
...@@ -44,7 +44,8 @@ std::map<std::string, std::string> parseOptions(const std::string& raw_options) ...@@ -44,7 +44,8 @@ std::map<std::string, std::string> parseOptions(const std::string& raw_options)
const auto left = item.substr(0, pos); const auto left = item.substr(0, pos);
if (!options.insert(std::make_pair(left, right)).second) if (!options.insert(std::make_pair(left, right)).second)
{ {
throw std::runtime_error(std::string("option ") + left + " duplicated in title of TTree used as input"); throw std::runtime_error(std::string("option ") + left +
" duplicated in title of TTree used as input");
} }
} }
...@@ -64,95 +65,24 @@ BDT::BDT(::TTree *tree) ...@@ -64,95 +65,24 @@ BDT::BDT(::TTree *tree)
std::string node_type = get_default_string_map (options, std::string("node_type")); std::string node_type = get_default_string_map (options, std::string("node_type"));
if (node_type == "lgbm") { if (node_type == "lgbm") {
m_forest = std::make_unique<ForestLGBM>(tree); m_forest = std::make_unique<ForestLGBM>(tree);
} else if (node_type == "lgbm_simple") {
m_forest = std::make_unique<ForestLGBMSimple>(
tree); // this do not support nan as inputs
} else {
throw std::runtime_error(
"the title of the input tree is misformatted: cannot understand which "
"BDT implementation to use");
} }
else if (node_type == "lgbm_simple") { } else if (creator == "xgboost") {
m_forest = std::make_unique<ForestLGBMSimple>(tree); // this do not support nan as inputs // this do support nan as inputs
}
else
{
throw std::runtime_error("the title of the input tree is misformatted: cannot understand which BDT implementation to use");
}
}
else if (creator == "xgboost")
{
//this do support nan as inputs
m_forest = std::make_unique<ForestXGBoost>(tree); m_forest = std::make_unique<ForestXGBoost>(tree);
} } else {
else {
// default for compatibility: old TTree (based on TMVA) don't have a special title // default for compatibility: old TTree (based on TMVA) don't have a special title
m_forest = std::make_unique<ForestTMVA>(tree); m_forest = std::make_unique<ForestTMVA>(tree);
} }
} }
unsigned int BDT::GetNTrees() const { return m_forest->GetNTrees(); }
int BDT::GetNVars() const { return m_forest->GetNVars(); }
float BDT::GetOffset() const { return m_forest->GetOffset(); }
/** Return offset + the sum of the response of each tree **/
float BDT::GetResponse(const std::vector<float>& values) const
{
return m_forest->GetResponse(values);
}
/** Return offset + the sum of the response of each tree **/
float BDT::GetResponse(const std::vector<float*>& pointers) const
{
return m_forest->GetResponse(pointers);
}
float BDT::GetClassification(const std::vector<float>& values) const
{
return m_forest->GetClassification(values);
}
float BDT::GetClassification(const std::vector<float*>& pointers) const
{
return m_forest->GetClassification(pointers);
}
float BDT::GetGradBoostMVA(const std::vector<float>& values) const
{
const float sum = m_forest->GetRawResponse(values); // ignores the offset
return 2. / (1 + std::exp(-2 * sum)) - 1; //output shaping for gradient boosted decision tree (-1,1)
}
float BDT::GetGradBoostMVA(const std::vector<float*>& pointers) const
{
const float sum = m_forest->GetRawResponse(pointers); // ignores the offset
return 2. / (1 + std::exp(-2 * sum)) - 1; //output shaping for gradient boosted decision tree (-1,1)
}
std::vector<float> BDT::GetMultiResponse(const std::vector<float>& values,
unsigned int numClasses) const
{
return m_forest->GetMultiResponse(values, numClasses);
}
std::vector<float> BDT::GetMultiResponse(const std::vector<float*>& pointers,
unsigned int numClasses) const
{
return m_forest->GetMultiResponse(pointers, numClasses);
}
float BDT::GetTreeResponse(const std::vector<float>& values, MVAUtils::index_t index) const
{
return m_forest->GetTreeResponse(values, index);
}
float BDT::GetTreeResponse(const std::vector<float*>& pointers, MVAUtils::index_t index) const
{
return m_forest->GetTreeResponse(pointers, index);
}
TTree* BDT::WriteTree(TString name) const { return m_forest->WriteTree(std::move(name)); } TTree* BDT::WriteTree(TString name) const { return m_forest->WriteTree(std::move(name)); }
void BDT::PrintForest() const { m_forest->PrintForest(); } void BDT::PrintForest() const { m_forest->PrintForest(); }
void BDT::PrintTree(unsigned int itree) const { m_forest->PrintTree(itree); } void BDT::PrintTree(unsigned int itree) const { m_forest->PrintTree(itree); }
...@@ -74,26 +74,6 @@ TTree* ForestTMVA::WriteTree(TString name) const ...@@ -74,26 +74,6 @@ TTree* ForestTMVA::WriteTree(TString name) const
return tree; return tree;
} }
float ForestTMVA::GetResponse(const std::vector<float>& values) const {
return GetRawResponse(values) + GetOffset();
}
float ForestTMVA::GetResponse(const std::vector<float*>& pointers) const {
return GetRawResponse(pointers) + GetOffset();
}
float ForestTMVA::GetClassification(const std::vector<float>& values) const
{
float result = GetWeightedResponse(values);
return result / GetSumWeights();
}
float ForestTMVA::GetClassification(const std::vector<float*>& pointers) const
{
float result = GetWeightedResponse(pointers);
return result / GetSumWeights();
}
void ForestTMVA::PrintForest() const void ForestTMVA::PrintForest() const
{ {
std::cout << "***BDT TMVA: Printing entire forest***" << std::endl; std::cout << "***BDT TMVA: Printing entire forest***" << std::endl;
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment