d3/de7/EgammaDNNHelper_8cc_source.html

 #include "RecoEgamma/EgammaTools/interface/EgammaDNNHelper.h"
 #include "FWCore/MessageLogger/interface/MessageLogger.h"
 #include "FWCore/Utilities/interface/FileInPath.h"
 #include <iostream>
 #include <fstream>
 using namespace egammaTools;

 EgammaDNNHelper::EgammaDNNHelper(const DNNConfiguration& cfg,
                                  const ModelSelector& modelSelector,
                                  const std::vector<std::string>& availableVars)
     : cfg_(cfg), modelSelector_(modelSelector), nModels_(cfg_.modelsFiles.size()), graphDefs_(cfg_.modelsFiles.size()) {
   initTensorFlowGraphs();
   initScalerFiles(availableVars);
 }

 void EgammaDNNHelper::initTensorFlowGraphs() {
   // load the graph definition
   LogDebug("EgammaDNNHelper") << "Loading " << nModels_ << " graphs";
   size_t i = 0;
   for (const auto& model_file : cfg_.modelsFiles) {
     graphDefs_[i] =
         std::unique_ptr<tensorflow::GraphDef>(tensorflow::loadGraphDef(edm::FileInPath(model_file).fullPath()));
     i++;
   }
 }

 std::vector<tensorflow::Session*> EgammaDNNHelper::getSessions() const {
   std::vector<tensorflow::Session*> sessions;
   LogDebug("EgammaDNNHelper") << "Starting " << nModels_ << " TF sessions";
   sessions.reserve(graphDefs_.size());
   for (const auto& graphDef : graphDefs_) {
     sessions.push_back(tensorflow::createSession(graphDef.get()));
   }
   LogDebug("EgammaDNNHelper") << "TF sessions started";
   return sessions;
 }

 void EgammaDNNHelper::initScalerFiles(const std::vector<std::string>& availableVars) {
   for (const auto& scaler_file : cfg_.scalersFiles) {
     // Parse scaler configuration
     std::vector<ScalerConfiguration> features;
     std::ifstream inputfile_scaler{edm::FileInPath(scaler_file).fullPath()};
     int ninputs = 0;
     if (inputfile_scaler.fail()) {
       throw cms::Exception("MissingFile") << "Scaler file for PFid DNN not found";
     } else {
       // Now read mean, scale factors for each variable
       float par1, par2;
       std::string varName, type_str;
       uint type;
       while (inputfile_scaler >> varName >> type_str >> par1 >> par2) {
         if (type_str == "stdscale")
           type = 1;
         else if (type_str == "minmax")
           type = 2;
         else if (type_str == "custom1")  // 2*((X_train - minValues)/(MaxMinusMin)) -1.0
           type = 3;
         else
           type = 0;
         features.push_back(ScalerConfiguration{.varName = varName, .type = type, .par1 = par1, .par2 = par2});
         // Protection for mismatch between requested variables and the available ones
         auto match = std::find(availableVars.begin(), availableVars.end(), varName);
         if (match == std::end(availableVars)) {
           throw cms::Exception("MissingVariable")
               << "Requested variable (" << varName << ") not available between DNN inputs";
         }
         ninputs += 1;
       }
     }
     inputfile_scaler.close();
     featuresMap_.push_back(features);
     nInputs_.push_back(ninputs);
   }
 }

 std::pair<uint, std::vector<float>> EgammaDNNHelper::getScaledInputs(
     const std::map<std::string, float>& variables) const {
   // Call the modelSelector function passing the variables map to return
   // the modelIndex to be used for the current candidate
   const auto modelIndex = modelSelector_(variables);
   std::vector<float> inputs;
   // Loop on the list of requested variables and scaling values for the specific modelIndex
   // Different type of scaling are available: 0=no scaling, 1=standard scaler, 2=minmax
   for (auto& [varName, type, par1, par2] : featuresMap_[modelIndex]) {
     if (type == 1)  // Standard scaling
       inputs.push_back((variables.at(varName) - par1) / par2);
     else if (type == 2)  // MinMax
       inputs.push_back((variables.at(varName) - par1) / (par2 - par1));
     else if (type == 3)  //2*((X_train - minValues)/(MaxMinusMin)) -1.0
       inputs.push_back(2 * (variables.at(varName) - par1) / (par2 - par1) - 1.);
     else {
       inputs.push_back(variables.at(varName));  // Do nothing on the variable
     }
     //Protection for mismatch between requested variables and the available ones
     // have been added when the scaler config are loaded --> here we know that the variables are available
   }
   return std::make_pair(modelIndex, inputs);
 }

 std::vector<std::pair<uint, std::vector<float>>> EgammaDNNHelper::evaluate(
     const std::vector<std::map<std::string, float>>& candidates,
     const std::vector<tensorflow::Session*>& sessions) const {
   /*
     Evaluate the PFID DNN for all the electrons/photons.
     nModels_ are defined depending on modelIndex  --> we need to build N input tensors to evaluate
     the DNNs with batching.

     1) Get all the variable for each candidate  vector<map<string:float>>
     2) Scale the input and select the variables for each model
     2) Prepare the input tensors for the  models
     3) Run the models and get the output for each candidate
     4) Sort the output by candidate index
     5) Return the DNN outputs along with the model index used on it

     */
   size_t nCandidates = candidates.size();
   std::vector<std::vector<uint>> indexMap(nModels_);  // for each model; the list of candidate index is saved
   std::vector<std::vector<float>> inputsVectors(nCandidates);
   std::vector<uint> counts(nModels_);

   LogDebug("EgammaDNNHelper") << "Working on " << nCandidates << " candidates";

   uint icand = 0;
   for (auto& candidate : candidates) {
     LogDebug("EgammaDNNHelper") << "Working on candidate: " << icand;
     const auto& [model_index, inputs] = getScaledInputs(candidate);
     counts[model_index] += 1;
     indexMap[model_index].push_back(icand);
     inputsVectors[icand] = inputs;
     icand++;
   }

   // Prepare one input tensors for each model
   std::vector<tensorflow::Tensor> input_tensors(nModels_);
   // Pointers for filling efficiently the input tensors
   std::vector<float*> input_tensors_pointer(nModels_);
   for (size_t i = 0; i < nModels_; i++) {
     LogDebug("EgammaDNNHelper") << "Initializing TF input " << i << " with rows:" << counts[i]
                                 << " and cols:" << nInputs_[i];
     input_tensors[i] = tensorflow::Tensor{tensorflow::DT_FLOAT, {counts[i], nInputs_[i]}};
     input_tensors_pointer[i] = input_tensors[i].flat<float>().data();
   }

   // Filling the input tensors
   for (size_t m = 0; m < nModels_; m++) {
     LogDebug("EgammaDNNHelper") << "Loading TF input tensor for model: " << m;
     float* T = input_tensors_pointer[m];
     for (size_t cand_index : indexMap[m]) {
       for (size_t k = 0; k < nInputs_[m]; k++, T++) {  //Note the input tensor pointer incremented
         *T = inputsVectors[cand_index][k];
       }
     }
   }

   // Define the output and run
   // The initial output is [(cand_index,(model_index, outputs)),.. ]
   std::vector<std::pair<uint, std::pair<uint, std::vector<float>>>> outputs;
   // Run all the models
   for (size_t m = 0; m < nModels_; m++) {
     if (counts[m] == 0)
       continue;  //Skip model witout inputs
     std::vector<tensorflow::Tensor> output;
     LogDebug("EgammaDNNHelper") << "Run model: " << m << " with " << counts[m] << "objects";
     tensorflow::run(sessions[m], {{cfg_.inputTensorName, input_tensors[m]}}, {cfg_.outputTensorName}, &output);
     // Get the output and save the ElectronDNNEstimator::outputDim numbers along with the ele index
     const auto& r = output[0].tensor<float, 2>();
     // Iterate on the list of elements in the batch --> many electrons
     LogDebug("EgammaDNNHelper") << "Model " << m << " has " << cfg_.outputDim[m] << " nodes!";
     for (uint b = 0; b < counts[m]; b++) {
       //auto outputDim=cfg_.outputDim;
       std::vector<float> result(cfg_.outputDim[m]);
       for (size_t k = 0; k < cfg_.outputDim[m]; k++) {
         result[k] = r(b, k);
         LogDebug("EgammaDNNHelper") << "For Object " << b + 1 << " : Node " << k + 1 << " score = " << r(b, k);
       }
       // Get the original index of the electorn in the original order
       const auto cand_index = indexMap[m][b];
       outputs.push_back(std::make_pair(cand_index, std::make_pair(m, result)));
     }
   }
   // Now we have just to re-order the outputs
   std::sort(outputs.begin(), outputs.end());
   std::vector<std::pair<uint, std::vector<float>>> final_outputs(outputs.size());
   std::transform(outputs.begin(), outputs.end(), final_outputs.begin(), [](auto a) { return a.second; });

   return final_outputs;
 }
egammaTools::EgammaDNNHelper::graphDefs_
std::vector< std::unique_ptr< const tensorflow::GraphDef > > graphDefs_
Definition: EgammaDNNHelper.h:67

PixelMapPlotter.inputs
inputs
Definition: PixelMapPlotter.py:490

parallelization.uint
uint
Definition: parallelization.py:124

jetUpdater_cfi.sort
sort
Definition: jetUpdater_cfi.py:30

EgammaDNNHelper.h

egammaTools::EgammaDNNHelper::getScaledInputs
std::pair< uint, std::vector< float > > getScaledInputs(const std::map< std::string, float > &variables) const
Definition: EgammaDNNHelper.cc:77

mps_fire.i
i
Definition: mps_fire.py:429

Exception
Definition: hltDiff.cc:245

MessageLogger.h

mps_fire.result
result
Definition: mps_fire.py:311

edm::FileInPath::fullPath
std::string fullPath() const
Definition: FileInPath.cc:161

egammaTools::EgammaDNNHelper::getSessions
std::vector< tensorflow::Session * > getSessions() const
Definition: EgammaDNNHelper.cc:28

PatBasicFWLiteJetAnalyzer_Selector_cfg.outputs
outputs
Definition: PatBasicFWLiteJetAnalyzer_Selector_cfg.py:48

tensorflow::loadGraphDef
GraphDef * loadGraphDef(const std::string &pbFile)
Definition: TensorFlow.cc:129

egammaTools::DNNConfiguration::outputDim
std::vector< unsigned int > outputDim
Definition: EgammaDNNHelper.h:22

convertSQLitetoXML_cfg.output
output
Definition: convertSQLitetoXML_cfg.py:72

egammaTools::EgammaDNNHelper::EgammaDNNHelper
EgammaDNNHelper(const DNNConfiguration &, const ModelSelector &sel, const std::vector< std::string > &availableVars)
Definition: EgammaDNNHelper.cc:9

egammaTools::DNNConfiguration::modelsFiles
std::vector< std::string > modelsFiles
Definition: EgammaDNNHelper.h:20

egammaTools::EgammaDNNHelper::nInputs_
std::vector< uint > nInputs_
Definition: EgammaDNNHelper.h:65

spr::find
void find(edm::Handle< EcalRecHitCollection > &hits, DetId thisDet, std::vector< EcalRecHitCollection::const_iterator > &hit, bool debug=false)
Definition: FindCaloHit.cc:19

type
type
Definition: SiPixelVCal_PayloadInspector.cc:39

egammaTools::DNNConfiguration::inputTensorName
std::string inputTensorName
Definition: EgammaDNNHelper.h:18

AlCaHLTBitMon_QueryRunRegistry.string
string string
Definition: AlCaHLTBitMon_QueryRunRegistry.py:256

pfMETCorrectionType0_cfi.par1
par1
Definition: pfMETCorrectionType0_cfi.py:48

modelfilter_cfi.modelSelector
modelSelector
Definition: modelfilter_cfi.py:3

egammaTools::DNNConfiguration
Definition: EgammaDNNHelper.h:17

nano_mu_digi_cff.float
float
Definition: nano_mu_digi_cff.py:14

egammaTools
Definition: EcalClusterLocal.h:14

gainCalibHelper::gainCalibPI::type
type
Definition: SiPixelGainCalibHelper.h:40

egammaTools::EgammaDNNHelper::nModels_
uint nModels_
Definition: EgammaDNNHelper.h:63

lowptgsfeleseed::features
std::vector< float > features(const reco::PreId &ecal, const reco::PreId &hcal, double rho, const reco::BeamSpot &spot, noZS::EcalClusterLazyTools &ecalTools)
Definition: LowPtGsfElectronFeatures.cc:17

egammaTools::EgammaDNNHelper::featuresMap_
std::vector< std::vector< ScalerConfiguration > > featuresMap_
Definition: EgammaDNNHelper.h:70

gedGsfElectrons_cfi.modelsFiles
modelsFiles
Definition: gedGsfElectrons_cfi.py:26

visualization-live-secondInstance_cfg.m
m
Definition: visualization-live-secondInstance_cfg.py:84

tensorflow::run
void run(Session *session, const NamedTensorList &inputs, const std::vector< std::string > &outputNames, std::vector< Tensor > *outputs, const thread::ThreadPoolOptions &threadPoolOptions)
Definition: TensorFlow.cc:281

dqmiodumpmetadata.counts
counts
Definition: dqmiodumpmetadata.py:25

egammaTools::ScalerConfiguration::varName
std::string varName
Definition: EgammaDNNHelper.h:31

FileInPath.h

pfMETCorrectionType0_cfi.par2
par2
Definition: pfMETCorrectionType0_cfi.py:49

looper.cfg
cfg
Definition: looper.py:296

tensorflow::createSession
Session * createSession()
Definition: TensorFlow.cc:146

edm::FileInPath
Definition: FileInPath.h:61

egammaTools::ScalerConfiguration
Definition: EgammaDNNHelper.h:25

egammaTools::EgammaDNNHelper::initScalerFiles
void initScalerFiles(const std::vector< std::string > &availableVars)
Definition: EgammaDNNHelper.cc:39

b
double b
Definition: hdecay.h:120

egammaTools::DNNConfiguration::outputTensorName
std::string outputTensorName
Definition: EgammaDNNHelper.h:19

data
char data[epos_bytes_allocation]
Definition: EPOS_Wrapper.h:80

a
double a
Definition: hdecay.h:121

trackerHitRTTI::vector
Definition: trackerHitRTTI.h:21

egammaTools::EgammaDNNHelper::evaluate
std::vector< std::pair< uint, std::vector< float > > > evaluate(const std::vector< std::map< std::string, float >> &candidates, const std::vector< tensorflow::Session *> &sessions) const
Definition: EgammaDNNHelper.cc:101

egammaTools::DNNConfiguration::scalersFiles
std::vector< std::string > scalersFiles
Definition: EgammaDNNHelper.h:21

egammaTools::ModelSelector
std::function< uint(const std::map< std::string, float > &)> ModelSelector
Definition: EgammaDNNHelper.h:39

output
Definition: output.py:1

egammaTools::EgammaDNNHelper::initTensorFlowGraphs
void initTensorFlowGraphs()
Definition: EgammaDNNHelper.cc:17

egammaTools::EgammaDNNHelper::modelSelector_
const ModelSelector modelSelector_
Definition: EgammaDNNHelper.h:61

HLT_2024v13_cff.candidates
candidates
Definition: HLT_2024v13_cff.py:38848

T
long double T
Definition: Basic3DVectorLD.h:48

egammaTools::EgammaDNNHelper::cfg_
const DNNConfiguration cfg_
Definition: EgammaDNNHelper.h:60

hcalRecHitTable_cff.variables
variables
Definition: hcalRecHitTable_cff.py:11

dqmdumpme.k
k
Definition: dqmdumpme.py:60

contentValuesFiles.fullPath
fullPath
Definition: contentValuesFiles.py:64

LogDebug
#define LogDebug(id)
Definition: MessageLogger.h:241

HcalDetIdTransform::transform
unsigned transform(const HcalDetId &id, unsigned transformCode)
Definition: HcalDetIdTransform.cc:7