db/df0/MLPFProducer_8cc_source.html

 #include "FWCore/Framework/interface/Frameworkfwd.h"

 #include "FWCore/Framework/interface/stream/EDProducer.h"

 #include "FWCore/Framework/interface/Event.h"

 #include "FWCore/Framework/interface/MakerMacros.h"


 #include "DataFormats/ParticleFlowCandidate/interface/PFCandidate.h"

 #include "PhysicsTools/TensorFlow/interface/TensorFlow.h"

 #include "RecoParticleFlow/PFProducer/interface/MLPFModel.h"


 struct MLPFCache {

   const tensorflow::GraphDef* graph_def;

 };


 class MLPFProducer : public edm::stream::EDProducer<edm::GlobalCache<MLPFCache> > {

 public:

   explicit MLPFProducer(const edm::ParameterSet&, const MLPFCache*);

   void produce(edm::Event& event, const edm::EventSetup& setup) override;

   static void fillDescriptions(edm::ConfigurationDescriptions& descriptions);


   // static methods for handling the global cache

   static std::unique_ptr<MLPFCache> initializeGlobalCache(const edm::ParameterSet&);

   static void globalEndJob(MLPFCache*);


 private:

   const edm::EDPutTokenT<reco::PFCandidateCollection> pfCandidatesPutToken_;

   const edm::EDGetTokenT<reco::PFBlockCollection> inputTagBlocks_;

   const std::string model_path_;

   tensorflow::Session* session_;

 };


 MLPFProducer::MLPFProducer(const edm::ParameterSet& cfg, const MLPFCache* cache)

     : pfCandidatesPutToken_{produces<reco::PFCandidateCollection>()},

       inputTagBlocks_(consumes<reco::PFBlockCollection>(cfg.getParameter<edm::InputTag>("src"))),

       model_path_(cfg.getParameter<std::string>("model_path")) {

   session_ = tensorflow::createSession(cache->graph_def);

 }


 void MLPFProducer::produce(edm::Event& event, const edm::EventSetup& setup) {

   using namespace reco::mlpf;


   const auto& blocks = event.get(inputTagBlocks_);

   const auto& all_elements = getPFElements(blocks);


   const long long int num_elements_total = all_elements.size();


   //tensor size must be a multiple of the bin size and larger than the number of elements

   const auto tensor_size = LSH_BIN_SIZE * (num_elements_total / LSH_BIN_SIZE + 1);

   assert(tensor_size <= NUM_MAX_ELEMENTS_BATCH);


   //Create the input tensor

   tensorflow::TensorShape shape({BATCH_SIZE, tensor_size, NUM_ELEMENT_FEATURES});

   tensorflow::Tensor input(tensorflow::DT_FLOAT, shape);

   input.flat<float>().setZero();


   //Fill the input tensor

   unsigned int ielem = 0;

   for (const auto* pelem : all_elements) {

     const auto& elem = *pelem;


     //prepare the input array from the PFElement

     const auto& props = getElementProperties(elem);


     //copy features to the input array

     for (unsigned int iprop = 0; iprop < NUM_ELEMENT_FEATURES; iprop++) {

       input.tensor<float, 3>()(0, ielem, iprop) = normalize(props[iprop]);

     }

     ielem += 1;

   }


   //TF model input and output tensor names

   const tensorflow::NamedTensorList input_list = {{"x:0", input}};

   const std::vector<std::string> output_names = {"Identity:0"};


   //Prepare the output tensor

   std::vector<tensorflow::Tensor> outputs;


   //run the GNN inference, given the inputs and the output.

   //Note that the GNN enables information transfer between the input PFElements,

   //such that the output ML-PFCandidates are in general combinations of the input PFElements, in the form of

   //y_out = Adj.x_in, where x_in is input matrix (num_elem, NUM_ELEMENT_FEATURES), y_out is the output matrix (num_elem, NUM_OUTPUT_FEATURES)

   //and Adj is an adjacency matrix between the elements that is constructed on the fly during model inference.

   tensorflow::run(session_, input_list, output_names, &outputs);


   //process the output tensor to ML-PFCandidates.

   //The output can contain up to num_elem particles, with predicted PDGID=0 corresponding to no particles predicted.

   const auto out_arr = outputs[0].tensor<float, 3>();


   std::vector<reco::PFCandidate> pOutputCandidateCollection;

   for (unsigned int ielem = 0; ielem < all_elements.size(); ielem++) {

     //get the coefficients in the output corresponding to the class probabilities (raw logits)

     std::vector<float> pred_id_logits;

     for (unsigned int idx_id = 0; idx_id <= NUM_CLASS; idx_id++) {

       pred_id_logits.push_back(out_arr(0, ielem, idx_id));

     }


     //get the most probable class PDGID

     int pred_pid = pdgid_encoding[argMax(pred_id_logits)];


     //get the predicted momentum components

     float pred_eta = out_arr(0, ielem, IDX_ETA);

     float pred_phi = out_arr(0, ielem, IDX_PHI);

     float pred_charge = out_arr(0, ielem, IDX_CHARGE);

     float pred_e = out_arr(0, ielem, IDX_ENERGY);


     //a particle was predicted for this PFElement, otherwise it was a spectator

     if (pred_pid != 0) {

       auto cand = makeCandidate(pred_pid, pred_charge, pred_e, pred_eta, pred_phi);

       setCandidateRefs(cand, all_elements, ielem);

       pOutputCandidateCollection.push_back(cand);

     }

   }  //loop over PFElements


   event.emplace(pfCandidatesPutToken_, pOutputCandidateCollection);

 }


 std::unique_ptr<MLPFCache> MLPFProducer::initializeGlobalCache(const edm::ParameterSet& params) {

   // this method is supposed to create, initialize and return a MLPFCache instance

   std::unique_ptr<MLPFCache> cache = std::make_unique<MLPFCache>();


   //load the frozen TF graph of the GNN model

   std::string path = params.getParameter<std::string>("model_path");

   auto fullPath = edm::FileInPath(path).fullPath();

   LogDebug("MLPFProducer") << "Initializing MLPF model from " << fullPath;


   cache->graph_def = tensorflow::loadGraphDef(fullPath);


   return cache;

 }


 void MLPFProducer::globalEndJob(MLPFCache* cache) { delete cache->graph_def; }


 void MLPFProducer::fillDescriptions(edm::ConfigurationDescriptions& descriptions) {

   edm::ParameterSetDescription desc;

   desc.add<edm::InputTag>("src", edm::InputTag("particleFlowBlock"));

   desc.add<std::string>("model_path", "RecoParticleFlow/PFProducer/data/mlpf/mlpf_2020_11_04.pb");

   descriptions.addWithDefaultLabel(desc);

 }


 DEFINE_FWK_MODULE(MLPFProducer);

tensorflow::createSession
Session * createSession(SessionOptions &sessionOptions)
Definition: TensorFlow.cc:85

edm::ConfigurationDescriptions::addWithDefaultLabel
void addWithDefaultLabel(ParameterSetDescription const &psetDescription)
Definition: ConfigurationDescriptions.cc:87

tensorflow::NamedTensorList
std::vector< NamedTensor > NamedTensorList
Definition: TensorFlow.h:30

reco::mlpf::IDX_ETA
static constexpr unsigned int IDX_ETA
Definition: MLPFModel.h:27

looper.cfg
tuple cfg
Definition: looper.py:296

edmPickEvents.event
tuple event
Definition: edmPickEvents.py:273

reco::mlpf::NUM_CLASS
static constexpr unsigned int NUM_CLASS
Definition: MLPFModel.h:26

reco::mlpf::getElementProperties
std::array< float, NUM_ELEMENT_FEATURES > getElementProperties(const reco::PFBlockElement &orig)
Definition: MLPFModel.cc:15

reco::mlpf::argMax
int argMax(std::vector< float > const &vec)
Definition: MLPFModel.cc:158

DEFINE_FWK_MODULE
#define DEFINE_FWK_MODULE(type)
Definition: MakerMacros.h:16

tensorflow::loadGraphDef
GraphDef * loadGraphDef(const std::string &pbFile)
Definition: TensorFlow.cc:68

reco::mlpf::NUM_ELEMENT_FEATURES
static constexpr unsigned int NUM_ELEMENT_FEATURES
Definition: MLPFModel.h:10

Event.h

contentValuesFiles.fullPath
fullPath
Definition: contentValuesFiles.py:64

MakerMacros.h

MLPFProducer::globalEndJob
static void globalEndJob(MLPFCache *)
Definition: MLPFProducer.cc:130

submitPVValidationJobs.params
list params
Definition: submitPVValidationJobs.py:487

gather_cfg.blocks
tuple blocks
Definition: gather_cfg.py:90

reco::mlpf::IDX_ENERGY
static constexpr unsigned int IDX_ENERGY
Definition: MLPFModel.h:29

reco::mlpf::BATCH_SIZE
static constexpr int BATCH_SIZE
Definition: MLPFModel.h:17

cms::cuda::assert
assert(be >=bs)

MLPFProducer::produce
void produce(edm::Event &event, const edm::EventSetup &setup) override
Definition: MLPFProducer.cc:38

edm::EDGetTokenT< reco::PFBlockCollection >

Frameworkfwd.h

edm::EDPutTokenT< reco::PFCandidateCollection >

AlCaHLTBitMon_QueryRunRegistry.string
string string
Definition: AlCaHLTBitMon_QueryRunRegistry.py:256

reco::mlpf::getPFElements
const std::vector< const reco::PFBlockElement * > getPFElements(const reco::PFBlockCollection &blocks)
Definition: MLPFModel.cc:185

edm::ParameterSetDescription
Definition: ParameterSetDescription.h:52

input
static std::string const input
Definition: EdmProvDump.cc:47

MLPFCache
Definition: MLPFProducer.cc:10

MLPFCache::graph_def
const tensorflow::GraphDef * graph_def
Definition: MLPFProducer.cc:11

EDProducer.h

MLPFProducer::initializeGlobalCache
static std::unique_ptr< MLPFCache > initializeGlobalCache(const edm::ParameterSet &)
Definition: MLPFProducer.cc:116

MLPFProducer::pfCandidatesPutToken_
const edm::EDPutTokenT< reco::PFCandidateCollection > pfCandidatesPutToken_
Definition: MLPFProducer.cc:25

submitPVResolutionJobs.desc
string desc
Definition: submitPVResolutionJobs.py:251

tensorflow::run
void run(Session *session, const NamedTensorList &inputs, const std::vector< std::string > &outputNames, std::vector< Tensor > *outputs, const thread::ThreadPoolOptions &threadPoolOptions)
Definition: TensorFlow.cc:213

reco::mlpf::IDX_PHI
static constexpr unsigned int IDX_PHI
Definition: MLPFModel.h:28

TensorFlow.h

MLPFProducer::session_
tensorflow::Session * session_
Definition: MLPFProducer.cc:28

edm::EventSetup
Definition: EventSetup.h:59

reco::mlpf::IDX_CHARGE
static constexpr unsigned int IDX_CHARGE
Definition: MLPFModel.h:30

edm::ParameterSetDescription::add
ParameterDescriptionBase * add(U const &iLabel, T const &value)
Definition: ParameterSetDescription.h:95

MLPFModel.h

GeneralSetup.setup
def setup
Definition: GeneralSetup.py:2

edm::FileInPath
Definition: FileInPath.h:61

mlpf_cff.mlpf
tuple mlpf
Definition: mlpf_cff.py:4

edm::stream::EDProducer
Definition: EDProducer.h:36

fed_dqm_sourceclient-live_cfg.path
string path
Definition: fed_dqm_sourceclient-live_cfg.py:46

reco::mlpf::setCandidateRefs
void setCandidateRefs(reco::PFCandidate &cand, const std::vector< const reco::PFBlockElement * > elems, size_t ielem_originator)
Definition: MLPFModel.cc:204

edm::ParameterSet::getParameter
T getParameter(std::string const &) const
Definition: ParameterSet.h:303

reco::mlpf::normalize
float normalize(float in)
Definition: MLPFModel.cc:149

HLT_FULL_cff.InputTag
tuple InputTag
Definition: HLT_FULL_cff.py:86956

MLPFProducer::inputTagBlocks_
const edm::EDGetTokenT< reco::PFBlockCollection > inputTagBlocks_
Definition: MLPFProducer.cc:26

MLPFProducer
Definition: MLPFProducer.cc:14

edm::InputTag
Definition: InputTag.h:15

MLPFProducer::fillDescriptions
static void fillDescriptions(edm::ConfigurationDescriptions &descriptions)
Definition: MLPFProducer.cc:132

edm::FileInPath::fullPath
std::string fullPath() const
Definition: FileInPath.cc:161

edm::ParameterSet
Definition: ParameterSet.h:47

reco::mlpf::pdgid_encoding
static const std::vector< int > pdgid_encoding
Definition: MLPFModel.h:34

edm::Event
Definition: Event.h:73

MLPFProducer::model_path_
const std::string model_path_
Definition: MLPFProducer.cc:27

PFCandidate.h

reco::mlpf::makeCandidate
reco::PFCandidate makeCandidate(int pred_pid, int pred_charge, float pred_e, float pred_eta, float pred_phi)
Definition: MLPFModel.cc:162

reco::mlpf::LSH_BIN_SIZE
static constexpr int LSH_BIN_SIZE
Definition: MLPFModel.h:14

edm::ConfigurationDescriptions
Definition: ConfigurationDescriptions.h:28

utilities.cache
def cache
Definition: utilities.py:3

MLPFProducer::MLPFProducer
MLPFProducer(const edm::ParameterSet &, const MLPFCache *)
Definition: MLPFProducer.cc:31

LogDebug
#define LogDebug(id)
Definition: MessageLogger.h:233

reco::mlpf::NUM_MAX_ELEMENTS_BATCH
static constexpr int NUM_MAX_ELEMENTS_BATCH
Definition: MLPFModel.h:13