CMS 3D CMS Logo

MillePedeFileExtractor.cc
Go to the documentation of this file.
1 // Original Author: Broen van Besien
2 // Created: Mon, 23 Mar 2015 14:56:15 GMT
3 
6 
7 #include <zlib.h>
8 
13 
15  : outputDir_(iConfig.getParameter<std::string>("fileDir")),
16  outputFileName_(iConfig.getParameter<std::string>("outputBinaryFile")),
17  maxNumberOfBinaries_(iConfig.getParameter<int>("maxNumberOfBinaries")) {
18  auto fileBlobInputTag = iConfig.getParameter<edm::InputTag>("fileBlobInputTag");
19  fileBlobToken_ = consumes<FileBlobCollection, edm::BranchType::InLumi>(fileBlobInputTag);
20  if (hasBinaryNumberLimit()) {
21  edm::LogInfo("MillePedeFileActions") << "Limiting the number of extracted binary files to " << maxNumberOfBinaries_;
22  }
23 }
24 
26 
28  if (enoughBinaries())
29  return;
30 
31  // Getting our hands on the vector of FileBlobs
32  edm::Handle<FileBlobCollection> fileBlobCollection;
33  iLumi.getByToken(fileBlobToken_, fileBlobCollection);
34  if (fileBlobCollection.isValid()) {
35  // Logging the amount of FileBlobs in the vector
36  edm::LogInfo("MillePedeFileActions") << "Root file contains " << fileBlobCollection->size() << " FileBlob(s).";
37  // Loop over the FileBlobs in the vector, and write them to files:
38  for (const auto& blob : *fileBlobCollection) {
39  if (enoughBinaries())
40  break;
41  // We format the filename with a number, starting from 0 to the size of
42  // our vector.
43  // For this to work, the outputBinaryFile config parameter must contain a
44  // formatting directive for a number, like %04d.
45  char theNumberedOutputFileName[200];
46  sprintf(theNumberedOutputFileName, outputFileName_.c_str(), nBinaries_);
47 
48  // Log the filename to which we will write...
49  edm::LogInfo("MillePedeFileActions")
50  << "Writing FileBlob file to file " << outputDir_ + theNumberedOutputFileName << ".";
51 
52  // ...and perform the writing operation.
53  writeGzipped(blob, outputDir_ + theNumberedOutputFileName);
54 
55  ++nBinaries_;
56  }
57  } else {
58  edm::LogError("MillePedeFileActions") << "Error: The root file does not contain any vector of FileBlob.";
59  }
60 }
61 
63  // - use zlib directly to avoid boost dependencies for this simple task
64  // - zlib and gzip compression differ -> get uncompressed blob first
65  auto uncompressedBlob = blob.getUncompressedBlob();
66  gzFile fp = gzopen(fileName.c_str(), "wb");
67  if (fp == nullptr) {
68  edm::LogError("MillePedeFileActions") << "Problem while opening gzipped file '" << fileName << "'.";
69  }
70  auto nBytes = gzwrite(fp, &uncompressedBlob->front(), uncompressedBlob->size());
71  if (nBytes == 0 || nBytes != static_cast<decltype(nBytes)>(uncompressedBlob->size())) {
72  edm::LogError("MillePedeFileActions") << "Problem while writing FileBlob to gzipped file '" << fileName << "'.";
73  }
74  auto zerr = gzclose(fp);
75  if (zerr != 0) {
76  edm::LogError("MillePedeFileActions") << "Problem while closing gzipped file '" << fileName << "'.";
77  }
78 }
79 
80 // Manage the parameters for the module:
81 // (Note that this will autogenerate the _cfi.py file.)
84 
85  desc.add<std::string>("fileDir", "")
86  ->setComment(
87  "Keep the fileDir empty if you want to write to the current "
88  "directory.");
89 
90  desc.add<std::string>("outputBinaryFile", "milleBinary%04d.dat")
91  ->setComment(
92  "Base filename of the files that will be created. This must "
93  "contain "
94  "a placeholder for an index number in the standard C formatting "
95  "style, like %04d.");
96 
97  desc.add<edm::InputTag>("fileBlobInputTag", edm::InputTag("millePedeFileConverter", ""))
98  ->setComment(
99  "Name of the module that should have generated the blob in the "
100  "root file. Make sure you overwrite this, if you have changed "
101  "this is the configuration of the MillePedeFileConverter.");
102 
103  desc.add<int>("maxNumberOfBinaries", 1000)
104  ->setComment(
105  "Number of binaries to be extracted from the input files. "
106  "Use a negative value to apply no limit.");
107 
108  descriptions.add("millePedeFileExtractor", desc);
109  descriptions.setComment(
110  "This is the generic cfi file for the "
111  "MillePedeFileExtractor");
112 }
MessageLogger.h
edm::LuminosityBlock
Definition: LuminosityBlock.h:50
MillePedeFileExtractor_cfg.fileBlobInputTag
fileBlobInputTag
Definition: MillePedeFileExtractor_cfg.py:36
LuminosityBlock.h
MillePedeFileExtractor::endLuminosityBlock
void endLuminosityBlock(const edm::LuminosityBlock &, const edm::EventSetup &) override
Definition: MillePedeFileExtractor.cc:27
MillePedeFileExtractor::hasBinaryNumberLimit
bool hasBinaryNumberLimit()
Definition: MillePedeFileExtractor.h:43
HLT_FULL_cff.InputTag
InputTag
Definition: HLT_FULL_cff.py:89301
edm::ParameterSetDescription
Definition: ParameterSetDescription.h:52
MillePedeFileExtractor.h
personalPlayback.fp
fp
Definition: personalPlayback.py:523
MillePedeFileExtractor::writeGzipped
static void writeGzipped(const FileBlob &, const std::string &)
Definition: MillePedeFileExtractor.cc:62
edm::LogInfo
Log< level::Info, false > LogInfo
Definition: MessageLogger.h:125
MillePedeFileConverter_cfg.fileName
fileName
Definition: MillePedeFileConverter_cfg.py:32
edm::Handle
Definition: AssociativeIterator.h:50
FileBlob::getUncompressedBlob
std::unique_ptr< std::vector< unsigned char > > getUncompressedBlob() const
i didn't want to do two copies ... hope this works.
Definition: FileBlob.cc:75
FileBlob.h
edm::LuminosityBlock::getByToken
bool getByToken(EDGetToken token, Handle< PROD > &result) const
Definition: LuminosityBlock.h:321
MillePedeFileExtractor::nBinaries_
int nBinaries_
Definition: MillePedeFileExtractor.h:53
edm::ConfigurationDescriptions::add
void add(std::string const &label, ParameterSetDescription const &psetDescription)
Definition: ConfigurationDescriptions.cc:57
MillePedeFileExtractor::fillDescriptions
static void fillDescriptions(edm::ConfigurationDescriptions &descriptions)
Definition: MillePedeFileExtractor.cc:82
MillePedeFileExtractor::outputDir_
const std::string outputDir_
Definition: MillePedeFileExtractor.h:47
MillePedeFileExtractor::fileBlobToken_
edm::EDGetTokenT< FileBlobCollection > fileBlobToken_
Definition: MillePedeFileExtractor.h:50
EDGetToken.h
edm::ConfigurationDescriptions
Definition: ConfigurationDescriptions.h:28
MillePedeFileExtractor::~MillePedeFileExtractor
~MillePedeFileExtractor() override
Definition: MillePedeFileExtractor.cc:25
MillePedeFileExtractor::MillePedeFileExtractor
MillePedeFileExtractor(const edm::ParameterSet &)
Definition: MillePedeFileExtractor.cc:14
MillePedeFileExtractor::maxNumberOfBinaries_
const int maxNumberOfBinaries_
Definition: MillePedeFileExtractor.h:52
MillePedeFileExtractor::enoughBinaries
bool enoughBinaries()
Definition: MillePedeFileExtractor.h:42
edm::ParameterSet
Definition: ParameterSet.h:47
edm::ConfigurationDescriptions::setComment
void setComment(std::string const &value)
Definition: ConfigurationDescriptions.cc:48
createfilelist.int
int
Definition: createfilelist.py:10
edm::EventSetup
Definition: EventSetup.h:58
edm::LogError
Log< level::Error, false > LogError
Definition: MessageLogger.h:123
AlCaHLTBitMon_QueryRunRegistry.string
string string
Definition: AlCaHLTBitMon_QueryRunRegistry.py:256
InputTag.h
submitPVResolutionJobs.desc
string desc
Definition: submitPVResolutionJobs.py:251
std
Definition: JetResolutionObject.h:76
edm::ParameterSet::getParameter
T getParameter(std::string const &) const
Definition: ParameterSet.h:303
edm::HandleBase::isValid
bool isValid() const
Definition: HandleBase.h:70
spu::zerr
void zerr(int)
Definition: SherpackUtilities.cc:129
edm::InputTag
Definition: InputTag.h:15
FileBlobCollection::size
int size() const
Definition: FileBlobCollection.cc:5
FileBlob
Definition: FileBlob.h:11
MillePedeFileExtractor::outputFileName_
const std::string outputFileName_
Definition: MillePedeFileExtractor.h:48