CMS 3D CMS Logo

MillePedeFileExtractor.cc
Go to the documentation of this file.
1 // Original Author: Broen van Besien
2 // Created: Mon, 23 Mar 2015 14:56:15 GMT
3 
6 
7 #include <zlib.h>
8 
13 
15  : outputDir_(iConfig.getParameter<std::string>("fileDir")),
16  outputFileName_(iConfig.getParameter<std::string>("outputBinaryFile")),
17  maxNumberOfBinaries_(iConfig.getParameter<int>("maxNumberOfBinaries")) {
18 
19  auto fileBlobInputTag = iConfig.getParameter<edm::InputTag>("fileBlobInputTag");
20  fileBlobToken_ = consumes<FileBlobCollection, edm::BranchType::InLumi>(fileBlobInputTag);
21  if (hasBinaryNumberLimit()) {
22  edm::LogInfo("MillePedeFileActions")
23  << "Limiting the number of extracted binary files to "
25  }
26 }
27 
29 
31  const edm::EventSetup&)
32 {
33  if (enoughBinaries()) return;
34 
35  // Getting our hands on the vector of FileBlobs
36  edm::Handle<FileBlobCollection> fileBlobCollection;
37  iLumi.getByToken(fileBlobToken_, fileBlobCollection);
38  if (fileBlobCollection.isValid()) {
39  // Logging the amount of FileBlobs in the vector
40  edm::LogInfo("MillePedeFileActions")
41  << "Root file contains " << fileBlobCollection->size() << " FileBlob(s).";
42  // Loop over the FileBlobs in the vector, and write them to files:
43  for (const auto& blob: *fileBlobCollection) {
44  if (enoughBinaries()) break;
45  // We format the filename with a number, starting from 0 to the size of
46  // our vector.
47  // For this to work, the outputBinaryFile config parameter must contain a
48  // formatting directive for a number, like %04d.
49  char theNumberedOutputFileName[200];
50  sprintf(theNumberedOutputFileName, outputFileName_.c_str(), nBinaries_);
51 
52  // Log the filename to which we will write...
53  edm::LogInfo("MillePedeFileActions")
54  << "Writing FileBlob file to file "
55  << outputDir_ + theNumberedOutputFileName << ".";
56 
57  // ...and perform the writing operation.
58  writeGzipped(blob, outputDir_ + theNumberedOutputFileName);
59 
60  ++nBinaries_;
61  }
62  } else {
63  edm::LogError("MillePedeFileActions")
64  << "Error: The root file does not contain any vector of FileBlob.";
65  }
66 }
67 
68 
70  const std::string& fileName) {
71  // - use zlib directly to avoid boost dependencies for this simple task
72  // - zlib and gzip compression differ -> get uncompressed blob first
73  auto uncompressedBlob = blob.getUncompressedBlob();
74  gzFile fp = gzopen(fileName.c_str(), "wb");
75  if (fp == nullptr) {
76  edm::LogError("MillePedeFileActions")
77  << "Problem while opening gzipped file '" << fileName << "'.";
78  }
79  auto nBytes = gzwrite(fp, &uncompressedBlob->front(), uncompressedBlob->size());
80  if (nBytes == 0 ||
81  nBytes != static_cast<decltype(nBytes)>(uncompressedBlob->size())) {
82  edm::LogError("MillePedeFileActions")
83  << "Problem while writing FileBlob to gzipped file '" << fileName << "'.";
84  }
85  auto zerr = gzclose(fp);
86  if (zerr != 0) {
87  edm::LogError("MillePedeFileActions")
88  << "Problem while closing gzipped file '" << fileName << "'.";
89  }
90 }
91 
92 
93 // Manage the parameters for the module:
94 // (Note that this will autogenerate the _cfi.py file.)
96  edm::ConfigurationDescriptions& descriptions) {
98 
99  desc.add<std::string>("fileDir", "")->setComment(
100  "Keep the fileDir empty if you want to write to the current "
101  "directory.");
102 
103  desc.add<std::string>("outputBinaryFile", "milleBinary%04d.dat")->setComment(
104  "Base filename of the files that will be created. This must "
105  "contain "
106  "a placeholder for an index number in the standard C formatting "
107  "style, like %04d.");
108 
109  desc.add<edm::InputTag>("fileBlobInputTag", edm::InputTag("millePedeFileConverter",""))->setComment(
110  "Name of the module that should have generated the blob in the "
111  "root file. Make sure you overwrite this, if you have changed "
112  "this is the configuration of the MillePedeFileConverter.");
113 
114  desc.add<int>("maxNumberOfBinaries", 1000)->setComment(
115  "Number of binaries to be extracted from the input files. "
116  "Use a negative value to apply no limit.");
117 
118  descriptions.add("millePedeFileExtractor", desc);
119  descriptions.setComment(
120  "This is the generic cfi file for the "
121  "MillePedeFileExtractor");
122 }
T getParameter(std::string const &) const
edm::EDGetTokenT< FileBlobCollection > fileBlobToken_
const std::string outputFileName_
bool getByToken(EDGetToken token, Handle< PROD > &result) const
void zerr(int)
MillePedeFileExtractor(const edm::ParameterSet &)
void endLuminosityBlock(const edm::LuminosityBlock &, const edm::EventSetup &) override
static void fillDescriptions(edm::ConfigurationDescriptions &descriptions)
ParameterDescriptionBase * add(U const &iLabel, T const &value)
bool isValid() const
Definition: HandleBase.h:74
void setComment(std::string const &value)
void add(std::string const &label, ParameterSetDescription const &psetDescription)
std::unique_ptr< std::vector< unsigned char > > getUncompressedBlob() const
i didn&#39;t want to do two copies ... hope this works.
Definition: FileBlob.cc:74
static void writeGzipped(const FileBlob &, const std::string &)