CMS 3D CMS Logo

MillePedeFileExtractor.cc
Go to the documentation of this file.
1 // Original Author: Broen van Besien
2 // Created: Mon, 23 Mar 2015 14:56:15 GMT
3 
6 
7 #include <zlib.h>
8 
13 
14 #include <TSystem.h>
15 
17  : outputDir_(iConfig.getParameter<std::string>("fileDir")),
18  outputFileName_(iConfig.getParameter<std::string>("outputBinaryFile")),
19  maxNumberOfBinaries_(iConfig.getParameter<int>("maxNumberOfBinaries")) {
20  fileBlobInputTag_ = iConfig.getParameter<edm::InputTag>("fileBlobInputTag");
21  fileBlobToken_ = consumes<FileBlobCollection, edm::BranchType::InLumi>(fileBlobInputTag_);
22  if (hasBinaryNumberLimit()) {
23  edm::LogInfo("MillePedeFileActions") << "Limiting the number of extracted binary files to " << maxNumberOfBinaries_;
24  }
25 }
26 
28  if (enoughBinaries())
29  return;
30 
31  // Create output directory if not available
32  if (!outputDir_.empty()) {
33  std::string command = "mkdir -p " + outputDir_;
34  int shellReturn = gSystem->Exec(command.c_str());
35  edm::LogInfo("MillePedeFileActions") << "@SUB=MillePedeFileExtractor::endLuminosityBlock"
36  << "Command returns " << shellReturn;
37  }
38 
39  // Getting our hands on the vector of FileBlobs
40  edm::Handle<FileBlobCollection> fileBlobCollection;
41  iLumi.getByToken(fileBlobToken_, fileBlobCollection);
42 
43  if (fileBlobCollection.failedToGet()) {
44  edm::LogError("MillePedeFileActions") << "Failed to get collection from input tag: " << fileBlobInputTag_.encode();
45  return;
46  }
47 
48  if (fileBlobCollection.isValid()) {
49  // Logging the amount of FileBlobs in the vector
50  edm::LogInfo("MillePedeFileActions") << "Root file contains " << fileBlobCollection->size() << " FileBlob(s).";
51  // Loop over the FileBlobs in the vector, and write them to files:
52  for (const auto& blob : *fileBlobCollection) {
53  if (enoughBinaries())
54  break;
55  // We format the filename with a number, starting from 0 to the size of
56  // our vector.
57  // For this to work, the outputBinaryFile config parameter must contain a
58  // formatting directive for a number, like %04d.
59  char theNumberedOutputFileName[200];
60  sprintf(theNumberedOutputFileName, outputFileName_.c_str(), nBinaries_);
61 
62  // Log the filename to which we will write...
63  edm::LogInfo("MillePedeFileActions")
64  << "Writing FileBlob file to file " << outputDir_ + theNumberedOutputFileName << ".";
65 
66  // ...and perform the writing operation.
67  writeGzipped(blob, outputDir_ + theNumberedOutputFileName);
68 
69  ++nBinaries_;
70  }
71  } else {
72  edm::LogError("MillePedeFileActions")
73  << "Error: The root file does not contain any vector of FileBlob under the label " << fileBlobInputTag_.encode()
74  << ".";
75  }
76 }
77 
79  // - use zlib directly to avoid boost dependencies for this simple task
80  // - zlib and gzip compression differ -> get uncompressed blob first
81  auto uncompressedBlob = blob.getUncompressedBlob();
82  gzFile fp = gzopen(fileName.c_str(), "wb");
83  if (fp == nullptr) {
84  edm::LogError("MillePedeFileActions") << "Problem while opening gzipped file '" << fileName << "'.";
85  }
86  auto nBytes = gzwrite(fp, &uncompressedBlob->front(), uncompressedBlob->size());
87  if (nBytes == 0 || nBytes != static_cast<decltype(nBytes)>(uncompressedBlob->size())) {
88  edm::LogError("MillePedeFileActions") << "Problem while writing FileBlob to gzipped file '" << fileName << "'.";
89  }
90  auto zerr = gzclose(fp);
91  if (zerr != 0) {
92  edm::LogError("MillePedeFileActions") << "Problem while closing gzipped file '" << fileName << "'.";
93  }
94 }
95 
96 // Manage the parameters for the module:
97 // (Note that this will autogenerate the _cfi.py file.)
100 
101  desc.add<std::string>("fileDir", "")
102  ->setComment(
103  "Keep the fileDir empty if you want to write to the current "
104  "directory.");
105 
106  desc.add<std::string>("outputBinaryFile", "milleBinary%04d.dat")
107  ->setComment(
108  "Base filename of the files that will be created. This must "
109  "contain "
110  "a placeholder for an index number in the standard C formatting "
111  "style, like %04d.");
112 
113  desc.add<edm::InputTag>("fileBlobInputTag", edm::InputTag("millePedeFileConverter", ""))
114  ->setComment(
115  "Name of the module that should have generated the blob in the "
116  "root file. Make sure you overwrite this, if you have changed "
117  "this is the configuration of the MillePedeFileConverter.");
118 
119  desc.add<int>("maxNumberOfBinaries", 1000)
120  ->setComment(
121  "Number of binaries to be extracted from the input files. "
122  "Use a negative value to apply no limit.");
123 
124  descriptions.add("millePedeFileExtractor", desc);
125  descriptions.setComment(
126  "This is the generic cfi file for the "
127  "MillePedeFileExtractor");
128 }
T getParameter(std::string const &) const
Definition: ParameterSet.h:307
edm::EDGetTokenT< FileBlobCollection > fileBlobToken_
const std::string outputFileName_
std::string encode() const
Definition: InputTag.cc:159
void zerr(int)
MillePedeFileExtractor(const edm::ParameterSet &)
Log< level::Error, false > LogError
bool failedToGet() const
Definition: HandleBase.h:72
void endLuminosityBlock(const edm::LuminosityBlock &, const edm::EventSetup &) override
static void fillDescriptions(edm::ConfigurationDescriptions &descriptions)
Log< level::Info, false > LogInfo
void setComment(std::string const &value)
bool getByToken(EDGetToken token, Handle< PROD > &result) const
void add(std::string const &label, ParameterSetDescription const &psetDescription)
bool isValid() const
Definition: HandleBase.h:70
list command
Definition: mps_check.py:25
std::unique_ptr< std::vector< unsigned char > > getUncompressedBlob() const
i didn&#39;t want to do two copies ... hope this works.
Definition: FileBlob.cc:75
static void writeGzipped(const FileBlob &, const std::string &)