CMS 3D CMS Logo

 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Properties Friends Macros Pages
EvFDaqDirector.cc
Go to the documentation of this file.
10 
16 
17 #include <iostream>
18 #include <sstream>
19 #include <sys/time.h>
20 #include <unistd.h>
21 #include <stdio.h>
22 #include <sys/file.h>
23 #include <boost/lexical_cast.hpp>
24 #include <boost/filesystem/fstream.hpp>
25 
26 //#define DEBUG
27 
28 namespace evf {
29 
30  namespace {
31  struct flock make_flock(short type, short whence, off_t start, off_t len, pid_t pid)
32  {
33 #ifdef __APPLE__
34  return {start, len, pid, type, whence};
35 #else
36  return {type, whence, start, len, pid};
37 #endif
38  }
39  }
40 
42  edm::ActivityRegistry& reg) :
43  base_dir_(pset.getUntrackedParameter<std::string> ("baseDir", ".")),
44  bu_base_dir_(pset.getUntrackedParameter<std::string> ("buBaseDir", ".")),
45  directorBu_(pset.getUntrackedParameter<bool> ("directorIsBu", false)),
46  run_(pset.getUntrackedParameter<unsigned int> ("runNumber",0)),
47  outputAdler32Recheck_(pset.getUntrackedParameter<bool>("outputAdler32Recheck",false)),
48  requireTSPSet_(pset.getUntrackedParameter<bool>("requireTransfersPSet",false)),
49  selectedTransferMode_(pset.getUntrackedParameter<std::string>("selectedTransferMode","")),
50  hltSourceDirectory_(pset.getUntrackedParameter<std::string>("hltSourceDirectory","")),
51  fuLockPollInterval_(pset.getUntrackedParameter<unsigned int>("fuLockPollInterval",2000)),
52  emptyLumisectionMode_(pset.getUntrackedParameter<bool>("emptyLumisectionMode",false)),
53  hostname_(""),
54  bu_readlock_fd_(-1),
55  bu_writelock_fd_(-1),
56  fu_readwritelock_fd_(-1),
57  data_readwrite_fd_(-1),
58  fulocal_rwlock_fd_(-1),
59  fulocal_rwlock_fd2_(-1),
60 
61  bu_w_lock_stream(0),
62  bu_r_lock_stream(0),
63  fu_rw_lock_stream(0),
64  //bu_w_monitor_stream(0),
65  //bu_t_monitor_stream(0),
66  data_rw_stream(0),
67 
68  dirManager_(base_dir_),
69 
70  previousFileSize_(0),
71 
72  bu_w_flk( make_flock( F_WRLCK, SEEK_SET, 0, 0, 0 )),
73  bu_r_flk( make_flock( F_RDLCK, SEEK_SET, 0, 0, 0 )),
74  bu_w_fulk( make_flock( F_UNLCK, SEEK_SET, 0, 0, 0 )),
75  bu_r_fulk( make_flock( F_UNLCK, SEEK_SET, 0, 0, 0 )),
76  fu_rw_flk( make_flock ( F_WRLCK, SEEK_SET, 0, 0, getpid() )),
77  fu_rw_fulk( make_flock( F_UNLCK, SEEK_SET, 0, 0, getpid() )),
78  data_rw_flk( make_flock ( F_WRLCK, SEEK_SET, 0, 0, getpid() )),
79  data_rw_fulk( make_flock( F_UNLCK, SEEK_SET, 0, 0, getpid() ))
80  //fulocal_rw_flk( make_flock( F_WRLCK, SEEK_SET, 0, 0, getpid() )),
81  //fulocal_rw_fulk( make_flock( F_UNLCK, SEEK_SET, 0, 0, getpid() )),
82  //fulocal_rw_flk2( make_flock( F_WRLCK, SEEK_SET, 0, 0, getpid() )),
83  //fulocal_rw_fulk2( make_flock( F_UNLCK, SEEK_SET, 0, 0, getpid() ))
84  {
85 
91 
92  std::stringstream ss;
93  ss << "run" << std::setfill('0') << std::setw(6) << run_;
94  run_string_ = ss.str();
96 
97  //save hostname for later
98  char hostname[33];
99  gethostname(hostname,32);
100  hostname_ = hostname;
101 
102  char * fuLockPollIntervalPtr = getenv("FFF_LOCKPOLLINTERVAL");
103  if (fuLockPollIntervalPtr) {
104  try {
105  fuLockPollInterval_=boost::lexical_cast<unsigned int>(std::string(fuLockPollIntervalPtr));
106  edm::LogInfo("Setting fu lock poll interval by environment string: ") << fuLockPollInterval_ << " us";
107  }
108  catch (...) {edm::LogWarning("Unable to parse environment string: ") << std::string(fuLockPollIntervalPtr);}
109  }
110 
111  char * emptyLumiModePtr = getenv("FFF_EMPTYLSMODE");
112  if (emptyLumiModePtr) {
113  emptyLumisectionMode_ = true;
114  edm::LogInfo("Setting empty lumisection mode");
115  }
116 
117  // check if base dir exists or create it accordingly
118  int retval = mkdir(base_dir_.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
119  if (retval != 0 && errno != EEXIST) {
120  throw cms::Exception("DaqDirector") << " Error checking for base dir -: "
121  << base_dir_ << " mkdir error:" << strerror(errno);
122  }
123 
124  //create run dir in base dir
125  umask(0);
126  retval = mkdir(run_dir_.c_str(),
127  S_IRWXU | S_IRWXG | S_IROTH | S_IRWXO | S_IXOTH);
128  if (retval != 0 && errno != EEXIST) {
129  throw cms::Exception("DaqDirector") << " Error creating run dir -: "
130  << run_dir_ << " mkdir error:" << strerror(errno);
131  }
132 
133  //create fu-local.lock in run open dir
134  if (!directorBu_) {
135 
137  std::string fulocal_lock_ = getRunOpenDirPath() +"/fu-local.lock";
138  fulocal_rwlock_fd_ = open(fulocal_lock_.c_str(), O_RDWR | O_CREAT, S_IRWXU | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH);//O_RDWR?
139  if (fulocal_rwlock_fd_==-1)
140  throw cms::Exception("DaqDirector") << " Error creating/opening a local lock file -: " << fulocal_lock_.c_str() << " : " << strerror(errno);
141  chmod(fulocal_lock_.c_str(),0777);
142  fsync(fulocal_rwlock_fd_);
143  //open second fd for another input source thread
144  fulocal_rwlock_fd2_ = open(fulocal_lock_.c_str(), O_RDWR, S_IRWXU | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH);//O_RDWR?
145  if (fulocal_rwlock_fd2_==-1)
146  throw cms::Exception("DaqDirector") << " Error opening a local lock file -: " << fulocal_lock_.c_str() << " : " << strerror(errno);
147  }
148 
149  //bu_run_dir: for FU, for which the base dir is local and the BU is remote, it is expected to be there
150  //for BU, it is created at this point
151  if (directorBu_)
152  {
154  std::string bulockfile = bu_run_dir_ + "/bu.lock";
155  std::string fulockfile = bu_run_dir_ + "/fu.lock";
156 
157  //make or find bu run dir
158  retval = mkdir(bu_run_dir_.c_str(),
159  S_IRWXU | S_IRWXG | S_IRWXO);
160  if (retval != 0 && errno != EEXIST) {
161  throw cms::Exception("DaqDirector")
162  << " Error creating bu run dir -: " << bu_run_dir_
163  << " mkdir error:" << strerror(errno) << "\n";
164  }
165  bu_run_open_dir_ = bu_run_dir_ + "/open";
166  retval = mkdir(bu_run_open_dir_.c_str(),
167  S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
168  if (retval != 0 && errno != EEXIST) {
169  throw cms::Exception("DaqDirector") << " Error creating bu run open dir -: "
170  << bu_run_open_dir_ << " mkdir error:" << strerror(errno)
171  << "\n";
172  }
173 
174  // the BU director does not need to know about the fu lock
175  bu_writelock_fd_ = open(bulockfile.c_str(),
176  O_WRONLY | O_CREAT | O_TRUNC, S_IRWXU);
177  if (bu_writelock_fd_ == -1)
178  edm::LogWarning("EvFDaqDirector") << "problem with creating filedesc for buwritelock -: "
179  << strerror(errno);
180  else
181  edm::LogInfo("EvFDaqDirector") << "creating filedesc for buwritelock -: "
182  << bu_writelock_fd_;
183  bu_w_lock_stream = fdopen(bu_writelock_fd_, "w");
184  if (bu_w_lock_stream == 0)
185  edm::LogWarning("EvFDaqDirector")<< "Error creating write lock stream -: " << strerror(errno);
186 
187  // BU INITIALIZES LOCK FILE
188  // FU LOCK FILE OPEN
189  openFULockfileStream(fulockfile, true);
191  fflush(fu_rw_lock_stream);
192  close(fu_readwritelock_fd_);
193 
194  if (hltSourceDirectory_.size())
195  {
196  struct stat buf;
197  if (stat(hltSourceDirectory_.c_str(),&buf)==0) {
198  std::string hltdir=bu_run_dir_+"/hlt";
199  std::string tmphltdir=bu_run_open_dir_+"/hlt";
200  retval = mkdir(tmphltdir.c_str(),S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
201 
202  boost::filesystem::copy_file(hltSourceDirectory_+"/HltConfig.py",tmphltdir+"/HltConfig.py");
203  try {
204  boost::filesystem::copy_file(hltSourceDirectory_+"/CMSSW_VERSION",tmphltdir+"/CMSSW_VERSION");
205  boost::filesystem::copy_file(hltSourceDirectory_+"/SCRAM_ARCH",tmphltdir+"/SCRAM_ARCH");
206  } catch (...) {}
207 
208  boost::filesystem::copy_file(hltSourceDirectory_+"/fffParameters.jsn",tmphltdir+"/fffParameters.jsn");
209 
210  boost::filesystem::rename(tmphltdir,hltdir);
211  }
212  else
213  throw cms::Exception("DaqDirector") << " Error looking for HLT configuration -: " << hltSourceDirectory_;
214  }
215  //else{}//no configuration specified
216  }
217  else
218  {
219  // for FU, check if bu base dir exists
220 
221  retval = mkdir(bu_base_dir_.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
222  if (retval != 0 && errno != EEXIST) {
223  throw cms::Exception("DaqDirector") << " Error checking for bu base dir -: "
224  << bu_base_dir_ << " mkdir error:" << strerror(errno) << "\n";
225  }
226 
228  std::string fulockfile = bu_run_dir_ + "/fu.lock";
229  openFULockfileStream(fulockfile, false);
230  }
231 
232  pthread_mutex_init(&init_lock_,NULL);
233 
234  stopFilePath_ = run_dir_+"/CMSSW_STOP";
235  }
236 
238  {
239  if (fulocal_rwlock_fd_!=-1) {
240  unlockFULocal();
241  close(fulocal_rwlock_fd_);
242  }
243 
244  if (fulocal_rwlock_fd2_!=-1) {
245  unlockFULocal2();
246  close(fulocal_rwlock_fd2_);
247  }
248 
249  }
250 
252  {
254  desc.setComment("Service used for file locking arbitration and for propagating information between other EvF components");
255  desc.addUntracked<std::string> ("baseDir", ".")->setComment("Local base directory for run output");
256  desc.addUntracked<std::string> ("buBaseDir", ".")->setComment("BU base ramdisk directory ");
257  desc.addUntracked<unsigned int> ("runNumber",0)->setComment("Run Number in ramdisk to open");
258  desc.addUntracked<bool>("outputAdler32Recheck",false)->setComment("Check Adler32 of per-process output files while micro-merging");
259  desc.addUntracked<bool>("requireTransfersPSet",false)->setComment("Require complete transferSystem PSet in the process configuration");
260  desc.addUntracked<std::string>("selectedTransferMode","")->setComment("Selected transfer mode (choice in Lvl0 propagated as Python parameter");
261  desc.addUntracked<unsigned int>("fuLockPollInterval",2000)->setComment("Lock polling interval in microseconds for the input directory file lock");
262  desc.addUntracked<bool>("emptyLumisectionMode",false)->setComment("Enables writing stream output metadata even when no events are processed in a lumisection");
263  desc.setAllowAnything();
264  descriptions.add("EvFDaqDirector", desc);
265  }
266 
267  void EvFDaqDirector::postEndRun(edm::GlobalContext const& globalContext) {
268  close(bu_readlock_fd_);
269  close(bu_writelock_fd_);
270  if (directorBu_) {
271  std::string filename = bu_run_dir_ + "/bu.lock";
272  removeFile(filename);
273  }
274  }
275 
277 
278  for (unsigned int i=0;i<bounds.maxNumberOfStreams();i++){
279  streamFileTracker_.push_back(-1);
280  }
281  nThreads_=bounds.maxNumberOfStreams();
282  nStreams_=bounds.maxNumberOfThreads();
283 
285  }
286 
287  void EvFDaqDirector::preBeginRun(edm::GlobalContext const& globalContext) {
288 
289  //assert(run_ == id.run());
290 
291  // check if the requested run is the latest one - issue a warning if it isn't
293  edm::LogWarning("EvFDaqDirector") << "WARNING - checking run dir -: "
294  << run_dir_ << ". This is not the highest run "
296  }
297  }
298 
300  {
301  //delete all files belonging to just closed lumi
302  unsigned int ls = globalContext.luminosityBlockID().luminosityBlock();
304  edm::LogWarning("EvFDaqDirector") << " Handles to check for files to delete were not set by the input source...";
305  return;
306  }
307 
308  std::unique_lock<std::mutex> lkw(*fileDeleteLockPtr_);
309  auto it = filesToDeletePtr_->begin();
310  while (it!=filesToDeletePtr_->end()) {
311  if (it->second->lumi_ == ls) {
312  const boost::filesystem::path filePath(it->second->fileName_);
313  LogDebug("EvFDaqDirector") << "Deleting input file -:" << it->second->fileName_;
314  try {
315  //rarely this fails but file gets deleted
316  boost::filesystem::remove(filePath);
317  }
318  catch (const boost::filesystem::filesystem_error& ex)
319  {
320  edm::LogError("EvFDaqDirector") << " - deleteFile BOOST FILESYSTEM ERROR CAUGHT -: " << ex.what() << ". Trying again.";
321  usleep(10000);
322  try {
323  boost::filesystem::remove(filePath);
324  }
325  catch (...) {/*file gets deleted first time but exception is still thrown*/}
326  }
327  catch (std::exception& ex)
328  {
329  edm::LogError("EvFDaqDirector") << " - deleteFile std::exception CAUGHT -: " << ex.what() << ". Trying again.";
330  usleep(10000);
331  try {
332  boost::filesystem::remove(filePath);
333  } catch (...) {/*file gets deleted first time but exception is still thrown*/}
334  }
335 
336  delete it->second;
337  it = filesToDeletePtr_->erase(it);
338  }
339  else it++;
340  }
341  }
342 
343  inline void EvFDaqDirector::preSourceEvent(edm::StreamID const& streamID) {
345  }
346 
347 
348  std::string EvFDaqDirector::getInputJsonFilePath(const unsigned int ls, const unsigned int index) const {
349  return bu_run_dir_ + "/" + fffnaming::inputJsonFileName(run_,ls,index);
350  }
351 
352 
353  std::string EvFDaqDirector::getRawFilePath(const unsigned int ls, const unsigned int index) const {
354  return bu_run_dir_ + "/" + fffnaming::inputRawFileName(run_,ls,index);
355  }
356 
357  std::string EvFDaqDirector::getOpenRawFilePath(const unsigned int ls, const unsigned int index) const {
358  return bu_run_dir_ + "/open/" + fffnaming::inputRawFileName(run_,ls,index);
359  }
360 
361  std::string EvFDaqDirector::getOpenInputJsonFilePath(const unsigned int ls, const unsigned int index) const {
362  return bu_run_dir_ + "/open/" + fffnaming::inputJsonFileName(run_,ls,index);
363  }
364 
365  std::string EvFDaqDirector::getOpenDatFilePath(const unsigned int ls, std::string const& stream) const {
366  return run_dir_ + "/open/" + fffnaming::streamerDataFileNameWithPid(run_,ls,stream);
367  }
368 
369  std::string EvFDaqDirector::getOpenOutputJsonFilePath(const unsigned int ls, std::string const& stream) const {
370  return run_dir_ + "/open/" + fffnaming::streamerJsonFileNameWithPid(run_,ls,stream);
371  }
372 
373  std::string EvFDaqDirector::getOutputJsonFilePath(const unsigned int ls, std::string const& stream) const {
374  return run_dir_ + "/" + fffnaming::streamerJsonFileNameWithPid(run_,ls,stream);
375  }
376 
377  std::string EvFDaqDirector::getMergedDatFilePath(const unsigned int ls, std::string const& stream) const {
379  }
380 
381  std::string EvFDaqDirector::getMergedDatChecksumFilePath(const unsigned int ls, std::string const& stream) const {
383  }
384 
386  return run_dir_ + "/open/" + fffnaming::initFileNameWithPid(run_,0,stream);
387  }
388 
390  return run_dir_ + "/" + fffnaming::initFileNameWithPid(run_,0,stream);
391  }
392 
394  return run_dir_ + "/open/" + fffnaming::protocolBufferHistogramFileNameWithPid(run_,ls,stream);
395  }
396 
399  }
400 
403  }
404 
405  std::string EvFDaqDirector::getOpenRootHistogramFilePath(const unsigned int ls, std::string const& stream) const {
406  return run_dir_ + "/open/" + fffnaming::rootHistogramFileNameWithPid(run_,ls,stream);
407  }
408 
409  std::string EvFDaqDirector::getRootHistogramFilePath(const unsigned int ls, std::string const& stream) const {
410  return run_dir_ + "/" + fffnaming::rootHistogramFileNameWithPid(run_,ls,stream);
411  }
412 
415  }
416 
418  return bu_run_dir_ + "/" + fffnaming::eolsFileName(run_,ls);
419  }
420 
422  return run_dir_ + "/" + fffnaming::eolsFileName(run_,ls);
423  }
424 
426  return run_dir_ + "/" + fffnaming::bolsFileName(run_,ls);
427  }
428 
430  return bu_run_dir_ + "/" + fffnaming::eorFileName(run_);
431  }
432 
433 
435  return run_dir_ + "/" + fffnaming::eorFileName(run_);
436  }
437 
439  int retval = remove(filename.c_str());
440  if (retval != 0)
441  edm::LogError("EvFDaqDirector") << "Could not remove used file -: " << filename << ". error = "
442  << strerror(errno);
443  }
444 
445  void EvFDaqDirector::removeFile(unsigned int ls, unsigned int index) {
446  removeFile(getRawFilePath(ls,index));
447  }
448 
449  EvFDaqDirector::FileStatus EvFDaqDirector::updateFuLock(unsigned int& ls, std::string& nextFile, uint32_t& fsize, uint64_t& lockWaitTime) {
450  EvFDaqDirector::FileStatus fileStatus = noFile;
451 
452  int retval = -1;
453  int lock_attempts = 0;
454 
455  struct stat buf;
456  int stopFileLS = -1;
457  if (stat(stopFilePath_.c_str(),&buf)==0) {
458  stopFileLS = readLastLSEntry(stopFilePath_);
459  edm::LogWarning("EvFDaqDirector") << "Detected stop request from hltd. Ending run for this process after LS -: " << stopFileLS;
460  //return runEnded;
461  }
462 
463  timeval ts_lockbegin;
464  gettimeofday(&ts_lockbegin,0);
465 
466  while (retval==-1) {
467  retval = fcntl(fu_readwritelock_fd_, F_SETLK, &fu_rw_flk);
468  if (retval==-1) usleep(fuLockPollInterval_);
469  else continue;
470 
471  lock_attempts+=fuLockPollInterval_;
472  if (lock_attempts>5000000 || errno==116) {
473  if (errno==116)
474  edm::LogWarning("EvFDaqDirector") << "Stale lock file handle. Checking if run directory and fu.lock file are present" << std::endl;
475  else
476  edm::LogWarning("EvFDaqDirector") << "Unable to obtain a lock for 5 seconds. Checking if run directory and fu.lock file are present -: errno "
477  << errno <<":"<< strerror(errno) << std::endl;
478 
479 
480  if (stat(getEoLSFilePathOnFU(ls).c_str(),&buf)==0) {
481  edm::LogWarning("EvFDaqDirector") << "Detected local EoLS for lumisection "<< ls ;
482  ls++;
483  return noFile;
484  }
485 
486  if (stat(bu_run_dir_.c_str(), &buf)!=0) return runEnded;
487  if (stat((bu_run_dir_+"/fu.lock").c_str(), &buf)!=0) return runEnded;
488  lock_attempts=0;
489  }
490  }
491 
492  timeval ts_lockend;
493  gettimeofday(&ts_lockend,0);
494  long deltat = (ts_lockend.tv_usec-ts_lockbegin.tv_usec) + (ts_lockend.tv_sec-ts_lockbegin.tv_sec)*1000000;
495  if (deltat>0.) lockWaitTime=deltat;
496 
497 
498 
499  if(retval!=0) return fileStatus;
500 
501 #ifdef DEBUG
502  timeval ts_lockend;
503  gettimeofday(&ts_lockend,0);
504 #endif
505 
506  // if the stream is readable
507  if (fu_rw_lock_stream != 0) {
508  unsigned int readLs, readIndex;
509  int check = 0;
510  // rewind the stream
511  check = fseek(fu_rw_lock_stream, 0, SEEK_SET);
512  // if rewinded ok
513  if (check == 0) {
514  // read its' values
515  fscanf(fu_rw_lock_stream, "%u %u", &readLs, &readIndex);
516  edm::LogInfo("EvFDaqDirector") << "Read fu.lock file file -: " << readLs << ":" << readIndex;
517 
518  unsigned int currentLs = readLs;
519  bool bumpedOk = false;
520  //if next lumisection in a lock file is not +1 wrt. source, cycle through the next empty one, unless initial lumi not yet set
521  //no lock file write in this case
522  if (ls && ls+1 < currentLs) ls++;
523  else {
524  // try to bump (look for new index or EoLS file)
525  bumpedOk = bumpFile(readLs, readIndex, nextFile, fsize, stopFileLS);
526  //avoid 2 lumisections jump
527  if (ls && readLs>currentLs && currentLs > ls) {
528  ls++;
529  readLs=currentLs=ls;
530  readIndex=0;
531  bumpedOk=false;
532  //no write to lock file
533  }
534  else {
535  if (ls==0 && readLs>currentLs) {
536  //make sure to intialize always with LS found in the lock file, with possibility of grabbing index file immediately
537  //in this case there is no new file in the same LS
538  readLs=currentLs;
539  readIndex=0;
540  bumpedOk=false;
541  //no write to lock file
542  }
543  //update return LS value
544  ls = readLs;
545  }
546  }
547  if (bumpedOk) {
548  // there is a new index file to grab, lock file needs to be updated
549  check = fseek(fu_rw_lock_stream, 0, SEEK_SET);
550  if (check == 0) {
551  ftruncate(fu_readwritelock_fd_, 0);
552  // write next index in the file, which is the file the next process should take
553  fprintf(fu_rw_lock_stream, "%u %u", readLs, readIndex + 1);
554  fflush(fu_rw_lock_stream);
555  fsync(fu_readwritelock_fd_);
556  fileStatus = newFile;
557  LogDebug("EvFDaqDirector") << "Written to file -: " << readLs << ":" << readIndex + 1;
558  }
559  else {
560  throw cms::Exception("EvFDaqDirector") << "seek on fu read/write lock for updating failed with error " << strerror(errno);
561  }
562  }
563  else if (currentLs < readLs) {
564  //there is no new file in next LS (yet), but lock file can be updated to the next LS
565  check = fseek(fu_rw_lock_stream, 0, SEEK_SET);
566  if (check == 0) {
567  ftruncate(fu_readwritelock_fd_, 0);
568  // in this case LS was bumped, but no new file. Thus readIndex is 0 (set by bumpFile)
569  fprintf(fu_rw_lock_stream, "%u %u", readLs, readIndex);
570  fflush(fu_rw_lock_stream);
571  fsync(fu_readwritelock_fd_);
572  LogDebug("EvFDaqDirector") << "Written to file -: " << readLs << ":" << readIndex;
573  }
574  else {
575  throw cms::Exception("EvFDaqDirector") << "seek on fu read/write lock for updating failed with error " << strerror(errno);
576  }
577  }
578  } else {
579  edm::LogError("EvFDaqDirector") << "seek on fu read/write lock for reading failed with error " << strerror(errno);
580  }
581  } else {
582  edm::LogError("EvFDaqDirector") << "fu read/write lock stream is invalid " << strerror(errno);
583  }
584 
585 #ifdef DEBUG
586  timeval ts_preunlock;
587  gettimeofday(&ts_preunlock,0);
588  int locked_period_int = ts_preunlock.tv_sec - ts_lockend.tv_sec;
589  double locked_period=locked_period_int+double(ts_preunlock.tv_usec - ts_lockend.tv_usec)/1000000;
590 #endif
591 
592  //if new json is present, lock file which FedRawDataInputSource will later unlock
593  if (fileStatus==newFile) lockFULocal();
594 
595  //release lock at this point
596  int retvalu=-1;
597  retvalu=fcntl(fu_readwritelock_fd_, F_SETLKW, &fu_rw_fulk);
598  if (retvalu==-1) edm::LogError("EvFDaqDirector") << "Error unlocking the fu.lock " << strerror(errno);
599 
600 #ifdef DEBUG
601  edm::LogDebug("EvFDaqDirector") << "Waited during lock -: " << locked_period << " seconds";
602 #endif
603 
604  if ( fileStatus == noFile ) {
605  struct stat buf;
606  //edm::LogInfo("EvFDaqDirector") << " looking for EoR file: " << getEoRFilePath().c_str();
607  if ( stat(getEoRFilePath().c_str(), &buf) == 0 || stat(bu_run_dir_.c_str(), &buf)!=0)
608  fileStatus = runEnded;
609  if (stopFileLS>=0 && (int)ls > stopFileLS) {
610  edm::LogInfo("EvFDaqDirector") << "Reached maximum lumisection set by hltd";
611  fileStatus = runEnded;
612  }
613  }
614  return fileStatus;
615  }
616 
618 
619  boost::filesystem::ifstream ij(BUEoLSFile);
620  Json::Value deserializeRoot;
622 
623  if (!reader.parse(ij, deserializeRoot)) {
624  edm::LogError("EvFDaqDirector") << "Cannot deserialize input JSON file -:" << BUEoLSFile;
625  return -1;
626  }
627 
629  DataPoint dp;
630  dp.deserialize(deserializeRoot);
631 
632  //read definition
633  if (readEolsDefinition_) {
634  //std::string def = boost::algorithm::trim(dp.getDefinition());
636  if (!def.size()) readEolsDefinition_=false;
637  while (def.size()) {
638  std::string fullpath;
639  if (def.find('/')==0)
640  fullpath = def;
641  else
642  fullpath = bu_run_dir_+'/'+def;
643  struct stat buf;
644  if (stat(fullpath.c_str(), &buf) == 0) {
645  DataPointDefinition eolsDpd;
646  std::string defLabel = "legend";
647  DataPointDefinition::getDataPointDefinitionFor(fullpath, &eolsDpd,&defLabel);
648  if (eolsDpd.getNames().size()==0) {
649  //try with "data" label if "legend" format is not used
650  eolsDpd = DataPointDefinition();
651  defLabel="data";
652  DataPointDefinition::getDataPointDefinitionFor(fullpath, &eolsDpd,&defLabel);
653  }
654  for (unsigned int i=0;i<eolsDpd.getNames().size();i++)
655  if (eolsDpd.getNames().at(i)=="NFiles")
657  readEolsDefinition_=false;
658  break;
659  }
660  //check if we can still find definition
661  if (def.size()<=1 || def.find('/')==std::string::npos) {
662  readEolsDefinition_=false;
663  break;
664  }
665  def = def.substr(def.find('/')+1);
666  }
667  }
668 
669  if (dp.getData().size()>eolsNFilesIndex_)
670  data = dp.getData()[eolsNFilesIndex_];
671  else {
672  edm::LogError("EvFDaqDirector") << " error reading number of files from BU JSON -: " << BUEoLSFile;
673  return -1;
674  }
675  return boost::lexical_cast<int>(data);
676  }
677 
678  bool EvFDaqDirector::bumpFile(unsigned int& ls, unsigned int& index, std::string& nextFile, uint32_t& fsize, int maxLS) {
679 
680  if (previousFileSize_ != 0) {
681  if (!fms_) {
682  try {
684  } catch (...) {
685  edm::LogError("EvFDaqDirector") <<" FastMonitoringService not found";
686  }
687  }
689  previousFileSize_ = 0;
690  }
691 
692  //reached limit
693  if (maxLS>=0 && ls > (unsigned int)maxLS) return false;
694 
695  struct stat buf;
696  std::stringstream ss;
697  unsigned int nextIndex = index;
698  nextIndex++;
699 
700  // 1. Check suggested file
701  nextFile = getInputJsonFilePath(ls,index);
702  if (stat(nextFile.c_str(), &buf) == 0) {
703 
704  previousFileSize_ = buf.st_size;
705  fsize = buf.st_size;
706  return true;
707  }
708  // 2. No file -> lumi ended? (and how many?)
709  else {
710  std::string BUEoLSFile = getEoLSFilePathOnBU(ls);
711  bool eolFound = (stat(BUEoLSFile.c_str(), &buf) == 0);
712  while (eolFound) {
713 
714  // recheck that no raw file appeared in the meantime
715  if (stat(nextFile.c_str(), &buf) == 0) {
716  previousFileSize_ = buf.st_size;
717  fsize = buf.st_size;
718  return true;
719  }
720 
721  int indexFilesInLS = getNFilesFromEoLS(BUEoLSFile);
722  if (indexFilesInLS < 0)
723  //parsing failed
724  return false;
725  else {
726  //check index
727  if ((int)index<indexFilesInLS) {
728  //we have 2 files, and check for 1 failed... retry (2 will never be here)
729  edm::LogError("EvFDaqDirector") << "Potential miss of index file in LS -: " << ls << ". Missing "
730  << nextFile << " because " << indexFilesInLS-1 << " is the highest index expected. Will not update fu.lock file";
731  return false;
732  }
733  }
734  // this lumi ended, check for files
735  ++ls;
736  index = 0;
737 
738  //reached limit
739  if (maxLS>=0 && ls > (unsigned int)maxLS) return false;
740 
741  nextFile = getInputJsonFilePath(ls,0);
742  if (stat(nextFile.c_str(), &buf) == 0) {
743  // a new file was found at new lumisection, index 0
744  previousFileSize_ = buf.st_size;
745  fsize = buf.st_size;
746  return true;
747  }
748  else {
749  //change of policy: we need to cycle through each LS
750  return false;
751  }
752  BUEoLSFile = getEoLSFilePathOnBU(ls);
753  eolFound = (stat(BUEoLSFile.c_str(), &buf) == 0);
754  }
755  }
756  // no new file found
757  return false;
758  }
759 
761  if (fu_rw_lock_stream == 0)
762  edm::LogError("EvFDaqDirector") << "Error creating fu read/write lock stream "
763  << strerror(errno);
764  else {
765  edm::LogInfo("EvFDaqDirector") << "Initializing FU LOCK FILE";
766  unsigned int readLs = 1, readIndex = 0;
767  fprintf(fu_rw_lock_stream, "%u %u", readLs, readIndex);
768  }
769  }
770 
772  if (create) {
773  fu_readwritelock_fd_ = open(fulockfile.c_str(), O_RDWR | O_CREAT,
774  S_IRWXU | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH);
775  chmod(fulockfile.c_str(),0766);
776  } else {
777  fu_readwritelock_fd_ = open(fulockfile.c_str(), O_RDWR, S_IRWXU);
778  }
779  if (fu_readwritelock_fd_ == -1)
780  edm::LogError("EvFDaqDirector") << "problem with creating filedesc for fuwritelock -: " << fulockfile.c_str()
781  << " create:" << create << " error:" << strerror(errno);
782  else
783  LogDebug("EvFDaqDirector") << "creating filedesc for fureadwritelock -: "
785 
786  fu_rw_lock_stream = fdopen(fu_readwritelock_fd_, "r+");
787  }
788 
789  //create if does not exist then lock the merge destination file
791  data_rw_stream = fopen(getMergedDatFilePath(ls,stream).c_str(), "a"); //open stream for appending
793  if (data_readwrite_fd_ == -1)
794  edm::LogError("EvFDaqDirector") << "problem with creating filedesc for datamerge "
795  << strerror(errno);
796  else
797  LogDebug("EvFDaqDirector") << "creating filedesc for datamerge -: "
799  fcntl(data_readwrite_fd_, F_SETLKW, &data_rw_flk);
800 
801  return data_rw_stream;
802  }
803 
805  fflush(data_rw_stream);
806  fcntl(data_readwrite_fd_, F_SETLKW, &data_rw_fulk);
807  fclose(data_rw_stream);
808  }
809 
811  pthread_mutex_lock(&init_lock_);
812  }
813 
815  pthread_mutex_unlock(&init_lock_);
816  }
817 
819  //fcntl(fulocal_rwlock_fd_, F_SETLKW, &fulocal_rw_flk);
820  flock(fulocal_rwlock_fd_,LOCK_SH);
821  }
822 
824  //fcntl(fulocal_rwlock_fd_, F_SETLKW, &fulocal_rw_fulk);
825  flock(fulocal_rwlock_fd_,LOCK_UN);
826  }
827 
828 
830  //fcntl(fulocal_rwlock_fd2_, F_SETLKW, &fulocal_rw_flk2);
831  flock(fulocal_rwlock_fd2_,LOCK_EX);
832  }
833 
835  //fcntl(fulocal_rwlock_fd2_, F_SETLKW, &fulocal_rw_fulk2);
836  flock(fulocal_rwlock_fd2_,LOCK_UN);
837  }
838 
839 
841  // create open dir if not already there
842 
844  if (!boost::filesystem::is_directory(openPath)) {
845  LogDebug("EvFDaqDirector") << "<open> FU dir not found. Creating... -:" << openPath.string();
846  boost::filesystem::create_directories(openPath);
847  }
848  }
849 
850 
852 
853  boost::filesystem::ifstream ij(file);
854  Json::Value deserializeRoot;
856 
857  if (!reader.parse(ij, deserializeRoot)) {
858  edm::LogError("EvFDaqDirector") << "Cannot deserialize input JSON file -:" << file;
859  return -1;
860  }
861 
862  int ret = deserializeRoot.get("lastLS","").asInt();
863  return ret;
864 
865  }
866 
867  //if transferSystem PSet is present in the menu, we require it to be complete and consistent for all specified streams
869  {
870  transferSystemJson_.reset(new Json::Value);
871  if (edm::getProcessParameterSet().existsAs<edm::ParameterSet>("transferSystem",true))
872  {
873  const edm::ParameterSet& tsPset(edm::getProcessParameterSet().getParameterSet("transferSystem"));
874 
875  Json::Value destinationsVal(Json::arrayValue);
876  std::vector<std::string> destinations = tsPset.getParameter<std::vector<std::string>>("destinations");
877  for (auto & dest: destinations) destinationsVal.append(dest);
878  (*transferSystemJson_)["destinations"]=destinationsVal;
879 
880  Json::Value modesVal(Json::arrayValue);
881  std::vector<std::string> modes = tsPset.getParameter< std::vector<std::string> >("transferModes");
882  for (auto & mode: modes) modesVal.append(mode);
883  (*transferSystemJson_)["transferModes"]=modesVal;
884 
885  for (auto psKeyItr =tsPset.psetTable().begin();psKeyItr!=tsPset.psetTable().end(); ++ psKeyItr) {
886  if (psKeyItr->first!="destinations" && psKeyItr->first!="transferModes") {
887  const edm::ParameterSet & streamDef = tsPset.getParameterSet(psKeyItr->first);
888  Json::Value streamVal;
889  for (auto & mode : modes) {
890  //validation
891  if (!streamDef.existsAs<std::vector<std::string>>(mode,true))
892  throw cms::Exception("EvFDaqDirector") << " Missing transfer system specification for -:" << psKeyItr->first << " (transferMode " << mode << ")";
893  std::vector<std::string> streamDestinations = streamDef.getParameter<std::vector<std::string>>(mode);
894 
895  Json::Value sDestsValue(Json::arrayValue);
896 
897  if (!streamDestinations.size())
898  throw cms::Exception("EvFDaqDirector") << " Missing transter system destination(s) for -: "<< psKeyItr->first << ", mode:" << mode;
899 
900  for (auto & sdest:streamDestinations) {
901  bool sDestValid=false;
902  sDestsValue.append(sdest);
903  for (auto & dest: destinations) {
904  if (dest==sdest) sDestValid=true;
905  }
906  if (!sDestValid)
907  throw cms::Exception("EvFDaqDirector") << " Invalid transter system destination specified for -: "<< psKeyItr->first << ", mode:" << mode << ", dest:"<<sdest;
908  }
909  streamVal[mode]=sDestsValue;
910  }
911  (*transferSystemJson_)[psKeyItr->first] = streamVal;
912  }
913  }
914  }
915  else {
916  if (requireTSPSet_)
917  throw cms::Exception("EvFDaqDirector") << "transferSystem PSet not found";
918  }
919  }
920 
922  {
923  std::string streamRequestName;
924  if (transferSystemJson_->isMember(stream.c_str()))
925  streamRequestName = stream;
926  else {
927  std::stringstream msg;
928  msg << "Transfer system mode definitions missing for -: " << stream;
929  if (requireTSPSet_)
930  throw cms::Exception("EvFDaqDirector") << msg.str();
931  else {
932  edm::LogWarning("EvFDaqDirector") << msg.str() << " (permissive mode)";
933  return std::string("Failsafe");
934  }
935  }
936  //return empty if strict check parameter is not on
938  edm::LogWarning("EvFDaqDirector") << "Selected mode string is not provided as DaqDirector parameter."
939  << "Switch on requireTSPSet parameter to enforce this requirement. Setting mode to empty string.";
940  return std::string("Failsafe");
941  }
943  throw cms::Exception("EvFDaqDirector") << "Selected mode string is not provided as DaqDirector parameter.";
944  }
945  //check if stream has properly listed transfer stream
946  if (!transferSystemJson_->get(streamRequestName, "").isMember(selectedTransferMode_.c_str()))
947  {
948  std::stringstream msg;
949  msg << "Selected transfer mode " << selectedTransferMode_ << " is not specified for stream " << streamRequestName;
950  if (requireTSPSet_)
951  throw cms::Exception("EvFDaqDirector") << msg.str();
952  else
953  edm::LogWarning("EvFDaqDirector") << msg.str() << " (permissive mode)";
954  return std::string("Failsafe");
955  }
956  Json::Value destsVec = transferSystemJson_->get(streamRequestName, "").get(selectedTransferMode_,"");
957 
958  //flatten string json::Array into CSV std::string
960  for (Json::Value::iterator it = destsVec.begin(); it!=destsVec.end(); it++)
961  {
962  if (ret!="") ret +=",";
963  ret+=(*it).asString();
964  }
965  return ret;
966  }
967 
969  std::string proc_flag = run_dir_ + "/processing";
970  int proc_flag_fd = open(proc_flag.c_str(), O_RDWR | O_CREAT, S_IRWXU | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH);
971  close(proc_flag_fd);
972  }
973 
974 }
#define LogDebug(id)
unsigned int nThreads_
type
Definition: HCALResponse.h:21
unsigned int maxNumberOfThreads() const
Definition: SystemBounds.h:46
T getParameter(std::string const &) const
std::string getStreamDestinations(std::string const &stream) const
Value get(UInt index, const Value &defaultValue) const
std::vector< std::string > & getData()
Definition: DataPoint.h:58
int i
Definition: DBlmapReader.cc:9
struct flock fu_rw_flk
std::string run_string_
std::string protocolBufferHistogramFileNameWithInstance(const unsigned int run, const unsigned int ls, std::string const &stream, std::string const &instance)
tuple start
Check for commandline option errors.
Definition: dqm_diff.py:58
std::string bolsFileName(const unsigned int run, const unsigned int ls)
std::string streamerDataChecksumFileNameWithInstance(const unsigned int run, const unsigned int ls, std::string const &stream, std::string const &instance)
std::string getMergedProtocolBufferHistogramFilePath(const unsigned int ls, std::string const &stream) const
void watchPreallocate(Preallocate::slot_type const &iSlot)
std::vector< int > streamFileTracker_
const_iterator begin() const
bool existsAs(std::string const &parameterName, bool trackiness=true) const
checks if a parameter exists as a given type
Definition: ParameterSet.h:186
std::list< std::pair< int, InputFile * > > * filesToDeletePtr_
static void fillDescriptions(edm::ConfigurationDescriptions &descriptions)
ParameterDescriptionBase * addUntracked(U const &iLabel, T const &value)
std::string getMergedDatChecksumFilePath(const unsigned int ls, std::string const &stream) const
std::shared_ptr< Json::Value > transferSystemJson_
void setAllowAnything()
allow any parameter label/value pairs
void openFULockfileStream(std::string &fuLockFilePath, bool create)
void accumulateFileSize(unsigned int lumi, unsigned long fileSize)
void watchPreGlobalEndLumi(PreGlobalEndLumi::slot_type const &iSlot)
std::string getInitFilePath(std::string const &stream) const
std::string getMergedRootHistogramFilePath(const unsigned int ls, std::string const &stream) const
std::string inputRawFileName(const unsigned int run, const unsigned int ls, const unsigned int index)
ParameterSet const & getParameterSet(ParameterSetID const &id)
pthread_mutex_t init_lock_
LuminosityBlockID const & luminosityBlockID() const
Definition: GlobalContext.h:52
std::string getProtocolBufferHistogramFilePath(const unsigned int ls, std::string const &stream) const
std::string getRawFilePath(const unsigned int ls, const unsigned int index) const
std::string getOpenInitFilePath(std::string const &stream) const
std::string getOpenRawFilePath(const unsigned int ls, const unsigned int index) const
Value & append(const Value &value)
Append value to array at the end.
#define NULL
Definition: scimark2.h:8
struct flock data_rw_flk
void createProcessingNotificationMaybe() const
bool parse(const std::string &document, Value &root, bool collectComments=true)
Read a Value from a JSON document.
Represents a JSON value.
Definition: value.h:111
std::string getEoLSFilePathOnBU(const unsigned int ls) const
std::string getEoRFilePath() const
unsigned long previousFileSize_
struct flock fu_rw_fulk
unsigned int maxNumberOfStreams() const
Definition: SystemBounds.h:43
std::string hltSourceDirectory_
std::string getOpenProtocolBufferHistogramFilePath(const unsigned int ls, std::string const &stream) const
void setComment(std::string const &value)
std::mutex * fileDeleteLockPtr_
std::string streamerDataFileNameWithInstance(const unsigned int run, const unsigned int ls, std::string const &stream, std::string const &instance)
EvFDaqDirector(const edm::ParameterSet &pset, edm::ActivityRegistry &reg)
std::string getMergedDatFilePath(const unsigned int ls, std::string const &stream) const
bool check(const std::string &)
FileStatus updateFuLock(unsigned int &ls, std::string &nextFile, uint32_t &fsize, uint64_t &lockWaitTime)
std::string getOpenOutputJsonFilePath(const unsigned int ls, std::string const &stream) const
std::string getOpenRootHistogramFilePath(const unsigned int ls, std::string const &stream) const
std::string getRootHistogramFilePath(const unsigned int ls, std::string const &stream) const
std::string getOpenDatFilePath(const unsigned int ls, std::string const &stream) const
std::string inputJsonFileName(const unsigned int run, const unsigned int ls, const unsigned int index)
std::string stopFilePath_
FILE * maybeCreateAndLockFileHeadForStream(unsigned int ls, std::string &stream)
std::string bu_base_dir_
void removeFile(unsigned int ls, unsigned int index)
std::string selectedTransferMode_
std::string streamerJsonFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
std::string getOpenInputJsonFilePath(const unsigned int ls, const unsigned int index) const
std::string eorFileName(const unsigned int run)
int readLastLSEntry(std::string const &file)
virtual void deserialize(Json::Value &root)
Definition: DataPoint.cc:56
unsigned int eolsNFilesIndex_
void watchPreGlobalBeginRun(PreGlobalBeginRun::slot_type const &iSlot)
std::string getOutputJsonFilePath(const unsigned int ls, std::string const &stream) const
int getNFilesFromEoLS(std::string BUEoLSFile)
void preBeginRun(edm::GlobalContext const &globalContext)
std::string rootHistogramFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
psettable const & psetTable() const
Definition: ParameterSet.h:257
Int asInt() const
void preSourceEvent(edm::StreamID const &streamID)
std::string initFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
unsigned long long uint64_t
Definition: Time.h:15
ParameterSet const & getProcessParameterSet()
Definition: Registry.cc:85
ParameterSet const & getParameterSet(std::string const &) const
void preGlobalEndLumi(edm::GlobalContext const &globalContext)
tuple pid
Definition: sysUtil.py:22
void watchPostGlobalEndRun(PostGlobalEndRun::slot_type const &iSlot)
LuminosityBlockNumber_t luminosityBlock() const
void add(std::string const &label, ParameterSetDescription const &psetDescription)
std::string & getDefinition()
Definition: DataPoint.h:59
evf::FastMonitoringService * fms_
std::string bu_run_dir_
std::string rootHistogramFileNameWithInstance(const unsigned int run, const unsigned int ls, std::string const &stream, std::string const &instance)
std::string findHighestRunDir()
Definition: DirManager.cc:20
std::string getBoLSFilePathOnFU(const unsigned int ls) const
char data[epos_bytes_allocation]
Definition: EPOS_Wrapper.h:82
void postEndRun(edm::GlobalContext const &globalContext)
tuple filename
Definition: lut2db_cfg.py:20
Unserialize a JSON document into a Value.
Definition: reader.h:16
tuple destinations
Definition: gather_cfg.py:120
const_iterator end() const
std::vector< std::string > const & getNames()
std::string getEoLSFilePathOnFU(const unsigned int ls) const
void watchPreSourceEvent(PreSourceEvent::slot_type const &iSlot)
bool bumpFile(unsigned int &ls, unsigned int &index, std::string &nextFile, uint32_t &fsize, int maxLS)
volatile std::atomic< bool > shutdown_flag false
void preallocate(edm::service::SystemBounds const &bounds)
struct flock data_rw_fulk
Iterator for object and array value.
Definition: value.h:1007
std::string getInputJsonFilePath(const unsigned int ls, const unsigned int index) const
std::string getRunOpenDirPath() const
JetCorrectorParameters::Definitions def
Definition: classes.h:6
std::string protocolBufferHistogramFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
unsigned int fuLockPollInterval_
SurfaceDeformation * create(int type, const std::vector< double > &params)
std::string eolsFileName(const unsigned int run, const unsigned int ls)
unsigned int nStreams_
std::string streamerDataFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
std::string getEoRFilePathOnFU() const
std::string bu_run_open_dir_
array value (ordered list)
Definition: value.h:31