CMS 3D CMS Logo

EvFDaqDirector.cc
Go to the documentation of this file.
11 
19 
20 #include <iostream>
21 #include <fstream>
22 #include <sstream>
23 #include <sys/time.h>
24 #include <unistd.h>
25 #include <cstdio>
26 #include <boost/algorithm/string.hpp>
27 
28 //using boost::asio::ip::tcp;
29 
30 //#define DEBUG
31 
32 using namespace jsoncollector;
33 using namespace edm::streamer;
34 
35 namespace evf {
36 
37  //for enum MergeType
38  const std::vector<std::string> EvFDaqDirector::MergeTypeNames_ = {"", "DAT", "PB", "JSNDATA"};
39 
41  : base_dir_(pset.getUntrackedParameter<std::string>("baseDir")),
42  bu_base_dir_(pset.getUntrackedParameter<std::string>("buBaseDir")),
43  bu_base_dirs_all_(pset.getUntrackedParameter<std::vector<std::string>>("buBaseDirsAll")),
44  bu_base_dirs_nSources_(pset.getUntrackedParameter<std::vector<int>>("buBaseDirsNumStreams")),
45  run_(pset.getUntrackedParameter<unsigned int>("runNumber")),
46  useFileBroker_(pset.getUntrackedParameter<bool>("useFileBroker")),
47  fileBrokerHostFromCfg_(pset.getUntrackedParameter<bool>("fileBrokerHostFromCfg", false)),
48  fileBrokerHost_(pset.getUntrackedParameter<std::string>("fileBrokerHost", "InValid")),
49  fileBrokerPort_(pset.getUntrackedParameter<std::string>("fileBrokerPort", "8080")),
50  fileBrokerKeepAlive_(pset.getUntrackedParameter<bool>("fileBrokerKeepAlive", true)),
51  fileBrokerUseLocalLock_(pset.getUntrackedParameter<bool>("fileBrokerUseLocalLock", true)),
52  fuLockPollInterval_(pset.getUntrackedParameter<unsigned int>("fuLockPollInterval", 2000)),
53  outputAdler32Recheck_(pset.getUntrackedParameter<bool>("outputAdler32Recheck", false)),
54  directorBU_(pset.getUntrackedParameter<bool>("directorIsBU", false)),
55  hltSourceDirectory_(pset.getUntrackedParameter<std::string>("hltSourceDirectory", "")),
56  hostname_(""),
57  bu_readlock_fd_(-1),
58  bu_writelock_fd_(-1),
59  fu_readwritelock_fd_(-1),
60  fulocal_rwlock_fd_(-1),
61  fulocal_rwlock_fd2_(-1),
62  bu_w_lock_stream(nullptr),
63  bu_r_lock_stream(nullptr),
64  fu_rw_lock_stream(nullptr),
65  dirManager_(base_dir_),
66  previousFileSize_(0),
67  bu_w_flk(make_flock(F_WRLCK, SEEK_SET, 0, 0, 0)),
68  bu_r_flk(make_flock(F_RDLCK, SEEK_SET, 0, 0, 0)),
69  bu_w_fulk(make_flock(F_UNLCK, SEEK_SET, 0, 0, 0)),
70  bu_r_fulk(make_flock(F_UNLCK, SEEK_SET, 0, 0, 0)),
71  fu_rw_flk(make_flock(F_WRLCK, SEEK_SET, 0, 0, getpid())),
72  fu_rw_fulk(make_flock(F_UNLCK, SEEK_SET, 0, 0, getpid())) {
77 
78  //save hostname for later
79  char hostname[33];
80  gethostname(hostname, 32);
81  hostname_ = hostname;
82 
83  char* fuLockPollIntervalPtr = std::getenv("FFF_LOCKPOLLINTERVAL");
84  if (fuLockPollIntervalPtr) {
85  try {
86  fuLockPollInterval_ = std::stoul(std::string(fuLockPollIntervalPtr));
87  edm::LogInfo("EvFDaqDirector") << "Setting fu lock poll interval by environment string: " << fuLockPollInterval_
88  << " us";
89  } catch (const std::exception&) {
90  edm::LogWarning("EvFDaqDirector") << "Bad lexical cast in parsing: " << std::string(fuLockPollIntervalPtr);
91  }
92  }
93 
94  //override file service parameter if specified by environment
95  char* fileBrokerParamPtr = std::getenv("FFF_USEFILEBROKER");
96  if (fileBrokerParamPtr) {
97  try {
98  useFileBroker_ = (std::stoul(std::string(fileBrokerParamPtr))) > 0;
99  edm::LogInfo("EvFDaqDirector") << "Setting useFileBroker parameter by environment string: " << useFileBroker_;
100  } catch (const std::exception&) {
101  edm::LogWarning("EvFDaqDirector") << "Bad lexical cast in parsing: " << std::string(fileBrokerParamPtr);
102  }
103  }
104  if (useFileBroker_) {
106  //find BU data address from hltd configuration
108  struct stat buf;
109  if (stat("/etc/appliance/bus.config", &buf) == 0) {
110  std::ifstream busconfig("/etc/appliance/bus.config", std::ifstream::in);
111  std::getline(busconfig, fileBrokerHost_);
112  }
113  if (fileBrokerHost_.empty())
114  throw cms::Exception("EvFDaqDirector") << "No file service or BU data address information";
115  } else if (fileBrokerHost_.empty() || fileBrokerHost_ == "InValid")
116  throw cms::Exception("EvFDaqDirector")
117  << "fileBrokerHostFromCfg must be set to true if fileBrokerHost parameter is not valid or empty";
118 
119  resolver_ = std::make_unique<boost::asio::ip::tcp::resolver>(io_service_);
120  query_ = std::make_unique<boost::asio::ip::tcp::resolver::query>(fileBrokerHost_, fileBrokerPort_);
121  endpoint_iterator_ = std::make_unique<boost::asio::ip::tcp::resolver::iterator>(resolver_->resolve(*query_));
122  socket_ = std::make_unique<boost::asio::ip::tcp::socket>(io_service_);
123  }
124 
125  char* startFromLSPtr = std::getenv("FFF_START_LUMISECTION");
126  if (startFromLSPtr) {
127  try {
128  startFromLS_ = std::stoul(std::string(startFromLSPtr));
129  edm::LogInfo("EvFDaqDirector") << "Setting start from LS by environment string: " << startFromLS_;
130  } catch (const std::exception&) {
131  edm::LogWarning("EvFDaqDirector") << "Bad lexical cast in parsing: " << std::string(startFromLSPtr);
132  }
133  }
134 
135  //override file service parameter if specified by environment
136  char* fileBrokerUseLockParamPtr = std::getenv("FFF_FILEBROKERUSELOCALLOCK");
137  if (fileBrokerUseLockParamPtr) {
138  try {
139  fileBrokerUseLocalLock_ = (std::stoul(std::string(fileBrokerUseLockParamPtr))) > 0;
140  edm::LogInfo("EvFDaqDirector") << "Setting fileBrokerUseLocalLock parameter by environment string: "
142  } catch (const std::exception&) {
143  edm::LogWarning("EvFDaqDirector") << "Bad lexical cast in parsing: " << std::string(fileBrokerUseLockParamPtr);
144  }
145  }
146 
147  // set number of streams in each BU's ramdisk
148  if (bu_base_dirs_nSources_.empty()) {
149  // default is 1 stream per ramdisk
150  for (unsigned int i = 0; i < bu_base_dirs_all_.size(); i++) {
151  bu_base_dirs_nSources_.push_back(1);
152  }
153  } else if (bu_base_dirs_nSources_.size() != bu_base_dirs_all_.size()) {
154  throw cms::Exception("DaqDirector")
155  << " Error while setting number of sources: size mismatch with BU base directory vector";
156  } else {
157  for (unsigned int i = 0; i < bu_base_dirs_all_.size(); i++) {
159  edm::LogInfo("EvFDaqDirector") << "Setting " << bu_base_dirs_nSources_[i] << " sources"
160  << " for ramdisk " << bu_base_dirs_all_[i];
161  }
162  }
163 
164  std::stringstream ss;
165  ss << "run" << std::setfill('0') << std::setw(6) << run_;
166  run_string_ = ss.str();
167  ss = std::stringstream();
168  ss << run_;
169  run_nstring_ = ss.str();
170  run_dir_ = base_dir_ + "/" + run_string_;
171  input_throttled_file_ = run_dir_ + "/input_throttle";
172  discard_ls_filestem_ = run_dir_ + "/discard_ls";
173  ss = std::stringstream();
174  ss << getpid();
175  pid_ = ss.str();
176  }
177 
179  // check if base dir exists or create it accordingly
180  int retval = mkdir(base_dir_.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
181  if (retval != 0 && errno != EEXIST) {
182  throw cms::Exception("DaqDirector")
183  << " Error checking for base dir -: " << base_dir_ << " mkdir error:" << strerror(errno);
184  }
185 
186  //create run dir in base dir
187  umask(0);
188  retval = mkdir(run_dir_.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IRWXO | S_IXOTH);
189  if (retval != 0 && errno != EEXIST) {
190  throw cms::Exception("DaqDirector")
191  << " Error creating run dir -: " << run_dir_ << " mkdir error:" << strerror(errno);
192  }
193 
194  //create fu-local.lock in run open dir
195  if (!directorBU_) {
197  std::string fulocal_lock_ = getRunOpenDirPath() + "/fu-local.lock";
199  open(fulocal_lock_.c_str(), O_RDWR | O_CREAT, S_IRWXU | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH); //O_RDWR?
200  if (fulocal_rwlock_fd_ == -1)
201  throw cms::Exception("DaqDirector")
202  << " Error creating/opening a local lock file -: " << fulocal_lock_.c_str() << " : " << strerror(errno);
203  chmod(fulocal_lock_.c_str(), 0777);
204  fsync(fulocal_rwlock_fd_);
205  //open second fd for another input source thread
207  open(fulocal_lock_.c_str(), O_RDWR, S_IRWXU | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH); //O_RDWR?
208  if (fulocal_rwlock_fd2_ == -1)
209  throw cms::Exception("DaqDirector")
210  << " Error opening a local lock file -: " << fulocal_lock_.c_str() << " : " << strerror(errno);
211  }
212 
213  //bu_run_dir: for FU, for which the base dir is local and the BU is remote, it is expected to be there
214  //for BU, it is created at this point
215  if (directorBU_) {
217  std::string bulockfile = bu_run_dir_ + "/bu.lock";
218  fulockfile_ = bu_run_dir_ + "/fu.lock";
219 
220  //make or find bu run dir
221  retval = mkdir(bu_run_dir_.c_str(), S_IRWXU | S_IRWXG | S_IRWXO);
222  if (retval != 0 && errno != EEXIST) {
223  throw cms::Exception("DaqDirector")
224  << " Error creating bu run dir -: " << bu_run_dir_ << " mkdir error:" << strerror(errno);
225  }
226  bu_run_open_dir_ = bu_run_dir_ + "/open";
227  retval = mkdir(bu_run_open_dir_.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
228  if (retval != 0 && errno != EEXIST) {
229  throw cms::Exception("DaqDirector")
230  << " Error creating bu run open dir -: " << bu_run_open_dir_ << " mkdir error:" << strerror(errno);
231  }
232 
233  // the BU director does not need to know about the fu lock
234  bu_writelock_fd_ = open(bulockfile.c_str(), O_WRONLY | O_CREAT | O_TRUNC, S_IRWXU);
235  if (bu_writelock_fd_ == -1)
236  edm::LogWarning("EvFDaqDirector") << "problem with creating filedesc for buwritelock -: " << strerror(errno);
237  else
238  edm::LogInfo("EvFDaqDirector") << "creating filedesc for buwritelock -: " << bu_writelock_fd_;
239  bu_w_lock_stream = fdopen(bu_writelock_fd_, "w");
240  if (bu_w_lock_stream == nullptr)
241  edm::LogWarning("EvFDaqDirector") << "Error creating write lock stream -: " << strerror(errno);
242 
243  // BU INITIALIZES LOCK FILE
244  // FU LOCK FILE OPEN
245  openFULockfileStream(true);
247  fflush(fu_rw_lock_stream);
248  close(fu_readwritelock_fd_);
249 
250  if (!hltSourceDirectory_.empty()) {
251  struct stat buf;
252  if (stat(hltSourceDirectory_.c_str(), &buf) == 0) {
253  std::string hltdir = bu_run_dir_ + "/hlt";
254  std::string tmphltdir = bu_run_open_dir_ + "/hlt";
255  retval = mkdir(tmphltdir.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
256  if (retval != 0 && errno != EEXIST)
257  throw cms::Exception("DaqDirector")
258  << " Error creating bu run dir -: " << hltdir << " mkdir error:" << strerror(errno);
259 
260  std::filesystem::copy_file(hltSourceDirectory_ + "/HltConfig.py", tmphltdir + "/HltConfig.py");
261  std::filesystem::copy_file(hltSourceDirectory_ + "/fffParameters.jsn", tmphltdir + "/fffParameters.jsn");
262 
263  std::string optfiles[3] = {"hltinfo", "blacklist", "whitelist"};
264  for (auto& optfile : optfiles) {
265  try {
266  std::filesystem::copy_file(hltSourceDirectory_ + "/" + optfile, tmphltdir + "/" + optfile);
267  } catch (...) {
268  }
269  }
270 
271  std::filesystem::rename(tmphltdir, hltdir);
272  } else
273  throw cms::Exception("DaqDirector") << " Error looking for HLT configuration -: " << hltSourceDirectory_;
274  }
275  //else{}//no configuration specified
276  } else {
277  // for FU, check if bu base dir exists
278 
279  auto checkExists = [=](std::string const& bu_base_dir) -> void {
280  int retval = mkdir(bu_base_dir.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
281  if (retval != 0 && errno != EEXIST) {
282  throw cms::Exception("DaqDirector")
283  << " Error checking for bu base dir -: " << bu_base_dir << " mkdir error:" << strerror(errno);
284  }
285  };
286 
287  auto waitForDir = [=](std::string const& bu_base_dir) -> void {
288  int cnt = 0;
289  while (!edm::shutdown_flag.load(std::memory_order_relaxed)) {
290  //stat should trigger autofs mount (mkdir could fail with access denied first time)
291  struct stat statbuf;
292  stat(bu_base_dir.c_str(), &statbuf);
293  int retval = mkdir(bu_base_dir.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
294  if (retval != 0 && errno != EEXIST) {
295  usleep(500000);
296  cnt++;
297  if (cnt % 20 == 0)
298  edm::LogWarning("DaqDirector") << "waiting for " << bu_base_dir;
299  if (cnt > 120)
300  throw cms::Exception("DaqDirector") << " Error checking for bu base dir after 1 minute -: " << bu_base_dir
301  << " mkdir error:" << strerror(errno);
302  continue;
303  }
304  break;
305  }
306  };
307 
308  if (!bu_base_dirs_all_.empty()) {
309  std::string check_dir = bu_base_dir_.empty() ? bu_base_dirs_all_[0] : bu_base_dir_;
310  checkExists(check_dir);
311  bu_run_dir_ = check_dir + "/" + run_string_;
312  for (unsigned int i = 0; i < bu_base_dirs_all_.size(); i++)
313  waitForDir(bu_base_dirs_all_[i]);
314  } else {
315  checkExists(bu_base_dir_);
317  }
318 
319  fulockfile_ = bu_run_dir_ + "/fu.lock";
320  if (!useFileBroker_)
321  openFULockfileStream(false);
322  }
323 
324  pthread_mutex_init(&init_lock_, nullptr);
325 
326  stopFilePath_ = run_dir_ + "/CMSSW_STOP";
327  std::stringstream sstp;
328  sstp << stopFilePath_ << "_pid" << pid_;
329  stopFilePathPid_ = sstp.str();
330 
331  if (!directorBU_) {
332  std::string defPath = bu_run_dir_ + "/jsd/rawData.jsd";
333  struct stat statbuf;
334  if (!stat(defPath.c_str(), &statbuf))
335  edm::LogInfo("EvFDaqDirector") << "found JSD file in ramdisk -: " << defPath;
336  else {
337  //look in source directory if not present in ramdisk
338  std::string defPathSuffix = "src/EventFilter/Utilities/plugins/budef.jsd";
339  defPath = std::string(std::getenv("CMSSW_BASE")) + "/" + defPathSuffix;
340  if (stat(defPath.c_str(), &statbuf)) {
341  defPath = std::string(std::getenv("CMSSW_RELEASE_BASE")) + "/" + defPathSuffix;
342  if (stat(defPath.c_str(), &statbuf)) {
343  defPath = defPathSuffix;
344  }
345  }
346  }
347  dpd_ = new DataPointDefinition();
348  std::string defLabel = "data";
349  DataPointDefinition::getDataPointDefinitionFor(defPath, dpd_, &defLabel);
350  }
351  }
352 
354  //close server connection
355  if (socket_.get() && socket_->is_open()) {
356  boost::system::error_code ec;
357  socket_->shutdown(boost::asio::ip::tcp::socket::shutdown_both, ec);
358  socket_->close(ec);
359  }
360 
361  if (fulocal_rwlock_fd_ != -1) {
362  unlockFULocal();
363  close(fulocal_rwlock_fd_);
364  }
365 
366  if (fulocal_rwlock_fd2_ != -1) {
367  unlockFULocal2();
368  close(fulocal_rwlock_fd2_);
369  }
370  }
371 
373  initRun();
374 
375  nThreads_ = bounds.maxNumberOfStreams();
376  nStreams_ = bounds.maxNumberOfThreads();
377  nConcurrentLumis_ = bounds.maxNumberOfConcurrentLuminosityBlocks();
378  }
379 
382  desc.setComment(
383  "Service used for file locking arbitration and for propagating information between other EvF components");
384  desc.addUntracked<std::string>("baseDir", ".")->setComment("Local base directory for run output");
385  desc.addUntracked<std::string>("buBaseDir", ".")->setComment("BU base ramdisk directory ");
386  desc.addUntracked<std::vector<std::string>>("buBaseDirsAll", std::vector<std::string>())
387  ->setComment("BU base ramdisk directories for multi-file DAQSource models");
388  desc.addUntracked<std::vector<int>>("buBaseDirsNumStreams", std::vector<int>())
389  ->setComment("Number of streams for each BU base ramdisk directories for multi-file DAQSource models");
390  desc.addUntracked<unsigned int>("runNumber", 0)->setComment("Run Number in ramdisk to open");
391  desc.addUntracked<bool>("useFileBroker", false)
392  ->setComment("Use BU file service to grab input data instead of NFS file locking");
393  desc.addUntracked<bool>("fileBrokerHostFromCfg", true)
394  ->setComment("Allow service to discover BU address from hltd configuration");
395  desc.addUntracked<std::string>("fileBrokerHost", "InValid")->setComment("BU file service host.");
396  desc.addUntracked<std::string>("fileBrokerPort", "8080")->setComment("BU file service port");
397  desc.addUntracked<bool>("fileBrokerKeepAlive", true)
398  ->setComment("Use keep alive to avoid using large number of sockets");
399  desc.addUntracked<bool>("fileBrokerUseLocalLock", true)
400  ->setComment("Use local lock file to synchronize appearance of index and EoLS file markers for hltd");
401  desc.addUntracked<unsigned int>("fuLockPollInterval", 2000)
402  ->setComment("Lock polling interval in microseconds for the input directory file lock");
403  desc.addUntracked<bool>("outputAdler32Recheck", false)
404  ->setComment("Check Adler32 of per-process output files while micro-merging");
405  desc.addUntracked<bool>("directorIsBU", false)->setComment("BU director mode used for testing");
406  desc.addUntracked<std::string>("hltSourceDirectory", "")->setComment("BU director mode source directory");
407  desc.addUntracked<std::string>("mergingPset", "")
408  ->setComment("Name of merging PSet to look for merging type definitions for streams");
409  descriptions.add("EvFDaqDirector", desc);
410  }
411 
412  void EvFDaqDirector::preBeginRun(edm::GlobalContext const& globalContext) {
413  //assert(run_ == id.run());
414 
415  // check if the requested run is the latest one - issue a warning if it isn't
417  edm::LogWarning("EvFDaqDirector") << "WARNING - checking run dir -: " << run_dir_
418  << ". This is not the highest run " << dirManager_.findHighestRunDir();
419  }
420  }
421 
422  void EvFDaqDirector::postEndRun(edm::GlobalContext const& globalContext) {
423  close(bu_readlock_fd_);
424  close(bu_writelock_fd_);
425  if (directorBU_) {
426  std::string filename = bu_run_dir_ + "/bu.lock";
428  }
429  }
430 
432  //delete all files belonging to just closed lumi
433  unsigned int ls = globalContext.luminosityBlockID().luminosityBlock();
435  edm::LogWarning("EvFDaqDirector") << " Handles to check for files to delete were not set by the input source...";
436  return;
437  }
438 
439  std::unique_lock<std::mutex> lkw(*fileDeleteLockPtr_);
440  auto it = filesToDeletePtr_->begin();
441  while (it != filesToDeletePtr_->end()) {
442  if (it->second->lumi_ == ls && (!fms_ || !fms_->isExceptionOnData(it->second->lumi_))) {
443  it = filesToDeletePtr_->erase(it);
444  } else
445  it++;
446  }
447  }
448 
449  std::string EvFDaqDirector::getInputJsonFilePath(const unsigned int ls, const unsigned int index) const {
451  }
452 
453  std::string EvFDaqDirector::getRawFilePath(const unsigned int ls, const unsigned int index) const {
455  }
456 
457  std::string EvFDaqDirector::getOpenRawFilePath(const unsigned int ls, const unsigned int index) const {
458  return bu_run_dir_ + "/open/" + fffnaming::inputRawFileName(run_, ls, index);
459  }
460 
461  std::string EvFDaqDirector::getOpenInputJsonFilePath(const unsigned int ls, const unsigned int index) const {
462  return bu_run_dir_ + "/open/" + fffnaming::inputJsonFileName(run_, ls, index);
463  }
464 
465  std::string EvFDaqDirector::getDatFilePath(const unsigned int ls, std::string const& stream) const {
467  }
468 
471  }
472 
475  }
476 
479  }
480 
483  }
484 
487  }
488 
490  return run_dir_ + "/open/" + fffnaming::initFileNameWithPid(run_, 0, stream);
491  }
492 
495  }
496 
499  }
500 
502  std::string const& stream) const {
504  }
505 
507  std::string const& stream) const {
509  }
510 
512  std::string const& stream) const {
514  }
515 
518  }
519 
522  }
523 
526  }
527 
529  return bu_run_dir_ + "/" + fffnaming::eolsFileName(run_, ls);
530  }
531 
533  return run_dir_ + "/" + fffnaming::eolsFileName(run_, ls);
534  }
535 
537  return run_dir_ + "/" + fffnaming::bolsFileName(run_, ls);
538  }
539 
541 
543 
545 
546  std::string EvFDaqDirector::getFFFParamsFilePathOnBU() const { return bu_run_dir_ + "/hlt/fffParameters.jsn"; }
547 
549  int retval = remove(filename.c_str());
550  if (retval != 0)
551  edm::LogError("EvFDaqDirector") << "Could not remove used file -: " << filename
552  << ". error = " << strerror(errno);
553  }
554 
556  std::string& nextFile,
557  uint32_t& fsize,
558  uint16_t& rawHeaderSize,
559  uint64_t& lockWaitTime,
560  bool& setExceptionState) {
561  EvFDaqDirector::FileStatus fileStatus = noFile;
562  rawHeaderSize = 0;
563 
564  int retval = -1;
565  int lock_attempts = 0;
566  long total_lock_attempts = 0;
567 
568  struct stat buf;
569  int stopFileLS = -1;
570  int stopFileCheck = stat(stopFilePath_.c_str(), &buf);
571  int stopFilePidCheck = stat(stopFilePathPid_.c_str(), &buf);
572  if (stopFileCheck == 0 || stopFilePidCheck == 0) {
573  if (stopFileCheck == 0)
574  stopFileLS = readLastLSEntry(stopFilePath_);
575  else
576  stopFileLS = 1; //stop without drain if only pid is stopped
577  if (!stop_ls_override_) {
578  //if lumisection is higher than in stop file, should quit at next from current
579  if (stopFileLS >= 0 && (int)ls >= stopFileLS)
580  stopFileLS = stop_ls_override_ = ls;
581  } else
582  stopFileLS = stop_ls_override_;
583  edm::LogWarning("EvFDaqDirector") << "Detected stop request from hltd. Ending run for this process after LS -: "
584  << stopFileLS;
585  //return runEnded;
586  } else //if file was removed before reaching stop condition, reset this
587  stop_ls_override_ = 0;
588 
589  timeval ts_lockbegin;
590  gettimeofday(&ts_lockbegin, nullptr);
591 
592  while (retval == -1) {
593  retval = fcntl(fu_readwritelock_fd_, F_SETLK, &fu_rw_flk);
594  if (retval == -1)
595  usleep(fuLockPollInterval_);
596  else
597  continue;
598 
599  lock_attempts += fuLockPollInterval_;
600  total_lock_attempts += fuLockPollInterval_;
601  if (lock_attempts > 5000000 || errno == 116) {
602  if (errno == 116)
603  edm::LogWarning("EvFDaqDirector")
604  << "Stale lock file handle. Checking if run directory and fu.lock file are present" << std::endl;
605  else
606  edm::LogWarning("EvFDaqDirector") << "Unable to obtain a lock for 5 seconds. Checking if run directory and "
607  "fu.lock file are present -: errno "
608  << errno << ":" << strerror(errno) << std::endl;
609 
610  if (stat(getEoLSFilePathOnFU(ls).c_str(), &buf) == 0) {
611  edm::LogWarning("EvFDaqDirector") << "Detected local EoLS for lumisection " << ls;
612  ls++;
613  return noFile;
614  }
615 
616  if (stat(bu_run_dir_.c_str(), &buf) != 0)
617  return runEnded;
618  if (stat(fulockfile_.c_str(), &buf) != 0)
619  return runEnded;
620 
621  lock_attempts = 0;
622  }
623  if (total_lock_attempts > 5 * 60000000) {
624  edm::LogError("EvFDaqDirector") << "Unable to obtain a lock for 5 minutes. Stopping polling activity.";
625  return runAbort;
626  }
627  }
628 
629  timeval ts_lockend;
630  gettimeofday(&ts_lockend, nullptr);
631  long deltat = (ts_lockend.tv_usec - ts_lockbegin.tv_usec) + (ts_lockend.tv_sec - ts_lockbegin.tv_sec) * 1000000;
632  if (deltat > 0.)
633  lockWaitTime = deltat;
634 
635  if (retval != 0)
636  return fileStatus;
637 
638 #ifdef DEBUG
639  timeval ts_lockend;
640  gettimeofday(&ts_lockend, 0);
641 #endif
642 
643  //open another lock file FD after the lock using main fd has been acquired
644  int fu_readwritelock_fd2 = open(fulockfile_.c_str(), O_RDWR, S_IRWXU);
645  if (fu_readwritelock_fd2 == -1)
646  edm::LogError("EvFDaqDirector") << "problem with creating filedesc for fuwritelock -: " << fulockfile_
647  << " create. error:" << strerror(errno);
648 
649  FILE* fu_rw_lock_stream2 = fdopen(fu_readwritelock_fd2, "r+");
650 
651  // if the stream is readable
652  if (fu_rw_lock_stream2 != nullptr) {
653  unsigned int readLs, readIndex;
654  int check = 0;
655  // rewind the stream
656  check = fseek(fu_rw_lock_stream2, 0, SEEK_SET);
657  // if rewinded ok
658  if (check == 0) {
659  // read its' values
660  fscanf(fu_rw_lock_stream2, "%u %u", &readLs, &readIndex);
661  edm::LogInfo("EvFDaqDirector") << "Read fu.lock file file -: " << readLs << ":" << readIndex;
662 
663  unsigned int currentLs = readLs;
664  bool bumpedOk = false;
665  //if next lumisection in a lock file is not +1 wrt. source, cycle through the next empty one, unless initial lumi not yet set
666  //no lock file write in this case
667  if (ls && ls + 1 < currentLs)
668  ls++;
669  else {
670  // try to bump (look for new index or EoLS file)
671  bumpedOk = bumpFile(readLs, readIndex, nextFile, fsize, rawHeaderSize, stopFileLS, setExceptionState);
672  //avoid 2 lumisections jump
673  if (ls && readLs > currentLs && currentLs > ls) {
674  ls++;
675  readLs = currentLs = ls;
676  readIndex = 0;
677  bumpedOk = false;
678  //no write to lock file
679  } else {
680  if (ls == 0 && readLs > currentLs) {
681  //make sure to intialize always with LS found in the lock file, with possibility of grabbing index file immediately
682  //in this case there is no new file in the same LS
683  //this covers case where run has empty first lumisections and CMSSW are late to the lock file. always one process will start with LS 1,... and create empty files for them
684  readLs = currentLs;
685  readIndex = 0;
686  bumpedOk = false;
687  //no write to lock file
688  }
689  //update return LS value
690  ls = readLs;
691  }
692  }
693  if (bumpedOk) {
694  // there is a new index file to grab, lock file needs to be updated
695  check = fseek(fu_rw_lock_stream2, 0, SEEK_SET);
696  if (check == 0) {
697  ftruncate(fu_readwritelock_fd2, 0);
698  // write next index in the file, which is the file the next process should take
699  fprintf(fu_rw_lock_stream2, "%u %u", readLs, readIndex + 1);
700  fflush(fu_rw_lock_stream2);
701  fsync(fu_readwritelock_fd2);
702  fileStatus = newFile;
703  LogDebug("EvFDaqDirector") << "Written to file -: " << readLs << ":" << readIndex + 1;
704  } else {
705  edm::LogError("EvFDaqDirector")
706  << "seek on fu read/write lock for updating failed with error " << strerror(errno);
707  setExceptionState = true;
708  return noFile;
709  }
710  } else if (currentLs < readLs) {
711  //there is no new file in next LS (yet), but lock file can be updated to the next LS
712  check = fseek(fu_rw_lock_stream2, 0, SEEK_SET);
713  if (check == 0) {
714  ftruncate(fu_readwritelock_fd2, 0);
715  // in this case LS was bumped, but no new file. Thus readIndex is 0 (set by bumpFile)
716  fprintf(fu_rw_lock_stream2, "%u %u", readLs, readIndex);
717  fflush(fu_rw_lock_stream2);
718  fsync(fu_readwritelock_fd2);
719  LogDebug("EvFDaqDirector") << "Written to file -: " << readLs << ":" << readIndex;
720  } else {
721  edm::LogError("EvFDaqDirector")
722  << "seek on fu read/write lock for updating failed with error " << strerror(errno);
723  setExceptionState = true;
724  return noFile;
725  }
726  }
727  } else {
728  edm::LogError("EvFDaqDirector") << "seek on fu read/write lock for reading failed with error "
729  << strerror(errno);
730  }
731  } else {
732  edm::LogError("EvFDaqDirector") << "fu read/write lock stream is invalid " << strerror(errno);
733  }
734  fclose(fu_rw_lock_stream2); // = fdopen(fu_readwritelock_fd2, "r+");
735 
736 #ifdef DEBUG
737  timeval ts_preunlock;
738  gettimeofday(&ts_preunlock, 0);
739  int locked_period_int = ts_preunlock.tv_sec - ts_lockend.tv_sec;
740  double locked_period = locked_period_int + double(ts_preunlock.tv_usec - ts_lockend.tv_usec) / 1000000;
741 #endif
742 
743  //if new json is present, lock file which FedRawDataInputSource will later unlock
744  if (fileStatus == newFile)
745  lockFULocal();
746 
747  //release lock at this point
748  int retvalu = -1;
749  retvalu = fcntl(fu_readwritelock_fd_, F_SETLKW, &fu_rw_fulk);
750  if (retvalu == -1)
751  edm::LogError("EvFDaqDirector") << "Error unlocking the fu.lock " << strerror(errno);
752 
753 #ifdef DEBUG
754  edm::LogDebug("EvFDaqDirector") << "Waited during lock -: " << locked_period << " seconds";
755 #endif
756 
757  if (fileStatus == noFile) {
758  struct stat buf;
759  //edm::LogInfo("EvFDaqDirector") << " looking for EoR file: " << getEoRFilePath().c_str();
760  if (stat(getEoRFilePath().c_str(), &buf) == 0 || stat(bu_run_dir_.c_str(), &buf) != 0)
761  fileStatus = runEnded;
762  if (stopFileLS >= 0 && (int)ls > stopFileLS) {
763  edm::LogInfo("EvFDaqDirector") << "Reached maximum lumisection set by hltd";
764  fileStatus = runEnded;
765  }
766  }
767  return fileStatus;
768  }
769 
771  std::ifstream ij(BUEoLSFile);
772  Json::Value deserializeRoot;
774 
775  if (!reader.parse(ij, deserializeRoot)) {
776  edm::LogError("EvFDaqDirector") << "Cannot deserialize input JSON file -:" << BUEoLSFile;
777  return -1;
778  }
779 
781  DataPoint dp;
782  dp.deserialize(deserializeRoot);
783 
784  //read definition
785  if (readEolsDefinition_) {
786  //std::string def = boost::algorithm::trim(dp.getDefinition());
787  std::string def = dp.getDefinition();
788  if (def.empty())
789  readEolsDefinition_ = false;
790  while (!def.empty()) {
792  if (def.find('/') == 0)
793  fullpath = def;
794  else
795  fullpath = bu_run_dir_ + '/' + def;
796  struct stat buf;
797  if (stat(fullpath.c_str(), &buf) == 0) {
798  DataPointDefinition eolsDpd;
799  std::string defLabel = "legend";
800  DataPointDefinition::getDataPointDefinitionFor(fullpath, &eolsDpd, &defLabel);
801  if (eolsDpd.getNames().empty()) {
802  //try with "data" label if "legend" format is not used
803  eolsDpd = DataPointDefinition();
804  defLabel = "data";
805  DataPointDefinition::getDataPointDefinitionFor(fullpath, &eolsDpd, &defLabel);
806  }
807  for (unsigned int i = 0; i < eolsDpd.getNames().size(); i++)
808  if (eolsDpd.getNames().at(i) == "NFiles")
810  readEolsDefinition_ = false;
811  break;
812  }
813  //check if we can still find definition
814  if (def.size() <= 1 || def.find('/') == std::string::npos) {
815  readEolsDefinition_ = false;
816  break;
817  }
818  def = def.substr(def.find('/') + 1);
819  }
820  }
821 
822  if (dp.getData().size() > eolsNFilesIndex_)
823  data = dp.getData()[eolsNFilesIndex_];
824  else {
825  edm::LogError("EvFDaqDirector") << " error reading number of files from BU JSON -: " << BUEoLSFile;
826  return -1;
827  }
828  return std::stoi(data);
829  }
830 
831  bool EvFDaqDirector::bumpFile(unsigned int& ls,
832  unsigned int& index,
833  std::string& nextFile,
834  uint32_t& fsize,
835  uint16_t& rawHeaderSize,
836  int maxLS,
837  bool& setExceptionState) {
838  if (previousFileSize_ != 0) {
839  if (!fms_) {
841  }
842  if (fms_)
844  previousFileSize_ = 0;
845  }
846  nextFile = "";
847 
848  //reached limit
849  if (maxLS >= 0 && ls > (unsigned int)maxLS)
850  return false;
851 
852  struct stat buf;
853  std::stringstream ss;
854 
855  // 1. Check suggested file
856  std::string nextFileJson = getInputJsonFilePath(ls, index);
857  if (stat(nextFileJson.c_str(), &buf) == 0) {
858  fsize = previousFileSize_ = buf.st_size;
859  nextFile = nextFileJson;
860  return true;
861  }
862  // 2. No file -> lumi ended? (and how many?)
863  else {
864  // 3. No file -> check for standalone raw file
865  std::string nextFileRaw = getRawFilePath(ls, index);
866  if (stat(nextFileRaw.c_str(), &buf) == 0 && rawFileHasHeader(nextFileRaw, rawHeaderSize)) {
867  fsize = previousFileSize_ = buf.st_size;
868  nextFile = nextFileRaw;
869  return true;
870  }
871 
872  std::string BUEoLSFile = getEoLSFilePathOnBU(ls);
873 
874  if (stat(BUEoLSFile.c_str(), &buf) == 0) {
875  // recheck that no raw file appeared in the meantime
876  if (stat(nextFileJson.c_str(), &buf) == 0) {
877  fsize = previousFileSize_ = buf.st_size;
878  nextFile = nextFileJson;
879  return true;
880  }
881  if (stat(nextFileRaw.c_str(), &buf) == 0 && rawFileHasHeader(nextFileRaw, rawHeaderSize)) {
882  fsize = previousFileSize_ = buf.st_size;
883  nextFile = nextFileRaw;
884  return true;
885  }
886 
887  int indexFilesInLS = getNFilesFromEoLS(BUEoLSFile);
888  if (indexFilesInLS < 0)
889  //parsing failed
890  return false;
891  else {
892  //check index
893  if ((int)index < indexFilesInLS) {
894  //we have 2 files, and check for 1 failed... retry (2 will never be here)
895  edm::LogError("EvFDaqDirector")
896  << "Potential miss of index file in LS -: " << ls << ". Missing " << nextFile << " because "
897  << indexFilesInLS - 1 << " is the highest index expected. Will not update fu.lock file";
898  setExceptionState = true;
899  return false;
900  }
901  }
902  // this lumi ended, check for files
903  ++ls;
904  index = 0;
905 
906  //reached limit
907  if (maxLS >= 0 && ls > (unsigned int)maxLS)
908  return false;
909 
910  nextFileJson = getInputJsonFilePath(ls, 0);
911  nextFileRaw = getRawFilePath(ls, 0);
912  if (stat(nextFileJson.c_str(), &buf) == 0) {
913  // a new file was found at new lumisection, index 0
914  fsize = previousFileSize_ = buf.st_size;
915  nextFile = nextFileJson;
916  return true;
917  }
918  if (stat(nextFileRaw.c_str(), &buf) == 0 && rawFileHasHeader(nextFileRaw, rawHeaderSize)) {
919  fsize = previousFileSize_ = buf.st_size;
920  nextFile = nextFileRaw;
921  return true;
922  }
923  return false;
924  }
925  }
926  // no new file found
927  return false;
928  }
929 
931  if (fu_rw_lock_stream == nullptr)
932  edm::LogError("EvFDaqDirector") << "Error creating fu read/write lock stream " << strerror(errno);
933  else {
934  edm::LogInfo("EvFDaqDirector") << "Initializing FU LOCK FILE";
935  unsigned int readLs = 1, readIndex = 0;
936  fprintf(fu_rw_lock_stream, "%u %u", readLs, readIndex);
937  }
938  }
939 
941  if (create) {
943  open(fulockfile_.c_str(), O_RDWR | O_CREAT, S_IRWXU | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH);
944  chmod(fulockfile_.c_str(), 0766);
945  } else {
946  fu_readwritelock_fd_ = open(fulockfile_.c_str(), O_RDWR, S_IRWXU);
947  }
948  if (fu_readwritelock_fd_ == -1)
949  edm::LogError("EvFDaqDirector") << "problem with creating filedesc for fuwritelock -: " << fulockfile_
950  << " create:" << create << " error:" << strerror(errno);
951  else
952  LogDebug("EvFDaqDirector") << "creating filedesc for fureadwritelock -: " << fu_readwritelock_fd_;
953 
954  fu_rw_lock_stream = fdopen(fu_readwritelock_fd_, "r+");
955  if (fu_rw_lock_stream == nullptr)
956  edm::LogError("EvFDaqDirector") << "problem with opening fuwritelock file stream -: " << strerror(errno);
957  }
958 
959  void EvFDaqDirector::lockInitLock() { pthread_mutex_lock(&init_lock_); }
960 
961  void EvFDaqDirector::unlockInitLock() { pthread_mutex_unlock(&init_lock_); }
962 
964  //fcntl(fulocal_rwlock_fd_, F_SETLKW, &fulocal_rw_flk);
965  flock(fulocal_rwlock_fd_, LOCK_SH);
966  }
967 
969  //fcntl(fulocal_rwlock_fd_, F_SETLKW, &fulocal_rw_fulk);
970  flock(fulocal_rwlock_fd_, LOCK_UN);
971  }
972 
974  //fcntl(fulocal_rwlock_fd2_, F_SETLKW, &fulocal_rw_flk2);
975  flock(fulocal_rwlock_fd2_, LOCK_EX);
976  }
977 
979  //fcntl(fulocal_rwlock_fd2_, F_SETLKW, &fulocal_rw_fulk2);
980  flock(fulocal_rwlock_fd2_, LOCK_UN);
981  }
982 
983  void EvFDaqDirector::createBoLSFile(const uint32_t lumiSection, bool checkIfExists) const {
984  //used for backpressure mechanisms and monitoring
985  const std::string fuBoLS = getBoLSFilePathOnFU(lumiSection);
986  struct stat buf;
987  if (checkIfExists == false || stat(fuBoLS.c_str(), &buf) != 0) {
988  int bol_fd = open(fuBoLS.c_str(), O_RDWR | O_CREAT, S_IRUSR | S_IWUSR | S_IRGRP | S_IWGRP | S_IROTH | S_IWOTH);
989  close(bol_fd);
990  }
991  }
992 
993  void EvFDaqDirector::createLumiSectionFiles(const uint32_t lumiSection,
994  const uint32_t currentLumiSection,
995  bool doCreateBoLS,
996  bool doCreateEoLS) {
997  if (currentLumiSection > 0) {
998  const std::string fuEoLS = getEoLSFilePathOnFU(currentLumiSection);
999  struct stat buf;
1000  bool found = (stat(fuEoLS.c_str(), &buf) == 0);
1001  if (!found) {
1002  if (doCreateEoLS) {
1003  int eol_fd =
1004  open(fuEoLS.c_str(), O_RDWR | O_CREAT, S_IRUSR | S_IWUSR | S_IRGRP | S_IWGRP | S_IROTH | S_IWOTH);
1005  close(eol_fd);
1006  }
1007  if (doCreateBoLS)
1008  createBoLSFile(lumiSection, false);
1009  }
1010  } else if (doCreateBoLS) {
1011  createBoLSFile(lumiSection, true); //needed for initial lumisection
1012  }
1013  }
1014 
1016  int& rawFd,
1017  uint16_t& rawHeaderSize,
1018  uint16_t& rawDataType,
1019  uint32_t& lsFromHeader,
1020  int32_t& eventsFromHeader,
1021  int64_t& fileSizeFromHeader,
1022  bool requireHeader,
1023  bool retry,
1024  bool closeFile) {
1025  int infile;
1026 
1027  if ((infile = ::open(rawSourcePath.c_str(), O_RDONLY)) < 0) {
1028  if (retry) {
1029  edm::LogWarning("EvFDaqDirector")
1030  << "parseFRDFileHeader - failed to open input file -: " << rawSourcePath << " : " << strerror(errno);
1031  return parseFRDFileHeader(rawSourcePath,
1032  rawFd,
1033  rawHeaderSize,
1034  rawDataType,
1035  lsFromHeader,
1036  eventsFromHeader,
1037  fileSizeFromHeader,
1038  requireHeader,
1039  false,
1040  closeFile);
1041  } else {
1042  if ((infile = ::open(rawSourcePath.c_str(), O_RDONLY)) < 0) {
1043  edm::LogError("EvFDaqDirector")
1044  << "parseFRDFileHeader - failed to open input file -: " << rawSourcePath << " : " << strerror(errno);
1045  if (errno == ENOENT)
1046  return 1; // error && file not found
1047  else
1048  return -1;
1049  }
1050  }
1051  }
1052 
1053  //v2 is the largest possible read
1054  char hdr[sizeof(FRDFileHeader_v2)];
1055  if (!checkFileRead(hdr, infile, sizeof(FRDFileHeaderIdentifier), rawSourcePath))
1056  return -1;
1057 
1059  uint16_t frd_version = getFRDFileHeaderVersion(fileId->id_, fileId->version_);
1060 
1061  if (frd_version == 0) {
1062  //no header (specific sequence not detected)
1063  if (requireHeader) {
1064  edm::LogError("EvFDaqDirector") << "no header or invalid version string found in:" << rawSourcePath;
1065  close(infile);
1066  return -1;
1067  } else {
1068  //no header, but valid file
1069  lseek(infile, 0, SEEK_SET);
1070  rawHeaderSize = 0;
1071  lsFromHeader = 0;
1072  eventsFromHeader = -1;
1073  fileSizeFromHeader = -1;
1074  }
1075  } else if (frd_version == 1) {
1076  //version 1 header
1077  if (!checkFileRead(hdr, infile, sizeof(FRDFileHeaderContent_v1), rawSourcePath))
1078  return -1;
1080  uint32_t headerSizeRaw = fhContent->headerSize_;
1081  if (headerSizeRaw != sizeof(FRDFileHeader_v1)) {
1082  edm::LogError("EvFDaqDirector") << "inconsistent header size: " << rawSourcePath << " size: " << headerSizeRaw
1083  << " v:" << frd_version;
1084  close(infile);
1085  return -1;
1086  }
1087  //allow header size to exceed read size. Future header versions will not break this, but the size can change.
1088  rawDataType = 0;
1089  lsFromHeader = fhContent->lumiSection_;
1090  eventsFromHeader = (int32_t)fhContent->eventCount_;
1091  fileSizeFromHeader = (int64_t)fhContent->fileSize_;
1092  rawHeaderSize = fhContent->headerSize_;
1093 
1094  } else if (frd_version == 2) {
1095  //version 2 heade
1096  if (!checkFileRead(hdr, infile, sizeof(FRDFileHeaderContent_v2), rawSourcePath))
1097  return -1;
1099  uint32_t headerSizeRaw = fhContent->headerSize_;
1100  if (headerSizeRaw != sizeof(FRDFileHeader_v2)) {
1101  edm::LogError("EvFDaqDirector") << "inconsistent header size: " << rawSourcePath << " size: " << headerSizeRaw
1102  << " v:" << frd_version;
1103  close(infile);
1104  return -1;
1105  }
1106  //allow header size to exceed read size. Future header versions will not break this, but the size can change.
1107  rawDataType = fhContent->dataType_;
1108  lsFromHeader = fhContent->lumiSection_;
1109  eventsFromHeader = (int32_t)fhContent->eventCount_;
1110  fileSizeFromHeader = (int64_t)fhContent->fileSize_;
1111  rawHeaderSize = fhContent->headerSize_;
1112  }
1113 
1114  if (closeFile) {
1115  close(infile);
1116  infile = -1;
1117  }
1118 
1119  rawFd = infile;
1120  return 0; //OK
1121  }
1122 
1123  bool EvFDaqDirector::checkFileRead(char* buf, int infile, std::size_t buf_sz, std::string const& path) {
1124  ssize_t sz_read = ::read(infile, buf, buf_sz);
1125  if (sz_read < 0) {
1126  edm::LogError("EvFDaqDirector") << "rawFileHasHeader - unable to read " << path << " : " << strerror(errno);
1127  if (infile != -1)
1128  close(infile);
1129  return false;
1130  }
1131  if ((size_t)sz_read < buf_sz) {
1132  edm::LogError("EvFDaqDirector") << "rawFileHasHeader - file smaller than header: " << path;
1133  if (infile != -1)
1134  close(infile);
1135  return false;
1136  }
1137  return true;
1138  }
1139 
1140  bool EvFDaqDirector::rawFileHasHeader(std::string const& rawSourcePath, uint16_t& rawHeaderSize) {
1141  int infile;
1142  if ((infile = ::open(rawSourcePath.c_str(), O_RDONLY)) < 0) {
1143  edm::LogWarning("EvFDaqDirector") << "rawFileHasHeader - failed to open input file -: " << rawSourcePath << " : "
1144  << strerror(errno);
1145  return false;
1146  }
1147  //try to read FRD header size (v2 is the biggest, use read buffer of that size)
1148  char hdr[sizeof(FRDFileHeader_v2)];
1149  if (!checkFileRead(hdr, infile, sizeof(FRDFileHeaderIdentifier), rawSourcePath))
1150  return false;
1152  uint16_t frd_version = getFRDFileHeaderVersion(fileId->id_, fileId->version_);
1153 
1154  if (frd_version == 1) {
1155  if (!checkFileRead(hdr, infile, sizeof(FRDFileHeaderContent_v1), rawSourcePath))
1156  return false;
1158  rawHeaderSize = fhContent->headerSize_;
1159  close(infile);
1160  return true;
1161  } else if (frd_version == 2) {
1162  if (!checkFileRead(hdr, infile, sizeof(FRDFileHeaderContent_v2), rawSourcePath))
1163  return false;
1165  rawHeaderSize = fhContent->headerSize_;
1166  close(infile);
1167  return true;
1168  } else
1169  edm::LogError("EvFDaqDirector") << "rawFileHasHeader - unknown version: " << frd_version;
1170 
1171  close(infile);
1172  rawHeaderSize = 0;
1173  return false;
1174  }
1175 
1177  int& rawFd,
1178  uint16_t& rawHeaderSize,
1179  int64_t& fileSizeFromHeader,
1180  bool& fileFound,
1181  uint32_t serverLS,
1182  bool closeFile,
1183  bool requireHeader) {
1184  fileFound = true;
1185 
1186  //take only first three tokens delimited by "_" in the renamed raw file name
1187  std::string jsonStem = std::filesystem::path(rawSourcePath).stem().string();
1188  size_t pos = 0, n_tokens = 0;
1189  while (n_tokens++ < 3 && (pos = jsonStem.find('_', pos + 1)) != std::string::npos) {
1190  }
1191  std::string reducedJsonStem = jsonStem.substr(0, pos);
1192 
1193  std::ostringstream fileNameWithPID;
1194  //should be ported to use fffnaming
1195  fileNameWithPID << reducedJsonStem << "_pid" << std::setfill('0') << std::setw(5) << pid_ << ".jsn";
1196 
1197  std::string jsonDestPath = baseRunDir() + "/" + fileNameWithPID.str();
1198 
1199  LogDebug("EvFDaqDirector") << "RAW parse -: " << rawSourcePath << " and JSON create " << jsonDestPath;
1200 
1201  //parse RAW file header if it exists
1202  uint32_t lsFromRaw;
1203  int32_t nbEventsWrittenRaw;
1204  int64_t fileSizeFromRaw;
1205  uint16_t rawDataType;
1206  auto ret = parseFRDFileHeader(rawSourcePath,
1207  rawFd,
1208  rawHeaderSize,
1209  rawDataType,
1210  lsFromRaw,
1211  nbEventsWrittenRaw,
1212  fileSizeFromRaw,
1213  requireHeader,
1214  true,
1215  closeFile);
1216  if (ret != 0) {
1217  if (ret == 1)
1218  fileFound = false;
1219  return -1;
1220  }
1221 
1222  int outfile;
1223  int oflag = O_CREAT | O_WRONLY | O_TRUNC | O_EXCL; //file should not exist
1224  int omode = S_IWUSR | S_IRUSR | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH;
1225  if ((outfile = ::open(jsonDestPath.c_str(), oflag, omode)) < 0) {
1226  if (errno == EEXIST) {
1227  edm::LogError("EvFDaqDirector") << "grabNextJsonFromRaw - destination file already exists -: " << jsonDestPath
1228  << " : ";
1229  return -1;
1230  }
1231  edm::LogError("EvFDaqDirector") << "grabNextJsonFromRaw - failed to open output file -: " << jsonDestPath << " : "
1232  << strerror(errno);
1233  struct stat out_stat;
1234  if (stat(jsonDestPath.c_str(), &out_stat) == 0) {
1235  edm::LogWarning("EvFDaqDirector")
1236  << "grabNextJsonFromRaw - output file possibly got created with error, deleting and retry -: "
1237  << jsonDestPath;
1238  if (unlink(jsonDestPath.c_str()) == -1) {
1239  edm::LogWarning("EvFDaqDirector")
1240  << "grabNextJsonFromRaw - failed to remove -: " << jsonDestPath << " : " << strerror(errno);
1241  }
1242  }
1243  if ((outfile = ::open(jsonDestPath.c_str(), oflag, omode)) < 0) {
1244  edm::LogError("EvFDaqDirector") << "grabNextJsonFromRaw - failed to open output file (on retry) -: "
1245  << jsonDestPath << " : " << strerror(errno);
1246  return -1;
1247  }
1248  }
1249  //write JSON file (TODO: use jsoncpp)
1250  std::stringstream ss;
1251  ss << "{\"data\":[" << nbEventsWrittenRaw << "," << fileSizeFromRaw << ",\"" << rawSourcePath << "\"]}";
1252  std::string sstr = ss.str();
1253 
1254  if (::write(outfile, sstr.c_str(), sstr.size()) < 0) {
1255  edm::LogError("EvFDaqDirector") << "grabNextJsonFromRaw - failed to write to output file file -: " << jsonDestPath
1256  << " : " << strerror(errno);
1257  return -1;
1258  }
1259  close(outfile);
1260  if (serverLS && serverLS != lsFromRaw)
1261  edm::LogWarning("EvFDaqDirector") << "grabNextJsonFromRaw - mismatch in expected (server) LS " << serverLS
1262  << " and raw file header LS " << lsFromRaw;
1263 
1264  fileSizeFromHeader = fileSizeFromRaw;
1265  return nbEventsWrittenRaw;
1266  }
1267 
1269  std::string const& rawSourcePath,
1270  int64_t& fileSizeFromJson,
1271  bool& fileFound) {
1272  fileFound = true;
1273 
1274  //should be ported to use fffnaming
1275  std::ostringstream fileNameWithPID;
1276  fileNameWithPID << std::filesystem::path(rawSourcePath).stem().string() << "_pid" << std::setfill('0')
1277  << std::setw(5) << pid_ << ".jsn";
1278 
1279  // assemble json destination path
1280  std::string jsonDestPath = baseRunDir() + "/" + fileNameWithPID.str();
1281 
1282  LogDebug("EvFDaqDirector") << "JSON rename -: " << jsonSourcePath << " to " << jsonDestPath;
1283 
1284  int infile = -1, outfile = -1;
1285 
1286  if ((infile = ::open(jsonSourcePath.c_str(), O_RDONLY)) < 0) {
1287  edm::LogWarning("EvFDaqDirector") << "grabNextJsonFile - failed to open input file -: " << jsonSourcePath << " : "
1288  << strerror(errno);
1289  if ((infile = ::open(jsonSourcePath.c_str(), O_RDONLY)) < 0) {
1290  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - failed to open input file (on retry) -: "
1291  << jsonSourcePath << " : " << strerror(errno);
1292  if (errno == ENOENT)
1293  fileFound = false;
1294  return -1;
1295  }
1296  }
1297 
1298  int oflag = O_CREAT | O_WRONLY | O_TRUNC | O_EXCL; //file should not exist
1299  int omode = S_IWUSR | S_IRUSR | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH;
1300  if ((outfile = ::open(jsonDestPath.c_str(), oflag, omode)) < 0) {
1301  if (errno == EEXIST) {
1302  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - destination file already exists -: " << jsonDestPath
1303  << " : ";
1304  ::close(infile);
1305  return -1;
1306  }
1307  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - failed to open output file -: " << jsonDestPath << " : "
1308  << strerror(errno);
1309  struct stat out_stat;
1310  if (stat(jsonDestPath.c_str(), &out_stat) == 0) {
1311  edm::LogWarning("EvFDaqDirector")
1312  << "grabNextJsonFile - output file possibly got created with error, deleting and retry -: " << jsonDestPath;
1313  if (unlink(jsonDestPath.c_str()) == -1) {
1314  edm::LogWarning("EvFDaqDirector")
1315  << "grabNextJsonFile - failed to remove -: " << jsonDestPath << " : " << strerror(errno);
1316  }
1317  }
1318  if ((outfile = ::open(jsonDestPath.c_str(), oflag, omode)) < 0) {
1319  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - failed to open output file (on retry) -: "
1320  << jsonDestPath << " : " << strerror(errno);
1321  ::close(infile);
1322  return -1;
1323  }
1324  }
1325  //copy contents
1326  const std::size_t buf_sz = 512;
1327  std::size_t tot_written = 0;
1328  std::unique_ptr<char[]> buf(new char[buf_sz]);
1329 
1330  ssize_t sz, sz_read = 1, sz_write;
1331  while (sz_read > 0 && (sz_read = ::read(infile, buf.get(), buf_sz)) > 0) {
1332  sz_write = 0;
1333  do {
1334  assert(sz_read - sz_write > 0);
1335  if ((sz = ::write(outfile, buf.get() + sz_write, sz_read - sz_write)) < 0) {
1336  sz_read = sz; // cause read loop termination
1337  break;
1338  }
1339  assert(sz > 0);
1340  sz_write += sz;
1341  tot_written += sz;
1342  } while (sz_write < sz_read);
1343  }
1344  close(infile);
1345  close(outfile);
1346 
1347  if (tot_written > 0) {
1348  //leave file if it was empty for diagnosis
1349  if (unlink(jsonSourcePath.c_str()) == -1) {
1350  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - failed to remove -: " << jsonSourcePath << " : "
1351  << strerror(errno);
1352  return -1;
1353  }
1354  } else {
1355  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - failed to copy json file or file was empty -: "
1356  << jsonSourcePath;
1357  return -1;
1358  }
1359 
1360  Json::Value deserializeRoot;
1362 
1363  std::string data;
1364  std::stringstream ss;
1365  bool result;
1366  try {
1367  if (tot_written <= buf_sz) {
1368  result = reader.parse(buf.get(), deserializeRoot);
1369  } else {
1370  //json will normally not be bigger than buf_sz bytes
1371  try {
1372  std::ifstream ij(jsonDestPath);
1373  ss << ij.rdbuf();
1374  } catch (std::filesystem::filesystem_error const& ex) {
1375  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - FILESYSTEM ERROR CAUGHT -: " << ex.what();
1376  return -1;
1377  }
1378  result = reader.parse(ss.str(), deserializeRoot);
1379  }
1380  if (!result) {
1381  if (tot_written <= buf_sz)
1382  ss << buf.get();
1383  edm::LogError("EvFDaqDirector") << "Failed to deserialize JSON file -: " << jsonDestPath << "\nERROR:\n"
1384  << reader.getFormatedErrorMessages() << "CONTENT:\n"
1385  << ss.str() << ".";
1386  return -1;
1387  }
1388 
1389  //read BU JSON
1390  DataPoint dp;
1391  dp.deserialize(deserializeRoot);
1392  bool success = false;
1393  for (unsigned int i = 0; i < dpd_->getNames().size(); i++) {
1394  if (dpd_->getNames().at(i) == "NEvents")
1395  if (i < dp.getData().size()) {
1396  data = dp.getData()[i];
1397  success = true;
1398  break;
1399  }
1400  }
1401  if (!success) {
1402  if (!dp.getData().empty())
1403  data = dp.getData()[0];
1404  else {
1405  edm::LogError("EvFDaqDirector::grabNextJsonFile")
1406  << "grabNextJsonFile - "
1407  << " error reading number of events from BU JSON; No input value. data -: " << data;
1408  return -1;
1409  }
1410  }
1411 
1412  //try to read raw file size
1413  fileSizeFromJson = -1;
1414  for (unsigned int i = 0; i < dpd_->getNames().size(); i++) {
1415  if (dpd_->getNames().at(i) == "NBytes") {
1416  if (i < dp.getData().size()) {
1417  std::string dataSize = dp.getData()[i];
1418  try {
1419  fileSizeFromJson = std::stol(dataSize);
1420  } catch (const std::exception&) {
1421  //non-fatal currently, processing can continue without this value
1422  edm::LogWarning("EvFDaqDirector") << "grabNextJsonFile - error parsing number of Bytes from BU JSON. "
1423  << "Input value is -: " << dataSize;
1424  }
1425  break;
1426  }
1427  }
1428  }
1429  return std::stoi(data);
1430  } catch (const std::out_of_range& e) {
1431  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - error parsing number of events from BU JSON. "
1432  << "Input value is -: " << data;
1433  } catch (const std::invalid_argument& e) {
1434  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - argument error parsing events from BU JSON. "
1435  << "Input value is -: " << data;
1436  } catch (std::runtime_error const& e) {
1437  //Can be thrown by Json parser
1438  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - std::runtime_error exception -: " << e.what();
1439  }
1440 
1441  catch (std::exception const& e) {
1442  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - SOME OTHER EXCEPTION OCCURED! -: " << e.what();
1443  } catch (...) {
1444  //unknown exception
1445  edm::LogError("EvFDaqDirector") << "grabNextJsonFile - SOME OTHER EXCEPTION OCCURED!";
1446  }
1447 
1448  return -1;
1449  }
1450 
1452  std::string data;
1453  try {
1454  // assemble json destination path
1455  std::filesystem::path jsonDestPath(baseRunDir());
1456 
1457  //should be ported to use fffnaming
1458  std::ostringstream fileNameWithPID;
1459  fileNameWithPID << jsonSourcePath.stem().string() << "_pid" << std::setfill('0') << std::setw(5) << getpid()
1460  << ".jsn";
1461  jsonDestPath /= fileNameWithPID.str();
1462 
1463  LogDebug("EvFDaqDirector") << "JSON rename -: " << jsonSourcePath << " to " << jsonDestPath;
1464  try {
1465  std::filesystem::copy(jsonSourcePath, jsonDestPath);
1466  } catch (std::filesystem::filesystem_error const& ex) {
1467  // Input dir gone?
1468  edm::LogError("EvFDaqDirector") << "grabNextFile BOOST FILESYSTEM ERROR CAUGHT -: " << ex.what();
1469  // << " Maybe the file is not yet visible by FU. Trying again in one second";
1470  sleep(1);
1471  std::filesystem::copy(jsonSourcePath, jsonDestPath);
1472  }
1473  unlockFULocal();
1474 
1475  try {
1476  //sometimes this fails but file gets deleted
1477  std::filesystem::remove(jsonSourcePath);
1478  } catch (std::filesystem::filesystem_error const& ex) {
1479  // Input dir gone?
1480  edm::LogError("EvFDaqDirector") << "grabNextFile BOOST FILESYSTEM ERROR CAUGHT -: " << ex.what();
1481  } catch (std::exception const& ex) {
1482  // Input dir gone?
1483  edm::LogError("EvFDaqDirector") << "grabNextFile std::exception CAUGHT -: " << ex.what();
1484  }
1485 
1486  std::ifstream ij(jsonDestPath);
1487  Json::Value deserializeRoot;
1489 
1490  std::stringstream ss;
1491  ss << ij.rdbuf();
1492  if (!reader.parse(ss.str(), deserializeRoot)) {
1493  edm::LogError("EvFDaqDirector") << "grabNextFile Failed to deserialize JSON file -: " << jsonDestPath
1494  << "\nERROR:\n"
1495  << reader.getFormatedErrorMessages() << "CONTENT:\n"
1496  << ss.str() << ".";
1497  throw std::runtime_error("Cannot deserialize input JSON file");
1498  }
1499 
1500  //read BU JSON
1501  std::string data;
1502  DataPoint dp;
1503  dp.deserialize(deserializeRoot);
1504  bool success = false;
1505  for (unsigned int i = 0; i < dpd_->getNames().size(); i++) {
1506  if (dpd_->getNames().at(i) == "NEvents")
1507  if (i < dp.getData().size()) {
1508  data = dp.getData()[i];
1509  success = true;
1510  }
1511  }
1512  if (!success) {
1513  if (!dp.getData().empty())
1514  data = dp.getData()[0];
1515  else
1516  throw cms::Exception("EvFDaqDirector::grabNextJsonFileUnlock")
1517  << " error reading number of events from BU JSON -: No input value " << data;
1518  }
1519  return std::stoi(data);
1520  } catch (std::filesystem::filesystem_error const& ex) {
1521  // Input dir gone?
1522  unlockFULocal();
1523  edm::LogError("EvFDaqDirector") << "grabNextFile BOOST FILESYSTEM ERROR CAUGHT -: " << ex.what();
1524  } catch (std::runtime_error const& e) {
1525  // Another process grabbed the file and NFS did not register this
1526  unlockFULocal();
1527  edm::LogError("EvFDaqDirector") << "grabNextFile runtime Exception -: " << e.what();
1528  } catch (const std::out_of_range&) {
1529  edm::LogError("EvFDaqDirector") << "grabNextFile error parsing number of events from BU JSON. "
1530  << "Input value is -: " << data;
1531  } catch (const std::invalid_argument&) {
1532  edm::LogError("EvFDaqDirector") << "grabNextFile argument error parsing events from BU JSON. "
1533  << "Input value is -: " << data;
1534  } catch (std::exception const& e) {
1535  // BU run directory disappeared?
1536  unlockFULocal();
1537  edm::LogError("EvFDaqDirector") << "grabNextFile SOME OTHER EXCEPTION OCCURED!!!! -: " << e.what();
1538  }
1539 
1540  return -1;
1541  }
1542 
1544  bool& serverError,
1545  uint32_t& serverLS,
1546  uint32_t& closedServerLS,
1547  std::string& nextFileJson,
1548  std::string& nextFileRaw,
1549  bool& rawHeader,
1550  int maxLS) {
1551  EvFDaqDirector::FileStatus fileStatus = noFile;
1552  serverError = false;
1553 
1554  boost::system::error_code ec;
1555  try {
1556  while (true) {
1557  //socket connect
1558  if (!fileBrokerKeepAlive_ || !socket_->is_open()) {
1560 
1561  if (ec) {
1562  edm::LogWarning("EvFDaqDirector") << "boost::asio::connect error -:" << ec;
1563  serverError = true;
1564  break;
1565  }
1566  }
1567 
1568  boost::asio::streambuf request;
1569  std::ostream request_stream(&request);
1570  std::string path = "/popfile?runnumber=" + run_nstring_ + "&pid=" + pid_;
1571  if (maxLS >= 0) {
1572  std::stringstream spath;
1573  spath << path << "&stopls=" << maxLS;
1574  path = spath.str();
1575  edm::LogWarning("EvFDaqDirector") << "Stop LS requested " << maxLS;
1576  }
1577  request_stream << "GET " << path << " HTTP/1.1\r\n";
1578  request_stream << "Host: " << fileBrokerHost_ << "\r\n";
1579  request_stream << "Accept: */*\r\n";
1580  request_stream << "Connection: keep-alive\r\n\r\n";
1581 
1582  boost::asio::write(*socket_, request, ec);
1583  if (ec) {
1584  if (fileBrokerKeepAlive_ && ec == boost::asio::error::connection_reset) {
1585  edm::LogInfo("EvFDaqDirector") << "reconnecting socket on received connection_reset";
1586  //we got disconnected, try to reconnect to the server before writing the request
1588  if (ec) {
1589  edm::LogWarning("EvFDaqDirector") << "boost::asio::connect error -:" << ec;
1590  serverError = true;
1591  break;
1592  }
1593  continue;
1594  }
1595  edm::LogWarning("EvFDaqDirector") << "boost::asio::write error -:" << ec;
1596  serverError = true;
1597  break;
1598  }
1599 
1600  boost::asio::streambuf response;
1601  boost::asio::read_until(*socket_, response, "\r\n", ec);
1602  if (ec) {
1603  edm::LogWarning("EvFDaqDirector") << "boost::asio::read_until error -:" << ec;
1604  serverError = true;
1605  break;
1606  }
1607 
1608  std::istream response_stream(&response);
1609 
1610  std::string http_version;
1611  response_stream >> http_version;
1612 
1613  response_stream >> serverHttpStatus;
1614 
1615  std::string status_message;
1616  std::getline(response_stream, status_message);
1617  if (!response_stream || http_version.substr(0, 5) != "HTTP/") {
1618  edm::LogWarning("EvFDaqDirector") << "Invalid server response";
1619  serverError = true;
1620  break;
1621  }
1622  if (serverHttpStatus != 200) {
1623  edm::LogWarning("EvFDaqDirector") << "Response returned with status code " << serverHttpStatus;
1624  serverError = true;
1625  break;
1626  }
1627 
1628  // Process the response headers.
1630  while (std::getline(response_stream, header) && header != "\r") {
1631  }
1632 
1633  std::string fileInfo;
1634  std::map<std::string, std::string> serverMap;
1635  while (std::getline(response_stream, fileInfo) && fileInfo != "\r") {
1636  auto pos = fileInfo.find('=');
1637  if (pos == std::string::npos)
1638  continue;
1639  auto stitle = fileInfo.substr(0, pos);
1640  auto svalue = fileInfo.substr(pos + 1);
1641  serverMap[stitle] = svalue;
1642  }
1643 
1644  //check that response run number if correct
1645  auto server_version = serverMap.find("version");
1646  assert(server_version != serverMap.end());
1647 
1648  auto server_run = serverMap.find("runnumber");
1649  assert(server_run != serverMap.end());
1650  assert(run_nstring_ == server_run->second);
1651 
1652  auto server_state = serverMap.find("state");
1653  assert(server_state != serverMap.end());
1654 
1655  auto server_eols = serverMap.find("lasteols");
1656  assert(server_eols != serverMap.end());
1657 
1658  auto server_ls = serverMap.find("lumisection");
1659 
1660  int version_maj = 1;
1661  int version_min = 0;
1662  int version_rev = 0;
1663  {
1664  auto* s_ptr = server_version->second.c_str();
1665  if (!server_version->second.empty() && server_version->second[0] == '"')
1666  s_ptr++;
1667  auto res = sscanf(s_ptr, "%d.%d.%d", &version_maj, &version_min, &version_rev);
1668  if (res < 3) {
1669  res = sscanf(s_ptr, "%d.%d", &version_maj, &version_min);
1670  if (res < 2) {
1671  res = sscanf(s_ptr, "%d", &version_maj);
1672  if (res < 1) {
1673  //expecting at least 1 number (major version)
1674  edm::LogWarning("EvFDaqDirector") << "Can not parse server version " << server_version->second;
1675  }
1676  }
1677  }
1678  }
1679 
1680  closedServerLS = (uint64_t)std::max(0, atoi(server_eols->second.c_str()));
1681  if (server_ls != serverMap.end())
1682  serverLS = (uint64_t)std::max(1, atoi(server_ls->second.c_str()));
1683  else
1684  serverLS = closedServerLS + 1;
1685 
1686  std::string s_state = server_state->second;
1687  if (s_state == "STARTING") //initial, always empty starting with LS 1
1688  {
1689  auto server_file = serverMap.find("file");
1690  assert(server_file == serverMap.end()); //no file with starting state
1691  fileStatus = noFile;
1692  edm::LogInfo("EvFDaqDirector") << "Got STARTING notification with last EOLS " << closedServerLS;
1693  } else if (s_state == "READY") {
1694  auto server_file = serverMap.find("file");
1695  if (server_file == serverMap.end()) {
1696  //can be returned by server if files from new LS already appeared but LS is not yet closed
1697  if (serverLS <= closedServerLS)
1698  serverLS = closedServerLS + 1;
1699  fileStatus = noFile;
1700  edm::LogInfo("EvFDaqDirector")
1701  << "Got READY notification with last EOLS " << closedServerLS << " and no new file";
1702  } else {
1703  std::string filestem;
1704  std::string fileprefix;
1705  auto server_fileprefix = serverMap.find("fileprefix");
1706 
1707  if (server_fileprefix != serverMap.end()) {
1708  auto pssize = server_fileprefix->second.size();
1709  if (pssize > 1 && server_fileprefix->second[0] == '"' && server_fileprefix->second[pssize - 1] == '"')
1710  fileprefix = server_fileprefix->second.substr(1, pssize - 2);
1711  else
1712  fileprefix = server_fileprefix->second;
1713  }
1714 
1715  //remove string literals
1716  auto ssize = server_file->second.size();
1717  if (ssize > 1 && server_file->second[0] == '"' && server_file->second[ssize - 1] == '"')
1718  filestem = server_file->second.substr(1, ssize - 2);
1719  else
1720  filestem = server_file->second;
1721  assert(!filestem.empty());
1722  if (version_maj > 1) {
1723  nextFileRaw = bu_run_dir_ + "/" + fileprefix + filestem + ".raw"; //filestem should be raw
1724  filestem = bu_run_dir_ + "/" + fileprefix + filestem;
1725  nextFileJson = "";
1726  rawHeader = true;
1727  } else {
1728  nextFileRaw = bu_run_dir_ + "/" + filestem + ".raw"; //raw files are not moved
1729  filestem = bu_run_dir_ + "/" + fileprefix + filestem;
1730  nextFileJson = filestem + ".jsn";
1731  rawHeader = false;
1732  }
1733  fileStatus = newFile;
1734  edm::LogInfo("EvFDaqDirector") << "Got READY notification with last EOLS " << closedServerLS << " new LS "
1735  << serverLS << " file:" << filestem;
1736  }
1737  } else if (s_state == "EOLS") {
1738  serverLS = closedServerLS + 1;
1739  edm::LogInfo("EvFDaqDirector") << "Got EOLS notification with last EOLS " << closedServerLS;
1740  fileStatus = noFile;
1741  } else if (s_state == "EOR") {
1742  //server_eor = serverMap.find("iseor");
1743  edm::LogInfo("EvFDaqDirector") << "Got EOR notification with last EOLS " << closedServerLS;
1744  fileStatus = runEnded;
1745  } else if (s_state == "NORUN") {
1746  auto err_msg = serverMap.find("errormessage");
1747  if (err_msg != serverMap.end())
1748  edm::LogWarning("EvFDaqDirector") << "Server NORUN -:" << server_state->second << " : " << err_msg->second;
1749  else
1750  edm::LogWarning("EvFDaqDirector") << "Server NORUN ";
1751  edm::LogWarning("EvFDaqDirector") << "executing run end";
1752  fileStatus = runEnded;
1753  } else if (s_state == "ERROR") {
1754  auto err_msg = serverMap.find("errormessage");
1755  if (err_msg != serverMap.end())
1756  edm::LogWarning("EvFDaqDirector") << "Server error -:" << server_state->second << " : " << err_msg->second;
1757  else
1758  edm::LogWarning("EvFDaqDirector") << "Server error -:" << server_state->second;
1759  fileStatus = noFile;
1760  serverError = true;
1761  } else {
1762  edm::LogWarning("EvFDaqDirector") << "Unknown Server state -:" << server_state->second;
1763  fileStatus = noFile;
1764  serverError = true;
1765  }
1766 
1767  // Read until EOF, writing data to output as we go.
1768  if (!fileBrokerKeepAlive_) {
1769  while (boost::asio::read(*socket_, response, boost::asio::transfer_at_least(1), ec)) {
1770  }
1771  if (ec != boost::asio::error::eof) {
1772  edm::LogWarning("EvFDaqDirector") << "boost::asio::read_until error -:" << ec;
1773  serverError = true;
1774  }
1775  }
1776 
1777  break;
1778  }
1779 
1780  } catch (std::exception const& e) {
1781  edm::LogWarning("EvFDaqDirector") << "Exception in socket handling";
1782  serverError = true;
1783  }
1784 
1785  if (!fileBrokerKeepAlive_ && socket_->is_open()) {
1786  socket_->shutdown(boost::asio::ip::tcp::socket::shutdown_both, ec);
1787  if (ec) {
1788  edm::LogWarning("EvFDaqDirector") << "socket shutdown error -:" << ec;
1789  }
1790  socket_->close(ec);
1791  if (ec) {
1792  edm::LogWarning("EvFDaqDirector") << "socket close error -:" << ec;
1793  }
1794  }
1795 
1796  if (serverError) {
1797  if (socket_->is_open())
1798  socket_->close(ec);
1799  if (ec) {
1800  edm::LogWarning("EvFDaqDirector") << "socket close error -:" << ec;
1801  }
1802  fileStatus = noFile;
1803  sleep(1); //back-off if error detected
1804  }
1805 
1806  return fileStatus;
1807  }
1808 
1810  unsigned int& ls,
1811  std::string& nextFileRaw,
1812  int& rawFd,
1813  uint16_t& rawHeaderSize,
1814  int32_t& serverEventsInNewFile,
1815  int64_t& fileSizeFromMetadata,
1816  uint64_t& thisLockWaitTimeUs,
1817  bool requireHeader) {
1818  EvFDaqDirector::FileStatus fileStatus = noFile;
1819 
1820  //int retval = -1;
1821  //int lock_attempts = 0;
1822  //long total_lock_attempts = 0;
1823 
1824  struct stat buf;
1825  int stopFileLS = -1;
1826  int stopFileCheck = stat(stopFilePath_.c_str(), &buf);
1827  int stopFilePidCheck = stat(stopFilePathPid_.c_str(), &buf);
1828  if (stopFileCheck == 0 || stopFilePidCheck == 0) {
1829  if (stopFileCheck == 0)
1830  stopFileLS = readLastLSEntry(stopFilePath_);
1831  else
1832  stopFileLS = 1; //stop without drain if only pid is stopped
1833  if (!stop_ls_override_) {
1834  //if lumisection is higher than in stop file, should quit at next from current
1835  if (stopFileLS >= 0 && (int)ls >= stopFileLS)
1836  stopFileLS = stop_ls_override_ = ls;
1837  } else
1838  stopFileLS = stop_ls_override_;
1839  edm::LogWarning("EvFDaqDirector") << "Detected stop request from hltd. Ending run for this process after LS -: "
1840  << stopFileLS;
1841  //return runEnded;
1842  } else //if file was removed before reaching stop condition, reset this
1843  stop_ls_override_ = 0;
1844 
1845  /* look for EoLS
1846  if (stat(getEoLSFilePathOnFU(currentLumiSection).c_str(),&buf)==0) {
1847  edm::LogWarning("EvFDaqDirector") << "Detected local EoLS for lumisection "<< currentLumiSection ;
1848  ls++;
1849  return noFile;
1850  }
1851  */
1852 
1853  timeval ts_lockbegin;
1854  gettimeofday(&ts_lockbegin, nullptr);
1855 
1856  std::string nextFileJson;
1857  uint32_t serverLS, closedServerLS;
1858  unsigned int serverHttpStatus;
1859  bool serverError;
1860 
1861  //local lock to force index json and EoLS files to appear in order
1863  lockFULocal();
1864 
1865  int maxLS = stopFileLS < 0 ? -1 : std::max(stopFileLS, (int)currentLumiSection);
1866  bool rawHeader = false;
1867  fileStatus = contactFileBroker(
1868  serverHttpStatus, serverError, serverLS, closedServerLS, nextFileJson, nextFileRaw, rawHeader, maxLS);
1869 
1870  if (serverError) {
1871  //do not update anything
1873  unlockFULocal();
1874  return noFile;
1875  }
1876 
1877  //handle creation of BoLS files if lumisection has changed
1878  if (currentLumiSection == 0) {
1879  if (fileStatus == runEnded)
1880  createLumiSectionFiles(closedServerLS, 0, true, false);
1881  else
1882  createLumiSectionFiles(serverLS, 0, true, false);
1883  } else {
1884  if (closedServerLS >= currentLumiSection) {
1885  //only BoLS files
1886  for (uint32_t i = std::max(currentLumiSection, 1U); i <= closedServerLS; i++)
1887  createLumiSectionFiles(i + 1, i, true, false);
1888  }
1889  }
1890 
1891  bool fileFound = true;
1892 
1893  if (fileStatus == newFile) {
1894  if (rawHeader > 0)
1895  serverEventsInNewFile = grabNextJsonFromRaw(
1896  nextFileRaw, rawFd, rawHeaderSize, fileSizeFromMetadata, fileFound, serverLS, false, requireHeader);
1897  else
1898  serverEventsInNewFile = grabNextJsonFile(nextFileJson, nextFileRaw, fileSizeFromMetadata, fileFound);
1899  }
1900  //closing file in case of any error
1901  if (serverEventsInNewFile < 0 && rawFd != -1) {
1902  close(rawFd);
1903  rawFd = -1;
1904  }
1905 
1906  //can unlock because all files have been created locally
1908  unlockFULocal();
1909 
1910  if (!fileFound) {
1911  //catch condition where directory got deleted
1912  fileStatus = noFile;
1913  struct stat buf;
1914  if (stat(bu_run_dir_.c_str(), &buf) != 0) {
1915  edm::LogWarning("EvFDaqDirector") << "BU run directory not found:" << bu_run_dir_;
1916  fileStatus = runEnded;
1917  }
1918  }
1919 
1920  //handle creation of EoLS files if lumisection has changed, this needs to be locked exclusively
1921  //so that EoLS files can not appear locally before index files
1922  if (currentLumiSection == 0) {
1923  lockFULocal2();
1924  if (fileStatus == runEnded) {
1925  createLumiSectionFiles(closedServerLS, 0, false, true);
1926  createLumiSectionFiles(serverLS, closedServerLS, false, true); // +1
1927  } else {
1928  createLumiSectionFiles(serverLS, 0, false, true);
1929  }
1930  unlockFULocal2();
1931  } else {
1932  if (closedServerLS >= currentLumiSection) {
1933  //lock exclusive to create EoLS files
1934  lockFULocal2();
1935  for (uint32_t i = std::max(currentLumiSection, 1U); i <= closedServerLS; i++)
1936  createLumiSectionFiles(i + 1, i, false, true);
1937  unlockFULocal2();
1938  }
1939  }
1940 
1941  if (fileStatus == runEnded)
1942  ls = std::max(currentLumiSection, serverLS);
1943  else if (fileStatus == newFile) {
1944  assert(serverLS >= ls);
1945  ls = serverLS;
1946  } else if (fileStatus == noFile) {
1947  if (serverLS >= ls)
1948  ls = serverLS;
1949  else {
1950  edm::LogWarning("EvFDaqDirector") << "Server reported LS " << serverLS
1951  << " which is smaller than currently open LS " << ls << ". Ignoring response";
1952  sleep(1);
1953  }
1954  }
1955 
1956  return fileStatus;
1957  }
1958 
1960  // create open dir if not already there
1961 
1963  if (!std::filesystem::is_directory(openPath)) {
1964  LogDebug("EvFDaqDirector") << "<open> FU dir not found. Creating... -:" << openPath.string();
1965  std::filesystem::create_directories(openPath);
1966  }
1967  }
1968 
1970  std::ifstream ij(file);
1971  Json::Value deserializeRoot;
1973 
1974  if (!reader.parse(ij, deserializeRoot)) {
1975  edm::LogError("EvFDaqDirector") << "Cannot deserialize input JSON file -:" << file;
1976  return -1;
1977  }
1978 
1979  int ret = deserializeRoot.get("lastLS", "").asInt();
1980  return ret;
1981  }
1982 
1984  std::string fileprefix = run_dir_ + "/" + run_string_ + "_ls";
1986  struct stat buf;
1987  unsigned int lscount = 1;
1988  do {
1989  std::stringstream ss;
1990  ss << fileprefix << std::setfill('0') << std::setw(4) << lscount << "_EoLS.jsn";
1991  fullpath = ss.str();
1992  lscount++;
1993  } while (stat(fullpath.c_str(), &buf) == 0);
1994  return lscount - 1;
1995  }
1996 
1997  //if transferSystem PSet is present in the menu, we require it to be complete and consistent for all specified streams
1999  std::string proc_flag = run_dir_ + "/processing";
2000  int proc_flag_fd = open(proc_flag.c_str(), O_RDWR | O_CREAT, S_IRWXU | S_IWGRP | S_IRGRP | S_IWOTH | S_IROTH);
2001  close(proc_flag_fd);
2002  }
2003 
2004  struct flock EvFDaqDirector::make_flock(short type, short whence, off_t start, off_t len, pid_t pid) {
2005 #ifdef __APPLE__
2006  return {start, len, pid, type, whence};
2007 #else
2008  return {type, whence, start, len, pid};
2009 #endif
2010  }
2011 
2013  struct stat buf;
2014  return (stat(input_throttled_file_.c_str(), &buf) == 0);
2015  }
2016 
2018  struct stat buf;
2019  return (stat((discard_ls_filestem_ + std::to_string(ls)).c_str(), &buf) == 0);
2020  }
2021 
2022 } // namespace evf
unsigned int nThreads_
Definition: fillJson.h:27
int def(FILE *, FILE *, int)
struct flock fu_rw_flk
unsigned int nConcurrentLumis_
std::vector< std::string > bu_base_dirs_all_
std::string run_string_
LuminosityBlockNumber_t luminosityBlock() const
std::string protocolBufferHistogramFileNameWithInstance(const unsigned int run, const unsigned int ls, std::string const &stream, std::string const &instance)
std::string bolsFileName(const unsigned int run, const unsigned int ls)
std::string streamerDataChecksumFileNameWithInstance(const unsigned int run, const unsigned int ls, std::string const &stream, std::string const &instance)
void watchPreallocate(Preallocate::slot_type const &iSlot)
boost::asio::io_service io_service_
bool rawFileHasHeader(std::string const &rawSourcePath, uint16_t &rawHeaderSize)
std::string getOpenInputJsonFilePath(const unsigned int ls, const unsigned int index) const
static void fillDescriptions(edm::ConfigurationDescriptions &descriptions)
std::string fulockfile_
def create(alignables, pedeDump, additionalData, outputFile, config)
std::string getOpenOutputJsonFilePath(const unsigned int ls, std::string const &stream) const
std::string getInputJsonFilePath(const unsigned int ls, const unsigned int index) const
static bool checkFileRead(char *buf, int infile, std::size_t buf_sz, std::string const &path)
jsoncollector::DataPointDefinition * dpd_
std::string getOpenDatFilePath(const unsigned int ls, std::string const &stream) const
void accumulateFileSize(unsigned int lumi, unsigned long fileSize)
std::string getFFFParamsFilePathOnBU() const
std::unique_ptr< boost::asio::ip::tcp::resolver > resolver_
void watchPreGlobalEndLumi(PreGlobalEndLumi::slot_type const &iSlot)
Int asInt() const
ret
prodAgent to be discontinued
std::string getRawFilePath(const unsigned int ls, const unsigned int index) const
std::array< uint8_t, 4 > version_
Definition: FRDFileHeader.h:31
std::string inputRawFileName(const unsigned int run, const unsigned int ls, const unsigned int index)
volatile std::atomic< bool > shutdown_flag
pthread_mutex_t init_lock_
Value get(UInt index, const Value &defaultValue) const
std::string getEoLSFilePathOnFU(const unsigned int ls) const
void removeFile(std::string)
bool lumisectionDiscarded(unsigned int ls)
reader
Definition: DQM.py:105
Represents a JSON value.
Definition: value.h:99
Log< level::Error, false > LogError
uint32_t T const *__restrict__ uint32_t const *__restrict__ int32_t int Histo::index_type cudaStream_t stream
std::string getOpenInitFilePath(std::string const &stream) const
std::string getRootHistogramFilePath(const unsigned int ls, std::string const &stream) const
assert(be >=bs)
bool isExceptionOnData(unsigned int ls)
std::string getOpenProtocolBufferHistogramFilePath(const unsigned int ls, std::string const &stream) const
Definition: Electron.h:6
unsigned long previousFileSize_
static std::string to_string(const XMLCh *ch)
std::unique_ptr< boost::asio::ip::tcp::resolver::iterator > endpoint_iterator_
std::string getInitTempFilePath(std::string const &stream) const
std::string getEoRFilePathOnFU() const
struct flock fu_rw_fulk
std::string hltSourceDirectory_
unsigned int startFromLS_
static int parseFRDFileHeader(std::string const &rawSourcePath, int &rawFd, uint16_t &rawHeaderSize, uint16_t &rawDataType, uint32_t &lsFromHeader, int32_t &eventsFromHeader, int64_t &fileSizeFromHeader, bool requireHeader, bool retry, bool closeFile)
std::string getEoLSFilePathOnBU(const unsigned int ls) const
std::mutex * fileDeleteLockPtr_
std::string getMergedDatFilePath(const unsigned int ls, std::string const &stream) const
FileStatus getNextFromFileBroker(const unsigned int currentLumiSection, unsigned int &ls, std::string &nextFile, int &rawFd, uint16_t &rawHeaderSize, int32_t &serverEventsInNewFile_, int64_t &fileSize, uint64_t &thisLockWaitTimeUs, bool requireHeader=true)
std::string streamerDataFileNameWithInstance(const unsigned int run, const unsigned int ls, std::string const &stream, std::string const &instance)
def chmod(path, mode)
Definition: eostools.py:294
std::string getRunOpenDirPath() const
std::string getDatFilePath(const unsigned int ls, std::string const &stream) const
std::string getMergedDatChecksumFilePath(const unsigned int ls, std::string const &stream) const
std::unique_ptr< boost::asio::ip::tcp::socket > socket_
std::string inputJsonFileName(const unsigned int run, const unsigned int ls, const unsigned int index)
std::string stopFilePath_
std::string getProtocolBufferHistogramFilePath(const unsigned int ls, std::string const &stream) const
std::string getMergedRootHistogramFilePath(const unsigned int ls, std::string const &stream) const
std::string bu_base_dir_
unsigned int stop_ls_override_
int grabNextJsonFileAndUnlock(std::filesystem::path const &jsonSourcePath)
std::string streamerJsonFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
std::string input_throttled_file_
std::string getBoLSFilePathOnFU(const unsigned int ls) const
std::string eorFileName(const unsigned int run)
int readLastLSEntry(std::string const &file)
std::string getMergedProtocolBufferHistogramFilePath(const unsigned int ls, std::string const &stream) const
std::unique_ptr< boost::asio::ip::tcp::resolver::query > query_
std::string stopFilePathPid_
LuminosityBlockID const & luminosityBlockID() const
Definition: GlobalContext.h:62
unsigned int eolsNFilesIndex_
std::string & baseRunDir()
std::string run_nstring_
void watchPreGlobalBeginRun(PreGlobalBeginRun::slot_type const &iSlot)
std::string getInitFilePath(std::string const &stream) const
void createProcessingNotificationMaybe() const
Log< level::Info, false > LogInfo
void openFULockfileStream(bool create)
std::string getOutputJsonFilePath(const unsigned int ls, std::string const &stream) const
int getNFilesFromEoLS(std::string BUEoLSFile)
FileStatus updateFuLock(unsigned int &ls, std::string &nextFile, uint32_t &fsize, uint16_t &rawHeaderSize, uint64_t &lockWaitTime, bool &setExceptionState)
def ls(path, rec=False)
Definition: eostools.py:349
void preBeginRun(edm::GlobalContext const &globalContext)
std::string rootHistogramFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
std::string initFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
unsigned long long uint64_t
Definition: Time.h:13
void preGlobalEndLumi(edm::GlobalContext const &globalContext)
std::vector< std::string > const & getNames() const
bool bumpFile(unsigned int &ls, unsigned int &index, std::string &nextFile, uint32_t &fsize, uint16_t &rawHeaderSize, int maxLS, bool &setExceptionState)
def load(fileName)
Definition: svgfig.py:547
std::string getOpenRootHistogramFilePath(const unsigned int ls, std::string const &stream) const
void watchPostGlobalEndRun(PostGlobalEndRun::slot_type const &iSlot)
std::string getEoRFileName() const
void add(std::string const &label, ParameterSetDescription const &psetDescription)
def remove(d, key, TELL=False)
Definition: MatrixUtil.py:223
evf::FastMonitoringService * fms_
std::string bu_run_dir_
std::string rootHistogramFileNameWithInstance(const unsigned int run, const unsigned int ls, std::string const &stream, std::string const &instance)
std::list< std::pair< int, std::unique_ptr< InputFile > > > * filesToDeletePtr_
std::string getEoRFilePath() const
def mkdir(path)
Definition: eostools.py:251
std::string getOpenRawFilePath(const unsigned int ls, const unsigned int index) const
std::string findHighestRunDir()
Definition: DirManager.cc:23
char data[epos_bytes_allocation]
Definition: EPOS_Wrapper.h:80
void postEndRun(edm::GlobalContext const &globalContext)
uint16_t getFRDFileHeaderVersion(const std::array< uint8_t, 4 > &id, const std::array< uint8_t, 4 > &version)
Definition: FRDFileHeader.h:81
std::string discard_ls_filestem_
Unserialize a JSON document into a Value.
Definition: reader.h:16
unsigned int getLumisectionToStart() const
int grabNextJsonFile(std::string const &jsonSourcePath, std::string const &rawSourcePath, int64_t &fileSizeFromJson, bool &fileFound)
std::string fileBrokerPort_
void createLumiSectionFiles(const uint32_t lumiSection, const uint32_t currentLumiSection, bool doCreateBoLS, bool doCreateEoLS)
std::string initTempFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
EvFDaqDirector::FileStatus contactFileBroker(unsigned int &serverHttpStatus, bool &serverState, uint32_t &serverLS, uint32_t &closedServerLS, std::string &nextFileJson, std::string &nextFileRaw, bool &rawHeader, int maxLS)
void preallocate(edm::service::SystemBounds const &bounds)
Log< level::Warning, false > LogWarning
std::vector< int > bu_base_dirs_nSources_
void createBoLSFile(const uint32_t lumiSection, bool checkIfExists) const
std::string fileBrokerHost_
std::string protocolBufferHistogramFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
unsigned int fuLockPollInterval_
int grabNextJsonFromRaw(std::string const &rawSourcePath, int &rawFd, uint16_t &rawHeaderSize, int64_t &fileSizeFromHeader, bool &fileFound, uint32_t serverLS, bool closeFile, bool requireHeader=true)
std::string eolsFileName(const unsigned int run, const unsigned int ls)
unsigned int nStreams_
std::string streamerDataFileNameWithPid(const unsigned int run, const unsigned int ls, std::string const &stream)
std::string bu_run_open_dir_
#define LogDebug(id)