CMS 3D CMS Logo

 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Properties Friends Macros Pages
Functions | Variables
FileNamesHelper Namespace Reference

Functions

def getJobID_fromEdmSizeFileName
 
def getJobID_fromFileName
 
def getJobID_fromIgProfLogName
 
def getJobID_fromMemcheckLogName
 
def getJobID_fromRootFileName
 
def getJobID_fromTimeReportLogName
 
def getRootFileSize
 
def read_ConfigurationFromSimulationCandles
 
def read_SimulationCandles
 

Variables

list f_candle_and_step_inJobID = lambdacandle,step,x:x[0]
 
string path = "/home/vidma/Desktop/CERN_code/cmssw/data/CMSSW_3_2_0_--usersteps=GEN-SIM,DIGI_lxbuild106.cern.ch_relval/relval/CMSSW_3_2_0/workGENSIMDIGI/TTbar_PU_TimeSize"
 
tuple simCandlesRules
 
tuple test_root_file = re.compile(".root$", re.IGNORECASE)
 
dictionary universal_candle_step_regs = {}
 

Function Documentation

def FileNamesHelper.getJobID_fromEdmSizeFileName (   logfile_name)
Returns the candle and STEP out of filename:

* the candle might include one optional underscore:
>>> getJobID_fromEdmSizeFileName("E_1000_GEN,SIM_EdmSize")
('E_1000', 'GEN,SIM', '', '')

* otherwise after candle we have two underscores:
>>> getJobID_fromEdmSizeFileName("TTBAR__RAW2DIGI,RECO_EdmSize")
('TTBAR', 'RAW2DIGI,RECO', '', '')

* and lastly we have the PILEUP possibility:
>>> getJobID_fromEdmSizeFileName("TTBAR__GEN,SIM_PILEUP_EdmSize")
('TTBAR', 'GEN,SIM', 'PILEUP', '')

Definition at line 185 of file FileNamesHelper.py.

References getJobID_fromFileName().

Referenced by parserEdmSize.getEdmReport().

186 def getJobID_fromEdmSizeFileName(logfile_name):
187  """
188  Returns the candle and STEP out of filename:
189 
190  * the candle might include one optional underscore:
191  >>> getJobID_fromEdmSizeFileName("E_1000_GEN,SIM_EdmSize")
192  ('E_1000', 'GEN,SIM', '', '')
193 
194  * otherwise after candle we have two underscores:
195  >>> getJobID_fromEdmSizeFileName("TTBAR__RAW2DIGI,RECO_EdmSize")
196  ('TTBAR', 'RAW2DIGI,RECO', '', '')
197 
198  * and lastly we have the PILEUP possibility:
199  >>> getJobID_fromEdmSizeFileName("TTBAR__GEN,SIM_PILEUP_EdmSize")
200  ('TTBAR', 'GEN,SIM', 'PILEUP', '')
201  """
202  return getJobID_fromFileName(logfile_name, "_EdmSize")
def getJobID_fromEdmSizeFileName
def FileNamesHelper.getJobID_fromFileName (   logfile_name,
  suffix,
  givenPath = "" 
)
Returns the JobID (candle, step, pileup_type, conditions, event_content) out of filename
-- if no pile up returns empty string for pileup type

* the candle might include one optional underscore:
>>> getJobID_fromFileName("PI-_1000_GEN,SIM.root", "\.root")
('PI-_1000', 'GEN,SIM', '', '')

* otherwise after candle we have two underscores:
>>> getJobID_fromFileName("MINBIAS__GEN,FASTSIM.root", "\.root")
('MINBIAS', 'GEN,FASTSIM', '', '')

* and lastly we have the PILEUP possibility:
>>> getJobID_fromFileName("TTBAR__DIGI_PILEUP.root", "\.root")
('TTBAR', 'DIGI', 'PILEUP', '')

Definition at line 93 of file FileNamesHelper.py.

References read_ConfigurationFromSimulationCandles(), and python.rootplot.root2matplotlib.replace().

Referenced by getJobID_fromEdmSizeFileName(), getJobID_fromMemcheckLogName(), getJobID_fromRootFileName(), and getJobID_fromTimeReportLogName().

93 
94 def getJobID_fromFileName(logfile_name, suffix, givenPath =""):
95  #TODO: join together with the one from parseTimingReport.py
96  """
97  Returns the JobID (candle, step, pileup_type, conditions, event_content) out of filename
98  -- if no pile up returns empty string for pileup type
99 
100  * the candle might include one optional underscore:
101  >>> getJobID_fromFileName("PI-_1000_GEN,SIM.root", "\.root")
102  ('PI-_1000', 'GEN,SIM', '', '')
103 
104  * otherwise after candle we have two underscores:
105  >>> getJobID_fromFileName("MINBIAS__GEN,FASTSIM.root", "\.root")
106  ('MINBIAS', 'GEN,FASTSIM', '', '')
107 
108  * and lastly we have the PILEUP possibility:
109  >>> getJobID_fromFileName("TTBAR__DIGI_PILEUP.root", "\.root")
110  ('TTBAR', 'DIGI', 'PILEUP', '')
111  """
112  import os
113 
114  # get the actual filename (no path
115  (path, filename) = os.path.split(logfile_name)
116  if givenPath:
117  path = givenPath
118 
119  if suffix not in universal_candle_step_regs:
120  #create and cache a regexp
121  universal_candle_step_regs[suffix] = re.compile( \
122  r"""
123  #candle1_[opt:candle2]_
124  ^([^_]+_[^_]*)_
125 
126  # step
127  ([^_]+)(_PILEUP)?%s$
128  """ % suffix , re.VERBOSE)
129 
130 
131 
132  #print logfile_name
133  result = universal_candle_step_regs[suffix].search(filename)
134  if result:
135  #print result.groups()
136  #print "result: %s" % str(result.groups())
137  candle = result.groups()[0]
138  step = result.groups()[1].replace('-', ',')
139  is_pileup = result.groups()[2]
140  if is_pileup:
141  is_pileup = "PILEUP"
142  else:
143  is_pileup = ""
144 
145  """ if we had the candle without underscore inside (like TTBAR but not E_1000)
146  on the end of result and underscore which needs to be removed """
147 
148  if (candle[-1] == '_'):
149  candle = candle[0:-1]
150 
151  """ try to fetch the conditions and real pileup type if the SimulationCandles.txt is existing """
152  conditions = ''
153  event_content = ''
154  try:
155  conf = read_ConfigurationFromSimulationCandles(path = path, step = step, is_pileup= is_pileup)
156  if conf:
157  is_pileup = conf["pileup_type"]
158  conditions = conf["conditions"]
159  event_content = conf["event_content"]
160  except OSError as e:
161  pass
162 
163  return (candle, step, is_pileup, conditions, event_content)
164  else:
165  return (None, None, None, None, None)
166 
def read_ConfigurationFromSimulationCandles
Definition: search.py:1
def FileNamesHelper.getJobID_fromIgProfLogName (   logfile_name)
Returns the candle and STEP out of .sql3 filename:

everything is given, just have to split it...
like:
TTbar___GEN,FASTSIM___LowLumiPileUp___MC_37Y_V5___RAWSIM___MEM_LIVE___1.sql3
and correct the conditions!

Definition at line 235 of file FileNamesHelper.py.

References read_ConfigurationFromSimulationCandles(), and pileupCalc.upper.

Referenced by cmsPerfSuiteHarvest.process_igprof_dir().

236 def getJobID_fromIgProfLogName(logfile_name):
237  """
238  Returns the candle and STEP out of .sql3 filename:
239 
240  everything is given, just have to split it...
241  like:
242  TTbar___GEN,FASTSIM___LowLumiPileUp___MC_37Y_V5___RAWSIM___MEM_LIVE___1.sql3
243  and correct the conditions!
244 
245  """
246 
247  (path, filename) = os.path.split(logfile_name)
248 
249  params = filename.split("___")
250  candle = params[0].upper()
251  step = params[1]
252  pileup_type = params[2]
253  if pileup_type == "NOPILEUP":
254  pileup_type = ""
255  elif pileup_type == "LowLumiPileUp":
256  pileup_type = "PILEUP"
257  #conditions = params[3] + "::All"
258  #event_content = params[4]
259 
260  #get the conditions from the SimulationCandles!!
261  conf = read_ConfigurationFromSimulationCandles(path = path, step = step, is_pileup= pileup_type)
262  if conf:
263  is_pileup = conf["pileup_type"]
264  conditions = conf["conditions"]
265  event_content = conf["event_content"]
266  return (candle, step, is_pileup, conditions, event_content)
267  else:
268  return (None, None, None, None, None)
269 
""" Get the root file size for the candle, step in current dir """
def read_ConfigurationFromSimulationCandles
def FileNamesHelper.getJobID_fromMemcheckLogName (   logfile_name)
Returns the candle and STEP out of filename:

* otherwise after candle we have two underscores:
>>> getJobID_fromTimeReportLogName("test_data/TTBAR__RAW2DIGI,RECO_memcheck_vlgd.xml")
('TTBAR', 'RAW2DIGI,RECO', '', '')

* and lastly we have the PILEUP possibility:
>>> getJobID_fromTimeReportLogName("TTBAR__DIGI_PILEUP_memcheck_vlgd.xml")
('TTBAR', 'DIGI', 'PILEUP', '')

Definition at line 221 of file FileNamesHelper.py.

References getJobID_fromFileName().

Referenced by cmsPerfSuiteHarvest.process_memcheck_dir().

222 def getJobID_fromMemcheckLogName(logfile_name):
223  """
224  Returns the candle and STEP out of filename:
225 
226  * otherwise after candle we have two underscores:
227  >>> getJobID_fromTimeReportLogName("test_data/TTBAR__RAW2DIGI,RECO_memcheck_vlgd.xml")
228  ('TTBAR', 'RAW2DIGI,RECO', '', '')
229 
230  * and lastly we have the PILEUP possibility:
231  >>> getJobID_fromTimeReportLogName("TTBAR__DIGI_PILEUP_memcheck_vlgd.xml")
232  ('TTBAR', 'DIGI', 'PILEUP', '')
233  """
234  return getJobID_fromFileName(logfile_name, "_memcheck_vlgd.xml")
def getJobID_fromMemcheckLogName
def FileNamesHelper.getJobID_fromRootFileName (   logfile_name)
Returns the candle and STEP out of filename:

* the candle might include one optional underscore:
>>> getJobID_fromRootFileName("PI-_1000_GEN,SIM.root")
('PI-_1000', 'GEN,SIM', '', '')

* otherwise after candle we have two underscores:
>>> getJobID_fromRootFileName("MINBIAS__GEN,FASTSIM.root")
('MINBIAS', 'GEN,FASTSIM', '', '')

* and lastly we have the PILEUP possibility:
>>> getJobID_fromRootFileName("TTBAR__DIGI_PILEUP.root")
('TTBAR', 'DIGI', 'PILEUP', '')

Definition at line 167 of file FileNamesHelper.py.

References getJobID_fromFileName().

Referenced by getRootFileSize().

168 def getJobID_fromRootFileName(logfile_name):
169  """
170  Returns the candle and STEP out of filename:
171 
172  * the candle might include one optional underscore:
173  >>> getJobID_fromRootFileName("PI-_1000_GEN,SIM.root")
174  ('PI-_1000', 'GEN,SIM', '', '')
175 
176  * otherwise after candle we have two underscores:
177  >>> getJobID_fromRootFileName("MINBIAS__GEN,FASTSIM.root")
178  ('MINBIAS', 'GEN,FASTSIM', '', '')
179 
180  * and lastly we have the PILEUP possibility:
181  >>> getJobID_fromRootFileName("TTBAR__DIGI_PILEUP.root")
182  ('TTBAR', 'DIGI', 'PILEUP', '')
183  """
184  return getJobID_fromFileName(logfile_name, "\\.root")
def FileNamesHelper.getJobID_fromTimeReportLogName (   logfile_name)
Returns the candle and STEP out of filename:

* the candle might include one optional underscore:
>>> getJobID_fromTimeReportLogName("E_1000_GEN,SIM_TimingReport.log")
('E_1000', 'GEN,SIM', '', '')

* otherwise after candle we have two underscores:
>>> getJobID_fromTimeReportLogName("test_data/TTBAR__RAW2DIGI,RECO_TimingReport.log")
('TTBAR', 'RAW2DIGI,RECO', '', '')

* and lastly we have the PILEUP possibility:
>>> getJobID_fromTimeReportLogName("TTBAR__DIGI_PILEUP_TimingReport.log")
('TTBAR', 'DIGI', 'PILEUP', '')

Definition at line 203 of file FileNamesHelper.py.

References getJobID_fromFileName().

Referenced by parserTimingReport.manual_run(), parserTimingReport.perf_profile(), and cmsPerfSuiteHarvest.process_timesize_dir().

204 def getJobID_fromTimeReportLogName(logfile_name):
205  """
206  Returns the candle and STEP out of filename:
207 
208  * the candle might include one optional underscore:
209  >>> getJobID_fromTimeReportLogName("E_1000_GEN,SIM_TimingReport.log")
210  ('E_1000', 'GEN,SIM', '', '')
211 
212  * otherwise after candle we have two underscores:
213  >>> getJobID_fromTimeReportLogName("test_data/TTBAR__RAW2DIGI,RECO_TimingReport.log")
214  ('TTBAR', 'RAW2DIGI,RECO', '', '')
215 
216  * and lastly we have the PILEUP possibility:
217  >>> getJobID_fromTimeReportLogName("TTBAR__DIGI_PILEUP_TimingReport.log")
218  ('TTBAR', 'DIGI', 'PILEUP', '')
219  """
220  return getJobID_fromFileName(logfile_name, "_TimingReport.log")
def getJobID_fromTimeReportLogName
def FileNamesHelper.getRootFileSize (   path,
  candle,
  step 
)

Definition at line 270 of file FileNamesHelper.py.

References f_candle_and_step_inJobID, and getJobID_fromRootFileName().

Referenced by cmsPerfSuiteHarvest.process_timesize_dir().

271 def getRootFileSize(path, candle, step):
272  files = os.listdir(path)
273  root_files = [os.path.join(path, f) for f in files
274  if test_root_file.search(f)
275  and os.path.isfile(os.path.join(path, f)) ]
276 
277  """ get the size of file if it is the root file for current candle and step """
278  try:
279  size = [os.stat(f).st_size for f in root_files
281  except Exception as e:
282  print e
283  return 0
284  return size
list f_candle_and_step_inJobID
def FileNamesHelper.read_ConfigurationFromSimulationCandles (   path,
  step,
  is_pileup 
)

Definition at line 45 of file FileNamesHelper.py.

References parsingRulesHelper.rulesParser(), and split.

Referenced by getJobID_fromFileName(), getJobID_fromIgProfLogName(), and cmsPerfSuiteHarvest.process_timesize_dir().

45 
46 def read_ConfigurationFromSimulationCandles(path, step, is_pileup):
47  # Here we parse SimulationCandles_<version: e.g. CMSSW_3_2_0>.txt which contains
48  # release:TODO, release_base [path] - we can put it to release [but it's of different granularity]
49  # how to reproduce stuff: TODO
50 
51  try:
52  """ get the acual file """
53  SimulationCandles_file = [os.path.join(path, f) for f in os.listdir(path)
54  if os.path.isfile(os.path.join(path, f)) and f.startswith("SimulationCandles_")][0]
55  except IndexError:
56  return None
57 
58  """ read and parse it; format: #Version : CMSSW_3_2_0 """
59  f = open(SimulationCandles_file, 'r')
60 
61  lines = [s.strip() for s in f.readlines()]
62  f.close()
63 
64 
65 
66  """ we call a shared helper to parse the file """
67 
68  for line in lines:
69  #print line
70  #print simCandlesRules[2][1].match(line) and simCandlesRules[2][1].match(line).groups() or ""
71 
72  info, missing_fields = parsingRulesHelper.rulesParser(simCandlesRules, [line], compileRules = False)
73  #print info
74  #Massaging the info dictionary conditions entry to allow for new cmsDriver.py --conditions option:
75  if 'auto:' in info['conditions']:
76  from Configuration.AlCa.autoCond import autoCond
77  info['conditions'] = autoCond[ info['conditions'].split(':')[1] ].split("::")[0]
78  else:
79  if 'FrontierConditions_GlobalTag' in info['conditions']:
80  info['conditions']=info['conditions'].split(",")[1]
81  #print (info, missing_fields)
82  #if we successfully parsed the line of simulation candles:
83  if not missing_fields:
84  #we have to match only step and
85  if info["step"].strip() == step.strip() and ((not is_pileup and not info["pileup_type"]) or (is_pileup and info["pileup_type"])):
86  # if it's pile up or not:
87  #print "Info for <<%s, %s>>: %s" % (str(step), str(is_pileup), str(info))
88  return info
89 
90 
91 
92 
def read_ConfigurationFromSimulationCandles
double split
Definition: MVATrainer.cc:139
def FileNamesHelper.read_SimulationCandles (   path)
get the acual file 

Definition at line 285 of file FileNamesHelper.py.

Referenced by cmsPerfSuiteHarvest.process_igprof_dir(), cmsPerfSuiteHarvest.process_memcheck_dir(), and cmsPerfSuiteHarvest.process_timesize_dir().

286 def read_SimulationCandles(path):
287  # Here we parse SimulationCandles_<version: e.g. CMSSW_3_2_0>.txt which contains
288  # release:TODO, release_base [path] - we can put it to release [but it's of different granularity]
289  # how to reproduce stuff: TODO
290 
291  """ get the acual file """
292  SimulationCandles_file = [os.path.join(path, f) for f in os.listdir(path)
293  if os.path.isfile(os.path.join(path, f)) and f.startswith("SimulationCandles_")][0]
294 
295  """ read and parse it; format: #Version : CMSSW_3_2_0 """
296  f = open(SimulationCandles_file, 'r')
297  lines = f.readlines()
298  f.close()
299 
300  release_version =[[a.strip() for a in line.split(":")] for line in lines if line.startswith("#Version")][0][1]
301  return release_version
302 

Variable Documentation

list FileNamesHelper.f_candle_and_step_inJobID = lambdacandle,step,x:x[0]

Definition at line 6 of file FileNamesHelper.py.

Referenced by parserEdmSize.getEdmReport(), and getRootFileSize().

string FileNamesHelper.path = "/home/vidma/Desktop/CERN_code/cmssw/data/CMSSW_3_2_0_--usersteps=GEN-SIM,DIGI_lxbuild106.cern.ch_relval/relval/CMSSW_3_2_0/workGENSIMDIGI/TTbar_PU_TimeSize"

Definition at line 306 of file FileNamesHelper.py.

tuple FileNamesHelper.simCandlesRules
Initial value:
1 = (
2 
3  #e.g.: --conditions FrontierConditions_GlobalTag,MC_31X_V4::All --eventcontent RECOSIM
4  (("cms_driver_options", ), r"""^cmsDriver.py(.+)$"""),
5  #Changing the following to allow for new cmsDriver.py --conditions option (that can optionally drop the FrontierConditions_GlobalTag,)
6  (("", "conditions", ""), r"""^cmsDriver.py(.*)--conditions ([^\s]+)(.*)$""", "req"),
7  (("", "pileup_type", ""), r"""^cmsDriver.py(.*)--pileup=([^\s]+)(.*)$"""),
8  (("", "step", ""), r"""^cmsDriver.py(.*)--step=([^\s]+)(.*)$""", "req"),
9  #not shure if event content is required
10  (("", "event_content", ""), r"""^cmsDriver.py(.*)--eventcontent ([^\s]+)(.*)$""", "req"),
11  (("", "num_events", ""), r"""^cmsDriver.py(.*)-n ([^\s]+)(.*)$""", "req"),
12 
13  #TODO: after changeing the splitter to "taskset -c ..." this is no longer included into the part of correct job
14  #(("input_user_root_file", ), r"""^For these tests will use user input file (.+)$"""),
15 )

Definition at line 28 of file FileNamesHelper.py.

tuple FileNamesHelper.test_root_file = re.compile(".root$", re.IGNORECASE)

Definition at line 19 of file FileNamesHelper.py.

dictionary FileNamesHelper.universal_candle_step_regs = {}

Definition at line 18 of file FileNamesHelper.py.