1 from __future__
import print_function
11 print(
'Not injecting to wmagent in --show mode. Need to run the worklfows.')
13 if opt.wmcontrol==
'init':
16 if opt.wmcontrol==
'test':
19 if opt.wmcontrol==
'submit' and opt.nProcs==0:
20 print(
'Not injecting to wmagent in -j 0 mode. Need to run the worklfows.')
22 if opt.wmcontrol==
'force':
23 print(
"This is an expert setting, you'd better know what you're doing")
27 from modules.wma
import upload_to_couch
28 (filePath,labelInCouch,user,group,where) = arguments
29 cacheId=upload_to_couch(filePath,
45 for k
in options.split(
','):
46 if k.startswith(
'dqm:'):
47 self.
dqmgui=k.split(
':',1)[-1]
48 elif k.startswith(
'wma:'):
51 self.
testMode=((mode!=
'submit')
and (mode!=
'force'))
63 self.
wmagent=os.getenv(
'WMAGENT_REQMGR')
69 self.
wmagent =
'cmsweb-testbed.cern.ch' 70 self.
DbsUrl =
"https://"+self.
wmagent+
"/dbs/int/global/DBSReader" 73 self.
dqmgui=
"https://cmsweb.cern.ch/dqm/relval" 78 self.
user = os.getenv(
'USER')
86 if not os.getenv(
'WMCORE_ROOT'):
87 print(
'\n\twmclient is not setup properly. Will not be able to upload or submit requests.\n')
92 print(
'\n\tFound wmclient\n')
95 "RequestType" :
"TaskChain",
96 "SubRequestType" :
"RelVal",
97 "RequestPriority": 500000,
98 "Requestor": self.
user,
100 "CMSSWVersion": os.getenv(
'CMSSW_VERSION'),
101 "Campaign": os.getenv(
'CMSSW_VERSION'),
102 "ScramArch": os.getenv(
'SCRAM_ARCH'),
103 "ProcessingVersion": self.
version,
105 "ConfigCacheUrl": self.
couch,
113 "SizePerEvent" : 1234,
115 "PrepID": os.getenv(
'CMSSW_VERSION')
119 "EnableHarvesting" :
"True",
120 "DQMUploadUrl" : self.
dqmgui,
121 "DQMConfigCacheID" :
None,
127 "ConfigCacheID" :
None,
129 "SplittingAlgo" :
"EventBased",
130 "EventsPerJob" :
None,
131 "RequestNumEvents" :
None,
132 "Seeding" :
"AutomaticSeeding",
133 "PrimaryDataset" :
None,
135 "Multicore" : opt.nThreads,
139 "TaskName" :
"DigiHLT",
140 "ConfigCacheID" :
None,
142 "InputDataset" :
None,
143 "SplittingAlgo" :
"LumiBased",
146 "Multicore" : opt.nThreads,
152 "InputFromOutputModule" :
None,
153 "ConfigCacheID" :
None,
155 "SplittingAlgo" :
"LumiBased",
158 "Multicore" : opt.nThreads,
165 def prepare(self,mReader, directories, mode='init'):
172 wmsplit[
'RECODreHLT']=2
176 wmsplit[
'DIGIUP15_PU50']=1
177 wmsplit[
'RECOUP15_PU50']=1
178 wmsplit[
'DIGIUP15_PU25']=1
179 wmsplit[
'RECOUP15_PU25']=1
180 wmsplit[
'DIGIUP15_PU25HS']=1
181 wmsplit[
'RECOUP15_PU25HS']=1
182 wmsplit[
'DIGIHIMIX']=5
183 wmsplit[
'RECOHIMIX']=5
184 wmsplit[
'RECODSplit']=1
185 wmsplit[
'SingleMuPt10_UP15_ID']=1
186 wmsplit[
'DIGIUP15_ID']=1
187 wmsplit[
'RECOUP15_ID']=1
188 wmsplit[
'TTbar_13_ID']=1
189 wmsplit[
'SingleMuPt10FS_ID']=1
190 wmsplit[
'TTbarFS_ID']=1
191 wmsplit[
'RECODR2_50nsreHLT']=5
192 wmsplit[
'RECODR2_25nsreHLT']=5
193 wmsplit[
'RECODR2_2016reHLT']=5
194 wmsplit[
'RECODR2_50nsreHLT_HIPM']=5
195 wmsplit[
'RECODR2_25nsreHLT_HIPM']=5
196 wmsplit[
'RECODR2_2016reHLT_HIPM']=1
197 wmsplit[
'RECODR2_2016reHLT_skimSingleMu']=1
198 wmsplit[
'RECODR2_2016reHLT_skimDoubleEG']=1
199 wmsplit[
'RECODR2_2016reHLT_skimMuonEG']=1
200 wmsplit[
'RECODR2_2016reHLT_skimJetHT']=1
201 wmsplit[
'RECODR2_2016reHLT_skimMET']=1
202 wmsplit[
'RECODR2_2016reHLT_skimSinglePh']=1
203 wmsplit[
'RECODR2_2016reHLT_skimMuOnia']=1
204 wmsplit[
'RECODR2_2016reHLT_skimSingleMu_HIPM']=1
205 wmsplit[
'RECODR2_2016reHLT_skimDoubleEG_HIPM']=1
206 wmsplit[
'RECODR2_2016reHLT_skimMuonEG_HIPM']=1
207 wmsplit[
'RECODR2_2016reHLT_skimJetHT_HIPM']=1
208 wmsplit[
'RECODR2_2016reHLT_skimMET_HIPM']=1
209 wmsplit[
'RECODR2_2016reHLT_skimSinglePh_HIPM']=1
210 wmsplit[
'RECODR2_2016reHLT_skimMuOnia_HIPM']=1
211 wmsplit[
'RECODR2_2017reHLT_Prompt']=1
212 wmsplit[
'RECODR2_2017reHLT_skimSingleMu_Prompt_Lumi']=1
213 wmsplit[
'RECODR2_2017reHLT_skimDoubleEG_Prompt']=1
214 wmsplit[
'RECODR2_2017reHLT_skimMET_Prompt']=1
215 wmsplit[
'RECODR2_2017reHLT_skimMuOnia_Prompt']=1
216 wmsplit[
'RECODR2_2017reHLT_Prompt_L1TEgDQM']=1
217 wmsplit[
'RECODR2_2018reHLT_Prompt']=1
218 wmsplit[
'RECODR2_2018reHLT_skimSingleMu_Prompt_Lumi']=1
219 wmsplit[
'RECODR2_2018reHLT_skimDoubleEG_Prompt']=1
220 wmsplit[
'RECODR2_2018reHLT_skimJetHT_Prompt']=1
221 wmsplit[
'RECODR2_2018reHLT_skimMET_Prompt']=1
222 wmsplit[
'RECODR2_2018reHLT_skimMuOnia_Prompt']=1
223 wmsplit[
'RECODR2_2018reHLT_skimEGamma_Prompt_L1TEgDQM']=1
224 wmsplit[
'RECODR2_2018reHLT_skimMuonEG_Prompt']=1
225 wmsplit[
'RECODR2_2018reHLT_skimCharmonium_Prompt']=1
226 wmsplit[
'RECODR2_2018reHLT_skimJetHT_Prompt_HEfail']=1
227 wmsplit[
'RECODR2_2018reHLT_skimJetHT_Prompt_BadHcalMitig']=1
228 wmsplit[
'RECODR2_2018reHLTAlCaTkCosmics_Prompt']=1
229 wmsplit[
'RECODR2_2018reHLT_skimDisplacedJet_Prompt']=1
230 wmsplit[
'RECODR2_2018reHLT_ZBPrompt']=1
231 wmsplit[
'RECODR2_2018reHLT_Offline']=1
232 wmsplit[
'RECODR2_2018reHLT_skimSingleMu_Offline_Lumi']=1
233 wmsplit[
'RECODR2_2018reHLT_skimDoubleEG_Offline']=1
234 wmsplit[
'RECODR2_2018reHLT_skimJetHT_Offline']=1
235 wmsplit[
'RECODR2_2018reHLT_skimMET_Offline']=1
236 wmsplit[
'RECODR2_2018reHLT_skimMuOnia_Offline']=1
237 wmsplit[
'RECODR2_2018reHLT_skimEGamma_Offline_L1TEgDQM']=1
238 wmsplit[
'RECODR2_2018reHLT_skimMuonEG_Offline']=1
239 wmsplit[
'RECODR2_2018reHLT_skimCharmonium_Offline']=1
240 wmsplit[
'RECODR2_2018reHLT_skimJetHT_Offline_HEfail']=1
241 wmsplit[
'RECODR2_2018reHLT_skimJetHT_Offline_BadHcalMitig']=1
242 wmsplit[
'RECODR2_2018reHLTAlCaTkCosmics_Offline']=1
243 wmsplit[
'RECODR2_2018reHLT_skimDisplacedJet_Offline']=1
244 wmsplit[
'RECODR2_2018reHLT_ZBOffline']=1
245 wmsplit[
'HLTDR2_50ns']=1
246 wmsplit[
'HLTDR2_25ns']=1
247 wmsplit[
'HLTDR2_2016']=1
248 wmsplit[
'HLTDR2_2017']=1
249 wmsplit[
'HLTDR2_2018']=1
250 wmsplit[
'HLTDR2_2018_BadHcalMitig']=1
251 wmsplit[
'Hadronizer']=1
252 wmsplit[
'DIGIUP15']=1
253 wmsplit[
'RECOUP15']=1
254 wmsplit[
'RECOAODUP15']=5
255 wmsplit[
'DBLMINIAODMCUP15NODQM']=5
256 wmsplit[
'DigiFull']=5
257 wmsplit[
'RecoFull']=5
258 wmsplit[
'DigiFullPU']=1
259 wmsplit[
'RecoFullPU']=1
260 wmsplit[
'RECOHID11']=1
261 wmsplit[
'DigiFullTriggerPU_2026D17PU'] = 1
262 wmsplit[
'RecoFullGlobalPU_2026D17PU']=1
263 wmsplit[
'DIGIUP17']=1
264 wmsplit[
'RECOUP17']=1
265 wmsplit[
'DIGIUP17_PU25']=1
266 wmsplit[
'RECOUP17_PU25']=1
267 wmsplit[
'DIGICOS_UP16']=1
268 wmsplit[
'RECOCOS_UP16']=1
269 wmsplit[
'DIGICOS_UP17']=1
270 wmsplit[
'RECOCOS_UP17']=1
271 wmsplit[
'DIGICOS_UP18']=1
272 wmsplit[
'RECOCOS_UP18']=1
273 wmsplit[
'DIGICOS_UP21']=1
274 wmsplit[
'RECOCOS_UP21']=1
275 wmsplit[
'HYBRIDRepackHI2015VR']=1
276 wmsplit[
'HYBRIDZSHI2015']=1
277 wmsplit[
'RECOHID15']=1
278 wmsplit[
'RECOHID18']=1
283 print(
"Not set up for step splitting")
287 for (n,dir)
in directories.items():
289 print(
"inspecting",dir)
291 for (x,s)
in mReader.workFlowSteps.items():
301 if len( [step
for step
in s[3]
if "HARVESTGEN" in step] )>0:
302 chainDict[
'TimePerEvent']=0.01
303 thisLabel=thisLabel+
"_gen" 305 if len( [step
for step
in s[3]
if "DBLMINIAODMCUP15NODQM" in step] )>0:
306 thisLabel=thisLabel+
"_dblMiniAOD" 312 if 'INPUT' in step
or (
not isinstance(s[2][index],str)):
313 nextHasDSInput=s[2][index]
321 chainDict[
'nowmTasklist'][-1][
'nowmIO']=json.loads(open(
'%s/%s.io'%(dir,step)).
read())
323 print(
"Failed to find",
'%s/%s.io'%(dir,step),
".The workflows were probably not run on cfg not created")
326 chainDict[
'nowmTasklist'][-1][
'PrimaryDataset']=
'RelVal'+s[1].
split(
'+')[0]
327 if not '--relval' in s[2][index]:
328 print(
'Impossible to create task from scratch without splitting information with --relval')
331 arg=s[2][index].
split()
332 ns=
map(int,arg[arg.index(
'--relval')+1].
split(
','))
333 chainDict[
'nowmTasklist'][-1][
'RequestNumEvents'] = ns[0]
334 chainDict[
'nowmTasklist'][-1][
'EventsPerJob'] = ns[1]
335 if 'FASTSIM' in s[2][index]
or '--fast' in s[2][index]:
336 thisLabel+=
'_FastSim' 337 if 'lhe' in s[2][index]
in s[2][index]:
338 chainDict[
'nowmTasklist'][-1][
'LheInputFiles'] =
True 343 chainDict[
'nowmTasklist'][-1][
'nowmIO']=json.loads(open(
'%s/%s.io'%(dir,step)).
read())
345 print(
"Failed to find",
'%s/%s.io'%(dir,step),
".The workflows were probably not run on cfg not created")
347 chainDict[
'nowmTasklist'][-1][
'InputDataset']=nextHasDSInput.dataSet
348 if (
'DQMHLTonRAWAOD' in step) :
349 chainDict[
'nowmTasklist'][-1][
'IncludeParents']=
True 350 splitForThisWf=nextHasDSInput.split
351 chainDict[
'nowmTasklist'][-1][
'LumisPerJob']=splitForThisWf
353 chainDict[
'nowmTasklist'][-1][
'LumisPerJob']=wmsplit[step]
355 if len(nextHasDSInput.run):
356 chainDict[
'nowmTasklist'][-1][
'RunWhitelist']=nextHasDSInput.run
357 if len(nextHasDSInput.ls):
358 chainDict[
'nowmTasklist'][-1][
'LumiList']=nextHasDSInput.ls
360 if '--data' in s[2][index]
and nextHasDSInput.label:
361 thisLabel+=
'_RelVal_%s'%nextHasDSInput.label
362 if 'filter' in chainDict[
'nowmTasklist'][-1][
'nowmIO']:
363 print(
"This has an input DS and a filter sequence: very likely to be the PyQuen sample")
364 processStrPrefix=
'PU_' 365 setPrimaryDs =
'RelVal'+s[1].
split(
'+')[0]
367 chainDict[
'nowmTasklist'][-1][
'PrimaryDataset']=setPrimaryDs
373 chainDict[
'nowmTasklist'][-1][
'nowmIO']=json.loads(open(
'%s/%s.io'%(dir,step)).
read())
375 print(
"Failed to find",
'%s/%s.io'%(dir,step),
".The workflows were probably not run on cfg not created")
378 chainDict[
'nowmTasklist'][-1][
'LumisPerJob']=splitForThisWf
380 chainDict[
'nowmTasklist'][-1][
'LumisPerJob']=wmsplit[step]
383 if 'Hadronizer' in step:
384 chainDict[
'nowmTasklist'][-1][
'LumisPerJob']=wmsplit[
'Hadronizer']
387 chainDict[
'nowmTasklist'][-1][
'TaskName']=step
389 chainDict[
'nowmTasklist'][-1][
'PrimaryDataset']=setPrimaryDs
390 chainDict[
'nowmTasklist'][-1][
'ConfigCacheID']=
'%s/%s.py'%(dir,step)
391 chainDict[
'nowmTasklist'][-1][
'GlobalTag']=chainDict[
'nowmTasklist'][-1][
'nowmIO'][
'GT']
392 chainDict[
'GlobalTag']=chainDict[
'nowmTasklist'][-1][
'nowmIO'][
'GT']
393 if 'NANOEDM' in step :
394 nanoedmGT = chainDict[
'nowmTasklist'][-1][
'nowmIO'][
'GT']
395 if 'NANOMERGE' in step :
396 chainDict[
'GlobalTag'] = nanoedmGT
397 if 'pileup' in chainDict[
'nowmTasklist'][-1][
'nowmIO']:
398 chainDict[
'nowmTasklist'][-1][
'MCPileup']=chainDict[
'nowmTasklist'][-1][
'nowmIO'][
'pileup']
399 if '--pileup ' in s[2][index]:
400 processStrPrefix=
'PU_' 402 processStrPrefix=
'PU25ns_' 404 processStrPrefix=
'PU50ns_' 405 if 'premix_stage2' in s[2][index]
and '--pileup_input' in s[2][index]:
407 processStrPrefix=
'PUpmx25ns_' 408 elif s[2][index].
split()[ s[2][index].
split().
index(
'--pileup_input')+1 ].
find(
'50ns') > 0 :
409 processStrPrefix=
'PUpmx50ns_' 413 chainDict[
'AcquisitionEra'][step]=chainDict[
'CMSSWVersion']
414 chainDict[
'ProcessingString'][step]=processStrPrefix+chainDict[
'nowmTasklist'][-1][
'GlobalTag'].
replace(
'::All',
'').
replace(
'-',
'_')+thisLabel
415 if 'NANOMERGE' in step :
416 chainDict[
'ProcessingString'][step]=processStrPrefix+nanoedmGT.replace(
'::All',
'').
replace(
'-',
'_')+thisLabel
419 chainDict[
'nowmTasklist'][-1][
'AcquisitionEra']=chainDict[
'CMSSWVersion']
420 chainDict[
'nowmTasklist'][-1][
'ProcessingString']=processStrPrefix+chainDict[
'nowmTasklist'][-1][
'GlobalTag'].
replace(
'::All',
'').
replace(
'-',
'_')+thisLabel
421 if 'NANOMERGE' in step :
422 chainDict[
'nowmTasklist'][-1][
'ProcessingString']=processStrPrefix+nanoedmGT.replace(
'::All',
'').
replace(
'-',
'_')+thisLabel
425 chainDict[
'nowmTasklist'][-1][
'Campaign'] = chainDict[
'nowmTasklist'][-1][
'AcquisitionEra']+self.
batchName 428 if (
'DBLMINIAODMCUP15NODQM' in step):
429 chainDict[
'nowmTasklist'][-1][
'ProcessingString']=chainDict[
'nowmTasklist'][-1][
'ProcessingString']+
'_miniAOD' 431 if( chainDict[
'nowmTasklist'][-1][
'Multicore'] ):
438 chainDict[
'nowmTasklist'][-1][
'Memory'] = self.
memoryOffset +
int( chainDict[
'nowmTasklist'][-1][
'Multicore'] -1 ) * self.
memPerCore 442 chainDict[
'RequestString']=
'RV'+chainDict[
'CMSSWVersion']+s[1].
split(
'+')[0]
443 if processStrPrefix
or thisLabel:
444 chainDict[
'RequestString']+=
'_'+processStrPrefix+thisLabel
447 chainDict[
'PrepID'] = chainDict[
'CMSSWVersion']+
'__'+self.
batchTime+
'-'+s[1].
split(
'+')[0]
449 chainDict[
'PrepID'] = chainDict[
'CMSSWVersion']+self.
batchName+
'-'+s[1].
split(
'+')[0]
451 chainDict[
'SubRequestType'] =
"HIRelVal" 458 for i_second
in reversed(
range(len(chainDict[
'nowmTasklist']))):
459 t_second=chainDict[
'nowmTasklist'][i_second]
461 if 'primary' in t_second[
'nowmIO']:
463 primary=t_second[
'nowmIO'][
'primary'][0].
replace(
'file:',
'')
464 for i_input
in reversed(
range(0,i_second)):
465 t_input=chainDict[
'nowmTasklist'][i_input]
466 for (om,o)
in t_input[
'nowmIO'].
items():
470 if (len(t_input[
'TaskName'])>50):
471 if (t_input[
'TaskName'].
find(
'GenSim') != -1):
472 t_input[
'TaskName'] =
'GenSimFull' 473 if (t_input[
'TaskName'].
find(
'Hadronizer') != -1):
474 t_input[
'TaskName'] =
'HadronizerFull' 475 t_second[
'InputTask'] = t_input[
'TaskName']
476 t_second[
'InputFromOutputModule'] = om
478 if t_second[
'TaskName'].startswith(
'HARVEST'):
480 chainDict[
'DQMConfigCacheID']=t_second[
'ConfigCacheID']
500 chainDict[
'AcquisitionEra'] = chainDict[
'AcquisitionEra'].
values()[0]
501 chainDict[
'ProcessingString'] = chainDict[
'ProcessingString'].
values()[0]
503 chainDict[
'AcquisitionEra'] = chainDict[
'nowmTasklist'][0][
'AcquisitionEra']
504 chainDict[
'ProcessingString'] = chainDict[
'nowmTasklist'][0][
'ProcessingString']
508 chainDict[
'Campaign'] = chainDict[
'AcquisitionEra']+self.
batchName 514 if isinstance(i, int)
and i < len(chainDict[
'nowmTasklist']):
515 chainDict[
'nowmTasklist'][i][
'KeepOutput']=
True 516 for (i,t)
in enumerate(chainDict[
'nowmTasklist']):
517 if t[
'TaskName'].startswith(
'HARVEST'):
521 elif t[
'TaskName']
in self.
keep:
523 if t[
'TaskName'].startswith(
'HYBRIDRepackHI2015VR'):
524 t[
'KeepOutput']=
False 527 chainDict[
'Task%d'%(itask)]=t
534 chainDict[
'TaskChain']=itask
536 chainDict.pop(
'nowmTasklist')
543 labelInCouch=self.
label+
'_'+label
544 cacheName=filePath.split(
'/')[-1]
547 print(
'\tFake upload of',filePath,
'to couch with label',labelInCouch)
551 from modules.wma
import upload_to_couch,DATABASE_NAME
553 print(
'\n\tUnable to find wmcontrol modules. Please include it in your python path\n')
558 print(
"Not re-uploading",filePath,
"to",where,
"for",label)
561 print(
"Loading",filePath,
"to",where,
"for",label)
563 pool = multiprocessing.Pool(1)
564 cacheIds = pool.map( upload_to_couch_oneArg, [(filePath,labelInCouch,self.
user,self.
group,where)] )
565 cacheId = cacheIds[0]
570 for (n,d)
in self.chainDicts.items():
572 if it.startswith(
"Task")
and it!=
'TaskChain':
574 couchID=self.
uploadConf(d[it][
'ConfigCacheID'],
575 str(n)+d[it][
'TaskName'],
578 print(d[it][
'ConfigCacheID'],
" uploaded to couchDB for",
str(n),
"with ID",couchID)
579 d[it][
'ConfigCacheID']=couchID
580 if it ==
'DQMConfigCacheID':
581 couchID=self.
uploadConf(d[
'DQMConfigCacheID'],
585 print(d[
'DQMConfigCacheID'],
"uploaded to couchDB for",
str(n),
"with ID",couchID)
586 d[
'DQMConfigCacheID']=couchID
591 from modules.wma
import makeRequest,approveRequest
592 from wmcontrol
import random_sleep
593 print(
'\n\tFound wmcontrol\n')
595 print(
'\n\tUnable to find wmcontrol modules. Please include it in your python path\n')
601 for (n,d)
in self.chainDicts.items():
603 print(
"Only viewing request",n)
604 print(pprint.pprint(d))
607 print(
"For eyes before submitting",n)
608 print(pprint.pprint(d))
609 print(
"Submitting",n,
"...........")
610 workFlow=makeRequest(self.
wmagent,d,encodeDict=
True)
611 print(
"...........",n,
"submitted")
std::vector< std::string_view > split(std::string_view, const char *)
def prepare(self, mReader, directories, mode='init')
def performInjectionOptionTest(opt)
def uploadConf(self, filePath, label, where)
the info are not in the task specific dict but in the general dict t_input.update(copy.deepcopy(self.defaultHarvest)) t_input['DQMConfigCacheID']=t_second['ConfigCacheID']
def replace(string, replacements)
S & print(S &os, JobReport::InputFile const &f)
void find(edm::Handle< EcalRecHitCollection > &hits, DetId thisDet, std::vector< EcalRecHitCollection::const_iterator > &hit, bool debug=false)
def __init__(self, opt, mode='init', options='')
def upload_to_couch_oneArg(arguments)