da/d0b/MatrixUtil_8py_source.html

 from __future__ import print_function
 import os
 class Matrix(dict):
     def __setitem__(self,key,value):
         if key in self:
             print("ERROR in Matrix")
             print("overwriting",key,"not allowed")
         else:
             self.update({float(key):WF(float(key),value)})

     def addOverride(self,key,override):
         self[key].addOverride(override)

 #the class to collect all possible steps
 class Steps(dict):
     def __setitem__(self,key,value):
         if key in self:
             print("ERROR in Step")
             print("overwriting",key,"not allowed")
             import sys
             sys.exit(-9)
         else:
             self.update({key:value})
             # make the python file named <step>.py
             #if not '--python' in value:                self[key].update({'--python':'%s.py'%(key,)})

     def overwrite(self,keypair):
         value=self[keypair[1]]
         self.update({keypair[0]:value})

 class WF(list):
     def __init__(self,n,l):
         self.extend(l)
         self.num=n
         #the actual steps of this WF
         self.steps=[]
         self.overrides={}
     def addOverride(self,overrides):
         self.overrides=overrides

     def interpret(self,stepsDict):
         for s in self:
             print('steps',s,stepsDict[s])
             steps.append(stepsDict[s])


 def expandLsInterval(lumis):
     return range(lumis[0],(lumis[1]+1))

 from DPGAnalysis.Skims.golden_json_2015 import *
 jsonFile2015 = findFileInPath("DPGAnalysis/Skims/data/Cert_13TeV_16Dec2015ReReco_Collisions15_25ns_50ns_JSON.txt")
 jsonFile2016 = findFileInPath("DPGAnalysis/Skims/data/Cert_271036-274240_13TeV_PromptReco_Collisions16_JSON.txt")

 import json
 with open(jsonFile2015) as data_file:
     data_json2015 = json.load(data_file)

 with open(jsonFile2016) as data_file:
     data_json2016 = json.load(data_file)

 # return a portion of the 2015 golden json
 # LS for a full run by default; otherwise a subset of which you determined the size
 def selectedLS(list_runs=[],maxNum=-1,l_json=data_json2015):
     # print "maxNum is %s"%(maxNum)
     if not isinstance(list_runs[0], int):
         print("ERROR: list_runs must be a list of integers")
         return None
     local_dict = {}
     ls_count = 0

     for run in list_runs:
         if str(run) in l_json.keys():
             # print "run %s is there"%(run)
             runNumber = run
             # print "Doing lumi-section selection for run %s: "%(run)
             for LSsegment in l_json[str(run)] :
                 # print LSsegment
                 ls_count += (LSsegment[-1] - LSsegment[0] + 1)
                 if (ls_count > maxNum) & (maxNum != -1):
                     break
                     # return local_dict
                 if runNumber in local_dict.keys():
                     local_dict[runNumber].append(LSsegment)
                 else:
                     local_dict[runNumber] = [LSsegment]
                 # print "total LS so far  %s    -   grow %s"%(ls_count,local_dict)
             #local_dict[runNumber] = [1,2,3]
         else:
             print("run %s is NOT present in json %s\n\n"%(run, l_json))
         # print "++    %s"%(local_dict)

     if ( len(local_dict) > 0 ) :
         return local_dict
     else :
         print("No luminosity section interval passed the json and your selection; returning None")
         return None

 # print "\n\n\n THIS IS WHAT I RETURN: %s \n\n"%( selectedLS([251244,251251]) )


 InputInfoNDefault=2000000
 class InputInfo(object):
     def __init__(self,dataSet,dataSetParent='',label='',run=[],ls={},files=1000,events=InputInfoNDefault,split=10,location='CAF',ib_blacklist=None,ib_block=None,skimEvents=False) :
         self.run = run
         self.ls = ls
         self.files = files
         self.events = events
         self.location = location
         self.label = label
         self.dataSet = dataSet
         self.split = split
         self.ib_blacklist = ib_blacklist
         self.ib_block = ib_block
         self.dataSetParent = dataSetParent
         self.skimEvents = skimEvents

     def das(self, das_options, dataset):
         if not self.skimEvents and (len(self.run) != 0 or self.ls):
             queries = self.queries(dataset)
             if len(self.run) != 0:
                 command = ";".join(["dasgoclient %s --query '%s'" % (das_options, query) for query in queries])
             else:
               lumis = self.lumis()
               commands = []
               while queries:
                     commands.append("dasgoclient %s --query 'lumi,%s' --format json | das-selected-lumis.py %s " % (das_options, queries.pop(), lumis.pop()))
               command = ";".join(commands)
             command = "({0})".format(command)
         elif not self.skimEvents:
             command = "dasgoclient %s --query '%s'" % (das_options, self.queries(dataset)[0])
         elif self.skimEvents:
             from os import getenv
             if getenv("JENKINS_PREFIX") is not None:
                 # to be assured that whatever happens the files are only those at CERN
                 command = "das-up-to-nevents.py -d %s -e %d -pc"%(dataset,self.events)
             else:
                 command = "das-up-to-nevents.py -d %s -e %d"%(dataset,self.events)
         # Run filter on DAS output
         if self.ib_blacklist:
             command += " | grep -E -v "
             command += " ".join(["-e '{0}'".format(pattern) for pattern in self.ib_blacklist])
         if not self.skimEvents:
             from os import getenv
             if getenv("CMSSW_USE_IBEOS","false")=="true":
                 return "export CMSSW_USE_IBEOS=true; " + command + " | ibeos-lfn-sort"
             return command + " | sort -u"
         else:
             return command

     def lumiRanges(self):
         if len(self.run) != 0:
             return "echo '{\n"+",".join(('"%d":[[1,268435455]]\n'%(x,) for x in self.run))+"}'"
         if self.ls :
             return "echo '{\n"+",".join(('"%d" : %s\n'%( int(x),self.ls[x]) for x in self.ls.keys()))+"}'"
         return None

     def lumis(self):
       query_lumis = []
       if self.ls:
         for run in sorted(self.ls.keys()):
           run_lumis = []
           for rng in self.ls[run]:
               if isinstance(rng, int):
                   run_lumis.append(str(rng))
               else:
                   run_lumis.append(str(rng[0])+","+str(rng[1]))
           query_lumis.append(":".join(run_lumis))
       return query_lumis

     def queries(self, dataset):
         query_by = "block" if self.ib_block else "dataset"
         query_source = "{0}#{1}".format(dataset, self.ib_block) if self.ib_block else dataset

         if self.ls :
             the_queries = []
             #for query_run in self.ls.keys():
             # print "run is %s"%(query_run)
             # if you have a LS list specified, still query das for the full run (multiple ls queries take forever)
             # and use step1_lumiRanges.log to run only on LS which respect your selection

             # DO WE WANT T2_CERN ?
             return ["file {0}={1} run={2}".format(query_by, query_source, query_run) for query_run in sorted(self.ls.keys())]
             #return ["file {0}={1} run={2} site=T2_CH_CERN".format(query_by, query_source, query_run) for query_run in self.ls.keys()]


                 #
                 #for a_range in self.ls[query_run]:
                 #    # print "a_range is %s"%(a_range)
                 #    the_queries +=  ["file {0}={1} run={2} lumi={3} ".format(query_by, query_source, query_run, query_ls) for query_ls in expandLsInterval(a_range) ]
             #print the_queries
             return the_queries

         site = " site=T2_CH_CERN"
         if "CMSSW_DAS_QUERY_SITES" in os.environ:
             if os.environ["CMSSW_DAS_QUERY_SITES"]:
                 site = " site=%s" % os.environ["CMSSW_DAS_QUERY_SITES"]
             else:
                 site = ""
         if len(self.run) != 0:
             return ["file {0}={1} run={2}{3}".format(query_by, query_source, query_run, site) for query_run in self.run]
             #return ["file {0}={1} run={2} ".format(query_by, query_source, query_run) for query_run in self.run]
         else:
             return ["file {0}={1}{2}".format(query_by, query_source, site)]
             #return ["file {0}={1} ".format(query_by, query_source)]

     def __str__(self):
         if self.ib_block:
             return "input from: {0} with run {1}#{2}".format(self.dataSet, self.ib_block, self.run)
         return "input from: {0} with run {1}".format(self.dataSet, self.run)


 # merge dictionaries, with prioty on the [0] index
 def merge(dictlist,TELL=False):
     import copy
     last=len(dictlist)-1
     if TELL: print(last,dictlist)
     if last==0:
         # ONLY ONE ITEM LEFT
         return copy.copy(dictlist[0])
     else:
         reducedlist=dictlist[0:max(0,last-1)]
         if TELL: print(reducedlist)
         # make a copy of the last item
         d=copy.copy(dictlist[last])
         # update with the last but one item
         d.update(dictlist[last-1])
         # and recursively do the rest
         reducedlist.append(d)
         return merge(reducedlist,TELL)

 def remove(d,key,TELL=False):
     import copy
     e = copy.deepcopy(d)
     if TELL: print("original dict, BEF: %s"%d)
     del e[key]
     if TELL: print("copy-removed dict, AFT: %s"%e)
     return e


 stCond={'--conditions':'auto:run1_mc'}
 def Kby(N,s):
     return {'--relval':'%s000,%s'%(N,s)}
 def Mby(N,s):
     return {'--relval':'%s000000,%s'%(N,s)}

 def changeRefRelease(steps,listOfPairs):
     for s in steps:
         if ('INPUT' in steps[s]):
             oldD=steps[s]['INPUT'].dataSet
             for (ref,newRef) in listOfPairs:
                 if  ref in oldD:
                     steps[s]['INPUT'].dataSet=oldD.replace(ref,newRef)
         if '--pileup_input' in steps[s]:
             for (ref,newRef) in listOfPairs:
                 if ref in steps[s]['--pileup_input']:
                     steps[s]['--pileup_input']=steps[s]['--pileup_input'].replace(ref,newRef)

 def addForAll(steps,d):
     for s in steps:
         steps[s].update(d)


 def genvalid(fragment,d,suffix='all',fi='',dataSet=''):
     import copy
     c=copy.copy(d)
     if suffix:
         c['-s']=c['-s'].replace('genvalid','genvalid_'+suffix)
     if fi:
         c['--filein']='lhe:%d'%(fi,)
     if dataSet:
         c['--filein']='das:%s'%(dataSet,)
     c['cfg']=fragment
     return c

 def check_dups(input):
     seen = set()
     dups = set(x for x in input if x in seen or seen.add(x))

     return dups
MatrixUtil.InputInfo.ib_block
ib_block
Definition: MatrixUtil.py:116

ALCARECOEcalPhiSym_cff.float
float
Definition: ALCARECOEcalPhiSym_cff.py:32

MatrixUtil.InputInfo.queries
def queries(self, dataset)
Definition: MatrixUtil.py:173

MatrixUtil.InputInfo.run
run
Definition: MatrixUtil.py:107

merge
Definition: merge.py:1

MatrixUtil.WF.steps
steps
Definition: MatrixUtil.py:36

MatrixUtil.WF.interpret
def interpret(self, stepsDict)
Definition: MatrixUtil.py:41

MatrixUtil.Steps.__setitem__
def __setitem__(self, key, value)
Definition: MatrixUtil.py:16

MatrixUtil.genvalid
def genvalid(fragment, d, suffix='all', fi='', dataSet='')
Definition: MatrixUtil.py:268

MatrixUtil.InputInfo.files
files
Definition: MatrixUtil.py:109

MatrixUtil.WF.overrides
overrides
Definition: MatrixUtil.py:37

WZElectronSkims53X_cff.max
max
Definition: WZElectronSkims53X_cff.py:197

MatrixUtil.InputInfo.location
location
Definition: MatrixUtil.py:111

MatrixUtil.InputInfo.events
events
Definition: MatrixUtil.py:110

MatrixUtil.Steps.overwrite
def overwrite(self, keypair)
Definition: MatrixUtil.py:27

python.rootplot.root2matplotlib.replace
def replace(string, replacements)
Definition: root2matplotlib.py:444

MatrixUtil.InputInfo.dataSetParent
dataSetParent
Definition: MatrixUtil.py:117

MatrixUtil.WF.__init__
def __init__(self, n, l)
Definition: MatrixUtil.py:32

golden_json_2015

MatrixUtil.InputInfo.lumiRanges
def lumiRanges(self)
Definition: MatrixUtil.py:153

relativeConstraints.keys
keys
Definition: relativeConstraints.py:89

dcsonly_json_2012.findFileInPath
def findFileInPath(theFile)
Definition: dcsonly_json_2012.py:6

MatrixUtil.expandLsInterval
def expandLsInterval(lumis)
Definition: MatrixUtil.py:48

MatrixUtil.addForAll
def addForAll(steps, d)
Definition: MatrixUtil.py:263

createfilelist.int
int
Definition: createfilelist.py:10

MatrixUtil.Matrix
Definition: MatrixUtil.py:3

MatrixUtil.InputInfo.das
def das(self, das_options, dataset)
Definition: MatrixUtil.py:120

print
void print(TMatrixD &m, const char *label=nullptr, bool mathematicaFormat=false)
Definition: Utilities.cc:47

MatrixUtil.Matrix.__setitem__
def __setitem__(self, key, value)
Definition: MatrixUtil.py:4

MatrixUtil.WF.num
num
Definition: MatrixUtil.py:34

mps_setup.append
append
Definition: mps_setup.py:85

MatrixUtil.check_dups
def check_dups(input)
Definition: MatrixUtil.py:280

MatrixUtil.InputInfo
Definition: MatrixUtil.py:105

join
static std::string join(char **cmd)
Definition: RemoteFile.cc:21

MatrixUtil.selectedLS
def selectedLS(list_runs=[], maxNum=-1, l_json=data_json2015)
Definition: MatrixUtil.py:64

MatrixUtil.Steps
Definition: MatrixUtil.py:15

MatrixUtil.InputInfo.__init__
def __init__(self, dataSet, dataSetParent='', label='', run=[], ls={}, files=1000, events=InputInfoNDefault, split=10, location='CAF', ib_blacklist=None, ib_block=None, skimEvents=False)
Definition: MatrixUtil.py:106

MatrixUtil.InputInfo.split
split
Definition: MatrixUtil.py:114

MatrixUtil.InputInfo.lumis
def lumis(self)
Definition: MatrixUtil.py:160

MatrixUtil.remove
def remove(d, key, TELL=False)
Definition: MatrixUtil.py:234

MatrixUtil.InputInfo.ls
ls
Definition: MatrixUtil.py:108

MatrixUtil.changeRefRelease
def changeRefRelease(steps, listOfPairs)
Definition: MatrixUtil.py:251

update
#define update(a, b)
Definition: TrackClassifier.cc:10

MatrixUtil.Mby
def Mby(N, s)
Definition: MatrixUtil.py:248

MatrixUtil.InputInfo.ib_blacklist
ib_blacklist
Definition: MatrixUtil.py:115

MatrixUtil.InputInfo.dataSet
dataSet
Definition: MatrixUtil.py:113

MatrixUtil.Matrix.addOverride
def addOverride(self, key, override)
Definition: MatrixUtil.py:11

format

MatrixUtil.Kby
def Kby(N, s)
Definition: MatrixUtil.py:246

MatrixUtil.WF.addOverride
def addOverride(self, overrides)
Definition: MatrixUtil.py:38

default_text_conditions_cfi.object
object
Definition: default_text_conditions_cfi.py:8

MatrixUtil.InputInfo.label
label
Definition: MatrixUtil.py:112

str
#define str(s)
Definition: TestProcessor.cc:56

MatrixUtil.WF
Definition: MatrixUtil.py:31

MatrixUtil.InputInfo.skimEvents
skimEvents
Definition: MatrixUtil.py:118

isotrackApplyRegressor.range
range
Definition: isotrackApplyRegressor.py:124

MatrixUtil.InputInfo.__str__
def __str__(self)
Definition: MatrixUtil.py:209

MatrixUtil.merge
def merge(dictlist, TELL=False)
Definition: MatrixUtil.py:216