d3/d8b/edmStreamStallGrapher_8py_source.html

 #!/usr/bin/env python
 from __future__ import print_function
 from itertools import groupby
 from operator import attrgetter,itemgetter
 import sys
 from collections import defaultdict
 import six

 #----------------------------------------------
 def printHelp():
     s = '''
 To Use: Add the StallMonitor Service to the cmsRun job you want to check for
   stream stalls. Use something like this in the configuration:

   process.add_(cms.Service("StallMonitor", fileName = cms.untracked.string("stallMonitor.log")))

   After running the job, execute this script and pass the name of the
   StallMonitor log file to the script.

   By default, the script will then print an 'ASCII art' stall graph
   which consists of a line of text for each time a module or the
   source stops or starts. Each line contains the name of the module
   which either started or stopped running, and the number of modules
   running on each stream at that moment in time. After that will be
   the time and stream number. Then if a module just started, you
   will also see the amount of time the module spent between finishing
   its prefetching and starting.  The state of a module is represented
   by a symbol:

     plus  ("+") the stream has just finished waiting and is starting a module
     minus ("-") the stream just finished running a module

   If a module had to wait more than 0.1 seconds, the end of the line
   will have "STALLED". Startup actions, e.g. reading conditions,
   may affect results for the first few events.

   Using the command line arguments described above you can make the
   program create a PDF file with actual graphs instead of the 'ASCII art'
   output.

   Once the graph is completed, the program outputs the list of modules
   which had the greatest total stall times. The list is sorted by
   total stall time and written in descending order. In addition, the
   list of all stall times for the module is given.

   There is an inferior alternative (an old obsolete way).
   Instead of using the StallMonitor Service, you can use the
   Tracer Service.  Make sure to use the 'printTimestamps' option
   cms.Service("Tracer", printTimestamps = cms.untracked.bool(True))
   There are problems associated with this and it is not recommended.'''
     return s

 kStallThreshold=100 #in milliseconds
 kTracerInput=False

 #Stream states
 kStarted=0
 kFinished=1
 kPrefetchEnd=2
 kStartedAcquire=3
 kFinishedAcquire=4
 kStartedSource=5
 kFinishedSource=6
 kStartedSourceDelayedRead=7
 kFinishedSourceDelayedRead=8

 #Special names
 kSourceFindEvent = "sourceFindEvent"
 kSourceDelayedRead ="sourceDelayedRead"

 #----------------------------------------------
 def processingStepsFromStallMonitorOutput(f,moduleNames):
     for rawl in f:
         l = rawl.strip()
         if not l or l[0] == '#':
             continue
         (step,payload) = tuple(l.split(None,1))
         payload=payload.split()

         # Ignore these
         if step == 'E' or step == 'e':
             continue

         # Payload format is:
         #  <stream id> <..other fields..> <time since begin job>
         stream = int(payload[0])
         time = int(payload[-1])
         trans = None
         isEvent = True

         name = None
         # 'S' = begin of event creation in source
         # 's' = end of event creation in source
         if step == 'S' or step == 's':
             name = kSourceFindEvent
             trans = kStartedSource
             # The start of an event is the end of the framework part
             if step == 's':
                 trans = kFinishedSource
         else:
             # moduleID is the second payload argument for all steps below
             moduleID = payload[1]

             # 'p' = end of module prefetching
             # 'M' = begin of module processing
             # 'm' = end of module processing
             if step == 'p' or step == 'M' or step == 'm':
                 trans = kStarted
                 if step == 'p':
                     trans = kPrefetchEnd
                 elif step == 'm':
                     trans = kFinished
                 if step == 'm' or step == 'M':
                     isEvent = (int(payload[2]) == 0)
                 name = moduleNames[moduleID]

             # 'A' = begin of module acquire function
             # 'a' = end of module acquire function
             elif step == 'A' or step == 'a':
                 trans = kStartedAcquire
                 if step == 'a':
                     trans = kFinishedAcquire
                 name = moduleNames[moduleID]

             # Delayed read from source
             # 'R' = begin of delayed read from source
             # 'r' = end of delayed read from source
             elif step == 'R' or step == 'r':
                 trans = kStartedSourceDelayedRead
                 if step == 'r':
                     trans = kFinishedSourceDelayedRead
                 name = kSourceDelayedRead

         if trans is not None:
             yield (name,trans,stream,time, isEvent)

     return

 class StallMonitorParser(object):
     def __init__(self,f):
         numStreams = 0
         numStreamsFromSource = 0
         moduleNames = {}
         for rawl in f:
             l = rawl.strip()
             if l and l[0] == 'M':
                 i = l.split(' ')
                 if i[3] == '4':
                     #found global begin run
                     numStreams = int(i[1])+1
                     break
             if numStreams == 0 and l and l[0] == 'S':
                 s = int(l.split(' ')[1])
                 if s > numStreamsFromSource:
                   numStreamsFromSource = s
             if len(l) > 5 and l[0:2] == "#M":
                 (id,name)=tuple(l[2:].split())
                 moduleNames[id] = name
                 continue
         self._f = f
         if numStreams == 0:
           numStreams = numStreamsFromSource +1
         self.numStreams =numStreams
         self._moduleNames = moduleNames
         self.maxNameSize =0
         for n in six.iteritems(moduleNames):
             self.maxNameSize = max(self.maxNameSize,len(n))
         self.maxNameSize = max(self.maxNameSize,len(kSourceDelayedRead))

     def processingSteps(self):
         """Create a generator which can step through the file and return each processing step.
         Using a generator reduces the memory overhead when parsing a large file.
             """
         self._f.seek(0)
         return processingStepsFromStallMonitorOutput(self._f,self._moduleNames)

 #----------------------------------------------
 # Utility to get time out of Tracer output text format
 def getTime(line):
     time = line.split(" ")[1]
     time = time.split(":")
     time = int(time[0])*60*60+int(time[1])*60+float(time[2])
     time = int(1000*time) # convert to milliseconds
     return time

 #----------------------------------------------
 # The next function parses the Tracer output.
 # Here are some differences to consider if you use Tracer output
 # instead of the StallMonitor output.
 # - The time in the text of the Tracer output is not as precise
 # as the StallMonitor (.01 s vs .001 s)
 # - The MessageLogger bases the time on when the message printed
 # and not when it was initially queued up to print which smears
 # the accuracy of the times.
 # - Both of the previous things can produce some strange effects
 # in the output plots.
 # - The file size of the Tracer text file is much larger.
 # - The CPU work needed to parse the Tracer files is larger.
 # - The Tracer log file is expected to have "++" in the first
 # or fifth line. If there are extraneous lines at the beginning
 # you have to remove them.
 # - The ascii printout out will have one extraneous line
 # near the end for the SourceFindEvent start.
 # - The only advantage I can see is that you have only
 # one output file to handle instead of two, the regular
 # log file and the StallMonitor output.
 # We might should just delete the Tracer option because it is
 # clearly inferior ...
 def parseTracerOutput(f):
     processingSteps = []
     numStreams = 0
     maxNameSize = 0
     startTime = 0
     streamsThatSawFirstEvent = set()
     for l in f:
         trans = None
         # We estimate the start and stop of the source
         # by the end of the previous event and start of
         # the event. This is historical, probably because
         # the Tracer output for the begin and end of the
         # source event does not include the stream number.
         if l.find("processing event :") != -1:
             name = kSourceFindEvent
             trans = kStartedSource
             # the end of the source is estimated using the start of the event
             if l.find("starting:") != -1:
                 trans = kFinishedSource
         elif l.find("processing event for module") != -1:
             trans = kStarted
             if l.find("finished:") != -1:
                 if l.find("prefetching") != -1:
                     trans = kPrefetchEnd
                 else:
                     trans = kFinished
             else:
                 if l.find("prefetching") != -1:
                     #skip this since we don't care about prefetch starts
                     continue
             name = l.split("'")[1]
         elif l.find("processing event acquire for module:") != -1:
             trans = kStartedAcquire
             if l.find("finished:") != -1:
                 trans = kFinishedAcquire
             name = l.split("'")[1]
         elif l.find("event delayed read from source") != -1:
             trans = kStartedSourceDelayedRead
             if l.find("finished:") != -1:
                 trans = kFinishedSourceDelayedRead
             name = kSourceDelayedRead
         if trans is not None:
             time = getTime(l)
             if startTime == 0:
                 startTime = time
             time = time - startTime
             streamIndex = l.find("stream = ")
             stream = int(l[streamIndex+9:l.find(" ",streamIndex+10)])
             maxNameSize = max(maxNameSize, len(name))

             if trans == kFinishedSource and not stream in streamsThatSawFirstEvent:
                 # This is wrong but there is no way to estimate the time better
                 # because there is no previous event for the first event.
                 processingSteps.append((name,kStartedSource,stream,time,True))
                 streamsThatSawFirstEvent.add(stream)

             processingSteps.append((name,trans,stream,time, True))
             numStreams = max(numStreams, stream+1)

     f.close()
     return (processingSteps,numStreams,maxNameSize)

 class TracerParser(object):
     def __init__(self,f):
         self._processingSteps,self.numStreams,self.maxNameSize = parseTracerOutput(f)
     def processingSteps(self):
         return self._processingSteps

 #----------------------------------------------
 def chooseParser(inputFile):

     firstLine = inputFile.readline().rstrip()
     for i in range(3):
         inputFile.readline()
     # Often the Tracer log file starts with 4 lines not from the Tracer
     fifthLine = inputFile.readline().rstrip()
     inputFile.seek(0) # Rewind back to beginning
     if (firstLine.find("# Transition") != -1) or (firstLine.find("# Step") != -1):
         print("> ... Parsing StallMonitor output.")
         return StallMonitorParser

     if firstLine.find("++") != -1 or fifthLine.find("++") != -1:
         global kTracerInput
         kTracerInput = True
         print("> ... Parsing Tracer output.")
         return TracerParser
     else:
         inputFile.close()
         print("Unknown input format.")
         exit(1)

 #----------------------------------------------
 def readLogFile(inputFile):
     parseInput = chooseParser(inputFile)
     return parseInput(inputFile)

 #----------------------------------------------
 #
 # modules: The time between prefetch finished and 'start processing' is
 #   the time it took to acquire any resources which is by definition the
 #   stall time.
 #
 # source: The source just records how long it spent doing work,
 #   not how long it was stalled. We can get a lower bound on the stall
 #   time for delayed reads by measuring the time the stream was doing
 #   no work up till the start of the source delayed read.
 #
 def findStalledModules(processingSteps, numStreams):
     streamTime = [0]*numStreams
     streamState = [0]*numStreams
     stalledModules = {}
     modulesActiveOnStream = [{} for x in xrange(numStreams)]
     for n,trans,s,time,isEvent in processingSteps:

         waitTime = None
         modulesOnStream = modulesActiveOnStream[s]
         if trans == kPrefetchEnd:
             modulesOnStream[n] = time
         elif trans == kStarted or trans == kStartedAcquire:
             if n in modulesOnStream:
                 waitTime = time - modulesOnStream[n]
                 modulesOnStream.pop(n, None)
             streamState[s] +=1
         elif trans == kFinished or trans == kFinishedAcquire:
             streamState[s] -=1
             streamTime[s] = time
         elif trans == kStartedSourceDelayedRead:
             if streamState[s] == 0:
                 waitTime = time - streamTime[s]
         elif trans == kStartedSource:
             modulesOnStream.clear()
         elif trans == kFinishedSource or trans == kFinishedSourceDelayedRead:
             streamTime[s] = time
         if waitTime is not None:
             if waitTime > kStallThreshold:
                 t = stalledModules.setdefault(n,[])
                 t.append(waitTime)
     return stalledModules


 def createModuleTiming(processingSteps, numStreams):
     import yaml
     streamTime = [0]*numStreams
     streamState = [0]*numStreams
     moduleTimings = defaultdict(list)
     modulesActiveOnStream = [defaultdict(int) for x in xrange(numStreams)]
     for n,trans,s,time,isEvent in processingSteps:
         waitTime = None
         modulesOnStream = modulesActiveOnStream[s]
         if trans == kStarted:
             streamState[s] = 1
             modulesOnStream[n]=time
         elif trans == kFinished:
             waitTime = time - modulesOnStream[n]
             modulesOnStream.pop(n, None)
             streamState[s] = 0
             moduleTimings[n].append(float(waitTime/1000.))
     with open('module-timings.yaml', 'w') as outfile:
         outfile.write(yaml.dump(moduleTimings, default_flow_style=True))

 #----------------------------------------------
 def createAsciiImage(processingSteps, numStreams, maxNameSize):
     streamTime = [0]*numStreams
     streamState = [0]*numStreams
     modulesActiveOnStreams = [{} for x in xrange(numStreams)]
     for n,trans,s,time,isEvent in processingSteps:
         waitTime = None
         modulesActiveOnStream = modulesActiveOnStreams[s]
         if trans == kPrefetchEnd:
             modulesActiveOnStream[n] = time
             continue
         elif trans == kStartedAcquire or trans == kStarted:
             if n in modulesActiveOnStream:
                 waitTime = time - modulesActiveOnStream[n]
                 modulesActiveOnStream.pop(n, None)
             streamState[s] +=1
         elif trans == kFinishedAcquire or trans == kFinished:
             streamState[s] -=1
             streamTime[s] = time
         elif trans == kStartedSourceDelayedRead:
             if streamState[s] == 0:
                 waitTime = time - streamTime[s]
         elif trans == kStartedSource:
             modulesActiveOnStream.clear()
         elif trans == kFinishedSource or trans == kFinishedSourceDelayedRead:
             streamTime[s] = time
         states = "%-*s: " % (maxNameSize,n)
         if trans == kStartedAcquire or trans == kStarted or trans == kStartedSourceDelayedRead or trans == kStartedSource:
             states +="+ "
         else:
             states +="- "
         for index, state in enumerate(streamState):
             if n==kSourceFindEvent and index == s:
                 states +="* "
             else:
                 states +=str(state)+" "
         states += " -- " + str(time/1000.) + " " + str(s) + " "
         if waitTime is not None:
             states += " %.2f"% (waitTime/1000.)
             if waitTime > kStallThreshold:
                 states += " STALLED"

         print(states)

 #----------------------------------------------
 def printStalledModulesInOrder(stalledModules):
     priorities = []
     maxNameSize = 0
     for name,t in six.iteritems(stalledModules):
         maxNameSize = max(maxNameSize, len(name))
         t.sort(reverse=True)
         priorities.append((name,sum(t),t))

     def sumSort(i,j):
         return cmp(i[1],j[1])
     priorities.sort(cmp=sumSort, reverse=True)

     nameColumn = "Stalled Module"
     maxNameSize = max(maxNameSize, len(nameColumn))

     stallColumn = "Tot Stall Time"
     stallColumnLength = len(stallColumn)

     print("%-*s" % (maxNameSize, nameColumn), "%-*s"%(stallColumnLength,stallColumn), " Stall Times")
     for n,s,t in priorities:
         paddedName = "%-*s:" % (maxNameSize,n)
         print(paddedName, "%-*.2f"%(stallColumnLength,s/1000.), ", ".join([ "%.2f"%(x/1000.) for x in t]))

 #--------------------------------------------------------
 class Point:
     def __init__(self, x_, y_):
         self.x = x_
         self.y = y_

     def __str__(self):
         return "(x: {}, y: {})".format(self.x,self.y)

     def __repr__(self):
         return self.__str__()

 #--------------------------------------------------------
 def reduceSortedPoints(ps):
     if len(ps) < 2:
         return ps
     reducedPoints = []
     tmp = Point(ps[0].x, ps[0].y)
     for p in ps[1:]:
         if tmp.x == p.x:
             tmp.y += p.y
         else:
             reducedPoints.append(tmp)
             tmp = Point(p.x, p.y)
     reducedPoints.append(tmp)
     reducedPoints = [p for p in reducedPoints if p.y != 0]
     return reducedPoints

 # -------------------------------------------
 def adjacentDiff(*pairLists):
     points = []
     for pairList in pairLists:
         points += [Point(x[0], 1) for x in pairList if x[1] != 0]
         points += [Point(sum(x),-1) for x in pairList if x[1] != 0]
     points.sort(key=attrgetter('x'))
     return points

 stackType = 'stack'

 # --------------------------------------------
 class Stack:
     def __init__(self):
         self.data = []

     def update(self, graphType, points):
         tmp = points
         if len(self.data) != 0:
             tmp += self.data[-1][1]

         tmp.sort(key=attrgetter('x'))
         tmp = reduceSortedPoints(tmp)
         self.data.append((graphType, tmp))

 #---------------------------------------------
 # StreamInfoElement
 class StreamInfoElement:
     def __init__(self, begin_, delta_, color_):
         self.begin=begin_
         self.delta=delta_
         self.color=color_

     def unpack(self):
         return self.begin, self.delta, self.color

 #----------------------------------------------
 # Consolidating contiguous blocks with the same color
 # drastically reduces the size of the pdf file.
 def consolidateContiguousBlocks(numStreams, streamInfo):
     oldStreamInfo = streamInfo
     streamInfo = [[] for x in xrange(numStreams)]

     for s in xrange(numStreams):
         if oldStreamInfo[s]:
             lastStartTime,lastTimeLength,lastColor = oldStreamInfo[s][0].unpack()
             for info in oldStreamInfo[s][1:]:
                 start,length,color = info.unpack()
                 if color == lastColor and lastStartTime+lastTimeLength == start:
                     lastTimeLength += length
                 else:
                     streamInfo[s].append(StreamInfoElement(lastStartTime,lastTimeLength,lastColor))
                     lastStartTime = start
                     lastTimeLength = length
                     lastColor = color
             streamInfo[s].append(StreamInfoElement(lastStartTime,lastTimeLength,lastColor))

     return streamInfo

 #----------------------------------------------
 # Consolidating contiguous blocks with the same color drastically
 # reduces the size of the pdf file.  Same functionality as the
 # previous function, but with slightly different implementation.
 def mergeContiguousBlocks(blocks):
     oldBlocks = blocks

     blocks = []
     if not oldBlocks:
         return blocks

     lastStartTime,lastTimeLength,lastHeight = oldBlocks[0]
     for start,length,height in oldBlocks[1:]:
         if height == lastHeight and lastStartTime+lastTimeLength == start:
             lastTimeLength += length
         else:
             blocks.append((lastStartTime,lastTimeLength,lastHeight))
             lastStartTime = start
             lastTimeLength = length
             lastHeight = height
     blocks.append((lastStartTime,lastTimeLength,lastHeight))

     return blocks

 #----------------------------------------------
 def plotPerStreamAboveFirstAndPrepareStack(points, allStackTimes, ax, stream, height, streamHeightCut, doPlot, addToStackTimes, color, threadOffset):
     points = sorted(points, key=attrgetter('x'))
     points = reduceSortedPoints(points)
     streamHeight = 0
     preparedTimes = []
     for t1,t2 in zip(points, points[1:]):
         streamHeight += t1.y
         # We make a cut here when plotting because the first row for
         # each stream was already plotted previously and we do not
         # need to plot it again. And also we want to count things
         # properly in allStackTimes. We want to avoid double counting
         # or missing running modules and this is complicated because
         # we counted the modules in the first row already.
         if streamHeight < streamHeightCut:
             continue
         preparedTimes.append((t1.x,t2.x-t1.x, streamHeight))
     preparedTimes.sort(key=itemgetter(2))
     preparedTimes = mergeContiguousBlocks(preparedTimes)

     for nthreads, ts in groupby(preparedTimes, itemgetter(2)):
         theTS = [(t[0],t[1]) for t in ts]
         if doPlot:
             theTimes = [(t[0]/1000.,t[1]/1000.) for t in theTS]
             yspan = (stream-0.4+height,height*(nthreads-1))
             ax.broken_barh(theTimes, yspan, facecolors=color, edgecolors=color, linewidth=0)
         if addToStackTimes:
             allStackTimes[color].extend(theTS*(nthreads-threadOffset))

 #----------------------------------------------
 def createPDFImage(pdfFile, shownStacks, processingSteps, numStreams, stalledModuleInfo, displayExternalWork, checkOrder):

     stalledModuleNames = set([x for x in stalledModuleInfo.iterkeys()])
     streamLowestRow = [[] for x in xrange(numStreams)]
     modulesActiveOnStreams = [set() for x in xrange(numStreams)]
     acquireActiveOnStreams = [set() for x in xrange(numStreams)]
     externalWorkOnStreams  = [set() for x in xrange(numStreams)]
     previousFinishTime = [None for x in xrange(numStreams)]
     streamRunningTimes = [[] for x in xrange(numStreams)]
     streamExternalWorkRunningTimes = [[] for x in xrange(numStreams)]
     maxNumberOfConcurrentModulesOnAStream = 1
     externalWorkModulesInJob = False
     previousTime = [0 for x in xrange(numStreams)]

     # The next five variables are only used to check for out of order transitions
     finishBeforeStart = [set() for x in xrange(numStreams)]
     finishAcquireBeforeStart = [set() for x in xrange(numStreams)]
     countSource = [0 for x in xrange(numStreams)]
     countDelayedSource = [0 for x in xrange(numStreams)]
     countExternalWork = [defaultdict(int) for x in xrange(numStreams)]

     timeOffset = None
     for n,trans,s,time,isEvent in processingSteps:
         if timeOffset is None:
             timeOffset = time
         startTime = None
         time -=timeOffset
         # force the time to monotonically increase on each stream
         if time < previousTime[s]:
             time = previousTime[s]
         previousTime[s] = time

         activeModules = modulesActiveOnStreams[s]
         acquireModules = acquireActiveOnStreams[s]
         externalWorkModules = externalWorkOnStreams[s]

         if trans == kStarted or trans == kStartedSourceDelayedRead or trans == kStartedAcquire or trans == kStartedSource :
             if checkOrder:
                 # Note that the code which checks the order of transitions assumes that
                 # all the transitions exist in the input. It is checking only for order
                 # problems, usually a start before a finish. Problems are fixed and
                 # silently ignored. Nothing gets plotted for transitions that are
                 # in the wrong order.
                 if trans == kStarted:
                     countExternalWork[s][n] -= 1
                     if n in finishBeforeStart[s]:
                         finishBeforeStart[s].remove(n)
                         continue
                 elif trans == kStartedAcquire:
                     if n in finishAcquireBeforeStart[s]:
                         finishAcquireBeforeStart[s].remove(n)
                         continue

             if trans == kStartedSourceDelayedRead:
                 countDelayedSource[s] += 1
                 if countDelayedSource[s] < 1:
                     continue
             elif trans == kStartedSource:
                 countSource[s] += 1
                 if countSource[s] < 1:
                     continue

             moduleNames = activeModules.copy()
             moduleNames.update(acquireModules)
             if trans == kStartedAcquire:
                  acquireModules.add(n)
             else:
                  activeModules.add(n)
             streamRunningTimes[s].append(Point(time,1))
             if moduleNames or externalWorkModules:
                 startTime = previousFinishTime[s]
             previousFinishTime[s] = time

             if trans == kStarted and n in externalWorkModules:
                 externalWorkModules.remove(n)
                 streamExternalWorkRunningTimes[s].append(Point(time, -1))
             else:
                 nTotalModules = len(activeModules) + len(acquireModules) + len(externalWorkModules)
                 maxNumberOfConcurrentModulesOnAStream = max(maxNumberOfConcurrentModulesOnAStream, nTotalModules)
         elif trans == kFinished or trans == kFinishedSourceDelayedRead or trans == kFinishedAcquire or trans == kFinishedSource :
             if checkOrder:
                 if trans == kFinished:
                     if n not in activeModules:
                         finishBeforeStart[s].add(n)
                         continue

             if trans == kFinishedSourceDelayedRead:
                 countDelayedSource[s] -= 1
                 if countDelayedSource[s] < 0:
                     continue
             elif trans == kFinishedSource:
                 countSource[s] -= 1
                 if countSource[s] < 0:
                     continue

             if trans == kFinishedAcquire:
                 if checkOrder:
                     countExternalWork[s][n] += 1
                 if displayExternalWork:
                     externalWorkModulesInJob = True
                     if (not checkOrder) or countExternalWork[s][n] > 0:
                         externalWorkModules.add(n)
                         streamExternalWorkRunningTimes[s].append(Point(time,+1))
                 if checkOrder and n not in acquireModules:
                     finishAcquireBeforeStart[s].add(n)
                     continue
             streamRunningTimes[s].append(Point(time,-1))
             startTime = previousFinishTime[s]
             previousFinishTime[s] = time
             moduleNames = activeModules.copy()
             moduleNames.update(acquireModules)

             if trans == kFinishedAcquire:
                 acquireModules.remove(n)
             elif trans == kFinishedSourceDelayedRead:
                 if countDelayedSource[s] == 0:
                     activeModules.remove(n)
             elif trans == kFinishedSource:
                 if countSource[s] == 0:
                     activeModules.remove(n)
             else:
                 activeModules.remove(n)

         if startTime is not None:
             c="green"
             if not isEvent:
               c="limegreen"
             if not moduleNames:
                 c = "darkviolet"
             elif (kSourceDelayedRead in moduleNames) or (kSourceFindEvent in moduleNames):
                 c = "orange"
             else:
                 for n in moduleNames:
                     if n in stalledModuleNames:
                         c="red"
                         break
             streamLowestRow[s].append(StreamInfoElement(startTime, time-startTime, c))
     streamLowestRow = consolidateContiguousBlocks(numStreams, streamLowestRow)

     nr = 1
     if shownStacks:
         nr += 1
     fig, ax = plt.subplots(nrows=nr, squeeze=True)
     axStack = None
     if shownStacks:
         [xH,yH] = fig.get_size_inches()
         fig.set_size_inches(xH,yH*4/3)
         ax = plt.subplot2grid((4,1),(0,0), rowspan=3)
         axStack = plt.subplot2grid((4,1),(3,0))

     ax.set_xlabel("Time (sec)")
     ax.set_ylabel("Stream ID")
     ax.set_ylim(-0.5,numStreams-0.5)
     ax.yaxis.set_ticks(xrange(numStreams))

     height = 0.8/maxNumberOfConcurrentModulesOnAStream
     allStackTimes={'green': [],'limegreen':[], 'red': [], 'blue': [], 'orange': [], 'darkviolet': []}
     for iStream,lowestRow in enumerate(streamLowestRow):
         times=[(x.begin/1000., x.delta/1000.) for x in lowestRow] # Scale from msec to sec.
         colors=[x.color for x in lowestRow]
         # for each stream, plot the lowest row
         ax.broken_barh(times,(iStream-0.4,height),facecolors=colors,edgecolors=colors,linewidth=0)
         # record them also for inclusion in the stack plot
         # the darkviolet ones get counted later so do not count them here
         for info in lowestRow:
             if not info.color == 'darkviolet':
                 allStackTimes[info.color].append((info.begin, info.delta))

     # Now superimpose the number of concurrently running modules on to the graph.
     if maxNumberOfConcurrentModulesOnAStream > 1 or externalWorkModulesInJob:

         for i,perStreamRunningTimes in enumerate(streamRunningTimes):

             perStreamTimesWithExtendedWork = list(perStreamRunningTimes)
             perStreamTimesWithExtendedWork.extend(streamExternalWorkRunningTimes[i])

             plotPerStreamAboveFirstAndPrepareStack(perStreamTimesWithExtendedWork,
                                                    allStackTimes, ax, i, height,
                                                    streamHeightCut=2,
                                                    doPlot=True,
                                                    addToStackTimes=False,
                                                    color='darkviolet',
                                                    threadOffset=1)

             plotPerStreamAboveFirstAndPrepareStack(perStreamRunningTimes,
                                                    allStackTimes, ax, i, height,
                                                    streamHeightCut=2,
                                                    doPlot=True,
                                                    addToStackTimes=True,
                                                    color='blue',
                                                    threadOffset=1)

             plotPerStreamAboveFirstAndPrepareStack(streamExternalWorkRunningTimes[i],
                                                    allStackTimes, ax, i, height,
                                                    streamHeightCut=1,
                                                    doPlot=False,
                                                    addToStackTimes=True,
                                                    color='darkviolet',
                                                    threadOffset=0)

     if shownStacks:
         print("> ... Generating stack")
         stack = Stack()
         for color in ['green','limegreen','blue','red','orange','darkviolet']:
             tmp = allStackTimes[color]
             tmp = reduceSortedPoints(adjacentDiff(tmp))
             stack.update(color, tmp)

         for stk in reversed(stack.data):
             color = stk[0]

             # Now arrange list in a manner that it can be grouped by the height of the block
             height = 0
             xs = []
             for p1,p2 in zip(stk[1], stk[1][1:]):
                 height += p1.y
                 xs.append((p1.x, p2.x-p1.x, height))
             xs.sort(key = itemgetter(2))
             xs = mergeContiguousBlocks(xs)

             for height, xpairs in groupby(xs, itemgetter(2)):
                 finalxs = [(e[0]/1000.,e[1]/1000.) for e in xpairs]
                 # plot the stacked plot, one color and one height on each call to broken_barh
                 axStack.broken_barh(finalxs, (0, height), facecolors=color, edgecolors=color, linewidth=0)

         axStack.set_xlabel("Time (sec)");
         axStack.set_ylabel("# modules");
         axStack.set_xlim(ax.get_xlim())
         axStack.tick_params(top='off')

     fig.text(0.1, 0.95, "modules running event", color = "green", horizontalalignment = 'left')
     fig.text(0.1, 0.92, "modules running other", color = "limegreen", horizontalalignment = 'left')
     fig.text(0.5, 0.95, "stalled module running", color = "red", horizontalalignment = 'center')
     fig.text(0.9, 0.95, "read from input", color = "orange", horizontalalignment = 'right')
     fig.text(0.5, 0.92, "multiple modules running", color = "blue", horizontalalignment = 'center')
     if displayExternalWork:
         fig.text(0.9, 0.92, "external work", color = "darkviolet", horizontalalignment = 'right')
     print("> ... Saving to file: '{}'".format(pdfFile))
     plt.savefig(pdfFile)

 #=======================================
 if __name__=="__main__":
     import argparse
     import re
     import sys

     # Program options
     parser = argparse.ArgumentParser(description='Convert a text file created by cmsRun into a stream stall graph.',
                                      formatter_class=argparse.RawDescriptionHelpFormatter,
                                      epilog=printHelp())
     parser.add_argument('filename',
                         type=argparse.FileType('r'), # open file
                         help='file to process')
     parser.add_argument('-g', '--graph',
                         nargs='?',
                         metavar="'stall.pdf'",
                         const='stall.pdf',
                         dest='graph',
                         help='''Create pdf file of stream stall graph.  If -g is specified
                         by itself, the default file name is \'stall.pdf\'.  Otherwise, the
                         argument to the -g option is the filename.''')
     parser.add_argument('-s', '--stack',
                         action='store_true',
                         help='''Create stack plot, combining all stream-specific info.
                         Can be used only when -g is specified.''')
     parser.add_argument('-e', '--external',
                         action='store_false',
                         help='''Suppress display of external work in graphs.''')
     parser.add_argument('-o', '--order',
                         action='store_true',
                         help='''Enable checks for and repair of transitions in the input that are in the wrong order (for example a finish transition before a corresponding start). This is always enabled for Tracer input, but is usually an unnecessary waste of CPU time and memory with StallMonitor input and by default not enabled.''')
     parser.add_argument('-t', '--timings',
                         action='store_true',
                         help='''Create a dictionary of module labels and their timings from the stall monitor log. Write the dictionary filea as a yaml file modules-timings.yaml.''')
     args = parser.parse_args()

     # Process parsed options
     inputFile = args.filename
     pdfFile = args.graph
     shownStacks = args.stack
     displayExternalWork = args.external
     checkOrder = args.order
     doModuleTimings = False
     if args.timings:
         doModuleTimings = True

     doGraphic = False
     if pdfFile is not None:
         doGraphic = True
         import matplotlib
         # Need to force display since problems with CMSSW matplotlib.
         matplotlib.use("PDF")
         import matplotlib.pyplot as plt
         if not re.match(r'^[\w\.]+$', pdfFile):
             print("Malformed file name '{}' supplied with the '-g' option.".format(pdfFile))
             print("Only characters 0-9, a-z, A-Z, '_', and '.' are allowed.")
             exit(1)

         if '.' in pdfFile:
             extension = pdfFile.split('.')[-1]
             supported_filetypes = plt.figure().canvas.get_supported_filetypes()
             if not extension in supported_filetypes:
                 print("A graph cannot be saved to a filename with extension '{}'.".format(extension))
                 print("The allowed extensions are:")
                 for filetype in supported_filetypes:
                     print("   '.{}'".format(filetype))
                 exit(1)

     if pdfFile is None and shownStacks:
         print("The -s (--stack) option can be used only when the -g (--graph) option is specified.")
         exit(1)

     sys.stderr.write(">reading file: '{}'\n".format(inputFile.name))
     reader = readLogFile(inputFile)
     if kTracerInput:
         checkOrder = True
     sys.stderr.write(">processing data\n")
     stalledModules = findStalledModules(reader.processingSteps(), reader.numStreams)


     if not doGraphic:
         sys.stderr.write(">preparing ASCII art\n")
         createAsciiImage(reader.processingSteps(), reader.numStreams, reader.maxNameSize)
     else:
         sys.stderr.write(">creating PDF\n")
         createPDFImage(pdfFile, shownStacks, reader.processingSteps(), reader.numStreams, stalledModules, displayExternalWork, checkOrder)
     printStalledModulesInOrder(stalledModules)
     if doModuleTimings:
         sys.stderr.write(">creating module-timings.yaml\n")
         createModuleTiming(reader.processingSteps(), reader.numStreams)
edmStreamStallGrapher.createPDFImage
def createPDFImage(pdfFile, shownStacks, processingSteps, numStreams, stalledModuleInfo, displayExternalWork, checkOrder)
Definition: edmStreamStallGrapher.py:578

edmStreamStallGrapher.StallMonitorParser.maxNameSize
maxNameSize
Definition: edmStreamStallGrapher.py:165

edmStreamStallGrapher.StreamInfoElement.delta
delta
Definition: edmStreamStallGrapher.py:495

edmStreamStallGrapher.Point
Definition: edmStreamStallGrapher.py:438

edmStreamStallGrapher.Stack.update
def update(self, graphType, points)
Definition: edmStreamStallGrapher.py:481

edmStreamStallGrapher.Point.y
y
Definition: edmStreamStallGrapher.py:441

edmStreamStallGrapher.Point.x
x
Definition: edmStreamStallGrapher.py:440

edmStreamStallGrapher.findStalledModules
def findStalledModules(processingSteps, numStreams)
Definition: edmStreamStallGrapher.py:316

edmStreamStallGrapher.mergeContiguousBlocks
def mergeContiguousBlocks(blocks)
Definition: edmStreamStallGrapher.py:528

edmStreamStallGrapher.consolidateContiguousBlocks
def consolidateContiguousBlocks(numStreams, streamInfo)
Definition: edmStreamStallGrapher.py:504

edm::print
S & print(S &os, JobReport::InputFile const &f)
Definition: JobReport.cc:66

edmStreamStallGrapher.StreamInfoElement.begin
begin
Definition: edmStreamStallGrapher.py:494

edmStreamStallGrapher.Stack.__init__
def __init__(self)
Definition: edmStreamStallGrapher.py:478

edmStreamStallGrapher.StallMonitorParser
Definition: edmStreamStallGrapher.py:139

edmStreamStallGrapher.StreamInfoElement.__init__
def __init__(self, begin_, delta_, color_)
Definition: edmStreamStallGrapher.py:493

edmStreamStallGrapher.TracerParser.maxNameSize
maxNameSize
Definition: edmStreamStallGrapher.py:273

createfilelist.int
int
Definition: createfilelist.py:10

ComparisonHelper::zip
OutputIterator zip(InputIterator1 first1, InputIterator1 last1, InputIterator2 first2, InputIterator2 last2, OutputIterator result, Compare comp)
Definition: L1TStage2CaloLayer1.h:38

edmStreamStallGrapher.Point.__str__
def __str__(self)
Definition: edmStreamStallGrapher.py:443

edmStreamStallGrapher.StreamInfoElement.color
color
Definition: edmStreamStallGrapher.py:496

edmStreamStallGrapher.chooseParser
def chooseParser(inputFile)
Definition: edmStreamStallGrapher.py:278

edmStreamStallGrapher.StallMonitorParser._f
_f
Definition: edmStreamStallGrapher.py:160

edmStreamStallGrapher.createModuleTiming
def createModuleTiming(processingSteps, numStreams)
Definition: edmStreamStallGrapher.py:349

objects.autophobj.float
float
Definition: autophobj.py:147

edmStreamStallGrapher.StallMonitorParser._moduleNames
_moduleNames
Definition: edmStreamStallGrapher.py:164

edmStreamStallGrapher.Point.__repr__
def __repr__(self)
Definition: edmStreamStallGrapher.py:446

edmStreamStallGrapher.printHelp
def printHelp()
Definition: edmStreamStallGrapher.py:10

SiStripPI::max
Definition: SiStripPayloadInspectorHelper.h:178

edmStreamStallGrapher.printStalledModulesInOrder
def printStalledModulesInOrder(stalledModules)
Definition: edmStreamStallGrapher.py:414

edmStreamStallGrapher.Stack
Definition: edmStreamStallGrapher.py:477

edmStreamStallGrapher.createAsciiImage
def createAsciiImage(processingSteps, numStreams, maxNameSize)
Definition: edmStreamStallGrapher.py:370

edmStreamStallGrapher.reduceSortedPoints
def reduceSortedPoints(ps)
Definition: edmStreamStallGrapher.py:450

PVValHelper::add
void add(std::map< std::string, TH1 * > &h, TH1 *hist)
Definition: PVValidationHelpers.cc:12

edmStreamStallGrapher.StallMonitorParser.numStreams
numStreams
Definition: edmStreamStallGrapher.py:163

edmStreamStallGrapher.TracerParser.__init__
def __init__(self, f)
Definition: edmStreamStallGrapher.py:272

mps_setup.append
append
Definition: mps_setup.py:84

join
static std::string join(char **cmd)
Definition: RemoteFile.cc:18

edmStreamStallGrapher.TracerParser
Definition: edmStreamStallGrapher.py:271

edmStreamStallGrapher.StallMonitorParser.processingSteps
def processingSteps(self)
Definition: edmStreamStallGrapher.py:170

edmStreamStallGrapher.processingStepsFromStallMonitorOutput
def processingStepsFromStallMonitorOutput(f, moduleNames)
Definition: edmStreamStallGrapher.py:72

edmStreamStallGrapher.TracerParser.processingSteps
def processingSteps(self)
Definition: edmStreamStallGrapher.py:274

MatrixUtil.remove
def remove(d, key, TELL=False)
Definition: MatrixUtil.py:212

cmsRelvalreport.exit
exit
Definition: cmsRelvalreport.py:1001

edmStreamStallGrapher.readLogFile
def readLogFile(inputFile)
Definition: edmStreamStallGrapher.py:301

edmStreamStallGrapher.getTime
def getTime(line)
Definition: edmStreamStallGrapher.py:179

edmStreamStallGrapher.Point.__init__
def __init__(self, x_, y_)
Definition: edmStreamStallGrapher.py:439

edmStreamStallGrapher.StreamInfoElement.unpack
def unpack(self)
Definition: edmStreamStallGrapher.py:498

edmStreamStallGrapher.StallMonitorParser.__init__
def __init__(self, f)
Definition: edmStreamStallGrapher.py:140

format

edmStreamStallGrapher.adjacentDiff
def adjacentDiff(pairLists)
Definition: edmStreamStallGrapher.py:466

edmStreamStallGrapher.plotPerStreamAboveFirstAndPrepareStack
def plotPerStreamAboveFirstAndPrepareStack(points, allStackTimes, ax, stream, height, streamHeightCut, doPlot, addToStackTimes, color, threadOffset)
Definition: edmStreamStallGrapher.py:549

str
#define str(s)
Definition: TestProcessor.cc:47

edmStreamStallGrapher.Stack.data
data
Definition: edmStreamStallGrapher.py:479

split
double split
Definition: MVATrainer.cc:139

resolutioncreator_cfi.object
object
Definition: resolutioncreator_cfi.py:4

edmStreamStallGrapher.StreamInfoElement
Definition: edmStreamStallGrapher.py:492

list
How EventSelector::AcceptEvent() decides whether to accept an event for output otherwise it is excluding the probing of A single or multiple positive and the trigger will pass if any such matching triggers are PASS or EXCEPTION[A criterion thatmatches no triggers at all is detected and causes a throw.] A single negative with an expectation of appropriate bit checking in the decision and the trigger will pass if any such matching triggers are FAIL or EXCEPTION A wildcarded negative criterion that matches more than one trigger in the trigger list("!*","!HLTx*"if it matches 2 triggers or more) will accept the event if all the matching triggers are FAIL.It will reject the event if any of the triggers are PASS or EXCEPTION(this matches the behavior of"!*"before the partial wildcard feature was incorporated).Triggers which are in the READY state are completely ignored.(READY should never be returned since the trigger paths have been run

edmStreamStallGrapher.parseTracerOutput
def parseTracerOutput(f)
Definition: edmStreamStallGrapher.py:209

timeUnitHelper.unpack
def unpack(i)
Definition: timeUnitHelper.py:17