ATLAS Offline Software
Loading...
Searching...
No Matches
python.HTCondorJobRunner.HTCondorJobRunner Class Reference
Inheritance diagram for python.HTCondorJobRunner.HTCondorJobRunner:
Collaboration diagram for python.HTCondorJobRunner.HTCondorJobRunner:

Public Member Functions

 __init__ (self, **params)
 submitJob (self, jobConfig)
 setParam (self, name, value=None, description=None, isSpecial=None, insertAtFront=False)
 appendParam (self, name, value=None, description=None, isSpecial=None, insertAtFront=False, endOfLine='\n')
 getParam (self, name)
 isSpecialParam (self, name)
 registerToBeCopied (self, paramName)
 checkParams (self)
 showParams (self, maxLineLength=80)
 dumpParams (self, format='%(name) -20s=%(value) s', maxLineLength=0)
 addFiles (self, fileList)
 addFilesToPoolFileCatalog (self, fileList)
 configureJob (self, jobnr, inputList=[])
 configure (self)
 runJob (self, jobnr)
 run (self, jobnr=None)
 getNJobs (self)
 getRunningJobs (self)
 wait (self)
 getOutputFiles (self)
 log (self, subject, body, **data)

Public Attributes

dict params = { }
list paramOrder = [ ]
list paramToBeCopied = [ ]
dict jobs = { }
dict jobStatus = { }

Private Attributes

 __class__

Detailed Description

HTCondorJobRunner - run jobs using the HTCondor batch system

Definition at line 28 of file HTCondorJobRunner.py.

Constructor & Destructor Documentation

◆ __init__()

python.HTCondorJobRunner.HTCondorJobRunner.__init__ ( self,
** params )
Constructor (takes any number of parameters as an argument).

Definition at line 31 of file HTCondorJobRunner.py.

31 def __init__(self,**params):
32 """Constructor (takes any number of parameters as an argument)."""
33 JobRunner.JobRunner.__init__(self)
34
35 # Set user-specified parameters only after HTCondorJobRunner defaults
36 self.setParam('batchqueue','workday','Batch queue')
37 for k in params.keys():
38 self.setParam(k,params[k])
39 self.checkParams()
40

Member Function Documentation

◆ addFiles()

python.JobRunner.JobRunner.addFiles ( self,
fileList )
inherited
Add a list of input files to be processed.

Definition at line 247 of file JobRunner.py.

247 def addFiles(self,fileList):
248 """ Add a list of input files to be processed."""
249 self.getParam('inputfiles').extend(fileList)
250
251

◆ addFilesToPoolFileCatalog()

python.JobRunner.JobRunner.addFilesToPoolFileCatalog ( self,
fileList )
inherited
Add a list of files to be inserted to the POOL file catalog.

Definition at line 252 of file JobRunner.py.

252 def addFilesToPoolFileCatalog(self,fileList):
253 """Add a list of files to be inserted to the POOL file catalog."""
254 self.getParam('filesforpoolcatalog').extend(fileList)
255
256

◆ appendParam()

python.JobRunner.JobRunner.appendParam ( self,
name,
value = None,
description = None,
isSpecial = None,
insertAtFront = False,
endOfLine = '\n' )
inherited
Append to the value of a job parameter. If the parameter doesn't exist yet,
   setParam is called to create it. If it does exist, only the value is updated
   and the description and flag arguments are ignored.

Definition at line 177 of file JobRunner.py.

177 def appendParam(self,name,value=None,description=None,isSpecial=None,insertAtFront=False,endOfLine='\n'):
178 """Append to the value of a job parameter. If the parameter doesn't exist yet,
179 setParam is called to create it. If it does exist, only the value is updated
180 and the description and flag arguments are ignored."""
181 if name in self.params:
182 if value is not None:
183 p = self.params[name]
184 if isinstance(p.value,str) and p.value:
185 p.value = p.value + endOfLine + value
186 else:
187 p.value = p.value + value
188 else:
189 self.setParam(name,value,description,isSpecial,insertAtFront)
190
191

◆ checkParams()

python.JobRunner.JobRunner.checkParams ( self)
inherited
A generic routine for checking job parameters. Check that all parameters
   can be evaluated. May be overrridden by a subclass if desired.

Definition at line 209 of file JobRunner.py.

209 def checkParams(self):
210 """A generic routine for checking job parameters. Check that all parameters
211 can be evaluated. May be overrridden by a subclass if desired."""
212 if len(self.paramOrder)!=len(self.params):
213 raise JobRunnerError ('Inconsistent parameter definition')
214 try:
215 tmp = { }
216 for p in self.paramOrder:
217 value = '' # this is necessary to prevent an exception from picking up the previous value
218 value = self.getParam(p)
219 if isinstance(value,str):
220 tmp[p] = value % tmp
221 else:
222 tmp[p] = value
223 except Exception:
224 raise JobRunnerError ('Unable to evaluate parameter: '+p+' = '+value+' (check parameter order)')
225
226

◆ configure()

python.JobRunner.JobRunner.configure ( self)
inherited
Configure all jobs.

Definition at line 374 of file JobRunner.py.

374 def configure(self):
375 """Configure all jobs."""
376 if self.getParam('filesperjob')==0 or not self.getParam('inputfiles'):
377 raise JobRunnerError ("No input files or illegal parameter 'filesperjob'")
378 lbperjob = self.getParam('lbperjob')
379 if lbperjob:
380 # Bunched job submission with all files from LB range in single job
381 if lbperjob<=0:
382 raise JobRunnerError ('Negative number of luminosity blocks per job not allowed')
383 inputfiles = self.getParam('inputfiles')
384 jobInputDict = {}
385 jobLBDict = {}
386 lbpattern = re.compile(r'lb(\d+)')
387 for f in inputfiles:
388 lbnrs = lbpattern.findall(f)
389
390 if(len(lbnrs) < 1) :
391 raise JobRunnerError ('Unable to determine luminosity block number of file %s' % f)
392
393 if(len(lbnrs) > 2) :
394 raise JobRunnerError ('Too many luminosity block numbers in filename %s' % f)
395
396 lbnr = int(lbnrs[0])
397 if(len(lbnrs) > 1) :
398 lbnrmax = int(lbnrs[1])
399 else :
400 lbnrmax = lbnr
401
402 while (lbnr <= lbnrmax) :
403
404 jobId = int((lbnr-1)/lbperjob)
405 #print ('LB = %4i jobid = %i' % (lbnr,jobId))
406 if jobId not in jobInputDict:
407 jobInputDict[jobId] = [f]
408 jobLBDict[jobId] = [lbnr]
409 else:
410 if f not in jobInputDict[jobId] :
411 jobInputDict[jobId].append(f)
412 if lbnr not in jobLBDict[jobId] :
413 jobLBDict[jobId].append(lbnr)
414
415 lbnr = lbnr+1
416
417 maxJobs = self.getParam('maxjobs')
418 if not maxJobs:
419 maxJobs = len(jobInputDict)
420 for i in sorted(jobInputDict.keys())[:maxJobs]:
421 if i<0:
422 jobnr = 0
423 else:
424 jobnr = i*lbperjob+1 # use first LB number as job number
425 self.setParam('lbList', jobLBDict[i])
426 self.configureJob(jobnr,jobInputDict[i])
427
428 else:
429 # Normal (unbunched job submission)
430 njobs = int(math.ceil(float(len(self.getParam('inputfiles')))/self.getParam('filesperjob')))
431 if self.getParam('maxjobs'):
432 njobs = min(self.getParam('maxjobs'),njobs)
433 print ('\nConfiguring %i job(s) ...' % (njobs))
434 for i in range(njobs):
435 self.configureJob(i)
436
437
if(febId1==febId2)
bool configure(asg::AnaToolHandle< ITrigGlobalEfficiencyCorrectionTool > &tool, ToolHandleArray< IAsgElectronEfficiencyCorrectionTool > &electronEffToolsHandles, ToolHandleArray< IAsgElectronEfficiencyCorrectionTool > &electronSFToolsHandles, ToolHandleArray< CP::IMuonTriggerScaleFactors > &muonToolsHandles, ToolHandleArray< IAsgPhotonEfficiencyCorrectionTool > &photonEffToolsHandles, ToolHandleArray< IAsgPhotonEfficiencyCorrectionTool > &photonSFToolsHandles, const std::string &triggers, const std::map< std::string, std::string > &legsPerTool, unsigned long nToys, bool debug)
#define min(a, b)
Definition cfImp.cxx:40

◆ configureJob()

python.JobRunner.JobRunner.configureJob ( self,
jobnr,
inputList = [] )
inherited
Configure parameters for a single job and write job configuration files. If inputLIst
   is given, this is the list of input files used for the job.

Definition at line 257 of file JobRunner.py.

257 def configureJob(self,jobnr,inputList=[]):
258 """Configure parameters for a single job and write job configuration files. If inputLIst
259 is given, this is the list of input files used for the job."""
260 if jobnr in self.jobs:
261 raise JobRunnerError ('Job number %s already configured' % jobnr)
262 jobConfig = { }
263
264 jobConfig['jobnr'] = jobnr
265 self.setParam('jobnr',jobnr)
266
267 # Check if any input files are available for this job
268 if inputList:
269 jobConfig['inputfiles'] = inputList
270 else:
271 inputfiles = self.getParam('inputfiles')
272 iFirst = self.getParam('filesperjob')*jobnr
273 if iFirst >= len(inputfiles):
274 raise JobRunnerError ('Jobnr = %i too high for available number of files' % jobnr)
275 iLast = iFirst + self.getParam('filesperjob')
276 if iLast > len(inputfiles):
277 iLast=len(inputfiles)
278 jobConfig['inputfiles'] = inputfiles[iFirst:iLast]
279
280 # Update regular parameters
281 for p in self.paramOrder:
282 if self.isSpecialParam(p): continue
283 value = self.getParam(p)
284 if isinstance(value,str):
285 jobConfig[p] = value % jobConfig
286 else:
287 jobConfig[p] = value
288
289 # Define statement to set up the release
290 if jobConfig['setuprelease']:
291 # Use explicit command if given
292 jobConfig['cmdsetup'] = self.getParam('cmdsetup') % jobConfig
293 # otherwise take from CMDSETUP env var if set or assume normal asetup
294 if not jobConfig['cmdsetup']:
295 jobConfig['cmdsetup'] = os.getenv('CMDSETUP','source /afs/cern.ch/atlas/software/dist/AtlasSetup/scripts/asetup.sh %(release)s --noautocdtest') % jobConfig
296 else:
297 jobConfig['cmdsetup'] = ''
298
299 # Collect files to be copied locally, and replace corresponding jobConfig
300 # parameters by base file name (to point to the local copy)
301 jobConfig['cmdcopyfiles'] = self.getParam('cmdcopyfiles') % jobConfig
302 if not jobConfig['cmdcopyfiles']:
303 filestobecopied = ''
304 for p in self.paramToBeCopied:
305 if not jobConfig[p]: continue
306 filestobecopied = ' '.join([filestobecopied,jobConfig[p]])
307 jobConfig[p] = os.path.basename(jobConfig[p])
308 if filestobecopied:
309 jobConfig['cmdcopyfiles'] = 'cp -p '+filestobecopied+' .'
310
311 # Unless the user sets a specific value for parameter cmddefinepoolcatalog, determine
312 # what should be added and create appropriate catalog
313 jobConfig['cmddefinepoolcatalog'] = self.getParam('cmddefinepoolcatalog') % jobConfig
314 if not jobConfig['cmddefinepoolcatalog']:
315 if jobConfig['addinputtopoolcatalog']:
316 argstring = ' '.join(jobConfig['filesforpoolcatalog']+jobConfig['inputfiles']) % jobConfig
317 else:
318 argstring = ' '.join(jobConfig['filesforpoolcatalog']) % jobConfig
319 if argstring:
320 jobConfig['cmddefinepoolcatalog'] = 'pool_insertFileToCatalog '+argstring
321
322 # Define statement used to exit the shell script
323 if jobConfig['returnstatuscode']:
324 jobConfig['cmdexit'] = self.getParam('cmdexit') % jobConfig
325 if not jobConfig['cmdexit']:
326 jobConfig['cmdexit'] = 'exit $status' % jobConfig
327 else:
328 jobConfig['cmdexit'] = ''
329
330 # Generate string with comma-separated list of output files with full name
331 jobConfig['outputfilestring'] = ','.join([jobConfig['outputfileprefix']+f for f in jobConfig['outputfilelist']])
332
333 # Update remaining special parameters
334 if jobConfig['taskpostprocsteps']:
335 jobConfig['doneflag'] = jobConfig['postprocflag']
336 else:
337 jobConfig['doneflag'] = jobConfig['completedflag']
338 jobConfig['script'] = self.getParam('script') % jobConfig
339
340 # Check if job's output files exist already in order to prevent overwriting of data
341 # NOTE: cannot just check for existence of jobdir, since this might be set to the
342 # current directory
343 for f in jobConfig['outputfilelist']:
344 if os.access(jobConfig['outputfileprefix']+f,os.F_OK):
345 raise JobRunnerError ('Job output file %s exists already' % jobConfig[f])
346 for f in ('configfile', 'scriptfile', 'logfile'):
347 if os.access(jobConfig[f],os.F_OK):
348 raise JobRunnerError ('Job configuration or log file %s exists already' % jobConfig[f])
349
350 # Make sure start directory where script and config files will be written to exists
351 os.makedirs('%(jobdir)s' % jobConfig)
352
353 # Write job configuration file
354 config = open(jobConfig['configfile'],'w')
355 config.write('# Job configuration data for job %(jobname)s\n' % jobConfig)
356 config.write('# Generated by JobRunner.py\n\n')
357 if pprint.isreadable(jobConfig):
358 config.write('jobConfig = '+pprint.pformat(jobConfig))
359 else:
360 config.write('jobConfig = '+repr(jobConfig))
361 config.write('\n')
362 config.close()
363
364 # Write script file
365 script = open(jobConfig['scriptfile'],'w')
366 script.write(jobConfig['script'])
367 script.close()
368 os.chmod(jobConfig['scriptfile'],0o755)
369
370 # Record job configuration
371 self.jobs[jobnr] = jobConfig
372
373

◆ dumpParams()

python.JobRunner.JobRunner.dumpParams ( self,
format = '%(name)-20s = %(value)s',
maxLineLength = 0 )
inherited
Dump all parameters into a string in a user-specified format.

Definition at line 236 of file JobRunner.py.

236 def dumpParams(self,format='%(name)-20s = %(value)s',maxLineLength=0):
237 """Dump all parameters into a string in a user-specified format."""
238 dump = ''
239 for p in self.paramOrder:
240 s = format % self.params[p].__dict__
241 if maxLineLength:
242 s = s[0:maxLineLength-3]+'...'
243 dump += s+'\n'
244 return dump
245
246

◆ getNJobs()

python.JobRunner.JobRunner.getNJobs ( self)
inherited

Definition at line 476 of file JobRunner.py.

476 def getNJobs(self):
477 if not self.jobs:
478 return 0
479 else:
480 return len(self.jobs)
481
482

◆ getOutputFiles()

python.JobRunner.JobRunner.getOutputFiles ( self)
inherited
Get a list of all output files.

Definition at line 503 of file JobRunner.py.

503 def getOutputFiles(self):
504 """Get a list of all output files."""
505 outputFiles = [ ]
506 for j in self.jobs:
507 for f in sorted(glob.glob(self.jobs[j]['outputfileprefix']+'*')):
508 outputFiles.append(f)
509 return outputFiles
510
511

◆ getParam()

python.JobRunner.JobRunner.getParam ( self,
name )
inherited
Get value of a parameter by name.

Definition at line 192 of file JobRunner.py.

192 def getParam(self,name):
193 """Get value of a parameter by name."""
194 return self.params[name].value
195
196

◆ getRunningJobs()

python.JobRunner.JobRunner.getRunningJobs ( self)
inherited
Get list of jobs submitted by this JobRunner that are still running

Definition at line 483 of file JobRunner.py.

483 def getRunningJobs(self):
484 """Get list of jobs submitted by this JobRunner that are still running"""
485 runningJobs = [ ]
486 for j in self.jobs:
487 if os.path.exists(self.jobs[j]['subflag']) or os.path.exists(self.jobs[j]['runflag']):
488 runningJobs.append(self.jobs[j]['jobname'])
489 return runningJobs
490
491

◆ isSpecialParam()

python.JobRunner.JobRunner.isSpecialParam ( self,
name )
inherited
Check if parameter requires special treatment.

Definition at line 197 of file JobRunner.py.

197 def isSpecialParam(self,name):
198 """Check if parameter requires special treatment."""
199 return self.params[name].isSpecial
200
201

◆ log()

python.JobRunner.JobRunner.log ( self,
subject,
body,
** data )
inherited
Send a log message to a set of users specified by parameter 'logmail'.

Definition at line 512 of file JobRunner.py.

512 def log(self,subject,body,**data):
513 """Send a log message to a set of users specified by parameter 'logmail'."""
514 if self.getParam('logmail'):
515 msg = 'Generated by JobRunner on host '+socket.gethostname()+' by '+pwd.getpwuid(os.getuid())[0]+' at '+time.asctime()
516 msg += '\n\nCurrent working directory = '+os.getcwd()
517 if body: msg += '\n\n'+body
518 for k in data.keys():
519 if isinstance(data[k],dict):
520 msg += "\n\n%s:" % k
521 items = data[k].keys()
522 items.sort()
523 for i in items:
524 msg += "\n %-20s = %s" % (i,data[k][i])
525 else:
526 msg += "\n\n%-20s = %s" % (k,data[k])
527 subprocess.call("echo '%s' | mail -s '%s' '%s'" %
528 (msg,subject,self.getParam('logmail')), shell=True)
529
530
531#
532# Test code
533#

◆ registerToBeCopied()

python.JobRunner.JobRunner.registerToBeCopied ( self,
paramName )
inherited
Register a parameter holding the name of an input file to be
   copied before a job starts.

Definition at line 202 of file JobRunner.py.

202 def registerToBeCopied(self,paramName):
203 """Register a parameter holding the name of an input file to be
204 copied before a job starts."""
205 if paramName not in self.paramToBeCopied:
206 self.paramToBeCopied.append(paramName)
207
208

◆ run()

python.JobRunner.JobRunner.run ( self,
jobnr = None )
inherited
Run all configured job(s)

Definition at line 465 of file JobRunner.py.

465 def run(self,jobnr=None):
466 """Run all configured job(s)"""
467 if not self.jobs:
468 raise JobRunnerError ('No configured jobs')
469 njobs = len(self.jobs)
470 self.log('JobRunner: starting '+str(njobs)+' jobs',self.dumpParams())
471 for j in sorted(self.jobs.keys()):
472 print ('\nStarting job %i (using %s) ...\n' % (j,self.__class__))
473 self.runJob(j)
474
475
Definition run.py:1

◆ runJob()

python.JobRunner.JobRunner.runJob ( self,
jobnr )
inherited
Run a single configured job.

Definition at line 455 of file JobRunner.py.

455 def runJob(self,jobnr):
456 """Run a single configured job."""
457 if jobnr not in self.jobs:
458 raise JobRunnerError ('Job number %s is not configured' % jobnr)
459 jobConfig = self.jobs[jobnr]
460 subprocess.call('touch '+jobConfig['subflag'], shell=True)
461 status = self.submitJob(jobConfig)
462 self.jobStatus[jobnr] = status
463
464

◆ setParam()

python.JobRunner.JobRunner.setParam ( self,
name,
value = None,
description = None,
isSpecial = None,
insertAtFront = False )
inherited
Set the value of a job parameter. Job parameters may be templates that name
   previously defined job parameters and will be evaluated when a given job
   is configured. Therefore the order in which setParam is called for the different
   parameters is relevant. insertAtFront can be set to True to force early
   evaluation of a given parameter.

Definition at line 157 of file JobRunner.py.

157 def setParam(self,name,value=None,description=None,isSpecial=None,insertAtFront=False):
158 """Set the value of a job parameter. Job parameters may be templates that name
159 previously defined job parameters and will be evaluated when a given job
160 is configured. Therefore the order in which setParam is called for the different
161 parameters is relevant. insertAtFront can be set to True to force early
162 evaluation of a given parameter."""
163 p = self.params[name] = self.params.get(name,JobRunnerParameter(name))
164 if value is not None:
165 p.value = value
166 if description is not None:
167 p.description = description
168 if isSpecial is not None:
169 p.isSpecial=isSpecial
170 if name not in self.paramOrder:
171 if insertAtFront:
172 self.paramOrder.insert(0,name)
173 else:
174 self.paramOrder.append(name)
175
176
T * get(TKey *tobj)
get a TObject* from a TKey* (why can't a TObject be a TKey?)
Definition hcg.cxx:130

◆ showParams()

python.JobRunner.JobRunner.showParams ( self,
maxLineLength = 80 )
inherited
Show current job parameters.

Definition at line 227 of file JobRunner.py.

227 def showParams(self,maxLineLength=80):
228 """Show current job parameters."""
229 for p in self.paramOrder:
230 s = str(self.params[p])
231 if maxLineLength > 0 and len(s) > maxLineLength:
232 s = s[0:maxLineLength-3] + '...'
233 print (s)
234
235

◆ submitJob()

python.HTCondorJobRunner.HTCondorJobRunner.submitJob ( self,
jobConfig )
Submit a JobRunner job as a LSF batch job.

Reimplemented from python.JobRunner.JobRunner.

Definition at line 41 of file HTCondorJobRunner.py.

41 def submitJob(self,jobConfig):
42 """Submit a JobRunner job as a LSF batch job."""
43 condorScript = condorScriptTemplate % jobConfig
44 print (condorScript)
45 script = open('condorSubmit.sub','w')
46 script.write(condorScript)
47 script.close()
48 os.chmod('condorSubmit.sub',0o755)
49 batchCmd = 'condor_submit condorSubmit.sub'
50 print (batchCmd )
51 os.system(batchCmd)
52 return None

◆ wait()

python.JobRunner.JobRunner.wait ( self)
inherited
Wait until all jobs have completed

Definition at line 492 of file JobRunner.py.

492 def wait(self):
493 """Wait until all jobs have completed"""
494 while 1:
495 time.sleep(30)
496 runningJobs = self.getRunningJobs()
497 if not runningJobs: break
498 print()
499 print (time.asctime(),' Waiting for %2s job(s) (%s)' % (len(runningJobs),runningJobs))
500 self.log('JobRunner: finished',self.dumpParams(),outputFiles=self.getOutputFiles())
501
502
void print(char *figname, TCanvas *c1)

Member Data Documentation

◆ __class__

python.JobRunner.JobRunner.__class__
privateinherited

Definition at line 472 of file JobRunner.py.

◆ jobs

python.JobRunner.JobRunner.jobs = { }
inherited

Definition at line 106 of file JobRunner.py.

◆ jobStatus

dict python.JobRunner.JobRunner.jobStatus = { }
inherited

Definition at line 107 of file JobRunner.py.

◆ paramOrder

python.JobRunner.JobRunner.paramOrder = [ ]
inherited

Definition at line 104 of file JobRunner.py.

◆ params

dict python.JobRunner.JobRunner.params = { }
inherited

Definition at line 103 of file JobRunner.py.

◆ paramToBeCopied

list python.JobRunner.JobRunner.paramToBeCopied = [ ]
inherited

Definition at line 105 of file JobRunner.py.


The documentation for this class was generated from the following file: