[ViewVC] Diff of: cvsroot/COMP/CRAB/python/cms

Comparing COMP/CRAB/python/cms_cmssw.py (file contents):
Revision 1.73 by gutsche, Sun Apr 8 18:39:51 2007 UTC vs.
Revision 1.116.2.8 by fanzago, Wed Oct 17 13:25:00 2007 UTC

#	Line 2 \| Line 2 \| from JobType import JobType
2		from crab_logger import Logger
3		from crab_exceptions import *
4		from crab_util import *
5	+	from BlackWhiteListParser import BlackWhiteListParser
6		import common
6	–	import PsetManipulator
7	–	import DataDiscovery
8	–	import DataDiscovery_DBS2
9	–	import DataLocation
7		import Scram
8
9	<	import os, string, re, shutil, glob
9	>	import os, string, glob
10
11		class Cmssw(JobType):
12		def __init__(self, cfg_params, ncjobs):
13		JobType.__init__(self, 'CMSSW')
14		common.logger.debug(3,'CMSSW::__init__')
15
19	–	# Marco.
16		self._params = {}
17		self.cfg_params = cfg_params
18
19	+	# init BlackWhiteListParser
20	+	self.blackWhiteListParser = BlackWhiteListParser(cfg_params)
21	+
22		try:
23		self.MaxTarBallSize = float(self.cfg_params['EDG.maxtarballsize'])
24		except KeyError:
25	<	self.MaxTarBallSize = 100.0
25	>	self.MaxTarBallSize = 9.5
26
27		# number of jobs requested to be created, limit obj splitting
28		self.ncjobs = ncjobs
#	Line 36 \| Line 35 \| class Cmssw(JobType):
35		self.executable = ''
36		self.executable_arch = self.scram.getArch()
37		self.tgz_name = 'default.tgz'
38	+	self.additional_tgz_name = 'additional.tgz'
39		self.scriptName = 'CMSSW.sh'
40		self.pset = '' #scrip use case Da
41		self.datasetPath = '' #scrip use case Da
#	Line 44 \| Line 44 \| class Cmssw(JobType):
44		self.fjrFileName = 'crab_fjr.xml'
45
46		self.version = self.scram.getSWVersion()
47	+
48	+	#
49	+	# Try to block creation in case of arch/version mismatch
50	+	#
51	+
52	+	a = string.split(self.version, "_")
53	+
54	+	if int(a[1]) == 1 and (int(a[2]) < 5 and self.executable_arch.find('slc4') == 0):
55	+	msg = "Error: CMS does not support %s with %s architecture"%(self.version, self.executable_arch)
56	+	raise CrabException(msg)
57	+	if int(a[1]) == 1 and (int(a[2]) >= 5 and self.executable_arch.find('slc3') == 0):
58	+	msg = "Error: CMS does not support %s with %s architecture"%(self.version, self.executable_arch)
59	+	raise CrabException(msg)
60	+
61		common.taskDB.setDict('codeVersion',self.version)
62		self.setParam_('application', self.version)
63
#	Line 51 \| Line 65 \| class Cmssw(JobType):
65
66		## get DBS mode
67		try:
68	<	self.use_dbs_2 = int(self.cfg_params['CMSSW.use_dbs_2'])
68	>	self.use_dbs_1 = int(self.cfg_params['CMSSW.use_dbs_1'])
69		except KeyError:
70	<	self.use_dbs_2 = 0
70	>	self.use_dbs_1 = 0
71
72		try:
73		tmp = cfg_params['CMSSW.datasetpath']
#	Line 74 \| Line 88 \| class Cmssw(JobType):
88		self.setParam_('dataset', 'None')
89		self.setParam_('owner', 'None')
90		else:
91	<	datasetpath_split = self.datasetPath.split("/")
92	<	self.setParam_('dataset', datasetpath_split[1])
93	<	self.setParam_('owner', datasetpath_split[-1])
94	<
91	>	try:
92	>	datasetpath_split = self.datasetPath.split("/")
93	>	# standard style
94	>	self.setParam_('datasetFull', self.datasetPath)
95	>	if self.use_dbs_1 == 1 :
96	>	self.setParam_('dataset', datasetpath_split[1])
97	>	self.setParam_('owner', datasetpath_split[-1])
98	>	else:
99	>	self.setParam_('dataset', datasetpath_split[1])
100	>	self.setParam_('owner', datasetpath_split[2])
101	>	except:
102	>	self.setParam_('dataset', self.datasetPath)
103	>	self.setParam_('owner', self.datasetPath)
104	>
105		self.setTaskid_()
106		self.setParam_('taskId', self.cfg_params['taskId'])
107
#	Line 127 \| Line 151 \| class Cmssw(JobType):
151		self.output_file.append(tmp)
152		pass
153		else:
154	<	log.message("No output file defined: only stdout/err and the CRAB Framework Job Report will be available")
154	>	log.message("No output file defined: only stdout/err and the CRAB Framework Job Report will be available\n")
155		pass
156		pass
157		except KeyError:
158	<	log.message("No output file defined: only stdout/err and the CRAB Framework Job Report will be available")
158	>	log.message("No output file defined: only stdout/err and the CRAB Framework Job Report will be available\n")
159		pass
160
161		# script_exe file as additional file in inputSandbox
#	Line 157 \| Line 181 \| class Cmssw(JobType):
181		tmp = string.strip(tmp)
182		dirname = ''
183		if not tmp[0]=="/": dirname = "."
184	<	files = glob.glob(os.path.join(dirname, tmp))
184	>	files = []
185	>	if string.find(tmp,"*")>-1:
186	>	files = glob.glob(os.path.join(dirname, tmp))
187	>	if len(files)==0:
188	>	raise CrabException("No additional input file found with this pattern: "+tmp)
189	>	else:
190	>	files.append(tmp)
191		for file in files:
192		if not os.path.exists(file):
193		raise CrabException("Additional input file not found: "+file)
194		pass
195	<	storedFile = common.work_space.shareDir()+file
196	<	shutil.copyfile(file, storedFile)
197	<	self.additional_inbox_files.append(string.strip(storedFile))
195	>	# fname = string.split(file, '/')[-1]
196	>	# storedFile = common.work_space.pathForTgz()+'share/'+fname
197	>	# shutil.copyfile(file, storedFile)
198	>	self.additional_inbox_files.append(string.strip(file))
199		pass
200		pass
201		common.logger.debug(5,"Additional input files: "+str(self.additional_inbox_files))
#	Line 222 \| Line 253 \| class Cmssw(JobType):
253		except KeyError:
254		self.sourceSeedVtx = None
255		common.logger.debug(5,"No vertex seed given")
256	+
257	+	try:
258	+	self.sourceSeedG4 = int(cfg_params['CMSSW.g4_seed'])
259	+	except KeyError:
260	+	self.sourceSeedG4 = None
261	+	common.logger.debug(5,"No g4 sim hits seed given")
262	+
263	+	try:
264	+	self.sourceSeedMix = int(cfg_params['CMSSW.mix_seed'])
265	+	except KeyError:
266	+	self.sourceSeedMix = None
267	+	common.logger.debug(5,"No mix seed given")
268	+
269		try:
270		self.firstRun = int(cfg_params['CMSSW.first_run'])
271		except KeyError:
272		self.firstRun = None
273		common.logger.debug(5,"No first run given")
274		if self.pset != None: #CarlosDaniele
275	<	self.PsetEdit = PsetManipulator.PsetManipulator(self.pset) #Daniele Pset
275	>	ver = string.split(self.version,"_")
276	>	if (int(ver[1])>=1 and int(ver[2])>=5):
277	>	import PsetManipulator150 as pp
278	>	else:
279	>	import PsetManipulator as pp
280	>	PsetEdit = pp.PsetManipulator(self.pset) #Daniele Pset
281
282		#DBSDLS-start
283		## Initialize the variables that are extracted from DBS/DLS and needed in other places of the code
#	Line 250 \| Line 299 \| class Cmssw(JobType):
299		self.jobSplittingForScript()
300		else:
301		self.jobSplittingNoInput()
302	<	else:
302	>	else:
303		self.jobSplittingByBlocks(blockSites)
304
305		# modify Pset
#	Line 258 \| Line 307 \| class Cmssw(JobType):
307		try:
308		if (self.datasetPath): # standard job
309		# allow to processa a fraction of events in a file
310	<	self.PsetEdit.inputModule("INPUT")
311	<	self.PsetEdit.maxEvent("INPUTMAXEVENTS")
312	<	self.PsetEdit.skipEvent("INPUTSKIPEVENTS")
310	>	PsetEdit.inputModule("INPUT")
311	>	PsetEdit.maxEvent("INPUTMAXEVENTS")
312	>	PsetEdit.skipEvent("INPUTSKIPEVENTS")
313		else: # pythia like job
314	<	self.PsetEdit.maxEvent(self.eventsPerJob)
314	>	PsetEdit.maxEvent(self.eventsPerJob)
315		if (self.firstRun):
316	<	self.PsetEdit.pythiaFirstRun("INPUTFIRSTRUN") #First Run
316	>	PsetEdit.pythiaFirstRun("INPUTFIRSTRUN") #First Run
317		if (self.sourceSeed) :
318	<	self.PsetEdit.pythiaSeed("INPUT")
318	>	PsetEdit.pythiaSeed("INPUT")
319		if (self.sourceSeedVtx) :
320	<	self.PsetEdit.pythiaSeedVtx("INPUTVTX")
320	>	PsetEdit.vtxSeed("INPUTVTX")
321	>	if (self.sourceSeedG4) :
322	>	PsetEdit.g4Seed("INPUTG4")
323	>	if (self.sourceSeedMix) :
324	>	PsetEdit.mixSeed("INPUTMIX")
325		# add FrameworkJobReport to parameter-set
326	<	self.PsetEdit.addCrabFJR(self.fjrFileName)
327	<	self.PsetEdit.psetWriter(self.configFilename())
326	>	PsetEdit.addCrabFJR(self.fjrFileName)
327	>	PsetEdit.psetWriter(self.configFilename())
328		except:
329		msg='Error while manipuliating ParameterSet: exiting...'
330		raise CrabException(msg)
331
332		def DataDiscoveryAndLocation(self, cfg_params):
333
334	+	import DataDiscovery
335	+	import DataDiscovery_DBS2
336	+	import DataLocation
337		common.logger.debug(10,"CMSSW::DataDiscoveryAndLocation()")
338
339		datasetPath=self.datasetPath
340
341		## Contact the DBS
342	<	common.logger.message("Contacting DBS...")
342	>	common.logger.message("Contacting Data Discovery Services ...")
343		try:
344
345	<	if self.use_dbs_2 == 1 :
290	<	self.pubdata=DataDiscovery_DBS2.DataDiscovery_DBS2(datasetPath, cfg_params)
291	<	else :
345	>	if self.use_dbs_1 == 1 :
346		self.pubdata=DataDiscovery.DataDiscovery(datasetPath, cfg_params)
347	+	else :
348	+	self.pubdata=DataDiscovery_DBS2.DataDiscovery_DBS2(datasetPath, cfg_params)
349		self.pubdata.fetchDBSInfo()
350
351		except DataDiscovery.NotExistingDatasetError, ex :
#	Line 311 \| Line 367 \| class Cmssw(JobType):
367		msg = 'ERROR ***: failed Data Discovery in DBS : %s'%ex.getErrorMessage()
368		raise CrabException(msg)
369
314	–	## get list of all required data in the form of dbs paths (dbs path = /dataset/datatier/owner)
315	–	common.logger.message("Required data are :"+self.datasetPath)
316	–
370		self.filesbyblock=self.pubdata.getFiles()
371		self.eventsbyblock=self.pubdata.getEventsPerBlock()
372		self.eventsbyfile=self.pubdata.getEventsPerFile()
373
374		## get max number of events
375		self.maxEvents=self.pubdata.getMaxEvents() ## self.maxEvents used in Creator.py
323	–	common.logger.message("The number of available events is %s\n"%self.maxEvents)
376
325	–	common.logger.message("Contacting DLS...")
377		## Contact the DLS and build a list of sites hosting the fileblocks
378		try:
379		dataloc=DataLocation.DataLocation(self.filesbyblock.keys(),cfg_params)
#	Line 340 \| Line 391 \| class Cmssw(JobType):
391		allSites.append(oneSite)
392		allSites = self.uniquelist(allSites)
393
394	<	common.logger.message("Sites ("+str(len(allSites))+") hosting part/all of dataset: "+str(allSites))
395	<	common.logger.debug(6, "List of Sites: "+str(allSites))
394	>	# screen output
395	>	common.logger.message("Requested dataset: " + datasetPath + " has " + str(self.maxEvents) + " events in " + str(len(self.filesbyblock.keys())) + " blocks.\n")
396	>
397		return sites
398
399		def jobSplittingByBlocks(self, blockSites):
#	Line 403 \| Line 455 \| class Cmssw(JobType):
455		jobCount = 0
456		list_of_lists = []
457
458	+	# list tracking which jobs are in which jobs belong to which block
459	+	jobsOfBlock = {}
460	+
461		# ---- Iterate over the blocks in the dataset until ---- #
462		# ---- we've met the requested total # of events ---- #
463		while ( (eventsRemaining > 0) and (blockCount < numBlocksInDataset) and (jobCount < totalNumberOfJobs)):
464		block = blocks[blockCount]
465		blockCount += 1
466	+	if block not in jobsOfBlock.keys() :
467	+	jobsOfBlock[block] = []
468
469		if self.eventsbyblock.has_key(block) :
470		numEventsInBlock = self.eventsbyblock[block]
#	Line 457 \| Line 514 \| class Cmssw(JobType):
514		common.logger.debug(3,"Job "+str(jobCount+1)+" can run over "+str(filesEventCount - jobSkipEventCount)+" events (last file in block).")
515		self.jobDestination.append(blockSites[block])
516		common.logger.debug(5,"Job "+str(jobCount+1)+" Destination: "+str(self.jobDestination[jobCount]))
517	+	# fill jobs of block dictionary
518	+	jobsOfBlock[block].append(jobCount+1)
519		# reset counter
520		jobCount = jobCount + 1
521		totalEventCount = totalEventCount + filesEventCount - jobSkipEventCount
#	Line 480 \| Line 539 \| class Cmssw(JobType):
539		common.logger.debug(3,"Job "+str(jobCount+1)+" can run over "+str(eventsPerJobRequested)+" events.")
540		self.jobDestination.append(blockSites[block])
541		common.logger.debug(5,"Job "+str(jobCount+1)+" Destination: "+str(self.jobDestination[jobCount]))
542	+	jobsOfBlock[block].append(jobCount+1)
543		# reset counter
544		jobCount = jobCount + 1
545		totalEventCount = totalEventCount + eventsPerJobRequested
#	Line 500 \| Line 560 \| class Cmssw(JobType):
560		common.logger.debug(3,"Job "+str(jobCount+1)+" can run over "+str(eventsPerJobRequested)+" events.")
561		self.jobDestination.append(blockSites[block])
562		common.logger.debug(5,"Job "+str(jobCount+1)+" Destination: "+str(self.jobDestination[jobCount]))
563	+	jobsOfBlock[block].append(jobCount+1)
564		# increase counter
565		jobCount = jobCount + 1
566		totalEventCount = totalEventCount + eventsPerJobRequested
#	Line 517 \| Line 578 \| class Cmssw(JobType):
578		self.ncjobs = self.total_number_of_jobs = jobCount
579		if (eventsRemaining > 0 and jobCount < totalNumberOfJobs ):
580		common.logger.message("Could not run on all requested events because some blocks not hosted at allowed sites.")
581	<	common.logger.message("\n"+str(jobCount)+" job(s) can run on "+str(totalEventCount)+" events.\n")
581	>	common.logger.message(str(jobCount)+" job(s) can run on "+str(totalEventCount)+" events.\n")
582	>
583	>	# screen output
584	>	screenOutput = "List of jobs and available destination sites:\n\n"
585	>
586	>	# keep trace of block with no sites to print a warning at the end
587	>	noSiteBlock = []
588	>	bloskNoSite = []
589	>
590	>	blockCounter = 0
591	>	for block in blocks:
592	>	if block in jobsOfBlock.keys() :
593	>	blockCounter += 1
594	>	screenOutput += "Block %5i: jobs %20s: sites: %s\n" % (blockCounter,spanRanges(jobsOfBlock[block]),','.join(self.blackWhiteListParser.checkWhiteList(self.blackWhiteListParser.checkBlackList(blockSites[block],block),block)))
595	>	if len(self.blackWhiteListParser.checkWhiteList(self.blackWhiteListParser.checkBlackList(blockSites[block],block),block)) == 0:
596	>	noSiteBlock.append( spanRanges(jobsOfBlock[block]) )
597	>	bloskNoSite.append( blockCounter )
598
599	+	common.logger.message(screenOutput)
600	+	if len(noSiteBlock) > 0 and len(bloskNoSite) > 0:
601	+	msg = 'WARNING: No sites are hosting any part of data for block:\n '
602	+	virgola = ""
603	+	if len(bloskNoSite) > 1:
604	+	virgola = ","
605	+	for block in bloskNoSite:
606	+	msg += ' ' + str(block) + virgola
607	+	msg += '\n Related jobs:\n '
608	+	virgola = ""
609	+	if len(noSiteBlock) > 1:
610	+	virgola = ","
611	+	for range_jobs in noSiteBlock:
612	+	msg += str(range_jobs) + virgola
613	+	msg += '\n will not be submitted and this block of data can not be analyzed!\n'
614	+	common.logger.message(msg)
615	+
616		self.list_of_args = list_of_lists
617		return
618
#	Line 527 \| Line 621 \| class Cmssw(JobType):
621		Perform job splitting based on number of event per job
622		"""
623		common.logger.debug(5,'Splitting per events')
624	<	common.logger.message('Required '+str(self.eventsPerJob)+' events per job ')
625	<	common.logger.message('Required '+str(self.theNumberOfJobs)+' jobs in total ')
626	<	common.logger.message('Required '+str(self.total_number_of_events)+' events in total ')
624	>
625	>	if (self.selectEventsPerJob):
626	>	common.logger.message('Required '+str(self.eventsPerJob)+' events per job ')
627	>	if (self.selectNumberOfJobs):
628	>	common.logger.message('Required '+str(self.theNumberOfJobs)+' jobs in total ')
629	>	if (self.selectTotalNumberEvents):
630	>	common.logger.message('Required '+str(self.total_number_of_events)+' events in total ')
631
632		if (self.total_number_of_events < 0):
633		msg='Cannot split jobs per Events with "-1" as total number of events'
#	Line 563 \| Line 661 \| class Cmssw(JobType):
661		## Since there is no input, any site is good
662		# self.jobDestination.append(["Any"])
663		self.jobDestination.append([""]) #must be empty to write correctly the xml
664	<	args=''
664	>	args=[]
665		if (self.firstRun):
666		## pythia first run
667		#self.list_of_args.append([(str(self.firstRun)+str(i))])
668	<	args=args+(str(self.firstRun)+str(i))
668	>	args.append(str(self.firstRun)+str(i))
669		else:
670		## no first run
671		#self.list_of_args.append([str(i)])
672	<	args=args+str(i)
672	>	args.append(str(i))
673		if (self.sourceSeed):
674	+	args.append(str(self.sourceSeed)+str(i))
675		if (self.sourceSeedVtx):
676	<	## pythia + vtx random seed
677	<	#self.list_of_args.append([
678	<	# str(self.sourceSeed)+str(i),
679	<	# str(self.sourceSeedVtx)+str(i)
680	<	# ])
681	<	args=args+str(',')+str(self.sourceSeed)+str(i)+str(',')+str(self.sourceSeedVtx)+str(i)
682	<	else:
683	<	## only pythia random seed
684	<	#self.list_of_args.append([(str(self.sourceSeed)+str(i))])
685	<	args=args +str(',')+str(self.sourceSeed)+str(i)
686	<	else:
687	<	## no random seed
589	<	if str(args)=='': args=args+(str(self.firstRun)+str(i))
590	<	arguments=args.split(',')
591	<	if len(arguments)==3:self.list_of_args.append([str(arguments[0]),str(arguments[1]),str(arguments[2])])
592	<	elif len(arguments)==2:self.list_of_args.append([str(arguments[0]),str(arguments[1])])
593	<	else :self.list_of_args.append([str(arguments[0])])
676	>	## + vtx random seed
677	>	args.append(str(self.sourceSeedVtx)+str(i))
678	>	if (self.sourceSeedG4):
679	>	## + G4 random seed
680	>	args.append(str(self.sourceSeedG4)+str(i))
681	>	if (self.sourceSeedMix):
682	>	## + Mix random seed
683	>	args.append(str(self.sourceSeedMix)+str(i))
684	>	pass
685	>	pass
686	>	self.list_of_args.append(args)
687	>	pass
688
689	<	# print self.list_of_args
689	>	# print self.list_of_args
690
691		return
692
#	Line 687 \| Line 781 \| class Cmssw(JobType):
781		try: # create tar ball
782		tar = tarfile.open(self.tgzNameWithPath, "w:gz")
783		## First find the executable
784	<	if (executable != ''):
784	>	if (self.executable != ''):
785		exeWithPath = self.scram.findFile_(executable)
786		if ( not exeWithPath ):
787		raise CrabException('User executable '+executable+' not found')
#	Line 697 \| Line 791 \| class Cmssw(JobType):
791		# the exe is private, so we must ship
792		common.logger.debug(5,"Exe "+exeWithPath+" to be tarred")
793		path = swArea+'/'
794	<	exe = string.replace(exeWithPath, path,'')
795	<	tar.add(path+exe,executable)
794	>	# distinguish case when script is in user project area or given by full path somewhere else
795	>	if exeWithPath.find(path) >= 0 :
796	>	exe = string.replace(exeWithPath, path,'')
797	>	tar.add(path+exe,exe)
798	>	else :
799	>	tar.add(exeWithPath,os.path.basename(executable))
800		pass
801		else:
802		# the exe is from release, we'll find it on WN
#	Line 729 \| Line 827 \| class Cmssw(JobType):
827		pa = os.environ['CRABDIR'] + '/' + 'ProdAgentApi'
828		if os.path.isdir(pa):
829		tar.add(pa,paDir)
830	+
831	+	### FEDE FOR DBS PUBLICATION
832	+	## Add PRODCOMMON dir to tar
833	+	prodcommonDir = 'ProdCommon'
834	+	prodcommonPath = os.environ['CRABDIR'] + '/' + 'ProdCommon'
835	+	if os.path.isdir(prodcommonPath):
836	+	tar.add(prodcommonPath,prodcommonDir)
837	+	#############################
838
839		common.logger.debug(5,"Files added to "+self.tgzNameWithPath+" : "+str(tar.getnames()))
840		tar.close()
#	Line 754 \| Line 860 \| class Cmssw(JobType):
860
861		return
862
863	+	def additionalInputFileTgz(self):
864	+	"""
865	+	Put all additional files into a tar ball and return its name
866	+	"""
867	+	import tarfile
868	+	tarName= common.work_space.pathForTgz()+'share/'+self.additional_tgz_name
869	+	tar = tarfile.open(tarName, "w:gz")
870	+	for file in self.additional_inbox_files:
871	+	tar.add(file,string.split(file,'/')[-1])
872	+	common.logger.debug(5,"Files added to "+self.additional_tgz_name+" : "+str(tar.getnames()))
873	+	tar.close()
874	+	return tarName
875	+
876		def wsSetupEnvironment(self, nj):
877		"""
878		Returns part of a job script which prepares
#	Line 765 \| Line 884 \| class Cmssw(JobType):
884		## OLI_Daniele at this level middleware already known
885
886		txt += 'if [ $middleware == LCG ]; then \n'
887	+	txt += ' echo "### First set SCRAM ARCH and BUILD_ARCH to ' + self.executable_arch + ' ###"\n'
888	+	txt += ' export SCRAM_ARCH='+self.executable_arch+'\n'
889	+	txt += ' export BUILD_ARCH='+self.executable_arch+'\n'
890		txt += self.wsSetupCMSLCGEnvironment_()
891		txt += 'elif [ $middleware == OSG ]; then\n'
892		txt += ' WORKING_DIR=`/bin/mktemp -d $OSG_WN_TMP/cms_XXXXXXXXXXXX`\n'
893		txt += ' echo "Created working directory: $WORKING_DIR"\n'
894		txt += ' if [ ! -d $WORKING_DIR ] ;then\n'
895		txt += ' echo "SET_CMS_ENV 10016 ==> OSG $WORKING_DIR could not be created on WN `hostname`"\n'
896	<	txt += ' echo "JOB_EXIT_STATUS = 10016"\n'
897	<	txt += ' echo "JobExitCode=10016" \| tee -a $RUNTIME_AREA/$repo\n'
898	<	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
896	>	txt += ' echo "JOB_EXIT_STATUS = 10016"\n'
897	>	txt += ' echo "JobExitCode=10016" \| tee -a $RUNTIME_AREA/$repo\n'
898	>	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
899		txt += ' rm -f $RUNTIME_AREA/$repo \n'
900		txt += ' echo "MonitorJobID=`echo $MonitorJobID`" \| tee -a $RUNTIME_AREA/$repo \n'
901		txt += ' echo "MonitorID=`echo $MonitorID`" \| tee -a $RUNTIME_AREA/$repo\n'
#	Line 783 \| Line 905 \| class Cmssw(JobType):
905		txt += ' echo "Change to working directory: $WORKING_DIR"\n'
906		txt += ' cd $WORKING_DIR\n'
907		txt += self.wsSetupCMSOSGEnvironment_()
908	+	txt += ' echo "### Set SCRAM ARCH to ' + self.executable_arch + ' ###"\n'
909	+	txt += ' export SCRAM_ARCH='+self.executable_arch+'\n'
910		txt += 'fi\n'
911
912		# Prepare JobType-specific part
#	Line 805 \| Line 929 \| class Cmssw(JobType):
929		txt += ' cd $RUNTIME_AREA\n'
930		txt += ' /bin/rm -rf $WORKING_DIR\n'
931		txt += ' if [ -d $WORKING_DIR ] ;then\n'
932	<	txt += ' echo "SET_CMS_ENV 10018 ==> OSG $WORKING_DIR could not be deleted on WN `hostname` after CMSSW CMSSW_0_6_1 not found on `hostname`"\n'
933	<	txt += ' echo "JOB_EXIT_STATUS = 10018"\n'
934	<	txt += ' echo "JobExitCode=10018" \| tee -a $RUNTIME_AREA/$repo\n'
935	<	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
932	>	txt += ' echo "SET_CMS_ENV 10018 ==> OSG $WORKING_DIR could not be deleted on WN `hostname` after CMSSW CMSSW_0_6_1 not found on `hostname`"\n'
933	>	txt += ' echo "JOB_EXIT_STATUS = 10018"\n'
934	>	txt += ' echo "JobExitCode=10018" \| tee -a $RUNTIME_AREA/$repo\n'
935	>	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
936		txt += ' rm -f $RUNTIME_AREA/$repo \n'
937		txt += ' echo "MonitorJobID=`echo $MonitorJobID`" \| tee -a $RUNTIME_AREA/$repo \n'
938		txt += ' echo "MonitorID=`echo $MonitorID`" \| tee -a $RUNTIME_AREA/$repo\n'
#	Line 817 \| Line 941 \| class Cmssw(JobType):
941		txt += ' exit 1 \n'
942		txt += 'fi \n'
943		txt += 'echo "CMSSW_VERSION = '+self.version+'"\n'
820	–	txt += 'export SCRAM_ARCH='+self.executable_arch+'\n'
944		txt += 'cd '+self.version+'\n'
945	+	########## FEDE FOR DBS2 ######################
946	+	txt += 'SOFTWARE_DIR=`pwd`\n'
947	+	txt += 'echo SOFTWARE_DIR=$SOFTWARE_DIR \n'
948	+	###############################################
949		### needed grep for bug in scramv1 ###
950		txt += scram+' runtime -sh\n'
951		txt += 'eval `'+scram+' runtime -sh \| grep -v SCRAMRT_LSB_JOBNAME`\n'
#	Line 844 \| Line 971 \| class Cmssw(JobType):
971		txt += ' cd $RUNTIME_AREA\n'
972		txt += ' /bin/rm -rf $WORKING_DIR\n'
973		txt += ' if [ -d $WORKING_DIR ] ;then\n'
974	<	txt += ' echo "SET_EXE_ENV 50114 ==> OSG $WORKING_DIR could not be deleted on WN `hostname` after Too few arguments for CRAB job wrapper"\n'
975	<	txt += ' echo "JOB_EXIT_STATUS = 50114"\n'
976	<	txt += ' echo "JobExitCode=50114" \| tee -a $RUNTIME_AREA/$repo\n'
977	<	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
974	>	txt += ' echo "SET_EXE_ENV 50114 ==> OSG $WORKING_DIR could not be deleted on WN `hostname` after Too few arguments for CRAB job wrapper"\n'
975	>	txt += ' echo "JOB_EXIT_STATUS = 50114"\n'
976	>	txt += ' echo "JobExitCode=50114" \| tee -a $RUNTIME_AREA/$repo\n'
977	>	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
978		txt += ' rm -f $RUNTIME_AREA/$repo \n'
979		txt += ' echo "MonitorJobID=`echo $MonitorJobID`" \| tee -a $RUNTIME_AREA/$repo \n'
980		txt += ' echo "MonitorID=`echo $MonitorID`" \| tee -a $RUNTIME_AREA/$repo\n'
#	Line 859 \| Line 986 \| class Cmssw(JobType):
986
987		# Prepare job-specific part
988		job = common.job_list[nj]
989	+	### FEDE FOR DBS OUTPUT PUBLICATION
990	+	if (self.datasetPath):
991	+	txt += '\n'
992	+	txt += 'DatasetPath='+self.datasetPath+'\n'
993	+
994	+	datasetpath_split = self.datasetPath.split("/")
995	+
996	+	txt += 'PrimaryDataset='+datasetpath_split[1]+'\n'
997	+	txt += 'DataTier='+datasetpath_split[2]+'\n'
998	+	#txt += 'ProcessedDataset='+datasetpath_split[3]+'\n'
999	+	txt += 'ApplicationFamily=cmsRun\n'
1000	+
1001	+	else:
1002	+	txt += 'DatasetPath=MCDataTier\n'
1003	+	txt += 'PrimaryDataset=null\n'
1004	+	txt += 'DataTier=null\n'
1005	+	#txt += 'ProcessedDataset=null\n'
1006	+	txt += 'ApplicationFamily=MCDataTier\n'
1007		if self.pset != None: #CarlosDaniele
1008		pset = os.path.basename(job.configFilename())
1009		txt += '\n'
1010	+	txt += 'cp $RUNTIME_AREA/'+pset+' .\n'
1011		if (self.datasetPath): # standard job
1012		#txt += 'InputFiles=$2\n'
1013		txt += 'InputFiles=${args[1]}\n'
1014		txt += 'MaxEvents=${args[2]}\n'
1015		txt += 'SkipEvents=${args[3]}\n'
1016		txt += 'echo "Inputfiles:<$InputFiles>"\n'
1017	<	txt += 'sed "s#{\'INPUT\'}#$InputFiles#" $RUNTIME_AREA/'+pset+' > pset_tmp_1.cfg\n'
1017	>	txt += 'sed "s#{\'INPUT\'}#$InputFiles#" '+pset+' > tmp && mv -f tmp '+pset+'\n'
1018		txt += 'echo "MaxEvents:<$MaxEvents>"\n'
1019	<	txt += 'sed "s#INPUTMAXEVENTS#$MaxEvents#" pset_tmp_1.cfg > pset_tmp_2.cfg\n'
1019	>	txt += 'sed "s#INPUTMAXEVENTS#$MaxEvents#" '+pset+' > tmp && mv -f tmp '+pset+'\n'
1020		txt += 'echo "SkipEvents:<$SkipEvents>"\n'
1021	<	txt += 'sed "s#INPUTSKIPEVENTS#$SkipEvents#" pset_tmp_2.cfg > pset.cfg\n'
1021	>	txt += 'sed "s#INPUTSKIPEVENTS#$SkipEvents#" '+pset+' > tmp && mv -f tmp '+pset+'\n'
1022		else: # pythia like job
1023	<	if (self.sourceSeed):
1024	<	txt += 'FirstRun=${args[1]}\n'
1023	>	seedIndex=1
1024	>	if (self.firstRun):
1025	>	txt += 'FirstRun=${args['+str(seedIndex)+']}\n'
1026		txt += 'echo "FirstRun: <$FirstRun>"\n'
1027	<	txt += 'sed "s#\<INPUTFIRSTRUN\>#$FirstRun#" $RUNTIME_AREA/'+pset+' > tmp_1.cfg\n'
1028	<	else:
1029	<	txt += '# Copy untouched pset\n'
883	<	txt += 'cp $RUNTIME_AREA/'+pset+' tmp_1.cfg\n'
1027	>	txt += 'sed "s#\<INPUTFIRSTRUN\>#$FirstRun#" '+pset+' > tmp && mv -f tmp '+pset+'\n'
1028	>	seedIndex=seedIndex+1
1029	>
1030		if (self.sourceSeed):
1031	<	# txt += 'Seed=$2\n'
1032	<	txt += 'Seed=${args[2]}\n'
1033	<	txt += 'echo "Seed: <$Seed>"\n'
1034	<	txt += 'sed "s#\<INPUT\>#$Seed#" tmp_1.cfg > tmp_2.cfg\n'
1031	>	txt += 'Seed=${args['+str(seedIndex)+']}\n'
1032	>	txt += 'sed "s#\<INPUT\>#$Seed#" '+pset+' > tmp && mv -f tmp '+pset+'\n'
1033	>	seedIndex=seedIndex+1
1034	>	## the following seeds are not always present
1035		if (self.sourceSeedVtx):
1036	<	# txt += 'VtxSeed=$3\n'
891	<	txt += 'VtxSeed=${args[3]}\n'
1036	>	txt += 'VtxSeed=${args['+str(seedIndex)+']}\n'
1037		txt += 'echo "VtxSeed: <$VtxSeed>"\n'
1038	<	txt += 'sed "s#INPUTVTX#$VtxSeed#" tmp_2.cfg > pset.cfg\n'
1039	<	else:
1040	<	txt += 'mv tmp_2.cfg pset.cfg\n'
1041	<	else:
1042	<	txt += 'mv tmp_1.cfg pset.cfg\n'
1043	<	# txt += '# Copy untouched pset\n'
1044	<	# txt += 'cp $RUNTIME_AREA/'+pset+' pset.cfg\n'
1045	<
1038	>	txt += 'sed "s#\<INPUTVTX\>#$VtxSeed#" '+pset+' > tmp && mv -f tmp '+pset+'\n'
1039	>	seedIndex += 1
1040	>	if (self.sourceSeedG4):
1041	>	txt += 'G4Seed=${args['+str(seedIndex)+']}\n'
1042	>	txt += 'echo "G4Seed: <$G4Seed>"\n'
1043	>	txt += 'sed "s#\<INPUTG4\>#$G4Seed#" '+pset+' > tmp && mv -f tmp '+pset+'\n'
1044	>	seedIndex += 1
1045	>	if (self.sourceSeedMix):
1046	>	txt += 'mixSeed=${args['+str(seedIndex)+']}\n'
1047	>	txt += 'echo "MixSeed: <$mixSeed>"\n'
1048	>	txt += 'sed "s#\<INPUTMIX\>#$mixSeed#" '+pset+' > tmp && mv -f tmp '+pset+'\n'
1049	>	seedIndex += 1
1050	>	pass
1051	>	pass
1052	>	txt += 'mv -f '+pset+' pset.cfg\n'
1053
1054		if len(self.additional_inbox_files) > 0:
1055	<	for file in self.additional_inbox_files:
1056	<	relFile = file.split("/")[-1]
1057	<	txt += 'if [ -e $RUNTIME_AREA/'+relFile+' ] ; then\n'
906	<	txt += ' cp $RUNTIME_AREA/'+relFile+' .\n'
907	<	txt += ' chmod +x '+relFile+'\n'
908	<	txt += 'fi\n'
1055	>	txt += 'if [ -e $RUNTIME_AREA/'+self.additional_tgz_name+' ] ; then\n'
1056	>	txt += ' tar xzvf $RUNTIME_AREA/'+self.additional_tgz_name+'\n'
1057	>	txt += 'fi\n'
1058		pass
1059
1060		if self.pset != None: #CarlosDaniele
#	Line 916 \| Line 1065 \| class Cmssw(JobType):
1065		txt += 'cat pset.cfg\n'
1066		txt += 'echo "**** end pset.cfg ******"\n'
1067		txt += '\n'
1068	+	### FEDE FOR DBS OUTPUT PUBLICATION
1069	+	txt += 'PSETHASH=`EdmConfigHash < pset.cfg` \n'
1070	+	txt += 'echo "PSETHASH = $PSETHASH" \n'
1071	+	##############
1072	+	txt += '\n'
1073		# txt += 'echo "*** cat pset1.cfg *******"\n'
1074		# txt += 'cat pset1.cfg\n'
1075		# txt += 'echo "**** end pset1.cfg ******"\n'
#	Line 957 \| Line 1111 \| class Cmssw(JobType):
1111		txt += ' echo "Successful untar" \n'
1112		txt += 'fi \n'
1113		txt += '\n'
1114	<	txt += 'echo "Include ProdAgentApi in PYTHONPATH"\n'
1114	>	txt += 'echo "Include ProdAgentApi and PRODCOMMON in PYTHONPATH"\n'
1115		txt += 'if [ -z "$PYTHONPATH" ]; then\n'
1116	<	txt += ' export PYTHONPATH=ProdAgentApi\n'
1116	>	#### FEDE FOR DBS OUTPUT PUBLICATION
1117	>	txt += ' export PYTHONPATH=$SOFTWARE_DIR/ProdAgentApi:$SOFTWARE_DIR/ProdCommon\n'
1118	>	#txt += ' export PYTHONPATH=`pwd`/ProdAgentApi:`pwd`/ProdCommon\n'
1119	>	#txt += ' export PYTHONPATH=ProdAgentApi\n'
1120		txt += 'else\n'
1121	<	txt += ' export PYTHONPATH=ProdAgentApi:${PYTHONPATH}\n'
1121	>	txt += ' export PYTHONPATH=$SOFTWARE_DIR/ProdAgentApi:$SOFTWARE_DIR/ProdCommon:${PYTHONPATH}\n'
1122	>	#txt += ' export PYTHONPATH=`pwd`/ProdAgentApi:`pwd`/ProdCommon:${PYTHONPATH}\n'
1123	>	#txt += ' export PYTHONPATH=ProdAgentApi:${PYTHONPATH}\n'
1124	>	txt += 'echo "PYTHONPATH=$PYTHONPATH"\n'
1125	>	###################
1126		txt += 'fi\n'
1127		txt += '\n'
1128
#	Line 984 \| Line 1145 \| class Cmssw(JobType):
1145		def executableArgs(self):
1146		if self.scriptExe:#CarlosDaniele
1147		return self.scriptExe + " $NJob"
1148	<	else:
1149	<	return " -p pset.cfg"
1148	>	else:
1149	>	# if >= CMSSW_1_5_X, add -e
1150	>	version_array = self.scram.getSWVersion().split('_')
1151	>	major = 0
1152	>	minor = 0
1153	>	try:
1154	>	major = int(version_array[1])
1155	>	minor = int(version_array[2])
1156	>	except:
1157	>	msg = "Cannot parse CMSSW version string: " + "_".join(version_array) + " for major and minor release number!"
1158	>	raise CrabException(msg)
1159	>	if major >= 1 and minor >= 5 :
1160	>	return " -e -p pset.cfg"
1161	>	else:
1162	>	return " -p pset.cfg"
1163
1164		def inputSandbox(self, nj):
1165		"""
#	Line 1003 \| Line 1177 \| class Cmssw(JobType):
1177		if not self.pset is None:
1178		inp_box.append(common.work_space.pathForTgz() + 'job/' + self.configFilename())
1179		## additional input files
1180	<	for file in self.additional_inbox_files:
1181	<	inp_box.append(file)
1180	>	tgz = self.additionalInputFileTgz()
1181	>	inp_box.append(tgz)
1182		return inp_box
1183
1184		def outputSandbox(self, nj):
#	Line 1034 \| Line 1208 \| class Cmssw(JobType):
1208		txt += '# directory content\n'
1209		txt += 'ls \n'
1210
1211	<	for fileWithSuffix in (self.output_file+self.output_file_sandbox):
1211	>	txt += 'output_exit_status=0\n'
1212	>
1213	>	for fileWithSuffix in (self.output_file_sandbox):
1214		output_file_num = self.numberFile_(fileWithSuffix, '$NJob')
1215		txt += '\n'
1216		txt += '# check output file\n'
1217	<	txt += 'ls '+fileWithSuffix+'\n'
1218	<	txt += 'ls_result=$?\n'
1219	<	txt += 'if [ $ls_result -ne 0 ] ; then\n'
1220	<	txt += ' echo "ERROR: Problem with output file"\n'
1217	>	txt += 'if [ -e ./'+fileWithSuffix+' ] ; then\n'
1218	>	txt += ' mv '+fileWithSuffix+' $RUNTIME_AREA\n'
1219	>	txt += ' cp $RUNTIME_AREA/'+fileWithSuffix+' $RUNTIME_AREA/'+output_file_num+'\n'
1220	>	txt += 'else\n'
1221	>	txt += ' exit_status=60302\n'
1222	>	txt += ' echo "ERROR: Problem with output file '+fileWithSuffix+'"\n'
1223		if common.scheduler.boss_scheduler_name == 'condor_g':
1224		txt += ' if [ $middleware == OSG ]; then \n'
1225		txt += ' echo "prepare dummy output file"\n'
1226		txt += ' echo "Processing of job output failed" > $RUNTIME_AREA/'+output_file_num+'\n'
1227		txt += ' fi \n'
1228	+	txt += 'fi\n'
1229	+
1230	+	for fileWithSuffix in (self.output_file):
1231	+	output_file_num = self.numberFile_(fileWithSuffix, '$NJob')
1232	+	txt += '\n'
1233	+	txt += '# check output file\n'
1234	+	txt += 'if [ -e ./'+fileWithSuffix+' ] ; then\n'
1235	+	txt += ' mv '+fileWithSuffix+' $RUNTIME_AREA\n'
1236	+	txt += ' cp $RUNTIME_AREA/'+fileWithSuffix+' $RUNTIME_AREA/'+output_file_num+'\n'
1237		txt += 'else\n'
1238	<	txt += ' cp '+fileWithSuffix+' $RUNTIME_AREA/'+output_file_num+'\n'
1238	>	txt += ' exit_status=60302\n'
1239	>	txt += ' echo "ERROR: Problem with output file '+fileWithSuffix+'"\n'
1240	>	txt += ' echo "JOB_EXIT_STATUS = $exit_status"\n'
1241	>	txt += ' output_exit_status=$exit_status\n'
1242	>	if common.scheduler.boss_scheduler_name == 'condor_g':
1243	>	txt += ' if [ $middleware == OSG ]; then \n'
1244	>	txt += ' echo "prepare dummy output file"\n'
1245	>	txt += ' echo "Processing of job output failed" > $RUNTIME_AREA/'+output_file_num+'\n'
1246	>	txt += ' fi \n'
1247		txt += 'fi\n'
1248	<
1249	<	txt += 'cd $RUNTIME_AREA\n'
1248	>	file_list = []
1249	>	for fileWithSuffix in (self.output_file):
1250	>	file_list.append(self.numberFile_(fileWithSuffix, '$NJob'))
1251	>
1252	>	txt += 'file_list="'+string.join(file_list,' ')+'"\n'
1253		txt += 'cd $RUNTIME_AREA\n'
1056	–	### OLI_DANIELE
1057	–	txt += 'if [ $middleware == OSG ]; then\n'
1058	–	txt += ' cd $RUNTIME_AREA\n'
1059	–	txt += ' echo "Remove working directory: $WORKING_DIR"\n'
1060	–	txt += ' /bin/rm -rf $WORKING_DIR\n'
1061	–	txt += ' if [ -d $WORKING_DIR ] ;then\n'
1062	–	txt += ' echo "SET_EXE 60999 ==> OSG $WORKING_DIR could not be deleted on WN `hostname` after cleanup of WN"\n'
1063	–	txt += ' echo "JOB_EXIT_STATUS = 60999"\n'
1064	–	txt += ' echo "JobExitCode=60999" \| tee -a $RUNTIME_AREA/$repo\n'
1065	–	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
1066	–	txt += ' rm -f $RUNTIME_AREA/$repo \n'
1067	–	txt += ' echo "MonitorJobID=`echo $MonitorJobID`" \| tee -a $RUNTIME_AREA/$repo \n'
1068	–	txt += ' echo "MonitorID=`echo $MonitorID`" \| tee -a $RUNTIME_AREA/$repo\n'
1069	–	txt += ' fi\n'
1070	–	txt += 'fi\n'
1071	–	txt += '\n'
1072	–
1073	–	file_list = ''
1074	–	## Add to filelist only files to be possibly copied to SE
1075	–	for fileWithSuffix in self.output_file:
1076	–	output_file_num = self.numberFile_(fileWithSuffix, '$NJob')
1077	–	file_list=file_list+output_file_num+' '
1078	–	file_list=file_list[:-1]
1079	–	txt += 'file_list="'+file_list+'"\n'
1080	–
1254		return txt
1255
1256		def numberFile_(self, file, txt):
#	Line 1088 \| Line 1261 \| class Cmssw(JobType):
1261		# take away last extension
1262		name = p[0]
1263		for x in p[1:-1]:
1264	<	name=name+"."+x
1264	>	name=name+"."+x
1265		# add "_txt"
1266		if len(p)>1:
1267	<	ext = p[len(p)-1]
1268	<	result = name + '_' + txt + "." + ext
1267	>	ext = p[len(p)-1]
1268	>	result = name + '_' + txt + "." + ext
1269		else:
1270	<	result = name + '_' + txt
1270	>	result = name + '_' + txt
1271
1272		return result
1273
#	Line 1107 \| Line 1280 \| class Cmssw(JobType):
1280		req='Member("VO-cms-' + \
1281		self.version + \
1282		'", other.GlueHostApplicationSoftwareRunTimeEnvironment)'
1283	+	## SL add requirement for OS version only if SL4
1284	+	#reSL4 = re.compile( r'slc4' )
1285	+	if self.executable_arch: # and reSL4.search(self.executable_arch):
1286	+	req+=' && Member("VO-cms-' + \
1287	+	self.executable_arch + \
1288	+	'", other.GlueHostApplicationSoftwareRunTimeEnvironment)'
1289
1290		req = req + ' && (other.GlueHostNetworkAdapterOutboundIP)'
1291
#	Line 1126 \| Line 1305 \| class Cmssw(JobType):
1305		txt += ' echo "### SETUP CMS OSG ENVIRONMENT ###"\n'
1306		txt += ' if [ -f $GRID3_APP_DIR/cmssoft/cmsset_default.sh ] ;then\n'
1307		txt += ' # Use $GRID3_APP_DIR/cmssoft/cmsset_default.sh to setup cms software\n'
1308	+	txt += ' export SCRAM_ARCH='+self.executable_arch+'\n'
1309		txt += ' source $GRID3_APP_DIR/cmssoft/cmsset_default.sh '+self.version+'\n'
1310		txt += ' elif [ -f $OSG_APP/cmssoft/cms/cmsset_default.sh ] ;then\n'
1311		txt += ' # Use $OSG_APP/cmssoft/cms/cmsset_default.sh to setup cms software\n'
1312	+	txt += ' export SCRAM_ARCH='+self.executable_arch+'\n'
1313		txt += ' source $OSG_APP/cmssoft/cms/cmsset_default.sh '+self.version+'\n'
1314		txt += ' else\n'
1315		txt += ' echo "SET_CMS_ENV 10020 ==> ERROR $GRID3_APP_DIR/cmssoft/cmsset_default.sh and $OSG_APP/cmssoft/cms/cmsset_default.sh file not found"\n'
#	Line 1144 \| Line 1325 \| class Cmssw(JobType):
1325		txt += ' cd $RUNTIME_AREA\n'
1326		txt += ' /bin/rm -rf $WORKING_DIR\n'
1327		txt += ' if [ -d $WORKING_DIR ] ;then\n'
1328	<	txt += ' echo "SET_CMS_ENV 10017 ==> OSG $WORKING_DIR could not be deleted on WN `hostname` after $GRID3_APP_DIR/cmssoft/cmsset_default.sh and $OSG_APP/cmssoft/cms/cmsset_default.sh file not found"\n'
1329	<	txt += ' echo "JOB_EXIT_STATUS = 10017"\n'
1330	<	txt += ' echo "JobExitCode=10017" \| tee -a $RUNTIME_AREA/$repo\n'
1331	<	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
1332	<	txt += ' rm -f $RUNTIME_AREA/$repo \n'
1333	<	txt += ' echo "MonitorJobID=`echo $MonitorJobID`" \| tee -a $RUNTIME_AREA/$repo \n'
1334	<	txt += ' echo "MonitorID=`echo $MonitorID`" \| tee -a $RUNTIME_AREA/$repo\n'
1328	>	txt += ' echo "SET_CMS_ENV 10017 ==> OSG $WORKING_DIR could not be deleted on WN `hostname` after $GRID3_APP_DIR/cmssoft/cmsset_default.sh and $OSG_APP/cmssoft/cms/cmsset_default.sh file not found"\n'
1329	>	txt += ' echo "JOB_EXIT_STATUS = 10017"\n'
1330	>	txt += ' echo "JobExitCode=10017" \| tee -a $RUNTIME_AREA/$repo\n'
1331	>	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
1332	>	txt += ' rm -f $RUNTIME_AREA/$repo \n'
1333	>	txt += ' echo "MonitorJobID=`echo $MonitorJobID`" \| tee -a $RUNTIME_AREA/$repo \n'
1334	>	txt += ' echo "MonitorID=`echo $MonitorID`" \| tee -a $RUNTIME_AREA/$repo\n'
1335		txt += ' fi\n'
1336		txt += '\n'
1337		txt += ' exit 1\n'
#	Line 1209 \| Line 1390 \| class Cmssw(JobType):
1390		txt += ' echo "### END SETUP CMS LCG ENVIRONMENT ###"\n'
1391		return txt
1392
1393	+	### FEDE FOR DBS OUTPUT PUBLICATION
1394	+	def modifyReport(self, nj):
1395	+	"""
1396	+	insert the part of the script that modifies the FrameworkJob Report
1397	+	"""
1398	+
1399	+	txt = ''
1400	+	try:
1401	+	publish_data = int(self.cfg_params['USER.publish_data'])
1402	+	except KeyError:
1403	+	publish_data = 0
1404	+	if (publish_data == 1):
1405	+	txt += 'echo "Modify Job Report" \n'
1406	+	#txt += 'chmod a+x $RUNTIME_AREA/'+self.version+'/ProdAgentApi/FwkJobRep/ModifyJobReport.py\n'
1407	+	################ FEDE FOR DBS2 #############################################
1408	+	txt += 'chmod a+x $SOFTWARE_DIR/ProdAgentApi/FwkJobRep/ModifyJobReport.py\n'
1409	+	#############################################################################
1410	+	#try:
1411	+	# publish_data = int(self.cfg_params['USER.publish_data'])
1412	+	#except KeyError:
1413	+	# publish_data = 0
1414	+
1415	+	txt += 'if [ -z "$SE" ]; then\n'
1416	+	txt += ' SE="" \n'
1417	+	txt += 'fi \n'
1418	+	txt += 'if [ -z "$SE_PATH" ]; then\n'
1419	+	txt += ' SE_PATH="" \n'
1420	+	txt += 'fi \n'
1421	+	txt += 'echo "SE = $SE"\n'
1422	+	txt += 'echo "SE_PATH = $SE_PATH"\n'
1423	+
1424	+	#if (publish_data == 1):
1425	+	#processedDataset = self.cfg_params['USER.processed_datasetname']
1426	+	processedDataset = self.cfg_params['USER.publish_data_name']
1427	+	txt += 'ProcessedDataset='+processedDataset+'\n'
1428	+	#### LFN=/store/user/<user>/processedDataset_PSETHASH
1429	+	txt += 'if [ "$SE_PATH" == "" ]; then\n'
1430	+	#### FEDE: added slash in LFN ##############
1431	+	txt += ' FOR_LFN=/copy_problems/ \n'
1432	+	txt += 'else \n'
1433	+	txt += ' tmp=`echo $SE_PATH \| awk -F \'store\' \'{print$2}\'` \n'
1434	+	##### FEDE TO BE CHANGED, BECAUSE STORE IS HARDCODED!!!! ########
1435	+	txt += ' FOR_LFN=/store$tmp \n'
1436	+	txt += 'fi \n'
1437	+	txt += 'echo "ProcessedDataset = $ProcessedDataset"\n'
1438	+	txt += 'echo "FOR_LFN = $FOR_LFN" \n'
1439	+	txt += 'echo "CMSSW_VERSION = $CMSSW_VERSION"\n\n'
1440	+	#txt += 'echo "$RUNTIME_AREA/'+self.version+'/ProdAgentApi/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH"\n'
1441	+	txt += 'echo "$SOFTWARE_DIR/ProdAgentApi/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH"\n'
1442	+	txt += '$SOFTWARE_DIR/ProdAgentApi/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH\n'
1443	+	#txt += '$RUNTIME_AREA/'+self.version+'/ProdAgentApi/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH\n'
1444	+
1445	+	txt += 'modifyReport_result=$?\n'
1446	+	txt += 'echo modifyReport_result = $modifyReport_result\n'
1447	+	txt += 'if [ $modifyReport_result -ne 0 ]; then\n'
1448	+	txt += ' exit_status=1\n'
1449	+	txt += ' echo "ERROR: Problem with ModifyJobReport"\n'
1450	+	txt += 'else\n'
1451	+	txt += ' mv NewFrameworkJobReport.xml crab_fjr_$NJob.xml\n'
1452	+	txt += 'fi\n'
1453	+	else:
1454	+	txt += 'echo "no data publication required"\n'
1455	+	#txt += 'ProcessedDataset=no_data_to_publish \n'
1456	+	#### FEDE: added slash in LFN ##############
1457	+	#txt += 'FOR_LFN=/local/ \n'
1458	+	#txt += 'echo "ProcessedDataset = $ProcessedDataset"\n'
1459	+	#txt += 'echo "FOR_LFN = $FOR_LFN" \n'
1460	+	return txt
1461	+
1462	+	def cleanEnv(self):
1463	+	### OLI_DANIELE
1464	+	txt = ''
1465	+	txt += 'if [ $middleware == OSG ]; then\n'
1466	+	txt += ' cd $RUNTIME_AREA\n'
1467	+	txt += ' echo "Remove working directory: $WORKING_DIR"\n'
1468	+	txt += ' /bin/rm -rf $WORKING_DIR\n'
1469	+	txt += ' if [ -d $WORKING_DIR ] ;then\n'
1470	+	txt += ' echo "SET_EXE 60999 ==> OSG $WORKING_DIR could not be deleted on WN `hostname` after cleanup of WN"\n'
1471	+	txt += ' echo "JOB_EXIT_STATUS = 60999"\n'
1472	+	txt += ' echo "JobExitCode=60999" \| tee -a $RUNTIME_AREA/$repo\n'
1473	+	txt += ' dumpStatus $RUNTIME_AREA/$repo\n'
1474	+	txt += ' rm -f $RUNTIME_AREA/$repo \n'
1475	+	txt += ' echo "MonitorJobID=`echo $MonitorJobID`" \| tee -a $RUNTIME_AREA/$repo \n'
1476	+	txt += ' echo "MonitorID=`echo $MonitorID`" \| tee -a $RUNTIME_AREA/$repo\n'
1477	+	txt += ' fi\n'
1478	+	txt += 'fi\n'
1479	+	txt += '\n'
1480	+	return txt
1481	+
1482		def setParam_(self, param, value):
1483		self._params[param] = value
1484
#	Line 1221 \| Line 1491 \| class Cmssw(JobType):
1491		def getTaskid(self):
1492		return self._taskId
1493
1224	–	#######################################################################
1494		def uniquelist(self, old):
1495		"""
1496		remove duplicates from a list
#	Line 1230 \| Line 1499 \| class Cmssw(JobType):
1499		for e in old:
1500		nd[e]=0
1501		return nd.keys()
1502	+
1503	+
1504	+	def checkOut(self, limit):
1505	+	"""
1506	+	check the dimension of the output files
1507	+	"""
1508	+	txt = 'echo "*****************************************"\n'
1509	+	txt += 'echo " Starting output sandbox limit check "\n'
1510	+	txt += 'echo "*****************************************"\n'
1511	+	allOutFiles = ""
1512	+	listOutFiles = []
1513	+	for fileOut in (self.output_file+self.output_file_sandbox):
1514	+	if fileOut.find('crab_fjr') == -1:
1515	+	allOutFiles = allOutFiles + " " + self.numberFile_(fileOut, '$NJob')
1516	+	listOutFiles.append(self.numberFile_(fileOut, '$NJob'))
1517	+	txt += 'echo "OUTPUT files: '+str(allOutFiles)+'";\n'
1518	+	txt += 'ls -gGhrta;\n'
1519	+	txt += 'sum=0;\n'
1520	+	txt += 'for file in '+str(allOutFiles)+' ; do\n'
1521	+	txt += ' if [ -e $file ]; then\n'
1522	+	txt += ' tt=`ls -gGrta $file \| awk \'{ print $3 }\'`\n'
1523	+	txt += ' sum=`expr $sum + $tt`\n'
1524	+	txt += ' else\n'
1525	+	txt += ' echo "WARNING: output file $file not found!"\n'
1526	+	txt += ' fi\n'
1527	+	txt += 'done\n'
1528	+	txt += 'echo "Total Output dimension: $sum";\n'
1529	+	txt += 'limit='+str(limit)+';\n'
1530	+	txt += 'echo "OUTPUT FILES LIMIT SET TO: $limit";\n'
1531	+	txt += 'if [ $limit -lt $sum ]; then\n'
1532	+	txt += ' echo "WARNING: output files have to big size - something will be lost;"\n'
1533	+	txt += ' echo " checking the output file sizes..."\n'
1534	+	"""
1535	+	txt += ' dim=0;\n'
1536	+	txt += ' exclude=0;\n'
1537	+	txt += ' for files in '+str(allOutFiles)+' ; do\n'
1538	+	txt += ' sumTemp=0;\n'
1539	+	txt += ' for file2 in '+str(allOutFiles)+' ; do\n'
1540	+	txt += ' if [ $file != $file2 ]; then\n'
1541	+	txt += ' tt=`ls -gGrta $file2 \| awk \'{ print $3 }\';`\n'
1542	+	txt += ' sumTemp=`expr $sumTemp + $tt`;\n'
1543	+	txt += ' fi\n'
1544	+	txt += ' done\n'
1545	+	txt += ' if [ $sumTemp -lt $limit ]; then\n'
1546	+	txt += ' if [ $dim -lt $sumTemp ]; then\n'
1547	+	txt += ' dim=$sumTemp;\n'
1548	+	txt += ' exclude=$file;\n'
1549	+	txt += ' fi\n'
1550	+	txt += ' fi\n'
1551	+	txt += ' done\n'
1552	+	txt += ' echo "Dimension calculated: $dim"; echo "File to exclude: $exclude";\n'
1553	+	"""
1554	+	txt += ' tot=0;\n'
1555	+	txt += ' for file2 in '+str(allOutFiles)+' ; do\n'
1556	+	txt += ' tt=`ls -gGrta $file2 \| awk \'{ print $3 }\';`\n'
1557	+	txt += ' tot=`expr $tot + $tt`;\n'
1558	+	txt += ' if [ $limit -lt $tot ]; then\n'
1559	+	txt += ' tot=`expr $tot - $tt`;\n'
1560	+	txt += ' fileLast=$file;\n'
1561	+	txt += ' break;\n'
1562	+	txt += ' fi\n'
1563	+	txt += ' done\n'
1564	+	txt += ' echo "Dimension calculated: $tot"; echo "First file to exclude: $file";\n'
1565	+	txt += ' flag=0;\n'
1566	+	txt += ' for filess in '+str(allOutFiles)+' ; do\n'
1567	+	txt += ' if [ $fileLast = $filess ]; then\n'
1568	+	txt += ' flag=1;\n'
1569	+	txt += ' fi\n'
1570	+	txt += ' if [ $flag -eq 1 ]; then\n'
1571	+	txt += ' rm -f $filess;\n'
1572	+	txt += ' fi\n'
1573	+	txt += ' done\n'
1574	+	txt += ' ls -agGhrt;\n'
1575	+	txt += ' echo "WARNING: output files are too big in dimension: can not put in the output_sandbox.";\n'
1576	+	txt += ' echo "JOB_EXIT_STATUS = 70000";\n'
1577	+	txt += ' exit_status=70000;\n'
1578	+	txt += 'else'
1579	+	txt += ' echo "Total Output dimension $sum is fine.";\n'
1580	+	txt += 'fi\n'
1581	+	txt += 'echo "*****************************************"\n'
1582	+	txt += 'echo "* Ending output sandbox limit check *"\n'
1583	+	txt += 'echo "*****************************************"\n'
1584	+	return txt

Diff Legend

-–
+Removed lines
-+
+Added lines
-<
+Changed lines
->
+Changed lines

Comparing COMP/CRAB/python/cms_cmssw.py (file contents): Revision 1.73 by gutsche, Sun Apr 8 18:39:51 2007 UTC vs. Revision 1.116.2.8 by fanzago, Wed Oct 17 13:25:00 2007 UTC

Diff Legend

Comparing COMP/CRAB/python/cms_cmssw.py (file contents):
Revision 1.73 by gutsche, Sun Apr 8 18:39:51 2007 UTC vs.
Revision 1.116.2.8 by fanzago, Wed Oct 17 13:25:00 2007 UTC