[ViewVC] Diff of: cvsroot/COMP/CRAB/python/cms

Comparing COMP/CRAB/python/cms_cmssw.py (file contents):
Revision 1.139 by ewv, Tue Nov 20 17:06:50 2007 UTC vs.
Revision 1.157 by spiga, Sun Feb 17 20:13:00 2008 UTC

#	Line 13 \| Line 13 \| class Cmssw(JobType):
13		JobType.__init__(self, 'CMSSW')
14		common.logger.debug(3,'CMSSW::__init__')
15
16	+	self.argsList = []
17	+
18		self._params = {}
19		self.cfg_params = cfg_params
18	–
20		# init BlackWhiteListParser
21		self.blackWhiteListParser = BlackWhiteListParser(cfg_params)
22
23	<	try:
23	<	self.MaxTarBallSize = float(self.cfg_params['EDG.maxtarballsize'])
24	<	except KeyError:
25	<	self.MaxTarBallSize = 9.5
23	>	self.MaxTarBallSize = float(self.cfg_params.get('EDG.maxtarballsize',9.5))
24
25		# number of jobs requested to be created, limit obj splitting
26		self.ncjobs = ncjobs
#	Line 63 \| Line 61 \| class Cmssw(JobType):
61
62		### collect Data cards
63
64	<	try:
67	<	tmp = cfg_params['CMSSW.datasetpath']
68	<	log.debug(6, "CMSSW::CMSSW(): datasetPath = "+tmp)
69	<	if string.lower(tmp)=='none':
70	<	self.datasetPath = None
71	<	self.selectNoInput = 1
72	<	else:
73	<	self.datasetPath = tmp
74	<	self.selectNoInput = 0
75	<	except KeyError:
64	>	if not cfg_params.has_key('CMSSW.datasetpath'):
65		msg = "Error: datasetpath not defined "
66		raise CrabException(msg)
67	+	tmp = cfg_params['CMSSW.datasetpath']
68	+	log.debug(6, "CMSSW::CMSSW(): datasetPath = "+tmp)
69	+	if string.lower(tmp)=='none':
70	+	self.datasetPath = None
71	+	self.selectNoInput = 1
72	+	else:
73	+	self.datasetPath = tmp
74	+	self.selectNoInput = 0
75
76		# ML monitoring
77		# split dataset path style: /PreProdR3Minbias/SIM/GEN-SIM
#	Line 82 \| Line 79 \| class Cmssw(JobType):
79		self.setParam_('dataset', 'None')
80		self.setParam_('owner', 'None')
81		else:
82	+	## SL what is supposed to fail here?
83		try:
84		datasetpath_split = self.datasetPath.split("/")
85		# standard style
#	Line 92 \| Line 90 \| class Cmssw(JobType):
90		self.setParam_('dataset', self.datasetPath)
91		self.setParam_('owner', self.datasetPath)
92
93	<	self.setTaskid_()
96	<	self.setParam_('taskId', self.cfg_params['taskId'])
93	>	self.setParam_('taskId', common.taskDB.dict('taskId'))
94
95		self.dataTiers = []
96
97		## now the application
98	<	try:
99	<	self.executable = cfg_params['CMSSW.executable']
100	<	self.setParam_('exe', self.executable)
104	<	log.debug(6, "CMSSW::CMSSW(): executable = "+self.executable)
105	<	msg = "Default executable cmsRun overridden. Switch to " + self.executable
106	<	log.debug(3,msg)
107	<	except KeyError:
108	<	self.executable = 'cmsRun'
109	<	self.setParam_('exe', self.executable)
110	<	msg = "User executable not defined. Use cmsRun"
111	<	log.debug(3,msg)
112	<	pass
98	>	self.executable = cfg_params.get('CMSSW.executable','cmsRun')
99	>	self.setParam_('exe', self.executable)
100	>	log.debug(6, "CMSSW::CMSSW(): executable = "+self.executable)
101
102	<	try:
115	<	self.pset = cfg_params['CMSSW.pset']
116	<	log.debug(6, "Cmssw::Cmssw(): PSet file = "+self.pset)
117	<	if self.pset.lower() != 'none' :
118	<	if (not os.path.exists(self.pset)):
119	<	raise CrabException("User defined PSet file "+self.pset+" does not exist")
120	<	else:
121	<	self.pset = None
122	<	except KeyError:
102	>	if not cfg_params.has_key('CMSSW.pset'):
103		raise CrabException("PSet file missing. Cannot run cmsRun ")
104	+	self.pset = cfg_params['CMSSW.pset']
105	+	log.debug(6, "Cmssw::Cmssw(): PSet file = "+self.pset)
106	+	if self.pset.lower() != 'none' :
107	+	if (not os.path.exists(self.pset)):
108	+	raise CrabException("User defined PSet file "+self.pset+" does not exist")
109	+	else:
110	+	self.pset = None
111
112		# output files
113		## stuff which must be returned always via sandbox
#	Line 130 \| Line 117 \| class Cmssw(JobType):
117		self.output_file_sandbox.append(self.fjrFileName)
118
119		# other output files to be returned via sandbox or copied to SE
120	<	try:
121	<	self.output_file = []
122	<	tmp = cfg_params['CMSSW.output_file']
123	<	if tmp != '':
124	<	tmpOutFiles = string.split(cfg_params['CMSSW.output_file'],',')
125	<	log.debug(7, 'cmssw::cmssw(): output files '+str(tmpOutFiles))
126	<	for tmp in tmpOutFiles:
127	<	tmp=string.strip(tmp)
141	<	self.output_file.append(tmp)
142	<	pass
143	<	else:
144	<	log.message("No output file defined: only stdout/err and the CRAB Framework Job Report will be available\n")
120	>	self.output_file = []
121	>	tmp = cfg_params.get('CMSSW.output_file',None)
122	>	if tmp :
123	>	tmpOutFiles = string.split(tmp,',')
124	>	log.debug(7, 'cmssw::cmssw(): output files '+str(tmpOutFiles))
125	>	for tmp in tmpOutFiles:
126	>	tmp=string.strip(tmp)
127	>	self.output_file.append(tmp)
128		pass
129	<	pass
147	<	except KeyError:
129	>	else:
130		log.message("No output file defined: only stdout/err and the CRAB Framework Job Report will be available\n")
131	<	pass
131	>	pass
132
133		# script_exe file as additional file in inputSandbox
134	<	try:
135	<	self.scriptExe = cfg_params['USER.script_exe']
136	<	if self.scriptExe != '':
137	<	if not os.path.isfile(self.scriptExe):
138	<	msg ="ERROR. file "+self.scriptExe+" not found"
139	<	raise CrabException(msg)
158	<	self.additional_inbox_files.append(string.strip(self.scriptExe))
159	<	except KeyError:
160	<	self.scriptExe = ''
134	>	self.scriptExe = cfg_params.get('USER.script_exe',None)
135	>	if self.scriptExe :
136	>	if not os.path.isfile(self.scriptExe):
137	>	msg ="ERROR. file "+self.scriptExe+" not found"
138	>	raise CrabException(msg)
139	>	self.additional_inbox_files.append(string.strip(self.scriptExe))
140
141		#CarlosDaniele
142		if self.datasetPath == None and self.pset == None and self.scriptExe == '' :
#	Line 165 \| Line 144 \| class Cmssw(JobType):
144		raise CrabException(msg)
145
146		## additional input files
147	<	try:
147	>	if cfg_params.has_key('USER.additional_input_files'):
148		tmpAddFiles = string.split(cfg_params['USER.additional_input_files'],',')
149		for tmp in tmpAddFiles:
150		tmp = string.strip(tmp)
#	Line 189 \| Line 168 \| class Cmssw(JobType):
168		pass
169		pass
170		common.logger.debug(5,"Additional input files: "+str(self.additional_inbox_files))
171	<	except KeyError:
193	<	pass
194	<
195	<	# files per job
196	<	try:
197	<	if (cfg_params['CMSSW.files_per_jobs']):
198	<	raise CrabException("files_per_jobs no longer supported. Quitting.")
199	<	except KeyError:
200	<	pass
171	>	pass
172
173		## Events per job
174	<	try:
174	>	if cfg_params.has_key('CMSSW.events_per_job'):
175		self.eventsPerJob =int( cfg_params['CMSSW.events_per_job'])
176		self.selectEventsPerJob = 1
177	<	except KeyError:
177	>	else:
178		self.eventsPerJob = -1
179		self.selectEventsPerJob = 0
180
181		## number of jobs
182	<	try:
182	>	if cfg_params.has_key('CMSSW.number_of_jobs'):
183		self.theNumberOfJobs =int( cfg_params['CMSSW.number_of_jobs'])
184		self.selectNumberOfJobs = 1
185	<	except KeyError:
185	>	else:
186		self.theNumberOfJobs = 0
187		self.selectNumberOfJobs = 0
188
189	<	try:
189	>	if cfg_params.has_key('CMSSW.total_number_of_events'):
190		self.total_number_of_events = int(cfg_params['CMSSW.total_number_of_events'])
191		self.selectTotalNumberEvents = 1
192	<	except KeyError:
192	>	else:
193		self.total_number_of_events = 0
194		self.selectTotalNumberEvents = 0
195
#	Line 232 \| Line 203 \| class Cmssw(JobType):
203		raise CrabException(msg)
204
205		## source seed for pythia
206	<	try:
236	<	self.sourceSeed = int(cfg_params['CMSSW.pythia_seed'])
237	<	except KeyError:
238	<	self.sourceSeed = None
239	<	common.logger.debug(5,"No seed given")
206	>	self.sourceSeed = cfg_params.get('CMSSW.pythia_seed',None)
207
208	<	try:
242	<	self.sourceSeedVtx = int(cfg_params['CMSSW.vtx_seed'])
243	<	except KeyError:
244	<	self.sourceSeedVtx = None
245	<	common.logger.debug(5,"No vertex seed given")
208	>	self.sourceSeedVtx = cfg_params.get('CMSSW.vtx_seed',None)
209
210	<	try:
248	<	self.sourceSeedG4 = int(cfg_params['CMSSW.g4_seed'])
249	<	except KeyError:
250	<	self.sourceSeedG4 = None
251	<	common.logger.debug(5,"No g4 sim hits seed given")
210	>	self.sourceSeedG4 = cfg_params.get('CMSSW.g4_seed',None)
211
212	<	try:
213	<	self.sourceSeedMix = int(cfg_params['CMSSW.mix_seed'])
214	<	except KeyError:
256	<	self.sourceSeedMix = None
257	<	common.logger.debug(5,"No mix seed given")
212	>	self.sourceSeedMix = cfg_params.get('CMSSW.mix_seed',None)
213	>
214	>	self.firstRun = cfg_params.get('CMSSW.first_run',None)
215
259	–	try:
260	–	self.firstRun = int(cfg_params['CMSSW.first_run'])
261	–	except KeyError:
262	–	self.firstRun = None
263	–	common.logger.debug(5,"No first run given")
216		if self.pset != None: #CarlosDaniele
217		import PsetManipulator as pp
218		PsetEdit = pp.PsetManipulator(self.pset) #Daniele Pset
219
220	+	# Copy/return
221	+
222	+	self.copy_data = int(cfg_params.get('USER.copy_data',0))
223	+	self.return_data = int(cfg_params.get('USER.return_data',0))
224	+
225		#DBSDLS-start
226		## Initialize the variables that are extracted from DBS/DLS and needed in other places of the code
227		self.maxEvents=0 # max events available ( --> check the requested nb. of evts in Creator.py)
#	Line 326 \| Line 283 \| class Cmssw(JobType):
283		## Contact the DBS
284		common.logger.message("Contacting Data Discovery Services ...")
285		try:
329	–
286		self.pubdata=DataDiscovery.DataDiscovery(datasetPath, cfg_params)
287		self.pubdata.fetchDBSInfo()
288
#	Line 369 \| Line 325 \| class Cmssw(JobType):
325
326		return sites
327
328	+	def setArgsList(self, argsList):
329	+	self.argsList = argsList
330	+
331		def jobSplittingByBlocks(self, blockSites):
332		"""
333		Perform job splitting. Jobs run over an integer number of files
#	Line 581 \| Line 540 \| class Cmssw(JobType):
540		for range_jobs in noSiteBlock:
541		msg += str(range_jobs) + virgola
542		msg += '\n will not be submitted and this block of data can not be analyzed!\n'
543	+	if self.cfg_params.has_key('EDG.se_white_list'):
544	+	msg += 'WARNING: SE White List: '+self.cfg_params['EDG.se_white_list']+'\n'
545	+	msg += '(Hint: By whitelisting you force the job to run at this particular site(s).\n'
546	+	msg += 'Please check if the dataset is available at this site!)\n'
547	+	if self.cfg_params.has_key('EDG.ce_white_list'):
548	+	msg += 'WARNING: CE White List: '+self.cfg_params['EDG.ce_white_list']+'\n'
549	+	msg += '(Hint: By whitelisting you force the job to run at this particular site(s).\n'
550	+	msg += 'Please check if the dataset is available at this site!)\n'
551	+
552		common.logger.message(msg)
553
554		self.list_of_args = list_of_lists
#	Line 650 \| Line 618 \| class Cmssw(JobType):
618		self.list_of_args.append(args)
619		pass
620
653	–	# print self.list_of_args
654	–
621		return
622
623
#	Line 786 \| Line 752 \| class Cmssw(JobType):
752		common.logger.debug(5,"data "+root+"/data"+" to be tarred")
753		tar.add(root+"/data",root[swAreaLen:]+"/data")
754
755	<	## Add ProdAgent dir to tar
756	<	paDir = 'ProdAgentApi'
757	<	pa = os.environ['CRABDIR'] + '/' + 'ProdAgentApi'
758	<	if os.path.isdir(pa):
759	<	tar.add(pa,paDir)
755	>	### Removed ProdAgent Api dependencies ###
756	>	### Add ProdAgent dir to tar
757	>	#paDir = 'ProdAgentApi'
758	>	#pa = os.environ['CRABDIR'] + '/' + 'ProdAgentApi'
759	>	#if os.path.isdir(pa):
760	>	# tar.add(pa,paDir)
761
762	<	### FEDE FOR DBS PUBLICATION
796	<	## Add PRODCOMMON dir to tar
762	>	## Add ProdCommon dir to tar
763		prodcommonDir = 'ProdCommon'
764		prodcommonPath = os.environ['CRABDIR'] + '/' + 'ProdCommon'
765		if os.path.isdir(prodcommonPath):
766		tar.add(prodcommonPath,prodcommonDir)
801	–	#############################
767
768		common.logger.debug(5,"Files added to "+self.tgzNameWithPath+" : "+str(tar.getnames()))
769		tar.close()
#	Line 898 \| Line 863 \| class Cmssw(JobType):
863		txt += 'echo ">>> current directory (SOFTWARE_DIR): $SOFTWARE_DIR" \n'
864		###############################################
865		### needed grep for bug in scramv1 ###
901	–	txt += scram+' runtime -sh\n'
866		txt += 'eval `'+scram+' runtime -sh \| grep -v SCRAMRT_LSB_JOBNAME`\n'
903	–	txt += 'echo $PATH\n'
904	–
867		# Handle the arguments:
868		txt += "\n"
869		txt += "## number of arguments (first argument always jobnumber)\n"
870		txt += "\n"
871	<	txt += "if [ $nargs -lt 2 ]\n"
871	>	txt += "if [ $nargs -lt "+str(len(self.argsList[nj].split()))+" ]\n"
872		txt += "then\n"
873		txt += " echo 'SET_EXE_ENV 1 ==> ERROR Too few arguments' +$nargs+ \n"
874		txt += ' echo "JOB_EXIT_STATUS = 50113"\n'
#	Line 1045 \| Line 1007 \| class Cmssw(JobType):
1007		txt += ' echo "Successful untar" \n'
1008		txt += 'fi \n'
1009		txt += '\n'
1010	<	txt += 'echo ">>> Include ProdAgentApi and PRODCOMMON in PYTHONPATH:"\n'
1010	>	#### Removed ProdAgent API dependencies
1011	>	txt += 'echo ">>> Include ProdCommon in PYTHONPATH:"\n'
1012		txt += 'if [ -z "$PYTHONPATH" ]; then\n'
1013		#### FEDE FOR DBS OUTPUT PUBLICATION
1014	<	txt += ' export PYTHONPATH=$SOFTWARE_DIR/ProdAgentApi:$SOFTWARE_DIR/ProdCommon\n'
1014	>	txt += ' export PYTHONPATH=$SOFTWARE_DIR/ProdCommon\n'
1015		txt += 'else\n'
1016	<	txt += ' export PYTHONPATH=$SOFTWARE_DIR/ProdAgentApi:$SOFTWARE_DIR/ProdCommon:${PYTHONPATH}\n'
1016	>	txt += ' export PYTHONPATH=$SOFTWARE_DIR/ProdCommon:${PYTHONPATH}\n'
1017		txt += 'echo "PYTHONPATH=$PYTHONPATH"\n'
1018		###################
1019		txt += 'fi\n'
#	Line 1135 \| Line 1098 \| class Cmssw(JobType):
1098		"""
1099
1100		txt = '\n'
1101	<	txt += 'echo" >>> directory content:"\n'
1101	>	txt += 'echo ">>> current directory (SOFTWARE_DIR): $SOFTWARE_DIR" \n'
1102	>	txt += 'echo ">>> current directory content:"\n'
1103		txt += 'ls \n'
1104	<	txt = '\n'
1104	>	txt += '\n'
1105
1106		txt += 'output_exit_status=0\n'
1107
#	Line 1146 \| Line 1110 \| class Cmssw(JobType):
1110		txt += '\n'
1111		txt += '# check output file\n'
1112		txt += 'if [ -e ./'+fileWithSuffix+' ] ; then\n'
1113	<	txt += ' mv '+fileWithSuffix+' $RUNTIME_AREA\n'
1114	<	txt += ' cp $RUNTIME_AREA/'+fileWithSuffix+' $RUNTIME_AREA/'+output_file_num+'\n'
1113	>	txt += ' mv '+fileWithSuffix+' $RUNTIME_AREA/'+output_file_num+'\n'
1114	>	txt += ' ln -s $RUNTIME_AREA/'+output_file_num+' $RUNTIME_AREA/'+fileWithSuffix+'\n'
1115		txt += 'else\n'
1116		txt += ' exit_status=60302\n'
1117	<	txt += ' echo "ERROR: Problem with output file '+fileWithSuffix+'"\n'
1118	<	if common.scheduler.boss_scheduler_name == 'condor_g':
1117	>	txt += ' echo "ERROR: Output file '+fileWithSuffix+' not found"\n'
1118	>	if common.scheduler.name().upper() == 'CONDOR_G':
1119		txt += ' if [ $middleware == OSG ]; then \n'
1120		txt += ' echo "prepare dummy output file"\n'
1121		txt += ' echo "Processing of job output failed" > $RUNTIME_AREA/'+output_file_num+'\n'
#	Line 1163 \| Line 1127 \| class Cmssw(JobType):
1127		txt += '\n'
1128		txt += '# check output file\n'
1129		txt += 'if [ -e ./'+fileWithSuffix+' ] ; then\n'
1130	<	txt += ' mv '+fileWithSuffix+' $RUNTIME_AREA\n'
1131	<	txt += ' cp $RUNTIME_AREA/'+fileWithSuffix+' $RUNTIME_AREA/'+output_file_num+'\n'
1130	>	if (self.copy_data == 1): # For OSG nodes, file is in $WORKING_DIR, should not be moved to $RUNTIME_AREA
1131	>	txt += ' mv '+fileWithSuffix+' '+output_file_num+'\n'
1132	>	txt += ' ln -s `pwd`/'+output_file_num+' $RUNTIME_AREA/'+fileWithSuffix+'\n'
1133	>	else:
1134	>	txt += ' mv '+fileWithSuffix+' $RUNTIME_AREA/'+output_file_num+'\n'
1135	>	txt += ' ln -s $RUNTIME_AREA/'+output_file_num+' $RUNTIME_AREA/'+fileWithSuffix+'\n'
1136		txt += 'else\n'
1137		txt += ' exit_status=60302\n'
1138	<	txt += ' echo "ERROR: Problem with output file '+fileWithSuffix+'"\n'
1138	>	txt += ' echo "ERROR: Output file '+fileWithSuffix+' not found"\n'
1139		txt += ' echo "JOB_EXIT_STATUS = $exit_status"\n'
1140		txt += ' output_exit_status=$exit_status\n'
1141	<	if common.scheduler.boss_scheduler_name == 'condor_g':
1141	>	if common.scheduler.name().upper() == 'CONDOR_G':
1142		txt += ' if [ $middleware == OSG ]; then \n'
1143		txt += ' echo "prepare dummy output file"\n'
1144		txt += ' echo "Processing of job output failed" > $RUNTIME_AREA/'+output_file_num+'\n'
#	Line 1181 \| Line 1149 \| class Cmssw(JobType):
1149		file_list.append(self.numberFile_(fileWithSuffix, '$NJob'))
1150
1151		txt += 'file_list="'+string.join(file_list,' ')+'"\n'
1152	+	txt += '\n'
1153	+	txt += 'echo ">>> current directory (SOFTWARE_DIR): $SOFTWARE_DIR" \n'
1154	+	txt += 'echo ">>> current directory content:"\n'
1155	+	txt += 'ls \n'
1156	+	txt += '\n'
1157		txt += 'cd $RUNTIME_AREA\n'
1158		txt += 'echo ">>> current directory (RUNTIME_AREA): $RUNTIME_AREA"\n'
1159		return txt
#	Line 1318 \| Line 1291 \| class Cmssw(JobType):
1291		if (publish_data == 1):
1292		txt += 'echo ">>> Modify Job Report:" \n'
1293		################ FEDE FOR DBS2 #############################################
1294	<	txt += 'chmod a+x $SOFTWARE_DIR/ProdAgentApi/FwkJobRep/ModifyJobReport.py\n'
1294	>	#txt += 'chmod a+x $SOFTWARE_DIR/ProdAgentApi/FwkJobRep/ModifyJobReport.py\n'
1295	>	txt += 'chmod a+x $SOFTWARE_DIR/ProdCommon/ProdCommon/FwkJobRep/ModifyJobReport.py\n'
1296		#############################################################################
1297
1298		txt += 'if [ -z "$SE" ]; then\n'
#	Line 1344 \| Line 1318 \| class Cmssw(JobType):
1318		txt += 'echo "ProcessedDataset = $ProcessedDataset"\n'
1319		txt += 'echo "FOR_LFN = $FOR_LFN" \n'
1320		txt += 'echo "CMSSW_VERSION = $CMSSW_VERSION"\n\n'
1321	<	#txt += 'echo "$RUNTIME_AREA/'+self.version+'/ProdAgentApi/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH"\n'
1322	<	txt += 'echo "$SOFTWARE_DIR/ProdAgentApi/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH"\n'
1349	<	txt += '$SOFTWARE_DIR/ProdAgentApi/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH\n'
1350	<	#txt += '$RUNTIME_AREA/'+self.version+'/ProdAgentApi/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH\n'
1321	>	txt += 'echo "$SOFTWARE_DIR/ProdCommon/ProdCommon/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH"\n'
1322	>	txt += '$SOFTWARE_DIR/ProdCommon/ProdCommon/FwkJobRep/ModifyJobReport.py crab_fjr_$NJob.xml $NJob $FOR_LFN $PrimaryDataset $DataTier $ProcessedDataset $ApplicationFamily $executable $CMSSW_VERSION $PSETHASH $SE $SE_PATH\n'
1323
1324		txt += 'modifyReport_result=$?\n'
1325		txt += 'echo modifyReport_result = $modifyReport_result\n'
#	Line 1384 \| Line 1356 \| class Cmssw(JobType):
1356		def getParams(self):
1357		return self._params
1358
1387	–	def setTaskid_(self):
1388	–	self._taskId = self.cfg_params['taskId']
1389	–
1390	–	def getTaskid(self):
1391	–	return self._taskId
1392	–
1359		def uniquelist(self, old):
1360		"""
1361		remove duplicates from a list
#	Line 1404 \| Line 1370 \| class Cmssw(JobType):
1370		"""
1371		check the dimension of the output files
1372		"""
1373	<	txt += 'echo ">>> Starting output sandbox limit check :"\n'
1408	<	allOutFiles = ""
1373	>	txt = 'echo ">>> Starting output sandbox limit check :"\n'
1374		listOutFiles = []
1375	<	for fileOut in (self.output_file+self.output_file_sandbox):
1376	<	if fileOut.find('crab_fjr') == -1:
1377	<	allOutFiles = allOutFiles + " " + self.numberFile_(fileOut, '$NJob')
1378	<	listOutFiles.append(self.numberFile_(fileOut, '$NJob'))
1379	<	txt += 'echo "OUTPUT files: '+str(allOutFiles)+'";\n'
1375	>	txt += 'stdoutFile=`ls *stdout` \n'
1376	>	txt += 'stderrFile=`ls *stderr` \n'
1377	>	if (self.return_data == 1):
1378	>	for file in (self.output_file+self.output_file_sandbox):
1379	>	listOutFiles.append(self.numberFile_(file, '$NJob'))
1380	>	listOutFiles.append('$stdoutFile')
1381	>	listOutFiles.append('$stderrFile')
1382	>	else:
1383	>	for file in (self.output_file_sandbox):
1384	>	listOutFiles.append(self.numberFile_(file, '$NJob'))
1385	>	listOutFiles.append('$stdoutFile')
1386	>	listOutFiles.append('$stderrFile')
1387	>
1388	>	txt += 'echo "OUTPUT files: '+string.join(listOutFiles,' ')+'"\n'
1389	>	txt += 'filesToCheck="'+string.join(listOutFiles,' ')+'"\n'
1390	>	# txt += 'echo "OUTPUT files: '+str(allOutFiles)+'";\n'
1391		txt += 'ls -gGhrta;\n'
1392		txt += 'sum=0;\n'
1393	<	txt += 'for file in '+str(allOutFiles)+' ; do\n'
1393	>	txt += 'for file in $filesToCheck ; do\n'
1394		txt += ' if [ -e $file ]; then\n'
1395		txt += ' tt=`ls -gGrta $file \| awk \'{ print $3 }\'`\n'
1396		txt += ' sum=`expr $sum + $tt`\n'
#	Line 1428 \| Line 1404 \| class Cmssw(JobType):
1404		txt += 'if [ $limit -lt $sum ]; then\n'
1405		txt += ' echo "WARNING: output files have to big size - something will be lost;"\n'
1406		txt += ' echo " checking the output file sizes..."\n'
1431	–	"""
1432	–	txt += ' dim=0;\n'
1433	–	txt += ' exclude=0;\n'
1434	–	txt += ' for files in '+str(allOutFiles)+' ; do\n'
1435	–	txt += ' sumTemp=0;\n'
1436	–	txt += ' for file2 in '+str(allOutFiles)+' ; do\n'
1437	–	txt += ' if [ $file != $file2 ]; then\n'
1438	–	txt += ' tt=`ls -gGrta $file2 \| awk \'{ print $3 }\';`\n'
1439	–	txt += ' sumTemp=`expr $sumTemp + $tt`;\n'
1440	–	txt += ' fi\n'
1441	–	txt += ' done\n'
1442	–	txt += ' if [ $sumTemp -lt $limit ]; then\n'
1443	–	txt += ' if [ $dim -lt $sumTemp ]; then\n'
1444	–	txt += ' dim=$sumTemp;\n'
1445	–	txt += ' exclude=$file;\n'
1446	–	txt += ' fi\n'
1447	–	txt += ' fi\n'
1448	–	txt += ' done\n'
1449	–	txt += ' echo "Dimension calculated: $dim"; echo "File to exclude: $exclude";\n'
1450	–	"""
1407		txt += ' tot=0;\n'
1408	<	txt += ' for file2 in '+str(allOutFiles)+' ; do\n'
1409	<	txt += ' tt=`ls -gGrta $file2 \| awk \'{ print $3 }\';`\n'
1408	>	txt += ' for filefile in $filesToCheck ; do\n'
1409	>	txt += ' dimFile=`ls -gGrta $filefile \| awk \'{ print $3 }\';`\n'
1410		txt += ' tot=`expr $tot + $tt`;\n'
1411	<	txt += ' if [ $limit -lt $tot ]; then\n'
1412	<	txt += ' tot=`expr $tot - $tt`;\n'
1413	<	txt += ' fileLast=$file;\n'
1414	<	txt += ' break;\n'
1415	<	txt += ' fi\n'
1416	<	txt += ' done\n'
1417	<	txt += ' echo "Dimension calculated: $tot"; echo "First file to exclude: $file";\n'
1418	<	txt += ' flag=0;\n'
1463	<	txt += ' for filess in '+str(allOutFiles)+' ; do\n'
1464	<	txt += ' if [ $fileLast = $filess ]; then\n'
1465	<	txt += ' flag=1;\n'
1466	<	txt += ' fi\n'
1467	<	txt += ' if [ $flag -eq 1 ]; then\n'
1468	<	txt += ' rm -f $filess;\n'
1411	>	txt += ' if [ $limit -lt $dimFile ]; then\n'
1412	>	txt += ' echo "deleting file: $filefile";\n'
1413	>	txt += ' rm -f $filefile\n'
1414	>	txt += ' elif [ $limit -lt $tot ]; then\n'
1415	>	txt += ' echo "deleting file: $filefile";\n'
1416	>	txt += ' rm -f $filefile\n'
1417	>	txt += ' else\n'
1418	>	txt += ' echo "saving file: $filefile"\n'
1419		txt += ' fi\n'
1420		txt += ' done\n'
1421	+
1422		txt += ' ls -agGhrt;\n'
1423		txt += ' echo "WARNING: output files are too big in dimension: can not put in the output_sandbox.";\n'
1424		txt += ' echo "JOB_EXIT_STATUS = 70000";\n'

Diff Legend

-–
+Removed lines
-+
+Added lines
-<
+Changed lines
->
+Changed lines

Comparing COMP/CRAB/python/cms_cmssw.py (file contents): Revision 1.139 by ewv, Tue Nov 20 17:06:50 2007 UTC vs. Revision 1.157 by spiga, Sun Feb 17 20:13:00 2008 UTC

Diff Legend

Comparing COMP/CRAB/python/cms_cmssw.py (file contents):
Revision 1.139 by ewv, Tue Nov 20 17:06:50 2007 UTC vs.
Revision 1.157 by spiga, Sun Feb 17 20:13:00 2008 UTC