ViewVC Help
View File | Revision Log | Show Annotations | Root Listing
root/cvsroot/COMP/CRAB/python/SchedulerGlite.py
(Generate patch)

Comparing COMP/CRAB/python/SchedulerGlite.py (file contents):
Revision 1.37 by fanzago, Tue Mar 4 11:09:13 2008 UTC vs.
Revision 1.79 by farinafa, Wed Apr 21 08:50:52 2010 UTC

# Line 1 | Line 1
1 + """
2 + CRAB interface to BossLite gLite Scheduler
3 + """
4 +
5 + __revision__ = "$Id$"
6 + __version__ = "$Revision$"
7 +
8   from SchedulerGrid import SchedulerGrid
2 from crab_logger import Logger
9   from crab_exceptions import *
10   from crab_util import *
11 < from GliteConfig import *
11 > import EdgLoggingInfo
12   import common
13 + from WMCore.SiteScreening.BlackWhiteListParser import CEBlackWhiteListParser
14  
15   import os, sys, time
16  
# Line 11 | Line 18 | class SchedulerGlite(SchedulerGrid):
18      def __init__(self, name="GLITE"):
19          SchedulerGrid.__init__(self,name)
20  
21 +        self.OSBsize = 55000000
22 +
23      def configure(self,cfg_params):
24          SchedulerGrid.configure(self, cfg_params)
25 <        self.environment_unique_identifier = 'GLITE_WMS_JOBID'
25 >        self.environment_unique_identifier = '$GLITE_WMS_JOBID'
26 >
27 >    def realSchedParams(self,cfg_params):
28 >        """
29 >        Return dictionary with specific parameters, to use
30 >        with real scheduler
31 >        """
32 >        self.rb_param_file=''
33 >        if (not cfg_params.has_key('GRID.rb')):
34 >            cfg_params['GRID.rb']='CERN'
35 >        self.rb_param_file=common.scheduler.rb_configure(cfg_params.get("GRID.rb"))
36 >        self.wms_service=cfg_params.get("GRID.wms_service",'')
37 >        self.skipWMSAuth=cfg_params.get("GRID.skipwmsauth",1)
38 >        params = { 'service' : self.wms_service, \
39 >                   'config' : self.rb_param_file, \
40 >                   'skipWMSAuth' : self.skipWMSAuth
41 >                 }
42 >        return  params
43 >
44  
45      def rb_configure(self, RB):
46 +        url ='http://cmsdoc.cern.ch/cms/LCG/crab/config/'
47 +        from Downloader import Downloader
48 +        import httplib
49 +        common.logger.debug('Downloading config files for WMS: '+url)
50 +        ## 25-Jun-2009 SL: patch to use Cream enabled WMS
51 +        if ( self.cfg_params.get('GRID.use_cream',None) ):
52 +            RB='CREAM'
53          if not RB: return None
20        glite_config = None
54          rb_param_file = None
55 +        configFileName = 'glite_wms_'+str(RB)+'.conf'
56  
57 <        gliteConfig = GliteConfig(RB)
58 <        glite_config = gliteConfig.config()
57 >        results = Downloader(url)
58 >        try:
59 >            gliteConfig  = results.filePath(configFileName)
60 >        except httplib.HTTPException, ex:
61 >            raise CrabException( "Problem getting RB config file: %s, reason:"%(configFileName, ex) )
62  
63 <        if (glite_config ):
64 <            rb_param_file = 'WMSconfig = '+glite_config+';\n'
63 >        if (gliteConfig ):
64 >            rb_param_file = gliteConfig
65          return rb_param_file
66  
67      def ce_list(self):
68          """
69 <        Returns string with requirement CE related    
69 >        Returns string with requirement CE related
70          """
71 <        req = ''  
71 >        ceParser = CEBlackWhiteListParser(self.EDG_ce_white_list,
72 >                                          self.EDG_ce_black_list, common.logger())
73 >        req = ''
74 >        ce_white_list = []
75 >        ce_black_list = []
76          if self.EDG_ce_white_list:
77 <            ce_white_list = self.EDG_ce_white_list
77 >            ce_white_list = ceParser.whiteList()
78              tmpCe=[]
79              concString = '&&'
80              for ce in ce_white_list:
# Line 52 | Line 93 | class SchedulerGlite(SchedulerGrid):
93                      req += ") "
94  
95          if self.EDG_ce_black_list:
96 <            ce_black_list = self.EDG_ce_black_list
96 >            ce_black_list = ceParser.blackList()
97              tmpCe=[]
98              concString = '&&'
99              for ce in ce_black_list:
# Line 60 | Line 101 | class SchedulerGlite(SchedulerGrid):
101              if len(tmpCe): req += " && (" + concString.join(tmpCe) + ") "
102  
103          # requirement added to skip gliteCE
104 <        req += '&& (!RegExp("blah", other.GlueCEUniqueId))'
104 >        # not more needed
105 > #       req += '&& (!RegExp("blah", other.GlueCEUniqueId))'
106 >        retWL = ','.join(ce_white_list)
107 >        retBL = ','.join(ce_black_list)
108 >        if not retWL:
109 >            retWL = None
110 >        if not retBL:
111 >            retBL = None
112  
113 <        return req
113 >        return req, retWL, retBL
114  
115 <    def se_list(self, id):
115 >    def se_list(self, dest):
116 >        """
117 >        Returns string with requirement SE related
118          """
119 <        Returns string with requirement SE related    
70 <        """  
71 <        hostList=self.findSites_(id)
119 >        hostList=self.findSites_(dest)
120          req=''
121          reqtmp=[]
122          concString = '||'
# Line 82 | Line 130 | class SchedulerGlite(SchedulerGrid):
130  
131      def jdlParam(self):
132          """
133 <        Returns
134 <        """
133 >        Returns
134 >        """
135          req=''
136          if self.EDG_addJdlParam:
137 <            if self.EDG_addJdlParam[-1] == '': self.EDG_addJdlParam= self.EDG_addJdlParam[:-1]
137 >            if self.EDG_addJdlParam[-1] == '': self.EDG_addJdlParam= self.EDG_addJdlParam[:-1]
138              for p in self.EDG_addJdlParam:
139 <             #   param_file.write(string.strip(p)+';\n')
92 <                req+=string.strip(p)+';\n' ## BL--DS
139 >                req+=string.strip(p)+';\n'
140          return req
141  
142      def specific_req(self):
143          """
144          Returns string with specific requirements
145 <        """
145 >        """
146          req=''
147          if self.EDG_clock_time:
148              if (not req == ' '): req = req + ' && '
# Line 104 | Line 151 | class SchedulerGlite(SchedulerGrid):
151          if self.EDG_cpu_time:
152              if (not req == ' '): req = req + ' && '
153              req = req + ' other.GlueCEPolicyMaxCPUTime>='+self.EDG_cpu_time
154 <        
154 >
155          return req
156  
157 <    def sched_parameter(self):
157 >    def sched_parameter(self,i,task):
158          """
159          Returns string with requirements and scheduler-specific parameters
160          """
161 <        index = int(common._db.nJobs()) - 1
115 <        job = common.job_list[index]
116 <        jbt = job.type()
117 <
118 <      ### To Be Removed BL--DS
119 <      #  lastDest=''
120 <      #  first = []
121 <      #  last  = []
122 <      #  for n in range(common.jobDB.nJobs()):
123 <      #      currDest=common.jobDB.destination(n)
124 <      #      if (currDest!=lastDest):
125 <      #          lastDest = currDest
126 <      #          first.append(n)
127 <      #          if n != 0:last.append(n-1)
128 <      #  if len(first)>len(last) :last.append(common.jobDB.nJobs())
161 >        dest=  task.jobs[i-1]['dlsDestination']
162  
163 <        req = ''
164 <        req = req + jbt.getRequirements()
163 >        req=''
164 >        req +=task['jobType']
165  
133        if self.EDG_requirements:
134            if (not req == ' '): req = req +  ' && '
135            req = req + self.EDG_requirements
166          sched_param=''
167 <        sched_param='""pippo""'
168 <
169 <        ### Temporary Problem with quote and py2sqlite.... under investigation..        
170 <        for i in range(index):
171 <           # sched_param+='Requirements = ' + req +self.specific_req() + self.se_list(i) +\
172 <           #                                 self.ce_list() +';\n' ## BL--DS
173 <           # if self.EDG_addJdlParam: sched_param+=self.jdlParam() ## BL--DS
174 <           # if (self.rb_param_file): sched_param+=self.rb_param_file ## BL--DS
175 <           # print sched_param
176 <            run_jobReq={'schedulerAttributes':sched_param}## DS--BL
177 <            common._db.updateRunJob_(i,run_jobReq)        
178 <
179 <    def wsSetupEnvironment(self):
180 <        """
181 <        Returns part of a job script which does scheduler-specific work.
182 <        """
183 <        txt = ''
184 <        txt += '# strip arguments\n'
185 <        txt += 'echo "strip arguments"\n'
186 <        txt += 'args=("$@")\n'
187 <        txt += 'nargs=$#\n'
188 <        txt += 'shift $nargs\n'
189 <        txt += "# job number (first parameter for job wrapper)\n"
190 <        txt += "NJob=${args[0]}; export NJob\n"
191 <
192 <        txt += '# job identification to DashBoard \n'
193 <        #txt += 'MonitorJobID=`echo ${NJob}_$GLITE_WMS_JOBID`\n'
194 <        #txt += 'SyncGridJobId=`echo $GLITE_WMS_JOBID`\n'
195 <        #txt += 'MonitorID=`echo ' + self._taskId + '`\n'
196 <        txt += 'MonitorJobID=${NJob}_$GLITE_WMS_JOBID \n'
197 <        txt += 'SyncGridJobId=$GLITE_WMS_JOBID \n'
198 <        txt += 'MonitorID='+self._taskId+' \n'
199 <        txt += 'echo "MonitorJobID=$MonitorJobID" > $RUNTIME_AREA/$repo \n'
200 <        txt += 'echo "SyncGridJobId=$SyncGridJobId" >> $RUNTIME_AREA/$repo \n'
201 <        txt += 'echo "MonitorID=$MonitorID" >> $RUNTIME_AREA/$repo\n'
202 <        #txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
203 <        #txt += 'echo "SyncGridJobId=`echo $SyncGridJobId`" | tee -a $RUNTIME_AREA/$repo \n'
204 <        #txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
205 <
206 <        #txt += 'echo "middleware discovery: " \n'
207 <        txt += 'echo ">>> GridFlavour discovery: " \n'
208 <        txt += 'if [ $VO_CMS_SW_DIR ]; then \n'
209 <        txt += '    middleware=LCG\n'
210 <        #txt += '    echo "SyncCE=`glite-brokerinfo getCE`" | tee -a $RUNTIME_AREA/$repo \n'
211 <        txt += '    echo "SyncCE=`glite-brokerinfo getCE`" >> $RUNTIME_AREA/$repo \n'
212 <        #txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
213 <        txt += '    echo "GridFlavour=$middleware" | tee -a $RUNTIME_AREA/$repo \n'
214 <        #txt += '    echo ">>> middleware =$middleware" \n'
215 <        txt += 'elif [ $OSG_APP ]; then \n'
216 <        txt += '    middleware=OSG \n'
217 <        txt += '    if [ $OSG_JOB_CONTACT ]; then \n'
218 <        txt += '        SyncCE="$OSG_JOB_CONTACT"; \n'
219 <        #txt += '        echo "SyncCE=$SyncCE" | tee -a $RUNTIME_AREA/$repo ;\n'
220 <        txt += '        echo "SyncCE=$SyncCE" >> $RUNTIME_AREA/$repo ;\n'
167 >        sched_param+='Requirements = ' + req +self.specific_req() + self.se_list(dest) +\
168 >                                        self.ce_list()[0] +';\n'
169 >        if self.EDG_addJdlParam: sched_param+=self.jdlParam()
170 >        sched_param+='MyProxyServer = "' + self.proxyServer + '";\n'
171 >        sched_param+='VirtualOrganisation = "' + self.VO + '";\n'
172 >        sched_param+='RetryCount = '+str(self.EDG_retry_count)+';\n'
173 >        sched_param+='ShallowRetryCount = '+str(self.EDG_shallow_retry_count)+';\n'
174 >
175 >        return sched_param
176 >
177 >    def decodeLogInfo(self, file):
178 >        """
179 >        Parse logging info file and return main info
180 >        """
181 >        loggingInfo = EdgLoggingInfo.EdgLoggingInfo()
182 >        reason = loggingInfo.decodeReason(file)
183 >        return reason
184 >
185 >    def findSites_(self, sites):
186 >        itr4 =[]
187 >        if len(sites)>0 and sites[0]=="":
188 >            return itr4
189 >        if sites != [""]:
190 >            replicas = self.blackWhiteListParser.checkBlackList(sites)
191 >            if len(replicas)!=0:
192 >                replicas = self.blackWhiteListParser.checkWhiteList(replicas)
193 >
194 >            itr4 = replicas
195 >        return itr4
196 >
197 >    def delegateProxy(self):
198 >        self.boss().delegateProxy()  
199 >        return
200 >
201 >    def wsExitFunc(self):
202 >        """
203 >        """
204 >        txt = '\n'
205 >
206 >        txt += '#\n'
207 >        txt += '# EXECUTE THIS FUNCTION BEFORE EXIT \n'
208 >        txt += '#\n\n'
209 >
210 >        txt += 'func_exit() { \n'
211 >        txt += self.wsExitFunc_common()
212 >        ### specific Glite check for OSB
213 >        txt += '    tar zcvf ${out_files}.tgz  ${final_list}\n'
214 >        txt += '    tmp_size=`ls -gGrta ${out_files}.tgz | awk \'{ print $3 }\'`\n'
215 >        txt += '    rm ${out_files}.tgz\n'
216 >        txt += '    size=`expr $tmp_size`\n'
217 >        txt += '    echo "Total Output dimension: $size"\n'
218 >        txt += '    limit='+str(self.OSBsize) +' \n'
219 >        txt += '    echo "WARNING: output files size limit is set to: $limit"\n'
220 >        txt += '    if [ "$limit" -lt "$size" ]; then\n'
221 >        txt += '        exceed=1\n'
222 >        txt += '        job_exit_code=70000\n'
223 >        txt += '        echo "Output Sanbox too big. Produced output is lost "\n'
224 >        txt += '    else\n'
225 >        txt += '        exceed=0\n'
226 >        txt += '        echo "Total Output dimension $size is fine."\n'
227 >        txt += '    fi\n'
228 >
229 >        txt += '    echo "JOB_EXIT_STATUS = $job_exit_code"\n'
230 >        txt += '    echo "JobExitCode=$job_exit_code" >> $RUNTIME_AREA/$repo\n'
231 >        txt += '    dumpStatus $RUNTIME_AREA/$repo\n'
232 >        txt += '    if [ $exceed -ne 1 ]; then\n'
233 >        txt += '        tar zcvf ${out_files}.tgz  ${final_list}\n'
234          txt += '    else\n'
235 <        txt += '        echo "not reporting SyncCE";\n'
236 <        txt += '    fi\n';
237 <        txt += '    echo "GridFlavour=$middleware" | tee -a $RUNTIME_AREA/$repo \n'
238 <        #txt += '    echo ">>> middleware =$middleware" \n'
196 <        txt += 'else \n'
197 <        txt += '    echo "ERROR ==> GridFlavour not identified" \n'
198 <        txt += '    job_exit_code=10030\n'
199 <        txt += '    func_exit \n'
200 <        #txt += '    echo "SET_CMS_ENV 10030 ==> middleware not identified" \n'
201 <        #txt += '    echo "JOB_EXIT_STATUS = 10030" \n'
202 <        #txt += '    echo "JobExitCode=10030" | tee -a $RUNTIME_AREA/$repo \n'
203 <        #txt += '    dumpStatus $RUNTIME_AREA/$repo \n'
204 <        #txt += '    exit 1 \n'
205 <        txt += 'fi \n'
206 <
207 <        txt += 'dumpStatus $RUNTIME_AREA/$repo \n'
208 <
209 <        txt += '\n\n'
210 <
211 <        txt += 'export VO='+self.VO+'\n'
212 <        txt += 'if [ $middleware == LCG ]; then\n'
213 <        txt += '    CloseCEs=`glite-brokerinfo getCE`\n'
214 <        txt += '    echo "CloseCEs = $CloseCEs"\n'
215 <        txt += '    CE=`echo $CloseCEs | sed -e "s/:.*//"`\n'
216 <        txt += '    echo "CE = $CE"\n'
217 <        txt += 'elif [ $middleware == OSG ]; then \n'
218 <        txt += '    if [ $OSG_JOB_CONTACT ]; then \n'
219 <        txt += '        CE=`echo $OSG_JOB_CONTACT | /usr/bin/awk -F\/ \'{print $1}\'` \n'
220 <        txt += '    else \n'
221 <        txt += '        echo "ERROR ==> OSG mode in setting CE name from OSG_JOB_CONTACT" \n'
222 <        txt += '        job_exit_code=10099\n'
223 <        txt += '        func_exit \n'
224 <        #txt += '        echo "SET_CMS_ENV 10099 ==> OSG mode: ERROR in setting CE name from OSG_JOB_CONTACT" \n'
225 <        #txt += '        echo "JOB_EXIT_STATUS = 10099" \n'
226 <        #txt += '        echo "JobExitCode=10099" | tee -a $RUNTIME_AREA/$repo \n'
227 <        #txt += '        dumpStatus $RUNTIME_AREA/$repo \n'
228 <        #txt += '        exit 1 \n'
229 <        txt += '    fi \n'
230 <        txt += 'fi \n'
235 >        txt += '        tar zcvf ${out_files}.tgz CMSSW_${NJob}.stdout CMSSW_${NJob}.stderr\n'
236 >        txt += '    fi\n'
237 >        txt += '    python $RUNTIME_AREA/fillCrabFjr.py $RUNTIME_AREA/crab_fjr_$NJob.xml --errorcode $job_exit_code \n'
238 >        txt += '    exit $job_exit_code\n'
239  
240 +        txt += '}\n'
241          return txt
242  
243 <    def loggingInfo(self, id):
244 <        """
245 <        retrieve the logging info from logging and bookkeeping and return it
246 <        """
247 <        self.checkProxy()
248 <        cmd = 'glite-job-logging-info -v 3 ' + id
249 <        cmd_out = runCommand(cmd)
250 <        return cmd_out
251 <
252 <    def queryDetailedStatus(self, id):
253 <        """ Query a detailed status of the job with id """
254 <        cmd = 'glite-job-status '+id
255 <        cmd_out = runCommand(cmd)
256 <        return cmd_out
248 <
249 <
250 <    def tOut(self, list):
251 <        return 180
243 >    def listMatch(self, dest, full):
244 >        matching='fast'
245 >        
246 >        if self.boss().schedulerConfig['name'] == 'SchedulerGLite' :
247 >            taskId=common._db.getTask()
248 >            req=str(self.sched_parameter(1,taskId))
249 >            sites = self.boss().schedSession().matchResources(taskId, requirements=req)
250 >        else :
251 >            sites = SchedulerGrid.listMatch(self, dest, full)
252 >            
253 >        if full == True: matching='full'
254 >        common.logger.debug("list of available site ( "+str(matching) +" matching ) : "+str(sites))
255 >        
256 >        return sites

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines