ViewVC Help
View File | Revision Log | Show Annotations | Root Listing
root/cvsroot/COMP/CRAB/python/SchedulerGlite.py
(Generate patch)

Comparing COMP/CRAB/python/SchedulerGlite.py (file contents):
Revision 1.35 by fanzago, Mon Mar 3 16:41:24 2008 UTC vs.
Revision 1.64 by spiga, Sat Nov 8 11:57:03 2008 UTC

# Line 1 | Line 1
1 + """
2 + CRAB interface to BossLite gLite Scheduler
3 + """
4 +
5 + __revision__ = "$Id$"
6 + __version__ = "$Revision$"
7 +
8   from SchedulerGrid import SchedulerGrid
9   from crab_logger import Logger
10   from crab_exceptions import *
11   from crab_util import *
12   from GliteConfig import *
13 + import EdgLoggingInfo
14   import common
15  
16   import os, sys, time
# Line 11 | Line 19 | class SchedulerGlite(SchedulerGrid):
19      def __init__(self, name="GLITE"):
20          SchedulerGrid.__init__(self,name)
21  
22 +        self.OSBsize = 55000000
23 +
24      def configure(self,cfg_params):
25          SchedulerGrid.configure(self, cfg_params)
26 <        self.environment_unique_identifier = 'GLITE_WMS_JOBID'
26 >        self.environment_unique_identifier = '$GLITE_WMS_JOBID'
27 >
28 >    def realSchedParams(self,cfg_params):
29 >        """
30 >        Return dictionary with specific parameters, to use
31 >        with real scheduler
32 >        """
33 >        self.rb_param_file=''
34 >        if (not cfg_params.has_key('EDG.rb')):
35 >            cfg_params['EDG.rb']='CERN'
36 >        self.rb_param_file=common.scheduler.rb_configure(cfg_params.get("EDG.rb"))
37 >        self.wms_service=cfg_params.get("EDG.wms_service",'')
38 >        self.skipWMSAuth=cfg_params.get("EDG.skipwmsauth",1)
39 >        params = { 'service' : self.wms_service, \
40 >                   'config' : self.rb_param_file, \
41 >                   'skipWMSAuth' : self.skipWMSAuth
42 >                 }
43 >        return  params
44 >
45  
46      def rb_configure(self, RB):
47          if not RB: return None
# Line 24 | Line 52 | class SchedulerGlite(SchedulerGrid):
52          glite_config = gliteConfig.config()
53  
54          if (glite_config ):
55 <            rb_param_file = 'WMSconfig = '+glite_config+';\n'
55 >            rb_param_file = glite_config
56          return rb_param_file
57  
58 <    def sched_parameter(self):
58 >    def ce_list(self):
59          """
60 <        Returns file with requirements and scheduler-specific parameters
60 >        Returns string with requirement CE related
61          """
34        index = int(common.jobDB.nJobs()) - 1
35        job = common.job_list[index]
36        jbt = job.type()
37
38        lastDest=''
39        first = []
40        last  = []
41        for n in range(common.jobDB.nJobs()):
42            currDest=common.jobDB.destination(n)
43            if (currDest!=lastDest):
44                lastDest = currDest
45                first.append(n)
46                if n != 0:last.append(n-1)
47        if len(first)>len(last) :last.append(common.jobDB.nJobs())
48
62          req = ''
50        req = req + jbt.getRequirements()
51
52
53        if self.EDG_requirements:
54            if (not req == ' '): req = req +  ' && '
55            req = req + self.EDG_requirements
56
63          if self.EDG_ce_white_list:
64              ce_white_list = self.EDG_ce_white_list
65              tmpCe=[]
66              concString = '&&'
67              for ce in ce_white_list:
68                  tmpCe.append('RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId)')
63            ### MATTY' FIX: if more then one CE: && -> ||
64            #print "list CE: " + str(tmpCe)
69              if len(tmpCe) == 1:
70                  req +=  " && (" + concString.join(tmpCe) + ") "
71              elif len(tmpCe) > 1:
72                  firstCE = 0
73                  for reqTemp in tmpCe:
70                    #print reqTemp
74                      if firstCE == 0:
72                        #print "adding: "+str(" && ( (" + reqTemp + ") ")
75                          req += " && ( (" + reqTemp + ") "
76                          firstCE = 1
77                      elif firstCE > 0:
76                        #print "adding: "+str(" || (" + reqTemp + ") ")
78                          req += " || (" + reqTemp + ") "
79                  if firstCE > 0:
80                      req += ") "
80            ## old code
81 #            if len(tmpCe): req = req + " && (" + concString.join(tmpCe) + ") "
81  
82          if self.EDG_ce_black_list:
83              ce_black_list = self.EDG_ce_black_list
# Line 86 | Line 85 | class SchedulerGlite(SchedulerGrid):
85              concString = '&&'
86              for ce in ce_black_list:
87                  tmpCe.append('(!RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId))')
88 <            if len(tmpCe): req = req + " && (" + concString.join(tmpCe) + ") "
88 >            if len(tmpCe): req += " && (" + concString.join(tmpCe) + ") "
89 >
90 >        # requirement added to skip gliteCE
91 >        req += '&& (!RegExp("blah", other.GlueCEUniqueId))'
92 >
93 >        return req,self.EDG_ce_white_list,self.EDG_ce_black_list
94 >
95 >    def se_list(self, dest):
96 >        """
97 >        Returns string with requirement SE related
98 >        """
99 >        hostList=self.findSites_(dest)
100 >        req=''
101 >        reqtmp=[]
102 >        concString = '||'
103 >
104 >        for arg in hostList:
105 >            reqtmp.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
106 >
107 >        if len(reqtmp): req += " && (" + concString.join(reqtmp) + ") "
108  
109 +        return req
110 +
111 +    def jdlParam(self):
112 +        """
113 +        Returns
114 +        """
115 +        req=''
116 +        if self.EDG_addJdlParam:
117 +            if self.EDG_addJdlParam[-1] == '': self.EDG_addJdlParam= self.EDG_addJdlParam[:-1]
118 +            for p in self.EDG_addJdlParam:
119 +                req+=string.strip(p)+';\n'
120 +        return req
121 +
122 +    def specific_req(self):
123 +        """
124 +        Returns string with specific requirements
125 +        """
126 +        req=''
127          if self.EDG_clock_time:
128              if (not req == ' '): req = req + ' && '
129              req = req + 'other.GlueCEPolicyMaxWallClockTime>='+self.EDG_clock_time
# Line 96 | Line 132 | class SchedulerGlite(SchedulerGrid):
132              if (not req == ' '): req = req + ' && '
133              req = req + ' other.GlueCEPolicyMaxCPUTime>='+self.EDG_cpu_time
134  
135 <        for i in range(len(first)): # Add loop DS
100 <            self.param='sched_param_'+str(i)+'.clad'
101 <            param_file = open(common.work_space.shareDir()+'/'+self.param, 'w')
102 <
103 <            itr4=self.findSites_(first[i])
104 <            reqSites=''
105 <            reqtmp=[]
106 <            concString = '||'
107 <
108 <            #############
109 <            # MC Changed matching syntax to avoid gang matching
110 <            #############
111 <            for arg in itr4:
112 <                reqtmp.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
113 <
114 <            if len(reqtmp): reqSites = reqSites + " && (" + concString.join(reqtmp) + ") "
115 <
116 <            # requirement added to skip gliteCE
117 <            reqSites = reqSites + '&& (!RegExp("blah", other.GlueCEUniqueId));\n'
118 <
119 <            param_file.write('Requirements = ' + req + reqSites )
120 <
121 <            if (self.rb_param_file):
122 <                param_file.write(self.rb_param_file)
123 <
124 <            if self.EDG_addJdlParam:
125 <                if self.EDG_addJdlParam[-1] == '': self.EDG_addJdlParam= self.EDG_addJdlParam[:-1]
126 <                for p in self.EDG_addJdlParam:
127 <                    param_file.write(string.strip(p)+';\n')
128 <
129 <            param_file.close()
130 <
131 <    def wsSetupEnvironment(self):
132 <        """
133 <        Returns part of a job script which does scheduler-specific work.
134 <        """
135 <        txt = ''
136 <        txt += '# strip arguments\n'
137 <        txt += 'echo "strip arguments"\n'
138 <        txt += 'args=("$@")\n'
139 <        txt += 'nargs=$#\n'
140 <        txt += 'shift $nargs\n'
141 <        txt += "# job number (first parameter for job wrapper)\n"
142 <        txt += "NJob=${args[0]}; export NJob\n"
143 <
144 <        txt += '# job identification to DashBoard \n'
145 <        #txt += 'MonitorJobID=`echo ${NJob}_$GLITE_WMS_JOBID`\n'
146 <        #txt += 'SyncGridJobId=`echo $GLITE_WMS_JOBID`\n'
147 <        #txt += 'MonitorID=`echo ' + self._taskId + '`\n'
148 <        txt += 'MonitorJobID=${NJob}_$GLITE_WMS_JOBID \n'
149 <        txt += 'SyncGridJobId=$GLITE_WMS_JOBID \n'
150 <        txt += 'MonitorID='+self._taskId+' \n'
151 <        txt += 'echo "MonitorJobID=$MonitorJobID" > $RUNTIME_AREA/$repo \n'
152 <        txt += 'echo "SyncGridJobId=$SyncGridJobId" >> $RUNTIME_AREA/$repo \n'
153 <        txt += 'echo "MonitorID=$MonitorID" >> $RUNTIME_AREA/$repo\n'
154 <        #txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
155 <        #txt += 'echo "SyncGridJobId=`echo $SyncGridJobId`" | tee -a $RUNTIME_AREA/$repo \n'
156 <        #txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
157 <
158 <        #txt += 'echo "middleware discovery: " \n'
159 <        txt += 'echo ">>> GridFlavour discovery: " \n'
160 <        txt += 'if [ $VO_CMS_SW_DIR ]; then \n'
161 <        txt += '    middleware=LCG\n'
162 <        #txt += '    echo "SyncCE=`glite-brokerinfo getCE`" | tee -a $RUNTIME_AREA/$repo \n'
163 <        txt += '    echo "SyncCE=`glite-brokerinfo getCE`" >> $RUNTIME_AREA/$repo \n'
164 <        #txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
165 <        txt += '    echo "GridFlavour=$middleware" | tee -a $RUNTIME_AREA/$repo \n'
166 <        #txt += '    echo ">>> middleware =$middleware" \n'
167 <        txt += 'elif [ $OSG_APP ]; then \n'
168 <        txt += '    middleware=OSG \n'
169 <        txt += '    if [ $OSG_JOB_CONTACT ]; then \n'
170 <        txt += '        SyncCE="$OSG_JOB_CONTACT"; \n'
171 <        #txt += '        echo "SyncCE=$SyncCE" | tee -a $RUNTIME_AREA/$repo ;\n'
172 <        txt += '        echo "SyncCE=$SyncCE" >> $RUNTIME_AREA/$repo ;\n'
173 <        txt += '    else\n'
174 <        txt += '        echo "not reporting SyncCE";\n'
175 <        txt += '    fi\n';
176 <        txt += '    echo "GridFlavour=$middleware" | tee -a $RUNTIME_AREA/$repo \n'
177 <        #txt += '    echo ">>> middleware =$middleware" \n'
178 <        txt += 'else \n'
179 <        txt += '    echo "ERROR ==> GridFlavour not identified" \n'
180 <        txt += '    job_exit_code=10030\n'
181 <        txt += '    func_exit \n'
182 <        #txt += '    echo "SET_CMS_ENV 10030 ==> middleware not identified" \n'
183 <        #txt += '    echo "JOB_EXIT_STATUS = 10030" \n'
184 <        #txt += '    echo "JobExitCode=10030" | tee -a $RUNTIME_AREA/$repo \n'
185 <        #txt += '    dumpStatus $RUNTIME_AREA/$repo \n'
186 <        #txt += '    exit 1 \n'
187 <        txt += 'fi \n'
188 <
189 <        txt += 'dumpStatus $RUNTIME_AREA/$repo \n'
190 <
191 <        txt += '\n\n'
192 <
193 <        txt += 'export VO='+self.VO+'\n'
194 <        txt += 'if [ $middleware == LCG ]; then\n'
195 <        txt += '    CloseCEs=`glite-brokerinfo getCE`\n'
196 <        txt += '    echo "CloseCEs = $CloseCEs"\n'
197 <        txt += '    CE=`echo $CloseCEs | sed -e "s/:.*//"`\n'
198 <        txt += '    echo "CE = $CE"\n'
199 <        txt += 'elif [ $middleware == OSG ]; then \n'
200 <        txt += '    if [ $OSG_JOB_CONTACT ]; then \n'
201 <        txt += '        CE=`echo $OSG_JOB_CONTACT | /usr/bin/awk -F\/ \'{print $1}\'` \n'
202 <        txt += '    else \n'
203 <        txt += '        echo "ERROR ==> OSG mode in setting CE name from OSG_JOB_CONTACT" \n'
204 <        txt += '        job_exit_code=10099\n'
205 <        txt += '        func_exit \n'
206 <        #txt += '        echo "SET_CMS_ENV 10099 ==> OSG mode: ERROR in setting CE name from OSG_JOB_CONTACT" \n'
207 <        #txt += '        echo "JOB_EXIT_STATUS = 10099" \n'
208 <        #txt += '        echo "JobExitCode=10099" | tee -a $RUNTIME_AREA/$repo \n'
209 <        #txt += '        dumpStatus $RUNTIME_AREA/$repo \n'
210 <        #txt += '        exit 1 \n'
211 <        txt += '    fi \n'
212 <        txt += 'fi \n'
135 >        return req
136  
137 <        return txt
137 >    def sched_parameter(self,i,task):
138 >        """
139 >        Returns string with requirements and scheduler-specific parameters
140 >        """
141 >        dest=  task.jobs[i-1]['dlsDestination']
142 >
143 >        req=''
144 >        req +=task['jobType']
145 >
146 >        sched_param=''
147 >        sched_param+='Requirements = ' + req +self.specific_req() + self.se_list(dest) +\
148 >                                        self.ce_list()[0] +';\n'
149 >        if self.EDG_addJdlParam: sched_param+=self.jdlParam()
150 >        sched_param+='MyProxyServer = "' + self.proxyServer + '";\n'
151 >        sched_param+='VirtualOrganisation = "' + self.VO + '";\n'
152 >        sched_param+='RetryCount = '+str(self.EDG_retry_count)+';\n'
153 >        sched_param+='ShallowRetryCount = '+str(self.EDG_shallow_retry_count)+';\n'
154  
155 <    def loggingInfo(self, id):
155 >        return sched_param
156 >
157 >    def decodeLogInfo(self, file):
158          """
159 <        retrieve the logging info from logging and bookkeeping and return it
159 >        Parse logging info file and return main info
160          """
161 <        self.checkProxy()
162 <        cmd = 'glite-job-logging-info -v 3 ' + id
163 <        cmd_out = runCommand(cmd)
223 <        return cmd_out
224 <
225 <    def queryDetailedStatus(self, id):
226 <        """ Query a detailed status of the job with id """
227 <        cmd = 'glite-job-status '+id
228 <        cmd_out = runCommand(cmd)
229 <        return cmd_out
161 >        loggingInfo = EdgLoggingInfo.EdgLoggingInfo()
162 >        reason = loggingInfo.decodeReason(file)
163 >        return reason
164  
165 <    def findSites_(self, n):
165 >    def findSites_(self, sites):
166          itr4 =[]
233        sites = common.jobDB.destination(n)
167          if len(sites)>0 and sites[0]=="":
168              return itr4
169          if sites != [""]:
170 <            ##Addedd Daniele
238 <            replicas = self.blackWhiteListParser.checkBlackList(sites,n)
170 >            replicas = self.blackWhiteListParser.checkBlackList(sites)
171              if len(replicas)!=0:
172 <                replicas = self.blackWhiteListParser.checkWhiteList(replicas,n)
172 >                replicas = self.blackWhiteListParser.checkWhiteList(replicas)
173  
174              itr4 = replicas
243            #####
175          return itr4
176  
177 <    def tOut(self, list):
178 <        return 180
177 >
178 >    def wsExitFunc(self):
179 >        """
180 >        """
181 >        txt = '\n'
182 >
183 >        txt += '#\n'
184 >        txt += '# EXECUTE THIS FUNCTION BEFORE EXIT \n'
185 >        txt += '#\n\n'
186 >
187 >        txt += 'func_exit() { \n'
188 >        txt += self.wsExitFunc_common()
189 >        ### specific Glite check for OSB
190 >        txt += '    tar zcvf ${out_files}.tgz  ${final_list}\n'
191 >        txt += '    tmp_size=`ls -gGrta ${out_files}.tgz | awk \'{ print $3 }\'`\n'
192 >        txt += '    rm ${out_files}.tgz\n'
193 >        txt += '    size=`expr $tmp_size`\n'
194 >        txt += '    echo "Total Output dimension: $size"\n'
195 >        txt += '    limit='+str(self.OSBsize) +' \n'
196 >        txt += '    echo "WARNING: output files size limit is set to: $limit"\n'
197 >        txt += '    if [ "$limit" -lt "$size" ]; then\n'
198 >        txt += '        exceed=1\n'
199 >        txt += '        job_exit_code=70000\n'
200 >        txt += '        echo "Output Sanbox too big. Produced output is lost "\n'
201 >        txt += '    else\n'
202 >        txt += '        exceed=0\n'
203 >        txt += '        echo "Total Output dimension $size is fine."\n'
204 >        txt += '    fi\n'
205 >
206 >        txt += '    echo "JOB_EXIT_STATUS = $job_exit_code"\n'
207 >        txt += '    echo "JobExitCode=$job_exit_code" >> $RUNTIME_AREA/$repo\n'
208 >        txt += '    dumpStatus $RUNTIME_AREA/$repo\n'
209 >        txt += '    if [ $exceed -ne 1 ]; then\n'
210 >        txt += '        tar zcvf ${out_files}.tgz  ${final_list}\n'
211 >        txt += '    else\n'
212 >        txt += '        tar zcvf ${out_files}.tgz CMSSW_${NJob}.stdout CMSSW_${NJob}.stderr\n'
213 >        txt += '    fi\n'
214 >        txt += '    exit $job_exit_code\n'
215 >
216 >        txt += '}\n'
217 >        return txt

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines