ViewVC Help
View File | Revision Log | Show Annotations | Root Listing
root/cvsroot/COMP/CRAB/python/SchedulerGlite.py
(Generate patch)

Comparing COMP/CRAB/python/SchedulerGlite.py (file contents):
Revision 1.21 by fanzago, Fri Oct 5 12:55:05 2007 UTC vs.
Revision 1.73 by spiga, Thu Jan 14 10:24:17 2010 UTC

# Line 1 | Line 1
1 < from SchedulerEdg import SchedulerEdg
2 < from crab_logger import Logger
1 > """
2 > CRAB interface to BossLite gLite Scheduler
3 > """
4 >
5 > __revision__ = "$Id$"
6 > __version__ = "$Revision$"
7 >
8 > from SchedulerGrid import SchedulerGrid
9   from crab_exceptions import *
10   from crab_util import *
11   from GliteConfig import *
12 + import EdgLoggingInfo
13   import common
14 + from WMCore.SiteScreening.BlackWhiteListParser import CEBlackWhiteListParser
15  
16   import os, sys, time
17  
18 < class SchedulerGlite(SchedulerEdg):
19 <    def __init__(self):
20 <        SchedulerEdg.__init__(self)
18 > class SchedulerGlite(SchedulerGrid):
19 >    def __init__(self, name="GLITE"):
20 >        SchedulerGrid.__init__(self,name)
21 >
22 >        self.OSBsize = 55000000
23 >
24 >    def configure(self,cfg_params):
25 >        SchedulerGrid.configure(self, cfg_params)
26 >        self.environment_unique_identifier = '$GLITE_WMS_JOBID'
27 >
28 >    def realSchedParams(self,cfg_params):
29 >        """
30 >        Return dictionary with specific parameters, to use
31 >        with real scheduler
32 >        """
33 >        self.rb_param_file=''
34 >        if (not cfg_params.has_key('GRID.rb')):
35 >            cfg_params['GRID.rb']='CERN'
36 >        self.rb_param_file=common.scheduler.rb_configure(cfg_params.get("GRID.rb"))
37 >        self.wms_service=cfg_params.get("GRID.wms_service",'')
38 >        self.skipWMSAuth=cfg_params.get("GRID.skipwmsauth",1)
39 >        params = { 'service' : self.wms_service, \
40 >                   'config' : self.rb_param_file, \
41 >                   'skipWMSAuth' : self.skipWMSAuth
42 >                 }
43 >        return  params
44 >
45  
46      def rb_configure(self, RB):
47 <        self.glite_config = ''
48 <        self.rb_param_file = ''
47 >        ## 25-Jun-2009 SL: patch to use Cream enabled WMS
48 >        if ( self.cfg_params.get('GRID.use_cream',None) ):
49 >            RB='CREAM'
50 >        if not RB: return None
51 >        glite_config = None
52 >        rb_param_file = None
53  
54          gliteConfig = GliteConfig(RB)
55 <        self.glite_config = gliteConfig.config()
55 >        glite_config = gliteConfig.config()
56  
57 <        if (self.glite_config != ''):
58 <            self.rb_param_file = 'WMSconfig = '+self.glite_config+';\n'
59 <            #print "rb_param_file = ", self.rb_param_file
24 <        return self.rb_param_file
25 <
26 <    def sched_parameter(self):
27 <        """
28 <        Returns file with requirements and scheduler-specific parameters
29 <        """
30 <        index = int(common.jobDB.nJobs()) - 1
31 <        job = common.job_list[index]
32 <        jbt = job.type()
33 <        
34 <        lastDest=''
35 <        first = []
36 <        last  = []
37 <        for n in range(common.jobDB.nJobs()):
38 <            currDest=common.jobDB.destination(n)
39 <            if (currDest!=lastDest):
40 <                lastDest = currDest
41 <                first.append(n)
42 <                if n != 0:last.append(n-1)
43 <        if len(first)>len(last) :last.append(common.jobDB.nJobs())
44 <  
45 <        req = ''
46 <        req = req + jbt.getRequirements()
47 <  
48 <  
49 <        if self.EDG_requirements:
50 <            if (not req == ' '): req = req +  ' && '
51 <            req = req + self.EDG_requirements
57 >        if (glite_config ):
58 >            rb_param_file = glite_config
59 >        return rb_param_file
60  
61 +    def ce_list(self):
62 +        """
63 +        Returns string with requirement CE related
64 +        """
65 +        ceParser = CEBlackWhiteListParser(self.EDG_ce_white_list,
66 +                                          self.EDG_ce_black_list, common.logger())
67 +        req = ''
68 +        ce_white_list = []
69 +        ce_black_list = []
70          if self.EDG_ce_white_list:
71 <            ce_white_list = string.split(self.EDG_ce_white_list,',')
71 >            ce_white_list = ceParser.whiteList()
72              tmpCe=[]
73              concString = '&&'
74              for ce in ce_white_list:
75                  tmpCe.append('RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId)')
59            ### MATTY' FIX: if more then one CE: && -> ||
60            #print "list CE: " + str(tmpCe)
76              if len(tmpCe) == 1:
77                  req +=  " && (" + concString.join(tmpCe) + ") "
78              elif len(tmpCe) > 1:
79                  firstCE = 0
80                  for reqTemp in tmpCe:
66                    #print reqTemp
81                      if firstCE == 0:
68                        #print "adding: "+str(" && ( (" + reqTemp + ") ")
82                          req += " && ( (" + reqTemp + ") "
83                          firstCE = 1
84                      elif firstCE > 0:
72                        #print "adding: "+str(" || (" + reqTemp + ") ")
85                          req += " || (" + reqTemp + ") "
86                  if firstCE > 0:
87                      req += ") "
88 <            ## old code
77 < #            if len(tmpCe): req = req + " && (" + concString.join(tmpCe) + ") "
78 <        
88 >
89          if self.EDG_ce_black_list:
90 <            ce_black_list = string.split(self.EDG_ce_black_list,',')
90 >            ce_black_list = ceParser.blackList()
91              tmpCe=[]
92              concString = '&&'
93              for ce in ce_black_list:
94                  tmpCe.append('(!RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId))')
95 <            if len(tmpCe): req = req + " && (" + concString.join(tmpCe) + ") "
95 >            if len(tmpCe): req += " && (" + concString.join(tmpCe) + ") "
96 >
97 >        # requirement added to skip gliteCE
98 >        # not more needed
99 > #       req += '&& (!RegExp("blah", other.GlueCEUniqueId))'
100 >        retWL = ','.join(ce_white_list)
101 >        retBL = ','.join(ce_black_list)
102 >        if not retWL:
103 >            retWL = None
104 >        if not retBL:
105 >            retBL = None
106  
107 +        return req, retWL, retBL
108 +
109 +    def se_list(self, dest):
110 +        """
111 +        Returns string with requirement SE related
112 +        """
113 +        hostList=self.findSites_(dest)
114 +        req=''
115 +        reqtmp=[]
116 +        concString = '||'
117 +
118 +        for arg in hostList:
119 +            reqtmp.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
120 +
121 +        if len(reqtmp): req += " && (" + concString.join(reqtmp) + ") "
122 +
123 +        return req
124 +
125 +    def jdlParam(self):
126 +        """
127 +        Returns
128 +        """
129 +        req=''
130 +        if self.EDG_addJdlParam:
131 +            if self.EDG_addJdlParam[-1] == '': self.EDG_addJdlParam= self.EDG_addJdlParam[:-1]
132 +            for p in self.EDG_addJdlParam:
133 +                req+=string.strip(p)+';\n'
134 +        return req
135 +
136 +    def specific_req(self):
137 +        """
138 +        Returns string with specific requirements
139 +        """
140 +        req=''
141          if self.EDG_clock_time:
142              if (not req == ' '): req = req + ' && '
143              req = req + 'other.GlueCEPolicyMaxWallClockTime>='+self.EDG_clock_time
# Line 91 | Line 145 | class SchedulerGlite(SchedulerEdg):
145          if self.EDG_cpu_time:
146              if (not req == ' '): req = req + ' && '
147              req = req + ' other.GlueCEPolicyMaxCPUTime>='+self.EDG_cpu_time
94                
95        for i in range(len(first)): # Add loop DS
96            self.param='sched_param_'+str(i)+'.clad'
97            param_file = open(common.work_space.shareDir()+'/'+self.param, 'w')
98
99            itr4=self.findSites_(first[i])
100            reqSites=''
101            reqtmp=[]  
102            concString = '||'
103
104            #############
105            # MC Changed matching syntax to avoid gang matching
106            #############
107            for arg in itr4:
108                reqtmp.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
109
110            if len(reqtmp): reqSites = reqSites + " && (" + concString.join(reqtmp) + ") "
111
112            # requirement added to skip gliteCE
113            reqSites = reqSites + '&& (!RegExp("blah", other.GlueCEUniqueId));\n'
114
115            param_file.write('Requirements = ' + req + reqSites )
116  
117            if (self.rb_param_file != ''):
118                param_file.write(self.rb_param_file)  
119
120            if len(self.EDG_addJdlParam):
121                for p in self.EDG_addJdlParam:
122                    param_file.write(p)
123
124            param_file.close()  
125
126    def wsSetupEnvironment(self):
127        """
128        Returns part of a job script which does scheduler-specific work.
129        """
130        txt = ''
131        txt += '# strip arguments\n'
132        txt += 'echo "strip arguments"\n'
133        txt += 'args=("$@")\n'
134        txt += 'nargs=$#\n'
135        txt += 'shift $nargs\n'
136        txt += "# job number (first parameter for job wrapper)\n"
137        txt += "NJob=${args[0]}\n"
138
139        txt += '# job identification to DashBoard \n'
140        txt += 'MonitorJobID=`echo ${NJob}_$GLITE_WMS_JOBID`\n'
141        txt += 'SyncGridJobId=`echo $GLITE_WMS_JOBID`\n'
142        txt += 'MonitorID=`echo ' + self._taskId + '`\n'
143        txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
144        txt += 'echo "SyncGridJobId=`echo $SyncGridJobId`" | tee -a $RUNTIME_AREA/$repo \n'
145        txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
146
147        txt += 'echo "middleware discovery " \n'
148        txt += 'if [ $VO_CMS_SW_DIR ]; then \n'
149        txt += '    middleware=LCG \n'
150        txt += '    echo "SyncCE=`glite-brokerinfo getCE`" | tee -a $RUNTIME_AREA/$repo \n'
151        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
152        txt += '    echo "middleware =$middleware" \n'
153        txt += 'elif [ $GRID3_APP_DIR ]; then\n'
154        txt += '    middleware=OSG \n'
155        txt += '    echo "SyncCE=`echo $GLITE_WL_LOG_DESTINATION`" | tee -a $RUNTIME_AREA/$repo \n'
156        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
157        txt += '    echo "middleware =$middleware" \n'
158        txt += 'elif [ $OSG_APP ]; then \n'
159        txt += '    middleware=OSG \n'
160        txt += '    echo "SyncCE=`echo $GLITE_WL_LOG_DESTINATION`" | tee -a $RUNTIME_AREA/$repo \n'
161        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
162        txt += '    echo "middleware =$middleware" \n'
163        txt += 'else \n'
164        txt += '    echo "SET_CMS_ENV 10030 ==> middleware not identified" \n'
165        txt += '    echo "JOB_EXIT_STATUS = 10030" \n'
166        txt += '    echo "JobExitCode=10030" | tee -a $RUNTIME_AREA/$repo \n'
167        txt += '    dumpStatus $RUNTIME_AREA/$repo \n'
168        txt += '    rm -f $RUNTIME_AREA/$repo \n'
169        txt += '    echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
170        txt += '    echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
171        txt += '    exit 1 \n'
172        txt += 'fi \n'
173
174        txt += '# report first time to DashBoard \n'
175        txt += 'dumpStatus $RUNTIME_AREA/$repo \n'
176        txt += 'rm -f $RUNTIME_AREA/$repo \n'
177        txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
178        txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
179        
180        txt += '\n\n'
181
182        #if int(self.copy_data) == 1:
183        #   if self.SE:
184        #      txt += 'export SE='+self.SE+'\n'
185        #      txt += 'echo "SE = $SE"\n'
186        #   if self.SE_PATH:
187        #      if ( self.SE_PATH[-1] != '/' ) : self.SE_PATH = self.SE_PATH + '/'
188        #      txt += 'export SE_PATH='+self.SE_PATH+'\n'
189        #      txt += 'echo "SE_PATH = $SE_PATH"\n'
190
191        txt += 'export VO='+self.VO+'\n'
192        ### some line for LFC catalog setting
193        #txt += 'if [ $middleware == LCG ]; then \n'
194        #txt += '    if [[ $LCG_CATALOG_TYPE != \''+self.lcg_catalog_type+'\' ]]; then\n'
195        #txt += '        export LCG_CATALOG_TYPE='+self.lcg_catalog_type+'\n'
196        #txt += '    fi\n'
197        #txt += '    if [[ $LFC_HOST != \''+self.lfc_host+'\' ]]; then\n'
198        #txt += '        export LFC_HOST='+self.lfc_host+'\n'
199        #txt += '    fi\n'
200        #txt += '    if [[ $LFC_HOME != \''+self.lfc_home+'\' ]]; then\n'
201        #txt += '        export LFC_HOME='+self.lfc_home+'\n'
202        #txt += '    fi\n'
203        #txt += 'elif [ $middleware == OSG ]; then\n'
204        #txt += '    echo "LFC catalog setting to be implemented for OSG"\n'
205        #txt += 'fi\n'
206        #####
207        #if int(self.register_data) == 1:
208        #   txt += 'if [ $middleware == LCG ]; then \n'
209        #   txt += '    export LFN='+self.LFN+'\n'
210        #   txt += '    lfc-ls $LFN\n'
211        #   txt += '    result=$?\n'
212        #   txt += '    echo $result\n'
213        #   ### creation of LFN dir in LFC catalog, under /grid/cms dir  
214        #   txt += '    if [ $result != 0 ]; then\n'
215        #   txt += '       lfc-mkdir $LFN\n'
216        #   txt += '       result=$?\n'
217        #   txt += '       echo $result\n'
218        #   txt += '    fi\n'
219        #   txt += 'elif [ $middleware == OSG ]; then\n'
220        #   txt += '    echo " Files registration to be implemented for OSG"\n'
221        #   txt += 'fi\n'
222        #   txt += '\n'
223        #   if self.VO:
224        #      txt += 'export VO='+self.VO+'\n'
225        #   if self.LFN:
226        #      txt += 'if [ $middleware == LCG ]; then \n'
227        #      txt += '    export LFN='+self.LFN+'\n'
228        #      txt += 'fi\n'
229        #      txt += '\n'
230
231        txt += 'if [ $middleware == LCG ]; then\n'
232        txt += '    CloseCEs=`glite-brokerinfo getCE`\n'
233        txt += '    echo "CloseCEs = $CloseCEs"\n'
234        txt += '    CE=`echo $CloseCEs | sed -e "s/:.*//"`\n'
235        txt += '    echo "CE = $CE"\n'
236        txt += 'elif [ $middleware == OSG ]; then \n'
237        txt += '    if [ $OSG_JOB_CONTACT ]; then \n'
238        txt += '        CE=`echo $OSG_JOB_CONTACT | /usr/bin/awk -F\/ \'{print $1}\'` \n'
239        txt += '    else \n'
240        txt += '        echo "SET_CMS_ENV 10099 ==> OSG mode: ERROR in setting CE name from OSG_JOB_CONTACT" \n'
241        txt += '        echo "JOB_EXIT_STATUS = 10099" \n'
242        txt += '        echo "JobExitCode=10099" | tee -a $RUNTIME_AREA/$repo \n'
243        txt += '        dumpStatus $RUNTIME_AREA/$repo \n'
244        txt += '        rm -f $RUNTIME_AREA/$repo \n'
245        txt += '        echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
246        txt += '        echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
247        txt += '        exit 1 \n'
248        txt += '    fi \n'
249        txt += 'fi \n'
148  
149 <        return txt
150 <        
151 <    def loggingInfo(self, id):
149 >        return req
150 >
151 >    def sched_parameter(self,i,task):
152 >        """
153 >        Returns string with requirements and scheduler-specific parameters
154 >        """
155 >        dest=  task.jobs[i-1]['dlsDestination']
156 >
157 >        req=''
158 >        req +=task['jobType']
159 >
160 >        sched_param=''
161 >        sched_param+='Requirements = ' + req +self.specific_req() + self.se_list(dest) +\
162 >                                        self.ce_list()[0] +';\n'
163 >        if self.EDG_addJdlParam: sched_param+=self.jdlParam()
164 >        sched_param+='MyProxyServer = "' + self.proxyServer + '";\n'
165 >        sched_param+='VirtualOrganisation = "' + self.VO + '";\n'
166 >        sched_param+='RetryCount = '+str(self.EDG_retry_count)+';\n'
167 >        sched_param+='ShallowRetryCount = '+str(self.EDG_shallow_retry_count)+';\n'
168 >
169 >        return sched_param
170 >
171 >    def decodeLogInfo(self, file):
172          """
173 <        retrieve the logging info from logging and bookkeeping and return it
173 >        Parse logging info file and return main info
174          """
175 <        self.checkProxy()
176 <        cmd = 'glite-job-logging-info -v 3 ' + id
177 <        cmd_out = runCommand(cmd)
178 <        return cmd_out
179 <
180 <    def queryDetailedStatus(self, id):
263 <        """ Query a detailed status of the job with id """
264 <        cmd = 'glite-job-status '+id
265 <        cmd_out = runCommand(cmd)
266 <        return cmd_out
267 <
268 <    def findSites_(self, n):
269 <        itr4 = []
270 <        sites = common.jobDB.destination(n)
175 >        loggingInfo = EdgLoggingInfo.EdgLoggingInfo()
176 >        reason = loggingInfo.decodeReason(file)
177 >        return reason
178 >
179 >    def findSites_(self, sites):
180 >        itr4 =[]
181          if len(sites)>0 and sites[0]=="":
182              return itr4
183 <        if sites != [""]:
184 <            ##Addedd Daniele
275 <            replicas = self.blackWhiteListParser.checkBlackList(sites,n)
183 >        if sites != [""]:
184 >            replicas = self.blackWhiteListParser.checkBlackList(sites)
185              if len(replicas)!=0:
186 <                replicas = self.blackWhiteListParser.checkWhiteList(replicas,n)
187 <              
188 <            if len(replicas)==0:
280 <                msg = 'No sites remaining that host any part of the requested data! Exiting... '
281 <                raise CrabException(msg)
282 <            itr4 = replicas
283 <            #####        
186 >                replicas = self.blackWhiteListParser.checkWhiteList(replicas)
187 >
188 >            itr4 = replicas
189          return itr4
190  
191 <    def submitTout(self, list):
192 <        return 180
191 >    def delegateProxy(self):
192 >        self.boss().delegateProxy()  
193 >        return
194 >
195 >    def wsExitFunc(self):
196 >        """
197 >        """
198 >        txt = '\n'
199 >
200 >        txt += '#\n'
201 >        txt += '# EXECUTE THIS FUNCTION BEFORE EXIT \n'
202 >        txt += '#\n\n'
203 >
204 >        txt += 'func_exit() { \n'
205 >        txt += self.wsExitFunc_common()
206 >        ### specific Glite check for OSB
207 >        txt += '    tar zcvf ${out_files}.tgz  ${final_list}\n'
208 >        txt += '    tmp_size=`ls -gGrta ${out_files}.tgz | awk \'{ print $3 }\'`\n'
209 >        txt += '    rm ${out_files}.tgz\n'
210 >        txt += '    size=`expr $tmp_size`\n'
211 >        txt += '    echo "Total Output dimension: $size"\n'
212 >        txt += '    limit='+str(self.OSBsize) +' \n'
213 >        txt += '    echo "WARNING: output files size limit is set to: $limit"\n'
214 >        txt += '    if [ "$limit" -lt "$size" ]; then\n'
215 >        txt += '        exceed=1\n'
216 >        txt += '        job_exit_code=70000\n'
217 >        txt += '        echo "Output Sanbox too big. Produced output is lost "\n'
218 >        txt += '    else\n'
219 >        txt += '        exceed=0\n'
220 >        txt += '        echo "Total Output dimension $size is fine."\n'
221 >        txt += '    fi\n'
222 >
223 >        txt += '    echo "JOB_EXIT_STATUS = $job_exit_code"\n'
224 >        txt += '    echo "JobExitCode=$job_exit_code" >> $RUNTIME_AREA/$repo\n'
225 >        txt += '    dumpStatus $RUNTIME_AREA/$repo\n'
226 >        txt += '    if [ $exceed -ne 1 ]; then\n'
227 >        txt += '        tar zcvf ${out_files}.tgz  ${final_list}\n'
228 >        txt += '    else\n'
229 >        txt += '        tar zcvf ${out_files}.tgz CMSSW_${NJob}.stdout CMSSW_${NJob}.stderr\n'
230 >        txt += '    fi\n'
231 >        txt += '    python $RUNTIME_AREA/fillCrabFjr.py $RUNTIME_AREA/crab_fjr_$NJob.xml --errorcode $job_exit_code \n'
232 >        txt += '    exit $job_exit_code\n'
233 >
234 >        txt += '}\n'
235 >        return txt

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines