ViewVC Help
View File | Revision Log | Show Annotations | Root Listing
root/cvsroot/COMP/CRAB/python/SchedulerGlite.py
(Generate patch)

Comparing COMP/CRAB/python/SchedulerGlite.py (file contents):
Revision 1.13 by slacapra, Wed Feb 28 14:10:33 2007 UTC vs.
Revision 1.85 by belforte, Thu Jun 14 15:50:46 2012 UTC

# Line 1 | Line 1
1 < from SchedulerEdg import SchedulerEdg
2 < from crab_logger import Logger
1 > """
2 > CRAB interface to BossLite gLite Scheduler
3 > """
4 >
5 > __revision__ = "$Id$"
6 > __version__ = "$Revision$"
7 >
8 > from SchedulerGrid import SchedulerGrid
9   from crab_exceptions import *
10   from crab_util import *
11 < from GliteConfig import *
11 > import EdgLoggingInfo
12   import common
13 + from WMCore.SiteScreening.BlackWhiteListParser import CEBlackWhiteListParser
14  
15   import os, sys, time
16  
17 < class SchedulerGlite(SchedulerEdg):
18 <    def __init__(self):
19 <        SchedulerEdg.__init__(self)
17 > class SchedulerGlite(SchedulerGrid):
18 >    def __init__(self, name="GLITE"):
19 >        SchedulerGrid.__init__(self,name)
20 >
21 >        self.EDG_retry_count        = 0
22 >        self.EDG_shallow_retry_count= -1
23 >        self.OSBsize = 55*1000*1000  # 55MB
24 >
25 >    def configure(self,cfg_params):
26 >        SchedulerGrid.configure(self, cfg_params)
27 >        self.environment_unique_identifier = '$GLITE_WMS_JOBID'
28  
29 <    def rb_configure(self, RB):
30 <        self.glite_config = ''
31 <        self.rb_param_file = ''
29 >    def realSchedParams(self,cfg_params):
30 >        """
31 >        Return dictionary with specific parameters, to use
32 >        with real scheduler
33 >        """
34 >        self.rb_param_file=''
35 >        if (not cfg_params.has_key('GRID.rb')):
36 >            cfg_params['GRID.rb']='CERN'
37 >        self.rb_param_file=common.scheduler.rb_configure(cfg_params.get("GRID.rb"))
38 >        self.wms_service=cfg_params.get("GRID.wms_service",'')
39 >        self.skipWMSAuth=cfg_params.get("GRID.skipwmsauth",1)
40 >        params = { 'service' : self.wms_service, \
41 >                   'config' : self.rb_param_file, \
42 >                   'skipWMSAuth' : self.skipWMSAuth
43 >                 }
44 >        return  params
45  
18        gliteConfig = GliteConfig(RB)
19        self.glite_config = gliteConfig.config()
46  
47 <        if (self.glite_config != ''):
48 <            self.rb_param_file = 'WMSconfig = '+self.glite_config+';\n'
49 <            #print "rb_param_file = ", self.rb_param_file
50 <        return self.rb_param_file
47 >    def rb_configure(self, RB):
48 >        url ='http://cmsdoc.cern.ch/cms/LCG/crab/config/'
49 >        from Downloader import Downloader
50 >        import httplib
51 >        common.logger.debug('Downloading config files for WMS: '+url)
52 >        ## 25-Jun-2009 SL: patch to use Cream enabled WMS
53 >        if ( self.cfg_params.get('GRID.use_cream',None) ):
54 >            RB='CREAM'
55 >        if not RB: return None
56 >        rb_param_file = None
57 >        configFileName = 'glite_wms_'+str(RB)+'.conf'
58 >
59 >        results = Downloader(url)
60 >        try:
61 >            gliteConfig  = results.filePath(configFileName)
62 >        except httplib.HTTPException, ex:
63 >            raise CrabException( "Problem getting RB config file: %s, reason:"%(configFileName, ex) )
64 >
65 >        if (gliteConfig ):
66 >            rb_param_file = gliteConfig
67 >        return rb_param_file
68  
69 <    def sched_parameter(self):
69 >    def ce_list(self):
70          """
71 <        Returns file with requirements and scheduler-specific parameters
71 >        Returns string with requirement CE related
72          """
73 <        index = int(common.jobDB.nJobs()) - 1
74 <        job = common.job_list[index]
32 <        jbt = job.type()
33 <        
34 <        lastDest=''
35 <        first = []
36 <        last  = []
37 <        for n in range(common.jobDB.nJobs()):
38 <            currDest=common.jobDB.destination(n)
39 <            if (currDest!=lastDest):
40 <                lastDest = currDest
41 <                first.append(n)
42 <                if n != 0:last.append(n-1)
43 <        if len(first)>len(last) :last.append(common.jobDB.nJobs())
44 <  
73 >        ceParser = CEBlackWhiteListParser(self.EDG_ce_white_list,
74 >                                          self.EDG_ce_black_list, common.logger())
75          req = ''
76 <        req = req + jbt.getRequirements()
77 <  
48 <  
49 <        if self.EDG_requirements:
50 <            if (not req == ' '): req = req +  ' && '
51 <            req = req + self.EDG_requirements
52 <
76 >        ce_white_list = []
77 >        ce_black_list = []
78          if self.EDG_ce_white_list:
79 <            ce_white_list = string.split(self.EDG_ce_white_list,',')
79 >            ce_white_list = ceParser.whiteList()
80              tmpCe=[]
81              concString = '&&'
82              for ce in ce_white_list:
83                  tmpCe.append('RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId)')
84 <            if len(tmpCe): req = req + " && (" + concString.join(tmpCe) + ") "
85 <        
84 >            if len(tmpCe) == 1:
85 >                req +=  " && (" + concString.join(tmpCe) + ") "
86 >            elif len(tmpCe) > 1:
87 >                firstCE = 0
88 >                for reqTemp in tmpCe:
89 >                    if firstCE == 0:
90 >                        req += " && ( (" + reqTemp + ") "
91 >                        firstCE = 1
92 >                    elif firstCE > 0:
93 >                        req += " || (" + reqTemp + ") "
94 >                if firstCE > 0:
95 >                    req += ") "
96 >
97          if self.EDG_ce_black_list:
98 <            ce_black_list = string.split(self.EDG_ce_black_list,',')
98 >            ce_black_list = ceParser.blackList()
99              tmpCe=[]
100              concString = '&&'
101              for ce in ce_black_list:
102                  tmpCe.append('(!RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId))')
103 <            if len(tmpCe): req = req + " && (" + concString.join(tmpCe) + ") "
103 >            if len(tmpCe): req += " && (" + concString.join(tmpCe) + ") "
104 >
105 >        # requirement added to skip gliteCE
106 >        # not more needed
107 > #       req += '&& (!RegExp("blah", other.GlueCEUniqueId))'
108 >        retWL = ','.join(ce_white_list)
109 >        retBL = ','.join(ce_black_list)
110 >        if not retWL:
111 >            retWL = None
112 >        if not retBL:
113 >            retBL = None
114 >
115 >        return req, retWL, retBL
116  
117 +    def se_list(self, dest):
118 +        """
119 +        Returns string with requirement SE related
120 +        """
121 +        hostList=self.findSites_(dest)
122 +        req=''
123 +        reqtmp=[]
124 +        concString = '||'
125 +
126 +        for arg in hostList:
127 +            reqtmp.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
128 +
129 +        if len(reqtmp): req += " && (" + concString.join(reqtmp) + ") "
130 +
131 +        return req
132 +
133 +    def jdlParam(self):
134 +        """
135 +        Returns
136 +        """
137 +        req=''
138 +        if self.EDG_addJdlParam:
139 +            if self.EDG_addJdlParam[-1] == '': self.EDG_addJdlParam= self.EDG_addJdlParam[:-1]
140 +            for p in self.EDG_addJdlParam:
141 +                req+=string.strip(p)+';\n'
142 +        return req
143 +
144 +    def specific_req(self):
145 +        """
146 +        Returns string with specific requirements
147 +        """
148 +        req=''
149          if self.EDG_clock_time:
150              if (not req == ' '): req = req + ' && '
151              req = req + 'other.GlueCEPolicyMaxWallClockTime>='+self.EDG_clock_time
# Line 73 | Line 153 | class SchedulerGlite(SchedulerEdg):
153          if self.EDG_cpu_time:
154              if (not req == ' '): req = req + ' && '
155              req = req + ' other.GlueCEPolicyMaxCPUTime>='+self.EDG_cpu_time
76                
77        for i in range(len(first)): # Add loop DS
78            self.param='sched_param_'+str(i)+'.clad'
79            param_file = open(common.work_space.shareDir()+'/'+self.param, 'w')
80
81            itr4=self.findSites_(first[i])
82            reqSites=''
83            reqtmp=[]  
84            concString = '||'
85
86            #############
87            # MC Changed matching syntax to avoid gang matching
88            #############
89            for arg in itr4:
90                reqtmp.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
91
92            if len(reqtmp): reqSites = reqSites + " && (" + concString.join(reqtmp) + ") "
93
94            # requirement added to skip gliteCE
95            reqSites = reqSites + '&& (!RegExp("blah", other.GlueCEUniqueId));\n'
96
97            param_file.write('Requirements = ' + req + reqSites )
98  
99            if (self.rb_param_file != ''):
100                param_file.write(self.rb_param_file)  
101
102            if len(self.EDG_addJdlParam):
103                for p in self.EDG_addJdlParam:
104                    param_file.write(p)
105
106            param_file.close()  
107
108    def wsSetupEnvironment(self):
109        """
110        Returns part of a job script which does scheduler-specific work.
111        """
112        txt = ''
113        txt += '# strip arguments\n'
114        txt += 'echo "strip arguments"\n'
115        txt += 'args=("$@")\n'
116        txt += 'nargs=$#\n'
117        txt += 'shift $nargs\n'
118        txt += "# job number (first parameter for job wrapper)\n"
119        txt += "NJob=${args[0]}\n"
120
121        txt += '# job identification to DashBoard \n'
122        txt += 'MonitorJobID=`echo ${NJob}_$GLITE_WMS_JOBID`\n'
123        txt += 'SyncGridJobId=`echo $GLITE_WMS_JOBID`\n'
124        txt += 'MonitorID=`echo ' + self._taskId + '`\n'
125        txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
126        txt += 'echo "SyncGridJobId=`echo $SyncGridJobId`" | tee -a $RUNTIME_AREA/$repo \n'
127        txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
128
129        txt += 'echo "middleware discovery " \n'
130        txt += 'if [ $VO_CMS_SW_DIR ]; then \n'
131        txt += '    middleware=LCG \n'
132        txt += '    echo "SyncCE=`glite-brokerinfo getCE`" | tee -a $RUNTIME_AREA/$repo \n'
133        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
134        txt += '    echo "middleware =$middleware" \n'
135        txt += 'elif [ $GRID3_APP_DIR ]; then\n'
136        txt += '    middleware=OSG \n'
137        txt += '    echo "SyncCE=`echo $EDG_WL_LOG_DESTINATION`" | tee -a $RUNTIME_AREA/$repo \n'
138        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
139        txt += '    echo "middleware =$middleware" \n'
140        txt += 'elif [ $OSG_APP ]; then \n'
141        txt += '    middleware=OSG \n'
142        txt += '    echo "SyncCE=`echo $EDG_WL_LOG_DESTINATION`" | tee -a $RUNTIME_AREA/$repo \n'
143        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
144        txt += '    echo "middleware =$middleware" \n'
145        txt += 'else \n'
146        txt += '    echo "SET_CMS_ENV 10030 ==> middleware not identified" \n'
147        txt += '    echo "JOB_EXIT_STATUS = 10030" \n'
148        txt += '    echo "JobExitCode=10030" | tee -a $RUNTIME_AREA/$repo \n'
149        txt += '    dumpStatus $RUNTIME_AREA/$repo \n'
150        txt += '    rm -f $RUNTIME_AREA/$repo \n'
151        txt += '    echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
152        txt += '    echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
153        txt += '    exit 1 \n'
154        txt += 'fi \n'
155
156        txt += '# report first time to DashBoard \n'
157        txt += 'dumpStatus $RUNTIME_AREA/$repo \n'
158        txt += 'rm -f $RUNTIME_AREA/$repo \n'
159        txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
160        txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
161        
162        txt += '\n\n'
156  
157 <        if int(self.copy_data) == 1:
165 <           if self.SE:
166 <              txt += 'export SE='+self.SE+'\n'
167 <              txt += 'echo "SE = $SE"\n'
168 <           if self.SE_PATH:
169 <              if ( self.SE_PATH[-1] != '/' ) : self.SE_PATH = self.SE_PATH + '/'
170 <              txt += 'export SE_PATH='+self.SE_PATH+'\n'
171 <              txt += 'echo "SE_PATH = $SE_PATH"\n'
172 <
173 <        txt += 'export VO='+self.VO+'\n'
174 <        ### some line for LFC catalog setting
175 <        txt += 'if [ $middleware == LCG ]; then \n'
176 <        txt += '    if [[ $LCG_CATALOG_TYPE != \''+self.lcg_catalog_type+'\' ]]; then\n'
177 <        txt += '        export LCG_CATALOG_TYPE='+self.lcg_catalog_type+'\n'
178 <        txt += '    fi\n'
179 <        txt += '    if [[ $LFC_HOST != \''+self.lfc_host+'\' ]]; then\n'
180 <        txt += '        export LFC_HOST='+self.lfc_host+'\n'
181 <        txt += '    fi\n'
182 <        txt += '    if [[ $LFC_HOME != \''+self.lfc_home+'\' ]]; then\n'
183 <        txt += '        export LFC_HOME='+self.lfc_home+'\n'
184 <        txt += '    fi\n'
185 <        txt += 'elif [ $middleware == OSG ]; then\n'
186 <        txt += '    echo "LFC catalog setting to be implemented for OSG"\n'
187 <        txt += 'fi\n'
188 <        #####
189 <        if int(self.register_data) == 1:
190 <           txt += 'if [ $middleware == LCG ]; then \n'
191 <           txt += '    export LFN='+self.LFN+'\n'
192 <           txt += '    lfc-ls $LFN\n'
193 <           txt += '    result=$?\n'
194 <           txt += '    echo $result\n'
195 <           ### creation of LFN dir in LFC catalog, under /grid/cms dir  
196 <           txt += '    if [ $result != 0 ]; then\n'
197 <           txt += '       lfc-mkdir $LFN\n'
198 <           txt += '       result=$?\n'
199 <           txt += '       echo $result\n'
200 <           txt += '    fi\n'
201 <           txt += 'elif [ $middleware == OSG ]; then\n'
202 <           txt += '    echo " Files registration to be implemented for OSG"\n'
203 <           txt += 'fi\n'
204 <           txt += '\n'
205 <
206 <           if self.VO:
207 <              txt += 'export VO='+self.VO+'\n'
208 <           if self.LFN:
209 <              txt += 'if [ $middleware == LCG ]; then \n'
210 <              txt += '    export LFN='+self.LFN+'\n'
211 <              txt += 'fi\n'
212 <              txt += '\n'
213 <
214 <        txt += 'if [ $middleware == LCG ]; then\n'
215 <        txt += '    CloseCEs=`glite-brokerinfo getCE`\n'
216 <        txt += '    echo "CloseCEs = $CloseCEs"\n'
217 <        txt += '    CE=`echo $CloseCEs | sed -e "s/:.*//"`\n'
218 <        txt += '    echo "CE = $CE"\n'
219 <        txt += 'elif [ $middleware == OSG ]; then \n'
220 <        txt += '    if [ $OSG_JOB_CONTACT ]; then \n'
221 <        txt += '        CE=`echo $OSG_JOB_CONTACT | /usr/bin/awk -F\/ \'{print $1}\'` \n'
222 <        txt += '    else \n'
223 <        txt += '        echo "SET_CMS_ENV 10099 ==> OSG mode: ERROR in setting CE name from OSG_JOB_CONTACT" \n'
224 <        txt += '        echo "JOB_EXIT_STATUS = 10099" \n'
225 <        txt += '        echo "JobExitCode=10099" | tee -a $RUNTIME_AREA/$repo \n'
226 <        txt += '        dumpStatus $RUNTIME_AREA/$repo \n'
227 <        txt += '        rm -f $RUNTIME_AREA/$repo \n'
228 <        txt += '        echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
229 <        txt += '        echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
230 <        txt += '        exit 1 \n'
231 <        txt += '    fi \n'
232 <        txt += 'fi \n'
157 >        return req
158  
159 <        return txt
235 <        
236 <    def loggingInfo(self, id):
159 >    def sched_parameter(self,i,task):
160          """
161 <        retrieve the logging info from logging and bookkeeping and return it
161 >        Returns string with requirements and scheduler-specific parameters
162          """
163 <        self.checkProxy()
241 <        cmd = 'glite-job-logging-info -v 3 ' + id
242 <        cmd_out = runCommand(cmd)
243 <        return cmd_out
244 <
245 <    def queryDetailedStatus(self, id):
246 <        """ Query a detailed status of the job with id """
247 <        cmd = 'glite-job-status '+id
248 <        cmd_out = runCommand(cmd)
249 <        return cmd_out
163 >        dest=  task.jobs[i-1]['dlsDestination']
164  
165 <    def findSites_(self, n):
166 <        sites = common.jobDB.destination(n)
165 >        req=''
166 >        #req +=task['jobType']
167 >        ####### FEDE FOR BUG 73010 ############
168 >        try:
169 >            #print "task['jobType'] = ", task['jobType']
170 >            req +=task['jobType']
171 >        except TypeError:
172 >            msg = "Error: wrong or missing task info. Your created task can not be submitted. Please check your configuration file and create the task again.  \n "
173 >            raise CrabException(msg)
174 >        #######################################
175 >
176 >        sched_param=''
177 >        sched_param+='Requirements = ' + req +self.specific_req() + self.se_list(dest) +\
178 >                                        self.ce_list()[0] +';\n'
179 >        if self.EDG_addJdlParam: sched_param+=self.jdlParam()
180 >        sched_param+='MyProxyServer = "' + self.proxyServer + '";\n'
181 >        sched_param+='VirtualOrganisation = "' + self.VO + '";\n'
182 >        sched_param+='RetryCount = '+str(self.EDG_retry_count)+';\n'
183 >        sched_param+='DefaultNodeRetryCount = '+str(self.EDG_retry_count)+';\n'
184 >        sched_param+='ShallowRetryCount = '+str(self.EDG_shallow_retry_count)+';\n'
185 >        sched_param+='DefaultNodeShallowRetryCount = '+str(self.EDG_shallow_retry_count)+';\n'
186 >
187 >        return sched_param
188 >
189 >    def decodeLogInfo(self, file):
190 >        """
191 >        Parse logging info file and return main info
192 >        """
193 >        loggingInfo = EdgLoggingInfo.EdgLoggingInfo()
194 >        reason = loggingInfo.decodeReason(file)
195 >        return reason
196 >
197 >    def findSites_(self, sites):
198 >        itr4 =[]
199          if len(sites)>0 and sites[0]=="":
200 <            return []
200 >            return itr4
201 >        if sites != [""]:
202 >            replicas = self.blackWhiteListParser.checkBlackList(sites)
203 >            if len(replicas)!=0:
204 >                replicas = self.blackWhiteListParser.checkWhiteList(replicas)
205 >
206 >            itr4 = replicas
207 >        return itr4
208 >
209 >    def delegateProxy(self):
210 >        self.boss().delegateProxy()  
211 >        return
212 >
213 >    def wsExitFunc(self):
214 >        """
215 >        """
216 >        txt = '\n'
217 >
218 >        txt += '#\n'
219 >        txt += '# EXECUTE THIS FUNCTION BEFORE EXIT \n'
220 >        txt += '#\n\n'
221 >
222 >        txt += 'func_exit() { \n'
223 >        txt += self.wsExitFunc_common()
224 >        ### specific Glite check for OSB
225 >        txt += '    tar zcvf ${out_files}.tgz  ${final_list}\n'
226 >        txt += '    tmp_size=`ls -gGrta ${out_files}.tgz | awk \'{ print $3 }\'`\n'
227 >        txt += '    rm ${out_files}.tgz\n'
228 >        txt += '    size=`expr $tmp_size`\n'
229 >        txt += '    echo "Total Output dimension: $size"\n'
230 >        txt += '    limit='+str(self.OSBsize) +' \n'
231 >        txt += '    echo "WARNING: output files size limit is set to: $limit"\n'
232 >        txt += '    if [ "$limit" -lt "$size" ]; then\n'
233 >        txt += '        exceed=1\n'
234 >        txt += '        job_exit_code=70000\n'
235 >        txt += '        echo "Output Sanbox too big. Produced output is lost "\n'
236 >        txt += '    else\n'
237 >        txt += '        exceed=0\n'
238 >        txt += '        echo "Total Output dimension $size is fine."\n'
239 >        txt += '    fi\n'
240 >
241 >        txt += '    echo "JOB_EXIT_STATUS = $job_exit_code"\n'
242 >        txt += '    echo "JobExitCode=$job_exit_code" >> $RUNTIME_AREA/$repo\n'
243 >        txt += '    dumpStatus $RUNTIME_AREA/$repo\n'
244 >        txt += '    if [ $exceed -ne 1 ]; then\n'
245 >        txt += '        tar zcvf ${out_files}.tgz  ${final_list}\n'
246 >        txt += '    else\n'
247 >        txt += '        tar zcvf ${out_files}.tgz CMSSW_${NJob}.stdout CMSSW_${NJob}.stderr\n'
248 >        txt += '    fi\n'
249 >        txt += '    python $RUNTIME_AREA/fillCrabFjr.py $RUNTIME_AREA/crab_fjr_$NJob.xml --errorcode $job_exit_code \n'
250 >        txt += '    exit $job_exit_code\n'
251 >
252 >        txt += '}\n'
253 >        return txt
254 >
255 >    def listMatch(self, dest, full):
256 >        matching='fast'
257 >        
258 >        if self.boss().schedulerConfig['name'] == 'SchedulerGLite' :
259 >            taskId=common._db.getTask()
260 >            req=str(self.sched_parameter(1,taskId))
261 >            sites = self.boss().schedSession().matchResources(taskId, requirements=req)
262 >        else :
263 >            sites = SchedulerGrid.listMatch(self, dest, full)
264 >            
265 >        if full == True: matching='full'
266 >        common.logger.debug("list of available site ( "+str(matching) +" matching ) : "+str(sites))
267 >        
268          return sites

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines