ViewVC Help
View File | Revision Log | Show Annotations | Root Listing
root/cvsroot/COMP/CRAB/python/SchedulerGlite.py
(Generate patch)

Comparing COMP/CRAB/python/SchedulerGlite.py (file contents):
Revision 1.4 by fanzago, Wed Oct 11 15:45:53 2006 UTC vs.
Revision 1.65 by ewv, Mon Dec 8 17:53:32 2008 UTC

# Line 1 | Line 1
1 < #from Scheduler import Scheduler
2 < from SchedulerEdg import SchedulerEdg
1 > """
2 > CRAB interface to BossLite gLite Scheduler
3 > """
4 >
5 > __revision__ = "$Id$"
6 > __version__ = "$Revision$"
7 >
8 > from SchedulerGrid import SchedulerGrid
9   from crab_logger import Logger
10   from crab_exceptions import *
11   from crab_util import *
6 #from EdgConfig import *
12   from GliteConfig import *
13 + import EdgLoggingInfo
14   import common
15 + from WMCore.SiteScreening.BlackWhiteListParser import CEBlackWhiteListParser
16  
17   import os, sys, time
18  
19 < class SchedulerGlite(SchedulerEdg):
20 <    def __init__(self):
21 <        SchedulerEdg.__init__(self)
19 > class SchedulerGlite(SchedulerGrid):
20 >    def __init__(self, name="GLITE"):
21 >        SchedulerGrid.__init__(self,name)
22 >
23 >        self.OSBsize = 55000000
24 >
25 >    def configure(self,cfg_params):
26 >        SchedulerGrid.configure(self, cfg_params)
27 >        self.environment_unique_identifier = '$GLITE_WMS_JOBID'
28 >
29 >    def realSchedParams(self,cfg_params):
30 >        """
31 >        Return dictionary with specific parameters, to use
32 >        with real scheduler
33 >        """
34 >        self.rb_param_file=''
35 >        if (not cfg_params.has_key('EDG.rb')):
36 >            cfg_params['EDG.rb']='CERN'
37 >        self.rb_param_file=common.scheduler.rb_configure(cfg_params.get("EDG.rb"))
38 >        self.wms_service=cfg_params.get("EDG.wms_service",'')
39 >        self.skipWMSAuth=cfg_params.get("EDG.skipwmsauth",1)
40 >        params = { 'service' : self.wms_service, \
41 >                   'config' : self.rb_param_file, \
42 >                   'skipWMSAuth' : self.skipWMSAuth
43 >                 }
44 >        return  params
45 >
46  
47      def rb_configure(self, RB):
48 <        self.glite_config = ''
49 <        self.rb_param_file = ''
48 >        if not RB: return None
49 >        glite_config = None
50 >        rb_param_file = None
51  
52          gliteConfig = GliteConfig(RB)
53 <        self.glite_config = gliteConfig.config()
53 >        glite_config = gliteConfig.config()
54  
55 <        if (self.glite_config != ''):
56 <            self.rb_param_file = 'WMSconfig = '+self.glite_config+';'
57 <            #print "rb_param_file = ", self.rb_param_file
58 <        return self.rb_param_file
59 <
60 <    def sched_parameter(self):
61 <        """
62 <        Returns file with requirements and scheduler-specific parameters
63 <        """
64 <        index = int(common.jobDB.nJobs()) - 1
33 <        job = common.job_list[index]
34 <        jbt = job.type()
35 <        
36 <        lastDest=''
37 <        first = []
38 <        last  = []
39 <        for n in range(common.jobDB.nJobs()):
40 <            currDest=common.jobDB.destination(n)
41 <            if (currDest!=lastDest):
42 <                lastDest = currDest
43 <                first.append(n)
44 <                if n != 0:last.append(n-1)
45 <        if len(first)>len(last) :last.append(common.jobDB.nJobs())
46 <  
55 >        if (glite_config ):
56 >            rb_param_file = glite_config
57 >        return rb_param_file
58 >
59 >    def ce_list(self):
60 >        """
61 >        Returns string with requirement CE related
62 >        """
63 >        ceParser = CEBlackWhiteListParser(self.EDG_ce_white_list,
64 >                                          self.EDG_ce_black_list, common.logger)
65          req = ''
66 <        req = req + jbt.getRequirements()
67 <    
50 <        if self.EDG_requirements:
51 <            if (req == ' '):
52 <                req = req + self.EDG_requirements
53 <            else:
54 <                req = req +  ' && ' + self.EDG_requirements
66 >        ce_white_list = []
67 >        ce_black_list = []
68          if self.EDG_ce_white_list:
69 <            ce_white_list = string.split(self.EDG_ce_white_list,',')
70 <            for i in range(len(ce_white_list)):
71 <                if i == 0:
72 <                    if (req == ' '):
73 <                        req = req + '((RegExp("' + ce_white_list[i] + '", other.GlueCEUniqueId))'
74 <                    else:
75 <                        req = req +  ' && ((RegExp("' + ce_white_list[i] + '", other.GlueCEUniqueId))'
76 <                    pass
77 <                else:
78 <                    req = req +  ' || (RegExp("' + ce_white_list[i] + '", other.GlueCEUniqueId))'
79 <            req = req + ')'
80 <        
69 >            ce_white_list = ceParser.whiteList()
70 >            tmpCe=[]
71 >            concString = '&&'
72 >            for ce in ce_white_list:
73 >                tmpCe.append('RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId)')
74 >            if len(tmpCe) == 1:
75 >                req +=  " && (" + concString.join(tmpCe) + ") "
76 >            elif len(tmpCe) > 1:
77 >                firstCE = 0
78 >                for reqTemp in tmpCe:
79 >                    if firstCE == 0:
80 >                        req += " && ( (" + reqTemp + ") "
81 >                        firstCE = 1
82 >                    elif firstCE > 0:
83 >                        req += " || (" + reqTemp + ") "
84 >                if firstCE > 0:
85 >                    req += ") "
86 >
87          if self.EDG_ce_black_list:
88 <            ce_black_list = string.split(self.EDG_ce_black_list,',')
88 >            ce_black_list = ceParser.blackList()
89 >            tmpCe=[]
90 >            concString = '&&'
91              for ce in ce_black_list:
92 <                if (req == ' '):
93 <                    req = req + '(!RegExp("' + ce + '", other.GlueCEUniqueId))'
94 <                else:
95 <                    req = req +  ' && (!RegExp("' + ce + '", other.GlueCEUniqueId))'
96 <                pass
92 >                tmpCe.append('(!RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId))')
93 >            if len(tmpCe): req += " && (" + concString.join(tmpCe) + ") "
94 >
95 >        # requirement added to skip gliteCE
96 >        req += '&& (!RegExp("blah", other.GlueCEUniqueId))'
97 >
98 >        return req, ','.join(ce_white_list), ','.join(ce_black_list)
99 >
100 >    def se_list(self, dest):
101 >        """
102 >        Returns string with requirement SE related
103 >        """
104 >        hostList=self.findSites_(dest)
105 >        req=''
106 >        reqtmp=[]
107 >        concString = '||'
108 >
109 >        for arg in hostList:
110 >            reqtmp.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
111 >
112 >        if len(reqtmp): req += " && (" + concString.join(reqtmp) + ") "
113 >
114 >        return req
115 >
116 >    def jdlParam(self):
117 >        """
118 >        Returns
119 >        """
120 >        req=''
121 >        if self.EDG_addJdlParam:
122 >            if self.EDG_addJdlParam[-1] == '': self.EDG_addJdlParam= self.EDG_addJdlParam[:-1]
123 >            for p in self.EDG_addJdlParam:
124 >                req+=string.strip(p)+';\n'
125 >        return req
126 >
127 >    def specific_req(self):
128 >        """
129 >        Returns string with specific requirements
130 >        """
131 >        req=''
132          if self.EDG_clock_time:
133 <            if (req == ' '):
134 <                req = req + 'other.GlueCEPolicyMaxWallClockTime>='+self.EDG_clock_time
79 <            else:
80 <                req = req + ' && other.GlueCEPolicyMaxWallClockTime>='+self.EDG_clock_time
133 >            if (not req == ' '): req = req + ' && '
134 >            req = req + 'other.GlueCEPolicyMaxWallClockTime>='+self.EDG_clock_time
135  
136          if self.EDG_cpu_time:
137 <            if (req == ' '):
138 <                req = req + ' other.GlueCEPolicyMaxCPUTime>='+self.EDG_cpu_time
85 <            else:
86 <                req = req + ' && other.GlueCEPolicyMaxCPUTime>='+self.EDG_cpu_time
87 <                
88 <        for i in range(len(first)): # Add loop DS
89 <            self.param='sched_param_'+str(i)+'.clad'
90 <            param_file = open(common.work_space.shareDir()+'/'+self.param, 'w')
91 <
92 <            itr4=self.findSites_(first[i])
93 <            req1=[]  
94 <            j = 0
95 <            concString = '||'
96 <            for arg in itr4:
97 <                #############
98 <                # MC Changed matching syntax to avoid gang matching
99 <                #############
100 <                req1.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
101 <            if len(req1): req = req + " && (" + concString.join(req1) + ')'
102 <            req = req + ';\n'
103 <            param_file.write('Requirements = ' + req )
104 <  
105 < #            if (self.edg_config and self.edg_config_vo != ''):
106 < #               param_file.write('RBconfig = "'+self.edg_config+'";\n')  
107 < #                param_file.write('RBconfigVO = "'+self.edg_config_vo+'";')
108 <
109 <            if (self.rb_param_file != ''):
110 <                param_file.write(self.rb_param_file)  
111 <
112 <
113 <            param_file.close()  
114 <
115 <    def wsSetupEnvironment(self):
116 <        """
117 <        Returns part of a job script which does scheduler-specific work.
118 <        """
119 <        txt = ''
120 <        txt += '# strip arguments\n'
121 <        txt += 'echo "strip arguments"\n'
122 <        txt += 'args=("$@")\n'
123 <        txt += 'nargs=$#\n'
124 <        txt += 'shift $nargs\n'
125 <        txt += "# job number (first parameter for job wrapper)\n"
126 <        txt += "NJob=${args[0]}\n"
127 <
128 <        txt += '# job identification to DashBoard \n'
129 <        txt += 'MonitorJobID=`echo ${NJob}_$GLITE_WMS_JOBID`\n'
130 <        txt += 'SyncGridJobId=`echo $GLITE_WMS_JOBID`\n'
131 <        txt += 'MonitorID=`echo ' + self._taskId + '`\n'
132 <        txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
133 <        txt += 'echo "SyncGridJobId=`echo $SyncGridJobId`" | tee -a $RUNTIME_AREA/$repo \n'
134 <        txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
135 <
136 <        txt += 'echo "middleware discovery " \n'
137 <        txt += 'if [ $VO_CMS_SW_DIR ]; then \n'
138 <        txt += '    middleware=LCG \n'
139 <        txt += '    echo "SyncCE=`glite-brokerinfo getCE`" | tee -a $RUNTIME_AREA/$repo \n'
140 <        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
141 <        txt += '    echo "middleware =$middleware" \n'
142 <        txt += 'elif [ $GRID3_APP_DIR ]; then\n'
143 <        txt += '    middleware=OSG \n'
144 <        txt += '    echo "SyncCE=`echo $EDG_WL_LOG_DESTINATION`" | tee -a $RUNTIME_AREA/$repo \n'
145 <        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
146 <        txt += '    echo "middleware =$middleware" \n'
147 <        txt += 'elif [ $OSG_APP ]; then \n'
148 <        txt += '    middleware=OSG \n'
149 <        txt += '    echo "SyncCE=`echo $EDG_WL_LOG_DESTINATION`" | tee -a $RUNTIME_AREA/$repo \n'
150 <        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
151 <        txt += '    echo "middleware =$middleware" \n'
152 <        txt += 'else \n'
153 <        txt += '    echo "SET_CMS_ENV 10030 ==> middleware not identified" \n'
154 <        txt += '    echo "JOB_EXIT_STATUS = 10030" \n'
155 <        txt += '    echo "JobExitCode=10030" | tee -a $RUNTIME_AREA/$repo \n'
156 <        txt += '    dumpStatus $RUNTIME_AREA/$repo \n'
157 <        txt += '    rm -f $RUNTIME_AREA/$repo \n'
158 <        txt += '    echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
159 <        txt += '    echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
160 <        txt += '    exit 1 \n'
161 <        txt += 'fi \n'
162 <
163 <        txt += '# report first time to DashBoard \n'
164 <        txt += 'dumpStatus $RUNTIME_AREA/$repo \n'
165 <        txt += 'rm -f $RUNTIME_AREA/$repo \n'
166 <        txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
167 <        txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
168 <        
169 <        txt += '\n\n'
170 <
171 <        if int(self.copy_data) == 1:
172 <           if self.SE:
173 <              txt += 'export SE='+self.SE+'\n'
174 <              txt += 'echo "SE = $SE"\n'
175 <           if self.SE_PATH:
176 <              if ( self.SE_PATH[-1] != '/' ) : self.SE_PATH = self.SE_PATH + '/'
177 <              txt += 'export SE_PATH='+self.SE_PATH+'\n'
178 <              txt += 'echo "SE_PATH = $SE_PATH"\n'
179 <
180 <        txt += 'export VO='+self.VO+'\n'
181 <        ### some line for LFC catalog setting
182 <        txt += 'if [ $middleware == LCG ]; then \n'
183 <        txt += '    if [[ $LCG_CATALOG_TYPE != \''+self.lcg_catalog_type+'\' ]]; then\n'
184 <        txt += '        export LCG_CATALOG_TYPE='+self.lcg_catalog_type+'\n'
185 <        txt += '    fi\n'
186 <        txt += '    if [[ $LFC_HOST != \''+self.lfc_host+'\' ]]; then\n'
187 <        txt += '        export LFC_HOST='+self.lfc_host+'\n'
188 <        txt += '    fi\n'
189 <        txt += '    if [[ $LFC_HOME != \''+self.lfc_home+'\' ]]; then\n'
190 <        txt += '        export LFC_HOME='+self.lfc_home+'\n'
191 <        txt += '    fi\n'
192 <        txt += 'elif [ $middleware == OSG ]; then\n'
193 <        txt += '    echo "LFC catalog setting to be implemented for OSG"\n'
194 <        txt += 'fi\n'
195 <        #####
196 <        if int(self.register_data) == 1:
197 <           txt += 'if [ $middleware == LCG ]; then \n'
198 <           txt += '    export LFN='+self.LFN+'\n'
199 <           txt += '    lfc-ls $LFN\n'
200 <           txt += '    result=$?\n'
201 <           txt += '    echo $result\n'
202 <           ### creation of LFN dir in LFC catalog, under /grid/cms dir  
203 <           txt += '    if [ $result != 0 ]; then\n'
204 <           txt += '       lfc-mkdir $LFN\n'
205 <           txt += '       result=$?\n'
206 <           txt += '       echo $result\n'
207 <           txt += '    fi\n'
208 <           txt += 'elif [ $middleware == OSG ]; then\n'
209 <           txt += '    echo " Files registration to be implemented for OSG"\n'
210 <           txt += 'fi\n'
211 <           txt += '\n'
212 <
213 <           if self.VO:
214 <              txt += 'export VO='+self.VO+'\n'
215 <           if self.LFN:
216 <              txt += 'if [ $middleware == LCG ]; then \n'
217 <              txt += '    export LFN='+self.LFN+'\n'
218 <              txt += 'fi\n'
219 <              txt += '\n'
220 <
221 <        txt += 'if [ $middleware == LCG ]; then\n'
222 <        txt += '    CloseCEs=`glite-brokerinfo getCE`\n'
223 <        txt += '    echo "CloseCEs = $CloseCEs"\n'
224 <        txt += '    CE=`echo $CloseCEs | sed -e "s/:.*//"`\n'
225 <        txt += '    echo "CE = $CE"\n'
226 <        txt += 'elif [ $middleware == OSG ]; then \n'
227 <        txt += '    if [ $OSG_JOB_CONTACT ]; then \n'
228 <        txt += '        CE=`echo $OSG_JOB_CONTACT | /usr/bin/awk -F\/ \'{print $1}\'` \n'
229 <        txt += '    else \n'
230 <        txt += '        echo "SET_CMS_ENV 10099 ==> OSG mode: ERROR in setting CE name from OSG_JOB_CONTACT" \n'
231 <        txt += '        echo "JOB_EXIT_STATUS = 10099" \n'
232 <        txt += '        echo "JobExitCode=10099" | tee -a $RUNTIME_AREA/$repo \n'
233 <        txt += '        dumpStatus $RUNTIME_AREA/$repo \n'
234 <        txt += '        rm -f $RUNTIME_AREA/$repo \n'
235 <        txt += '        echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
236 <        txt += '        echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
237 <        txt += '        exit 1 \n'
238 <        txt += '    fi \n'
239 <        txt += 'fi \n'
137 >            if (not req == ' '): req = req + ' && '
138 >            req = req + ' other.GlueCEPolicyMaxCPUTime>='+self.EDG_cpu_time
139  
140 <        return txt
141 <        
142 <    def loggingInfo(self, id):
140 >        return req
141 >
142 >    def sched_parameter(self,i,task):
143 >        """
144 >        Returns string with requirements and scheduler-specific parameters
145 >        """
146 >        dest=  task.jobs[i-1]['dlsDestination']
147 >
148 >        req=''
149 >        req +=task['jobType']
150 >
151 >        sched_param=''
152 >        sched_param+='Requirements = ' + req +self.specific_req() + self.se_list(dest) +\
153 >                                        self.ce_list()[0] +';\n'
154 >        if self.EDG_addJdlParam: sched_param+=self.jdlParam()
155 >        sched_param+='MyProxyServer = "' + self.proxyServer + '";\n'
156 >        sched_param+='VirtualOrganisation = "' + self.VO + '";\n'
157 >        sched_param+='RetryCount = '+str(self.EDG_retry_count)+';\n'
158 >        sched_param+='ShallowRetryCount = '+str(self.EDG_shallow_retry_count)+';\n'
159 >
160 >        return sched_param
161 >
162 >    def decodeLogInfo(self, file):
163          """
164 <        retrieve the logging info from logging and bookkeeping and return it
164 >        Parse logging info file and return main info
165          """
166 <        self.checkProxy()
167 <        cmd = 'glite-job-logging-info -v 2 ' + id
168 <        cmd_out = runCommand(cmd)
250 <        return cmd_out
251 <
252 <    def queryDetailedStatus(self, id):
253 <        """ Query a detailed status of the job with id """
254 <        cmd = 'glite-job-status '+id
255 <        cmd_out = runCommand(cmd)
256 <        return cmd_out
166 >        loggingInfo = EdgLoggingInfo.EdgLoggingInfo()
167 >        reason = loggingInfo.decodeReason(file)
168 >        return reason
169  
170 <    def findSites_(self, n):
171 <        sites = common.jobDB.destination(n)
170 >    def findSites_(self, sites):
171 >        itr4 =[]
172          if len(sites)>0 and sites[0]=="":
173 <            return []
174 <        return sites
173 >            return itr4
174 >        if sites != [""]:
175 >            replicas = self.blackWhiteListParser.checkBlackList(sites)
176 >            if len(replicas)!=0:
177 >                replicas = self.blackWhiteListParser.checkWhiteList(replicas)
178 >
179 >            itr4 = replicas
180 >        return itr4
181 >
182 >
183 >    def wsExitFunc(self):
184 >        """
185 >        """
186 >        txt = '\n'
187 >
188 >        txt += '#\n'
189 >        txt += '# EXECUTE THIS FUNCTION BEFORE EXIT \n'
190 >        txt += '#\n\n'
191 >
192 >        txt += 'func_exit() { \n'
193 >        txt += self.wsExitFunc_common()
194 >        ### specific Glite check for OSB
195 >        txt += '    tar zcvf ${out_files}.tgz  ${final_list}\n'
196 >        txt += '    tmp_size=`ls -gGrta ${out_files}.tgz | awk \'{ print $3 }\'`\n'
197 >        txt += '    rm ${out_files}.tgz\n'
198 >        txt += '    size=`expr $tmp_size`\n'
199 >        txt += '    echo "Total Output dimension: $size"\n'
200 >        txt += '    limit='+str(self.OSBsize) +' \n'
201 >        txt += '    echo "WARNING: output files size limit is set to: $limit"\n'
202 >        txt += '    if [ "$limit" -lt "$size" ]; then\n'
203 >        txt += '        exceed=1\n'
204 >        txt += '        job_exit_code=70000\n'
205 >        txt += '        echo "Output Sanbox too big. Produced output is lost "\n'
206 >        txt += '    else\n'
207 >        txt += '        exceed=0\n'
208 >        txt += '        echo "Total Output dimension $size is fine."\n'
209 >        txt += '    fi\n'
210 >
211 >        txt += '    echo "JOB_EXIT_STATUS = $job_exit_code"\n'
212 >        txt += '    echo "JobExitCode=$job_exit_code" >> $RUNTIME_AREA/$repo\n'
213 >        txt += '    dumpStatus $RUNTIME_AREA/$repo\n'
214 >        txt += '    if [ $exceed -ne 1 ]; then\n'
215 >        txt += '        tar zcvf ${out_files}.tgz  ${final_list}\n'
216 >        txt += '    else\n'
217 >        txt += '        tar zcvf ${out_files}.tgz CMSSW_${NJob}.stdout CMSSW_${NJob}.stderr\n'
218 >        txt += '    fi\n'
219 >        txt += '    exit $job_exit_code\n'
220 >
221 >        txt += '}\n'
222 >        return txt

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines