ViewVC Help
View File | Revision Log | Show Annotations | Root Listing
root/cvsroot/COMP/CRAB/python/SchedulerGlite.py
(Generate patch)

Comparing COMP/CRAB/python/SchedulerGlite.py (file contents):
Revision 1.28 by ewv, Wed Nov 14 16:35:21 2007 UTC vs.
Revision 1.51 by spiga, Sat May 3 17:14:17 2008 UTC

# Line 1 | Line 1
1 < from SchedulerEdg import SchedulerEdg
1 > from SchedulerGrid import SchedulerGrid
2   from crab_logger import Logger
3   from crab_exceptions import *
4   from crab_util import *
5   from GliteConfig import *
6 + import EdgLoggingInfo
7   import common
8  
9   import os, sys, time
10  
11 < class SchedulerGlite(SchedulerEdg):
12 <    def __init__(self):
13 <        SchedulerEdg.__init__(self)
11 > class SchedulerGlite(SchedulerGrid):
12 >    def __init__(self, name="GLITE"):
13 >        SchedulerGrid.__init__(self,name)
14  
15 <    def rb_configure(self, RB):
15 <        self.glite_config = ''
16 <        self.rb_param_file = ''
17 <
18 <        gliteConfig = GliteConfig(RB)
19 <        self.glite_config = gliteConfig.config()
15 >        self.OSBsize = 55000
16  
17 <        if (self.glite_config != ''):
18 <            self.rb_param_file = 'WMSconfig = '+self.glite_config+';\n'
19 <            #print "rb_param_file = ", self.rb_param_file
20 <        return self.rb_param_file
17 >    def configure(self,cfg_params):
18 >        SchedulerGrid.configure(self, cfg_params)
19 >        self.checkProxy()
20 >        self.environment_unique_identifier = 'GLITE_WMS_JOBID'
21  
22 <    def sched_parameter(self):
22 >    def realSchedParams(self,cfg_params):
23          """
24 <        Returns file with requirements and scheduler-specific parameters
24 >        Return dictionary with specific parameters, to use
25 >        with real scheduler  
26          """
27 <        index = int(common.jobDB.nJobs()) - 1
28 <        job = common.job_list[index]
29 <        jbt = job.type()
30 <
31 <        lastDest=''
32 <        first = []
33 <        last  = []
34 <        for n in range(common.jobDB.nJobs()):
35 <            currDest=common.jobDB.destination(n)
39 <            if (currDest!=lastDest):
40 <                lastDest = currDest
41 <                first.append(n)
42 <                if n != 0:last.append(n-1)
43 <        if len(first)>len(last) :last.append(common.jobDB.nJobs())
27 >        self.rb_param_file=''
28 >        if (cfg_params.has_key('EDG.rb')):
29 >            self.rb_param_file=common.scheduler.rb_configure(cfg_params.get("EDG.rb"))
30 >        self.wms_service=cfg_params.get("EDG.wms_service",'')
31 >        params = { 'service' : self.wms_service, \
32 >                   'config' : self.rb_param_file
33 >                 }
34 >        return  params
35 >      
36  
37 <        req = ''
38 <        req = req + jbt.getRequirements()
37 >    def rb_configure(self, RB):
38 >        if not RB: return None
39 >        glite_config = None
40 >        rb_param_file = None
41  
42 +        gliteConfig = GliteConfig(RB)
43 +        glite_config = gliteConfig.config()
44  
45 <        if self.EDG_requirements:
46 <            if (not req == ' '): req = req +  ' && '
47 <            req = req + self.EDG_requirements
45 >        if (glite_config ):
46 >            rb_param_file = glite_config
47 >        return rb_param_file
48  
49 +    def ce_list(self):
50 +        """
51 +        Returns string with requirement CE related
52 +        """
53 +        req = ''
54          if self.EDG_ce_white_list:
55 <            ce_white_list = string.split(self.EDG_ce_white_list,',')
55 >            ce_white_list = self.EDG_ce_white_list
56              tmpCe=[]
57              concString = '&&'
58              for ce in ce_white_list:
59                  tmpCe.append('RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId)')
59            ### MATTY' FIX: if more then one CE: && -> ||
60            #print "list CE: " + str(tmpCe)
60              if len(tmpCe) == 1:
61                  req +=  " && (" + concString.join(tmpCe) + ") "
62              elif len(tmpCe) > 1:
63                  firstCE = 0
64                  for reqTemp in tmpCe:
66                    #print reqTemp
65                      if firstCE == 0:
68                        #print "adding: "+str(" && ( (" + reqTemp + ") ")
66                          req += " && ( (" + reqTemp + ") "
67                          firstCE = 1
68                      elif firstCE > 0:
72                        #print "adding: "+str(" || (" + reqTemp + ") ")
69                          req += " || (" + reqTemp + ") "
70                  if firstCE > 0:
71                      req += ") "
76            ## old code
77 #            if len(tmpCe): req = req + " && (" + concString.join(tmpCe) + ") "
72  
73          if self.EDG_ce_black_list:
74 <            ce_black_list = string.split(self.EDG_ce_black_list,',')
74 >            ce_black_list = self.EDG_ce_black_list
75              tmpCe=[]
76              concString = '&&'
77              for ce in ce_black_list:
78                  tmpCe.append('(!RegExp("' + string.strip(ce) + '", other.GlueCEUniqueId))')
79 <            if len(tmpCe): req = req + " && (" + concString.join(tmpCe) + ") "
79 >            if len(tmpCe): req += " && (" + concString.join(tmpCe) + ") "
80 >
81 >        # requirement added to skip gliteCE
82 >        req += '&& (!RegExp("blah", other.GlueCEUniqueId))'
83 >
84 >        return req,self.EDG_ce_white_list,self.EDG_ce_black_list
85 >
86 >    def se_list(self, id, dest):
87 >        """
88 >        Returns string with requirement SE related
89 >        """
90 >        hostList=self.findSites_(id,dest)
91 >        req=''
92 >        reqtmp=[]
93 >        concString = '||'
94 >
95 >        for arg in hostList:
96 >            reqtmp.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
97  
98 +        if len(reqtmp): req += " && (" + concString.join(reqtmp) + ") "
99 +
100 +        return req
101 +
102 +    def jdlParam(self):
103 +        """
104 +        Returns
105 +        """
106 +        req=''
107 +        if self.EDG_addJdlParam:
108 +            if self.EDG_addJdlParam[-1] == '': self.EDG_addJdlParam= self.EDG_addJdlParam[:-1]
109 +            for p in self.EDG_addJdlParam:
110 +             #   param_file.write(string.strip(p)+';\n')
111 +                req+=string.strip(p)+';\n' ## BL--DS
112 +        return req
113 +
114 +    def specific_req(self):
115 +        """
116 +        Returns string with specific requirements
117 +        """
118 +        req=''
119          if self.EDG_clock_time:
120              if (not req == ' '): req = req + ' && '
121              req = req + 'other.GlueCEPolicyMaxWallClockTime>='+self.EDG_clock_time
# Line 92 | Line 124 | class SchedulerGlite(SchedulerEdg):
124              if (not req == ' '): req = req + ' && '
125              req = req + ' other.GlueCEPolicyMaxCPUTime>='+self.EDG_cpu_time
126  
127 <        for i in range(len(first)): # Add loop DS
96 <            self.param='sched_param_'+str(i)+'.clad'
97 <            param_file = open(common.work_space.shareDir()+'/'+self.param, 'w')
98 <
99 <            itr4=self.findSites_(first[i])
100 <            reqSites=''
101 <            reqtmp=[]
102 <            concString = '||'
103 <
104 <            #############
105 <            # MC Changed matching syntax to avoid gang matching
106 <            #############
107 <            for arg in itr4:
108 <                reqtmp.append(' Member("'+arg+'" , other.GlueCESEBindGroupSEUniqueID) ')
109 <
110 <            if len(reqtmp): reqSites = reqSites + " && (" + concString.join(reqtmp) + ") "
111 <
112 <            # requirement added to skip gliteCE
113 <            reqSites = reqSites + '&& (!RegExp("blah", other.GlueCEUniqueId));\n'
114 <
115 <            param_file.write('Requirements = ' + req + reqSites )
116 <
117 <            if (self.rb_param_file != ''):
118 <                param_file.write(self.rb_param_file)
119 <
120 <            if len(self.EDG_addJdlParam):
121 <                for p in self.EDG_addJdlParam:
122 <                    param_file.write(p)
123 <
124 <            param_file.close()
125 <
126 <    def wsSetupEnvironment(self):
127 <        """
128 <        Returns part of a job script which does scheduler-specific work.
129 <        """
130 <        txt = ''
131 <        txt += '# strip arguments\n'
132 <        txt += 'echo "strip arguments"\n'
133 <        txt += 'args=("$@")\n'
134 <        txt += 'nargs=$#\n'
135 <        txt += 'shift $nargs\n'
136 <        txt += "# job number (first parameter for job wrapper)\n"
137 <        txt += "NJob=${args[0]}\n"
138 <
139 <        txt += '# job identification to DashBoard \n'
140 <        txt += 'MonitorJobID=`echo ${NJob}_$GLITE_WMS_JOBID`\n'
141 <        txt += 'SyncGridJobId=`echo $GLITE_WMS_JOBID`\n'
142 <        txt += 'MonitorID=`echo ' + self._taskId + '`\n'
143 <        txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
144 <        txt += 'echo "SyncGridJobId=`echo $SyncGridJobId`" | tee -a $RUNTIME_AREA/$repo \n'
145 <        txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
146 <
147 <        txt += 'echo "middleware discovery: " \n'
148 <        txt += 'if [ $VO_CMS_SW_DIR ]; then \n'
149 <        txt += '    middleware=LCG \n'
150 <        txt += '    echo "SyncCE=`glite-brokerinfo getCE`" | tee -a $RUNTIME_AREA/$repo \n'
151 <        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
152 <        txt += '    echo ">>> middleware =$middleware" \n'
153 <        txt += 'elif [ $OSG_APP ]; then \n'
154 <        txt += '    middleware=OSG \n'
155 <        txt += '    if [ $OSG_JOB_CONTACT ]; then \n'
156 <        txt += '        SyncCE="$OSG_JOB_CONTACT"; \n'
157 <        txt += '        echo "SyncCE=$SyncCE" | tee -a $RUNTIME_AREA/$repo ;\n'
158 <        txt += '    else\n'
159 <        txt += '        echo "not reporting SyncCE";\n'
160 <        txt += '    fi\n';
161 <        txt += '    echo "GridFlavour=`echo $middleware`" | tee -a $RUNTIME_AREA/$repo \n'
162 <        txt += '    echo ">>> middleware =$middleware" \n'
163 <        txt += 'else \n'
164 <        txt += '    echo "SET_CMS_ENV 10030 ==> middleware not identified" \n'
165 <        txt += '    echo "JOB_EXIT_STATUS = 10030" \n'
166 <        txt += '    echo "JobExitCode=10030" | tee -a $RUNTIME_AREA/$repo \n'
167 <        txt += '    dumpStatus $RUNTIME_AREA/$repo \n'
168 <        txt += '    exit 1 \n'
169 <        txt += 'fi \n'
170 <
171 <        txt += 'dumpStatus $RUNTIME_AREA/$repo \n'
172 <        #txt += 'rm -f $RUNTIME_AREA/$repo \n'
173 <        #txt += 'echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
174 <        #txt += 'echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
175 <
176 <        txt += '\n\n'
177 <
178 <        #if int(self.copy_data) == 1:
179 <        #   if self.SE:
180 <        #      txt += 'export SE='+self.SE+'\n'
181 <        #      txt += 'echo "SE = $SE"\n'
182 <        #   if self.SE_PATH:
183 <        #      if ( self.SE_PATH[-1] != '/' ) : self.SE_PATH = self.SE_PATH + '/'
184 <        #      txt += 'export SE_PATH='+self.SE_PATH+'\n'
185 <        #      txt += 'echo "SE_PATH = $SE_PATH"\n'
186 <
187 <        txt += 'export VO='+self.VO+'\n'
188 <        ### some line for LFC catalog setting
189 <        #txt += 'if [ $middleware == LCG ]; then \n'
190 <        #txt += '    if [[ $LCG_CATALOG_TYPE != \''+self.lcg_catalog_type+'\' ]]; then\n'
191 <        #txt += '        export LCG_CATALOG_TYPE='+self.lcg_catalog_type+'\n'
192 <        #txt += '    fi\n'
193 <        #txt += '    if [[ $LFC_HOST != \''+self.lfc_host+'\' ]]; then\n'
194 <        #txt += '        export LFC_HOST='+self.lfc_host+'\n'
195 <        #txt += '    fi\n'
196 <        #txt += '    if [[ $LFC_HOME != \''+self.lfc_home+'\' ]]; then\n'
197 <        #txt += '        export LFC_HOME='+self.lfc_home+'\n'
198 <        #txt += '    fi\n'
199 <        #txt += 'elif [ $middleware == OSG ]; then\n'
200 <        #txt += '    echo "LFC catalog setting to be implemented for OSG"\n'
201 <        #txt += 'fi\n'
202 <        #####
203 <        #if int(self.register_data) == 1:
204 <        #   txt += 'if [ $middleware == LCG ]; then \n'
205 <        #   txt += '    export LFN='+self.LFN+'\n'
206 <        #   txt += '    lfc-ls $LFN\n'
207 <        #   txt += '    result=$?\n'
208 <        #   txt += '    echo $result\n'
209 <        #   ### creation of LFN dir in LFC catalog, under /grid/cms dir
210 <        #   txt += '    if [ $result != 0 ]; then\n'
211 <        #   txt += '       lfc-mkdir $LFN\n'
212 <        #   txt += '       result=$?\n'
213 <        #   txt += '       echo $result\n'
214 <        #   txt += '    fi\n'
215 <        #   txt += 'elif [ $middleware == OSG ]; then\n'
216 <        #   txt += '    echo " Files registration to be implemented for OSG"\n'
217 <        #   txt += 'fi\n'
218 <        #   txt += '\n'
219 <        #   if self.VO:
220 <        #      txt += 'export VO='+self.VO+'\n'
221 <        #   if self.LFN:
222 <        #      txt += 'if [ $middleware == LCG ]; then \n'
223 <        #      txt += '    export LFN='+self.LFN+'\n'
224 <        #      txt += 'fi\n'
225 <        #      txt += '\n'
226 <
227 <        txt += 'if [ $middleware == LCG ]; then\n'
228 <        txt += '    CloseCEs=`glite-brokerinfo getCE`\n'
229 <        txt += '    echo "CloseCEs = $CloseCEs"\n'
230 <        txt += '    CE=`echo $CloseCEs | sed -e "s/:.*//"`\n'
231 <        txt += '    echo "CE = $CE"\n'
232 <        txt += 'elif [ $middleware == OSG ]; then \n'
233 <        txt += '    if [ $OSG_JOB_CONTACT ]; then \n'
234 <        txt += '        CE=`echo $OSG_JOB_CONTACT | /usr/bin/awk -F\/ \'{print $1}\'` \n'
235 <        txt += '    else \n'
236 <        txt += '        echo "SET_CMS_ENV 10099 ==> OSG mode: ERROR in setting CE name from OSG_JOB_CONTACT" \n'
237 <        txt += '        echo "JOB_EXIT_STATUS = 10099" \n'
238 <        txt += '        echo "JobExitCode=10099" | tee -a $RUNTIME_AREA/$repo \n'
239 <        txt += '        dumpStatus $RUNTIME_AREA/$repo \n'
240 <        #txt += '        rm -f $RUNTIME_AREA/$repo \n'
241 <        #txt += '        echo "MonitorJobID=`echo $MonitorJobID`" | tee -a $RUNTIME_AREA/$repo \n'
242 <        #txt += '        echo "MonitorID=`echo $MonitorID`" | tee -a $RUNTIME_AREA/$repo\n'
243 <        txt += '        exit 1 \n'
244 <        txt += '    fi \n'
245 <        txt += 'fi \n'
127 >        return req
128  
129 <        return txt
129 >    def sched_fix_parameter(self):
130 >        """
131 >        Returns string with requirements and scheduler-specific parameters
132 >        """
133 >        index = int(common._db.nJobs())
134 >        job = common.job_list[index-1]
135 >        jbt = job.type()
136 >        req = ''
137 >        req = req + jbt.getRequirements()
138  
139 <    def loggingInfo(self, id):
139 >        if self.EDG_requirements:
140 >            if (not req == ' '): req = req +  ' && '
141 >            req = req + self.EDG_requirements
142 >
143 >        Task_Req={'jobType':req}## DS--BL
144 >        common._db.updateTask_(Task_Req)
145 >
146 >    def sched_parameter(self,i,task):
147          """
148 <        retrieve the logging info from logging and bookkeeping and return it
148 >        Returns string with requirements and scheduler-specific parameters
149          """
150 <        self.checkProxy()
151 <        cmd = 'glite-job-logging-info -v 3 ' + id
152 <        cmd_out = runCommand(cmd)
153 <        return cmd_out
154 <
155 <    def queryDetailedStatus(self, id):
156 <        """ Query a detailed status of the job with id """
157 <        cmd = 'glite-job-status '+id
158 <        cmd_out = runCommand(cmd)
159 <        return cmd_out
160 <
161 <    def findSites_(self, n):
162 <        itr4 = []
163 <        sites = common.jobDB.destination(n)
150 >        dest=  task.jobs[i-1]['dlsDestination'] ## DS--BL
151 >
152 >        req=''
153 >        req +=task['jobType']
154 >
155 >        sched_param=''
156 >        sched_param+='Requirements = ' + req +self.specific_req() + self.se_list(i,dest) +\
157 >                                        self.ce_list()[0] +';\n' ## BL--DS
158 >        if self.EDG_addJdlParam: sched_param+=self.jdlParam() ## BL--DS
159 >        sched_param+='MyProxyServer = "' + self.proxyServer + '";\n'
160 >        sched_param+='VirtualOrganisation = "' + self.VO + '";\n'
161 >        sched_param+='RetryCount = '+str(self.EDG_retry_count)+';\n'
162 >        sched_param+='ShallowRetryCount = '+str(self.EDG_shallow_retry_count)+';\n'
163 >
164 >        return sched_param
165 >
166 >    def decodeLogInfo(self, file):
167 >        """
168 >        Parse logging info file and return main info
169 >        """
170 >        loggingInfo = EdgLoggingInfo.EdgLoggingInfo()
171 >        reason = loggingInfo.decodeReason(file)
172 >        return reason
173 >
174 >    def findSites_(self, n, sites):
175 >        itr4 =[]
176          if len(sites)>0 and sites[0]=="":
177              return itr4
178          if sites != [""]:
# Line 272 | Line 181 | class SchedulerGlite(SchedulerEdg):
181              if len(replicas)!=0:
182                  replicas = self.blackWhiteListParser.checkWhiteList(replicas,n)
183  
275            #if len(replicas)==0:
276                #msg = 'No sites remaining that host any part of the requested data! Exiting... '
277                #raise CrabException(msg)
184              itr4 = replicas
185              #####
186          return itr4
187  
188 <    def tOut(self, list):
189 <        return 180
188 >    
189 >    def wsExitFunc(self):
190 >        """
191 >        """
192 >        txt = '\n'
193 >
194 >        txt += '#\n'
195 >        txt += '# EXECUTE THIS FUNCTION BEFORE EXIT \n'
196 >        txt += '#\n\n'
197 >
198 >        txt += 'func_exit() { \n'
199 >        txt += self.wsExitFunc_common()
200 >        ### specific Glite check for OSB
201 >        txt += '    tar zcvf ${out_files}.tgz  ${final_list}\n'
202 >        txt += '    tmp_size=`ls -gGrta ${out_files}.tgz | awk \'{ print $3 }\'`\n'
203 >        txt += '    rm ${out_files}.tgz\n'  
204 >        txt += '    size=`expr $tmp_size`\n'
205 >        txt += '    echo "Total Output dimension: $size"\n'
206 >        txt += '    limit='+str(self.OSBsize) +' \n'  
207 >        txt += '    echo "WARNING: output files size limit is set to: $limit"\n'
208 >        txt += '    if [ $limit -lt $sum ]; then\n'
209 >        txt += '        exceed=1\n'
210 >        txt += '        job_exit_code=70000\n'
211 >        txt += '        echo "Output Sanbox too big. Produced output is lost "\n'
212 >        txt += '    else\n'
213 >        txt += '        exceed=0\n'
214 >        txt += '        echo "Total Output dimension $sum is fine."\n'
215 >        txt += '    fi\n'
216 >
217 >        txt += '    echo "JOB_EXIT_STATUS = $job_exit_code"\n'
218 >        txt += '    echo "JobExitCode=$job_exit_code" >> $RUNTIME_AREA/$repo\n'
219 >        txt += '    dumpStatus $RUNTIME_AREA/$repo\n'
220 >        txt += '    if [ $exceed -ne 1 ]; then\n'
221 >        txt += '        tar zcvf ${out_files}.tgz  ${final_list}\n'
222 >        txt += '    else\n'
223 >        txt += '        tar zcvf ${out_files}.tgz CMSSW_${NJob}.stdout CMSSW_${NJob}.stderr\n'
224 >        txt += '    fi\n'
225 >        txt += '    exit $job_exit_code\n'
226 >
227 >        txt += '}\n'
228 >        return txt
229 >
230 >    def userName(self):
231 >        """ return the user name """
232 >        tmp=runCommand("voms-proxy-info -identity")
233 >        return tmp.strip()

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines