1 |
gutsche |
1.1 |
#!/usr/bin/env python
|
2 |
|
|
|
3 |
|
|
import sys, getopt, string
|
4 |
|
|
|
5 |
fanzago |
1.6 |
from ProdCommon.FwkJobRep.ReportParser import readJobReport
|
6 |
gutsche |
1.2 |
from DashboardAPI import apmonSend, apmonFree
|
7 |
|
|
|
8 |
gutsche |
1.1 |
|
9 |
|
|
def main(argv) :
|
10 |
|
|
"""
|
11 |
|
|
parseCrabFjr
|
12 |
|
|
|
13 |
gutsche |
1.2 |
- parse CRAB FrameworkJobReport on WN: { 'protocol' : { 'action' : [attempted,succedeed,total-size,total-time,min-time,max-time] , ... } , ... }
|
14 |
|
|
- report parameters to DashBoard using DashBoardApi.py: for all 'read' actions of all protocols, report MBPS
|
15 |
|
|
- return ExitStatus and dump of DashBoard report separated by semi-colon to WN wrapper script
|
16 |
gutsche |
1.1 |
|
17 |
|
|
required parameters:
|
18 |
|
|
--input : input FJR xml file
|
19 |
gutsche |
1.2 |
--MonitorID : DashBoard MonitorID
|
20 |
|
|
--MonitorJobID : DashBoard MonitorJobID
|
21 |
gutsche |
1.1 |
|
22 |
|
|
optional parameters:
|
23 |
|
|
--help : help
|
24 |
|
|
--debug : debug statements
|
25 |
|
|
|
26 |
|
|
"""
|
27 |
|
|
|
28 |
|
|
# defaults
|
29 |
|
|
input = ''
|
30 |
gutsche |
1.2 |
MonitorID = ''
|
31 |
|
|
MonitorJobID = ''
|
32 |
gutsche |
1.1 |
debug = 0
|
33 |
|
|
|
34 |
|
|
try:
|
35 |
gutsche |
1.2 |
opts, args = getopt.getopt(argv, "", ["input=", "MonitorID=", "MonitorJobID=", "debug", "help"])
|
36 |
gutsche |
1.1 |
except getopt.GetoptError:
|
37 |
|
|
print main.__doc__
|
38 |
|
|
sys.exit(2)
|
39 |
|
|
|
40 |
|
|
# check command line parameter
|
41 |
|
|
for opt, arg in opts :
|
42 |
|
|
if opt == "--help" :
|
43 |
|
|
print main.__doc__
|
44 |
|
|
sys.exit()
|
45 |
|
|
elif opt == "--input" :
|
46 |
|
|
input = arg
|
47 |
gutsche |
1.2 |
elif opt == "--MonitorID" :
|
48 |
|
|
MonitorID = arg
|
49 |
|
|
elif opt == "--MonitorJobID" :
|
50 |
|
|
MonitorJobID = arg
|
51 |
gutsche |
1.1 |
elif opt == "--debug" :
|
52 |
|
|
debug = 1
|
53 |
|
|
|
54 |
gutsche |
1.2 |
if input == '' or MonitorID == '' or MonitorJobID == '':
|
55 |
gutsche |
1.1 |
print main.__doc__
|
56 |
|
|
sys.exit()
|
57 |
|
|
|
58 |
|
|
# load FwkJobRep
|
59 |
|
|
jobReport = readJobReport(input)[0]
|
60 |
|
|
|
61 |
gutsche |
1.5 |
exit_status = ''
|
62 |
gutsche |
1.1 |
|
63 |
fanzago |
1.7 |
##### temporary fix for FJR incomplete ####
|
64 |
|
|
fjr = open (input)
|
65 |
|
|
len_fjr = len(fjr.readlines())
|
66 |
|
|
if (len_fjr <= 6):
|
67 |
|
|
### 50115 - cmsRun did not produce a valid/readable job report at runtime
|
68 |
|
|
exit_status = str(50115)
|
69 |
|
|
else:
|
70 |
|
|
# get ExitStatus of last error
|
71 |
|
|
if len(jobReport.errors) != 0 :
|
72 |
|
|
exit_status = str(jobReport.errors[-1]['ExitStatus'])
|
73 |
|
|
else :
|
74 |
|
|
exit_status = str(0)
|
75 |
gutsche |
1.1 |
|
76 |
|
|
# get i/o statistics
|
77 |
|
|
storageStatistics = str(jobReport.storageStatistics)
|
78 |
|
|
|
79 |
gutsche |
1.2 |
# dashboard report dictionary
|
80 |
|
|
dashboard_report = {}
|
81 |
|
|
|
82 |
|
|
# check if storageStatistics is valid
|
83 |
|
|
if storageStatistics.find('Storage statistics:') != -1 :
|
84 |
|
|
# report form: { 'protocol' : { 'action' : [attempted,succedeed,total-size,total-time,min-time,max-time] , ... } , ... }
|
85 |
|
|
report = {}
|
86 |
|
|
data = storageStatistics.split('Storage statistics:')[1]
|
87 |
|
|
data_fields = data.split(';')
|
88 |
|
|
for data_field in data_fields:
|
89 |
|
|
# parse: format protocol/action = attepted/succedeed/total-size/total-time/min-time/max-time
|
90 |
|
|
key = data_field.split('=')[0].strip()
|
91 |
|
|
item = data_field.split('=')[1].strip()
|
92 |
|
|
protocol = str(key.split('/')[0].strip())
|
93 |
|
|
action = str(key.split('/')[1].strip())
|
94 |
|
|
item_array = item.split('/')
|
95 |
|
|
attempted = str(item_array[0].strip())
|
96 |
|
|
succeeded = str(item_array[1].strip())
|
97 |
|
|
total_size = str(item_array[2].strip().split('MB')[0])
|
98 |
|
|
total_time = str(item_array[3].strip().split('ms')[0])
|
99 |
|
|
min_time = str(item_array[4].strip().split('ms')[0])
|
100 |
|
|
max_time = str(item_array[5].strip().split('ms')[0])
|
101 |
|
|
# add to report
|
102 |
|
|
if protocol in report.keys() :
|
103 |
|
|
if action in report[protocol].keys() :
|
104 |
|
|
print 'protocol/action:',protocol,'/',action,'listed twice in report, taking the first'
|
105 |
|
|
else :
|
106 |
|
|
report[protocol][action] = [attempted,succeeded,total_size,total_time,min_time,max_time]
|
107 |
|
|
else :
|
108 |
gutsche |
1.3 |
report[protocol] = {action : [attempted,succeeded,total_size,total_time,min_time,max_time] }
|
109 |
gutsche |
1.2 |
|
110 |
|
|
if debug :
|
111 |
|
|
for protocol in report.keys() :
|
112 |
|
|
print 'protocol:',protocol
|
113 |
|
|
for action in report[protocol].keys() :
|
114 |
|
|
print 'action:',action,'measurement:',report[protocol][action]
|
115 |
|
|
|
116 |
|
|
# extract information to be sent to DashBoard
|
117 |
|
|
# per protocol and for action=read, calculate MBPS
|
118 |
|
|
# dashboard key is io_action
|
119 |
|
|
dashboard_report['MonitorID'] = MonitorID
|
120 |
|
|
dashboard_report['MonitorJobID'] = MonitorJobID
|
121 |
|
|
for protocol in report.keys() :
|
122 |
gutsche |
1.3 |
for action in report[protocol].keys() :
|
123 |
|
|
try: size = float(report[protocol][action][2])
|
124 |
|
|
except: size = 'NULL'
|
125 |
gutsche |
1.4 |
try: time = float(report[protocol][action][3])/1000
|
126 |
gutsche |
1.3 |
except: time = 'NULL'
|
127 |
|
|
dashboard_report['io_'+protocol+'_'+action] = str(size)+'_'+str(time)
|
128 |
gutsche |
1.2 |
|
129 |
|
|
if debug :
|
130 |
gutsche |
1.3 |
ordered = dashboard_report.keys()
|
131 |
|
|
ordered.sort()
|
132 |
|
|
for key in ordered:
|
133 |
|
|
print key,'=',dashboard_report[key]
|
134 |
gutsche |
1.2 |
|
135 |
|
|
# send to DashBoard
|
136 |
|
|
apmonSend(MonitorID, MonitorJobID, dashboard_report)
|
137 |
|
|
apmonFree()
|
138 |
|
|
|
139 |
|
|
# prepare exit string
|
140 |
|
|
exit_string = str(exit_status)
|
141 |
|
|
for key in dashboard_report.keys() :
|
142 |
|
|
exit_string += ';' + str(key) + '=' + str(dashboard_report[key])
|
143 |
|
|
|
144 |
gutsche |
1.5 |
|
145 |
|
|
|
146 |
gutsche |
1.2 |
return exit_string
|
147 |
gutsche |
1.1 |
|
148 |
|
|
|
149 |
|
|
if __name__ == '__main__' :
|
150 |
gutsche |
1.2 |
exit_status = main(sys.argv[1:])
|
151 |
|
|
# output for wrapper script
|
152 |
|
|
print exit_status
|
153 |
gutsche |
1.1 |
|
154 |
|
|
|