ViewVC Help
View File | Revision Log | Show Annotations | Root Listing
root/cvsroot/UserCode/OSUT3Analysis/AnaTools/scripts/mergeHists
Revision: 1.24
Committed: Fri Apr 12 05:18:05 2013 UTC (12 years ago) by ahart
Branch: MAIN
CVS Tags: V02-02-00, V02-01-01, V02-01-00, V01-01-00, V01-00-01, V01-00-00, V00-01-00
Changes since 1.23: +10 -3 lines
Log Message:
The "weight" option can now be passed a comma-separated list of weights, one for each input file.

File Contents

# Content
1 #!/usr/bin/env perl
2
3 use strict;
4 use Getopt::Long;
5 use POSIX;
6
7 sub processArgs;
8 sub printHelp;
9 sub getRunList;
10 sub countEvents;
11
12 my %opt;
13 Getopt::Long::Configure ("bundling");
14 GetOptions (\%opt, "cutflow|c=s", "luminosity|l=s", "prefix|p=s", "weight|w=s", "xsection|x=s", "help|h");
15
16 printHelp () if $opt{"help"} || !$opt{"prefix"};
17 my $files = processArgs (\@ARGV);
18 my %rootFiles;
19 my %weights;
20 my @weights;
21 my $nGoodJobs = 0;
22 my $nBadJobs = 0;
23 my $nIncompleteJobs = 0;
24 my $counting = 0;
25 my %exitCodes;
26 my %signals;
27 my %partial;
28 my %crossSections;
29 my %dirs;
30 my $integratedLuminosity = 10000;
31 $integratedLuminosity = $opt{"luminosity"} if $opt{"luminosity"};
32 my $cutFlow = "cutFlow";
33 $cutFlow = $opt{"cutflow"} if $opt{"cutflow"};
34 foreach my $file (@$files)
35 {
36 next if $file eq ".";
37 next if $file eq "..";
38 my $dir = $file;
39 $dir =~ s/^(.*)\/[^\/]*$/$1/;
40 if ($file =~ m/^.*\/condor_[^_]*\.log$/)
41 {
42 my $jobNumber = $file;
43 $jobNumber =~ s/^.*\/condor_([^_]*)\.log$/$1/;
44 open (FILE, "<$file");
45 my @fileContents = <FILE>;
46 close (FILE);
47 my $fileContents = join ("", @fileContents);
48 $fileContents =~ s/\n/ /g;
49 $counting = 1;
50 if ($fileContents =~ m/return value/)
51 {
52 $fileContents =~ s/.*\(return value ([^)]*)\).*/$1/g;
53 $nGoodJobs++;
54 print "WARNING: Nonzero exit code for job $jobNumber. (return value $fileContents)\n" if $fileContents != 0;
55 $exitCodes{$dir}{$jobNumber} = $fileContents;
56 }
57 elsif ($fileContents =~ m/signal/)
58 {
59 $fileContents =~ s/.*\(signal ([^)]*)\).*/$1/g;
60 $nBadJobs++;
61 print "WARNING: Skipping job $jobNumber. (signal $fileContents)\n";
62 $signals{$dir}{$jobNumber} = $fileContents;
63 }
64 else
65 {
66 $nIncompleteJobs++;
67 $partial{$dir}{$jobNumber} = 1;
68 }
69 }
70 if ($file =~ m/^.*\/crossSectionInPicobarn\.txt$/)
71 {
72 open (CROSS_SECTION, "<$file");
73 my $crossSection = <CROSS_SECTION>;
74 close (CROSS_SECTION);
75 $crossSections{$dir} = $crossSection;
76 }
77 }
78 foreach my $file (@$files)
79 {
80 next if $file eq ".";
81 next if $file eq "..";
82 my $dir = $file;
83 $dir =~ s/^(.*)\/[^\/]*$/$1/;
84 my $badJob = 0;
85 my $jobNumber;
86 if ($file =~ m/^.*_[^_]*\.root$/)
87 {
88 $jobNumber = $file;
89 $jobNumber =~ s/^.*_([^_]*)\.root$/$1/;
90 $badJob = (defined $signals{$dir} && defined $signals{$dir}{$jobNumber}) || (defined $partial{$dir} && defined $partial{$dir}{$jobNumber});
91 }
92 next if $badJob;
93 if ($file =~ m/^.*\.root$/)
94 {
95 foreach my $arg (@ARGV)
96 {
97 if (substr ($file, 0, length ($arg)) eq $arg)
98 {
99 $dirs{$arg} = $dir;
100 if (countEvents ($file, $cutFlow) < 0)
101 {
102 $nGoodJobs--;
103 $nBadJobs++;
104 print "WARNING: Skipping job $jobNumber. (bad ROOT file)\n";
105 last;
106 }
107 push (@{$rootFiles{$arg}}, $file);
108 if ($opt{"weight"})
109 {
110 push (@weights, $opt{"weight"}) if !($opt{"weight"} =~ m/,/);
111 push (@weights, 1.0) if $opt{"weight"} =~ m/,/;
112 }
113 push (@weights, $opt{"xsection"} * $integratedLuminosity) if !$opt{"weight"} && $opt{"xsection"};
114 push (@weights, $crossSections{$dir} * $integratedLuminosity) if !$opt{"weight"} && !$opt{"xsection"} && defined $crossSections{$dir};
115 push (@weights, 1.0) if !$opt{"weight"} && !$opt{"xsection"} && !(defined $crossSections{$dir});
116 $weights{$arg} = $weights[-1];
117 }
118 }
119 }
120 }
121 if (!%rootFiles)
122 {
123 print "Found no ROOT files to merge!\n";
124 exit;
125 }
126 my %nTotalEvents;
127 my $nTotalEvents = 0;
128 my @mergedFiles;
129 my @mergedWeights;
130 foreach my $arg (@ARGV)
131 {
132 my $rootFiles = join (" ", @{$rootFiles{$arg}});
133 my $tmpName = $arg . "_" . "$opt{'prefix'}.root";
134 $tmpName =~ s/\//_/g;
135 system ("mergeTFileServiceHistograms -i $rootFiles -o $tmpName");
136 my $count = countEvents ($tmpName, $cutFlow);
137 system ("cutFlowLimits $tmpName");
138 $nTotalEvents{$arg} = $count;
139 $nTotalEvents += $count;
140 $weights{$arg} /= $count if !$opt{"weight"} && $opt{"xsection"};
141 $weights{$arg} /= $count if !$opt{"weight"} && !$opt{"xsection"} && defined $crossSections{$dirs{$arg}};
142 push (@mergedFiles, $tmpName);
143 push (@mergedWeights, $weights{$arg});
144 }
145 my $mergedFiles = join (" ", @mergedFiles);
146 my $mergedWeights = join (",", @mergedWeights);
147 $mergedWeights = $opt{"weight"} if $opt{"weight"} && $opt{"weight"} =~ m/,/;
148 system ("mergeTFileServiceHistograms -i $mergedFiles -o $opt{'prefix'}.root -w $mergedWeights");
149 foreach my $mergedFile (@mergedFiles)
150 {
151 unlink ("$mergedFile");
152 }
153 print "=============================================\n";
154 my $output = sprintf "Cross-section of samples:\n";
155 my $printOutput = 0;
156 foreach my $arg (keys %weights)
157 {
158 my $shortArg = $arg;
159 $shortArg =~ s/^.*\/([^\/]*)$/$1/;
160 $output = sprintf "%s $shortArg: %.5g pb\n", $output, ($crossSections{$dirs{$arg}});
161 $printOutput = 1 if $weights{$arg} != 1;
162 }
163 print $output if $printOutput;
164
165 my $output = sprintf "Effective luminosities of samples:\n";
166 my $printOutput = 0;
167 foreach my $arg (keys %weights)
168 {
169 my $shortArg = $arg;
170 $shortArg =~ s/^.*\/([^\/]*)$/$1/;
171 $output = sprintf "%s $shortArg: %.5g/fb\n", $output, ($integratedLuminosity / (1000.0 * $weights{$arg})) if $weights{$arg} != 1;
172 $printOutput = 1 if $weights{$arg} != 1;
173 }
174 print $output if $printOutput;
175
176 $output = sprintf "Weights for target luminosity of %g/fb:\n", ($integratedLuminosity / 1000.0);
177 $printOutput = 0;
178 foreach my $arg (keys %weights)
179 {
180 my $shortArg = $arg;
181 $shortArg =~ s/^.*\/([^\/]*)$/$1/;
182 $output = sprintf "%s $shortArg: %.5g\n", $output, $weights{$arg} if $weights{$arg} != 1;
183 $printOutput = 1 if $weights{$arg} != 1;
184 }
185 print $output if $printOutput;
186
187 my $goodEvents = countEvents ("$opt{'prefix'}.root", $cutFlow);
188 print "$nGoodJobs jobs ran successfully over $nTotalEvents ($goodEvents weighted) events.\n" if $counting;
189 print "$nBadJobs jobs failed to run.\n" if $counting;
190 print "$nIncompleteJobs jobs have not finished.\n" if $counting;
191 print "=============================================\n";
192
193 sub
194 processArgs
195 {
196 my $argv = shift;
197
198 my @files;
199 foreach my $arg (@$argv)
200 {
201 $arg =~ s/\/*$//;
202 if (!(-e $arg))
203 {
204 print "$arg does not exist!\n";
205 exit;
206 }
207 next if ($arg =~ m/\/\.$/ || $arg =~ m/\/\.\.$/);
208 if (-d $arg)
209 {
210 opendir (DIR, $arg);
211 my @dirContents = readdir (DIR);
212 closedir (DIR);
213 for (my $i = 0; $i < @dirContents; $i++)
214 {
215 $dirContents[$i] = "$arg/$dirContents[$i]";
216 }
217 my $newFiles = processArgs (\@dirContents);
218 push (@files, @$newFiles);
219 }
220 else
221 {
222 push (@files, $arg);
223 }
224 }
225
226 return \@files;
227 }
228
229 sub
230 printHelp
231 {
232 my $exeName = $0;
233 $exeName =~ s/^.*\/([^\/]*)$/$1/;
234
235 print "Usage: $exeName [OPTION]... -p PREFIX DIRECTORIES_AND_FILES\n";
236 print "Merges ROOT files containing histograms. If there are Condor logs in the\n";
237 print "specified directories, checks for nonzero return values. If the directories\n";
238 print "where created by \"osusub\", uses the cross section from the database to weight\n";
239 print "all histograms.\n";
240 print "\n";
241 print "Mandatory arguments to long options are mandatory for short options too.\n";
242 printf "%-29s%s\n", " -c, --cutflow HISTOGRAM", "name of histogram to use for the cutflow (default:";
243 printf "%-29s%s\n", " ", "cutFlow)";
244 printf "%-29s%s\n", " -h, --help", "print this help message";
245 printf "%-29s%s\n", " -l, --luminosity", "integrated luminosity to which the histograms are";
246 printf "%-29s%s\n", " ", "weighted (default: 10000/pb)";
247 printf "%-29s%s\n", " -p, --prefix PREFIX", "output is named PREFIX.root";
248 printf "%-29s%s\n", " -w, --weight WEIGHT", "scale the output by WEIGHT, overriding the";
249 printf "%-29s%s\n", " ", "automatic weighting using the cross section from";
250 printf "%-29s%s\n", " ", "the database; WEIGHT may be a single number or a";
251 printf "%-29s%s\n", " ", "comma-separated list, one for each input file";
252 printf "%-29s%s\n", " -x, --xsection XSECTION", "use XSECTION to weight the histograms instead of";
253 printf "%-29s%s\n", " ", "the value in the database";
254
255 exit;
256 }
257
258 sub
259 getRunList
260 {
261 my $runListFile = shift;
262
263 open (RUN_LIST, "<$runListFile");
264 my @runList0 = <RUN_LIST>;
265 close (RUN_LIST);
266 my @runList;
267 foreach my $file (@runList0)
268 {
269 next if !($file =~ m/^.*file:.*\.root.*/);
270 $file =~ s/.*file:(.*)\.root.*/$1.root/;
271 push (@runList, $file);
272 }
273
274 return \@runList;
275 }
276
277 sub
278 countEvents
279 {
280 my $file = shift;
281 my $cutFlow = shift;
282
283 my $output = `getEventsFromCutFlow $file $cutFlow`;
284 if ($output =~ m/Did not find a histogram named/ || $output =~ m/appears to be empty/ || $output =~ m/Failed to open/)
285 {
286 print $output;
287 return -1;
288 }
289 $output =~ s/^.*: (.*)$/$1/;
290 $output =~ s/\n//g;
291
292 return $output;
293 }