ViewVC Help
View File | Revision Log | Show Annotations | Root Listing
root/cvsroot/UserCode/OSUT3Analysis/AnaTools/scripts/mergeHists
Revision: 1.8
Committed: Thu Dec 13 10:51:30 2012 UTC (12 years, 4 months ago) by ahart
Branch: MAIN
Changes since 1.7: +21 -8 lines
Log Message:
Do not skip jobs with a nonzero exit code, but do skip jobs which exited from receiving a signal.

File Contents

# User Rev Content
1 ahart 1.1 #!/usr/bin/env perl
2    
3     use strict;
4     use Getopt::Long;
5 ahart 1.3 use POSIX;
6    
7     sub processArgs;
8     sub printHelp;
9     sub getRunList;
10     sub countEvents;
11 ahart 1.1
12     my %opt;
13     Getopt::Long::Configure ("bundling");
14 ahart 1.6 GetOptions (\%opt, "cutflow|c=s", "luminosity|l=s", "prefix|p=s", "weight|w=s", "xsection|x=s", "help|h");
15 ahart 1.1
16     printHelp () if $opt{"help"} || !$opt{"prefix"};
17     my $files = processArgs (\@ARGV);
18     my @rootFiles;
19 ahart 1.3 my @weights;
20 ahart 1.5 my $nGoodJobs = 0;
21     my $nBadJobs = 0;
22 ahart 1.3 my $counting = 0;
23 ahart 1.4 my %exitCodes;
24 ahart 1.8 my %signals;
25 ahart 1.5 my %crossSections;
26     my $integratedLuminosity = 10000;
27     $integratedLuminosity = $opt{"luminosity"} if $opt{"luminosity"};
28 ahart 1.6 my $cutFlow = "cutFlow";
29     $cutFlow = $opt{"cutflow"} if $opt{"cutflow"};
30 ahart 1.3 foreach my $file (@$files)
31     {
32     next if $file eq ".";
33     next if $file eq "..";
34 ahart 1.5 my $dir = $file;
35     $dir =~ s/^(.*)\/[^\/]*$/$1/;
36 ahart 1.4 if ($file =~ m/^.*\/condor_[^_]*\.log$/)
37 ahart 1.3 {
38     my $jobNumber = $file;
39     $jobNumber =~ s/^.*\/condor_([^_]*)\.log$/$1/;
40     open (FILE, "<$file");
41     my @fileContents = <FILE>;
42     close (FILE);
43     my $fileContents = join ("", @fileContents);
44     $fileContents =~ s/\n/ /g;
45 ahart 1.8 if ($fileContents =~ m/return value/)
46 ahart 1.3 {
47 ahart 1.8 $fileContents =~ s/.*\(return value ([^)]*)\).*/$1/g;
48     if ($fileContents != 0)
49     {
50     $nGoodJobs++;
51     print "WARNING: Nonzero exit code for job $jobNumber. (return value $fileContents)\n";
52     }
53     $exitCodes{$dir}{$jobNumber} = $fileContents;
54     $counting = 1;
55     }
56     if ($fileContents =~ m/signal/)
57     {
58     $fileContents =~ s/.*\(signal ([^)]*)\).*/$1/g;
59 ahart 1.5 $nBadJobs++;
60 ahart 1.8 print "WARNING: Skipping job $jobNumber. (signal $fileContents)\n";
61     $signals{$dir}{$jobNumber} = $fileContents;
62     $counting = 1;
63 ahart 1.3 }
64     }
65 ahart 1.5 if ($file =~ m/^.*\/crossSectionInPicobarn\.txt$/)
66     {
67     open (CROSS_SECTION, "<$file");
68     my $crossSection = <CROSS_SECTION>;
69     close (CROSS_SECTION);
70     $crossSections{$dir} = $crossSection;
71     }
72 ahart 1.3 }
73 ahart 1.1 foreach my $file (@$files)
74     {
75     next if $file eq ".";
76     next if $file eq "..";
77 ahart 1.5 my $dir = $file;
78     $dir =~ s/^(.*)\/[^\/]*$/$1/;
79 ahart 1.3 my $badJob = 0;
80     if ($file =~ m/^.*_[^_]*\.root$/)
81 ahart 1.1 {
82 ahart 1.3 my $jobNumber = $file;
83     $jobNumber =~ s/^.*_([^_]*)\.root$/$1/;
84 ahart 1.8 #$badJob = defined $exitCodes{$dir} && defined $exitCodes{$dir}{$jobNumber} && $exitCodes{$dir}{$jobNumber};
85     $badJob = defined $signals{$dir} && defined $signals{$dir}{$jobNumber};
86 ahart 1.5 }
87     next if $badJob;
88     if ($file =~ m/^.*\.root$/)
89     {
90 ahart 1.6 push (@rootFiles, $file);
91     push (@weights, 1.0);
92 ahart 1.5 }
93     }
94 ahart 1.6 if (!@rootFiles)
95     {
96     print "Found no ROOT files to merge!\n";
97     exit;
98     }
99     my $rootFiles = join (" ", @rootFiles);
100     my $weights = join (",", @weights);
101     system ("mergeTFileServiceHistograms -i $rootFiles -o $opt{'prefix'}.root -w $weights");
102     my $nTotalEvents = countEvents ("$opt{'prefix'}.root", $cutFlow);
103     unlink ("$opt{'prefix'}.root");
104     @weights = ();
105 ahart 1.5 foreach my $file (@$files)
106     {
107     next if $file eq ".";
108     next if $file eq "..";
109     my $dir = $file;
110     $dir =~ s/^(.*)\/[^\/]*$/$1/;
111     my $badJob = 0;
112     if ($file =~ m/^.*_[^_]*\.root$/)
113     {
114     my $jobNumber = $file;
115     $jobNumber =~ s/^.*_([^_]*)\.root$/$1/;
116 ahart 1.8 #$badJob = defined $exitCodes{$dir} && defined $exitCodes{$dir}{$jobNumber} && $exitCodes{$dir}{$jobNumber};
117     $badJob = defined $signals{$dir} && defined $signals{$dir}{$jobNumber};
118 ahart 1.1 }
119 ahart 1.3 next if $badJob;
120     if ($file =~ m/^.*\.root$/)
121 ahart 1.1 {
122 ahart 1.3 push (@weights, $opt{"weight"}) if $opt{"weight"};
123 ahart 1.6 push (@weights, ($opt{"xsection"} * $integratedLuminosity) / $nTotalEvents) if !$opt{"weight"} && $opt{"xsection"};
124     push (@weights, ($crossSections{$dir} * $integratedLuminosity) / $nTotalEvents) if !$opt{"weight"} && !$opt{"xsection"} && defined $crossSections{$dir};
125     push (@weights, 1.0) if !$opt{"weight"} && !$opt{"xsection"} && !(defined $crossSections{$dir});
126 ahart 1.1 }
127     }
128 ahart 1.3 my $weights = join (",", @weights);
129     system ("mergeTFileServiceHistograms -i $rootFiles -o $opt{'prefix'}.root -w $weights");
130 ahart 1.6 my $goodEvents = countEvents ("$opt{'prefix'}.root", $cutFlow);
131 ahart 1.5 print "$nGoodJobs jobs ran successfully over $nTotalEvents ($goodEvents weighted) events.\n" if $counting;
132 ahart 1.4 print "$nBadJobs jobs failed to run.\n" if $counting;
133 ahart 1.1
134     sub
135     processArgs
136     {
137     my $argv = shift;
138    
139     my @files;
140     foreach my $arg (@$argv)
141     {
142     $arg =~ s/\/*$//;
143     if (!(-e $arg))
144     {
145     print "$arg does not exist!\n";
146     exit;
147     }
148     next if ($arg =~ m/\/\.$/ || $arg =~ m/\/\.\.$/);
149     if (-d $arg)
150     {
151     opendir (DIR, $arg);
152     my @dirContents = readdir (DIR);
153     closedir (DIR);
154     for (my $i = 0; $i < @dirContents; $i++)
155     {
156     $dirContents[$i] = "$arg/$dirContents[$i]";
157     }
158     my $newFiles = processArgs (\@dirContents);
159     push (@files, @$newFiles);
160     }
161     else
162     {
163     push (@files, $arg);
164     }
165     }
166    
167     return \@files;
168     }
169    
170     sub
171     printHelp
172     {
173     my $exeName = $0;
174     $exeName =~ s/^.*\/([^\/]*)$/$1/;
175    
176 ahart 1.6 print "Usage: $exeName [OPTION]... -p PREFIX DIRECTORIES_AND_FILES\n";
177 ahart 1.7 print "Merges ROOT files containing histograms. If there are Condor logs in the\n";
178     print "specified directories, checks for nonzero return values. If the directories\n";
179     print "where created by \"osusub\", uses the cross section from the database to weight\n";
180     print "all histograms.\n";
181 ahart 1.1 print "\n";
182     print "Mandatory arguments to long options are mandatory for short options too.\n";
183 ahart 1.6 printf "%-29s%s\n", " -c, --cutflow HISTOGRAM", "name of histogram to use for the cutflow (default:";
184     printf "%-29s%s\n", " ", "cutFlow)";
185 ahart 1.1 printf "%-29s%s\n", " -h, --help", "print this help message";
186 ahart 1.5 printf "%-29s%s\n", " -l, --luminosity", "integrated luminosity to which the histograms are";
187     printf "%-29s%s\n", " ", "weighted (default: 10000/pb)";
188 ahart 1.7 printf "%-29s%s\n", " -p, --prefix PREFIX", "output is named PREFIX.root";
189 ahart 1.5 printf "%-29s%s\n", " -w, --weight WEIGHT", "scale the output by WEIGHT, overriding the";
190     printf "%-29s%s\n", " ", "automatic weighting using the cross section from";
191     printf "%-29s%s\n", " ", "the database";
192 ahart 1.6 printf "%-29s%s\n", " -x, --xsection XSECTION", "use XSECTION to weight the histograms instead of";
193     printf "%-29s%s\n", " ", "the value in the database";
194 ahart 1.1
195     exit;
196     }
197 ahart 1.3
198     sub
199     getRunList
200     {
201     my $runListFile = shift;
202    
203     open (RUN_LIST, "<$runListFile");
204     my @runList0 = <RUN_LIST>;
205     close (RUN_LIST);
206     my @runList;
207     foreach my $file (@runList0)
208     {
209     next if !($file =~ m/^.*file:.*\.root.*/);
210     $file =~ s/.*file:(.*)\.root.*/$1.root/;
211     push (@runList, $file);
212     }
213    
214     return \@runList;
215     }
216    
217     sub
218     countEvents
219     {
220 ahart 1.4 my $file = shift;
221 ahart 1.6 my $cutFlow = shift;
222 ahart 1.4
223 ahart 1.6 my $output = `getEventsFromCutFlow $file $cutFlow`;
224 ahart 1.5 if ($output =~ m/Did not find a histogram named/)
225     {
226     print $output;
227     return -1;
228     }
229 ahart 1.4 $output =~ s/^.*: (.*)$/$1/;
230     $output =~ s/\n//g;
231    
232     return $output;
233 ahart 1.3 }