ViewVC Help
View File | Revision Log | Show Annotations | Root Listing
root/cvsroot/UserCode/VHbb/python/evaluateMVA.py
Revision: 1.18
Committed: Wed Nov 28 13:04:59 2012 UTC (12 years, 5 months ago) by nmohr
Content type: text/x-python
Branch: MAIN
Changes since 1.17: +89 -148 lines
Log Message:
Different vars in MVA evaluation

File Contents

# User Rev Content
1 peller 1.1 #!/usr/bin/env python
2     import sys
3     import os
4     import ROOT
5     from array import array
6     from math import sqrt
7     from copy import copy
8     #suppres the EvalInstace conversion warning bug
9     import warnings
10     warnings.filterwarnings( action='ignore', category=RuntimeWarning, message='creating converter.*' )
11 nmohr 1.9 from optparse import OptionParser
12 nmohr 1.6 from BetterConfigParser import BetterConfigParser
13 peller 1.1 import pickle
14    
15     #CONFIGURE
16 nmohr 1.18 ROOT.gROOT.SetBatch(True)
17 peller 1.17 print 'hello'
18 peller 1.1 #load config
19 nmohr 1.9 #os.mkdir(path+'/sys')
20 nmohr 1.10 argv = sys.argv
21 nmohr 1.9 parser = OptionParser()
22 nmohr 1.10 parser.add_option("-U", "--update", dest="update", default=0,
23     help="update infofile")
24     parser.add_option("-D", "--discr", dest="discr", default="",
25     help="discriminators to be added")
26 peller 1.17 #parser.add_option("-I", "--inpath", dest="inpath", default="",
27     # help="path to samples")
28     #parser.add_option("-O", "--outpath", dest="outpath", default="",
29     # help="path where to store output samples")
30 nmohr 1.10 parser.add_option("-S", "--samples", dest="names", default="",
31     help="samples you want to run on")
32 nmohr 1.11 parser.add_option("-C", "--config", dest="config", default=[], action="append",
33 nmohr 1.10 help="configuration file")
34 nmohr 1.9 (opts, args) = parser.parse_args(argv)
35 nmohr 1.18
36     from samplesclass import sample
37     from mvainfos import mvainfo
38     from progbar import progbar
39     from printcolor import printc
40    
41 nmohr 1.10 if opts.config =="":
42 nmohr 1.9 opts.config = "config"
43 nmohr 1.6 config = BetterConfigParser()
44 peller 1.14 #config.read('./config7TeV_ZZ')
45 nmohr 1.9 config.read(opts.config)
46     anaTag = config.get("Analysis","tag")
47 peller 1.1
48     #get locations:
49     Wdir=config.get('Directories','Wdir')
50 nmohr 1.13 MVASubdir=config.get('Directories','MVAdir')
51 nmohr 1.15 samplesinfo=config.get('Directories','samplesinfo')
52 peller 1.1
53     #systematics
54    
55    
56 peller 1.17 INpath = config.get('Directories','MVAin')
57     OUTpath = config.get('Directories','MVAout')
58    
59 nmohr 1.15 infofile = open(samplesinfo,'r')
60 nmohr 1.9 info = pickle.load(infofile)
61     infofile.close()
62 nmohr 1.10 arglist=opts.discr #RTight_blavla,bsbsb
63 peller 1.1
64 nmohr 1.10 namelistIN=opts.names
65 peller 1.4 namelist=namelistIN.split(',')
66    
67 nmohr 1.10 doinfo=bool(int(opts.update))
68 peller 1.1
69     MVAlist=arglist.split(',')
70 nmohr 1.18
71 peller 1.1
72     #CONFIG
73     #factory
74     factoryname=config.get('factory','factoryname')
75     #MVA
76     MVAinfos=[]
77 nmohr 1.18 MVAdir=config.get('Directories','vhbbpath')
78 peller 1.1 for MVAname in MVAlist:
79 nmohr 1.12 MVAinfofile = open(MVAdir+'/data/'+factoryname+'_'+MVAname+'.info','r')
80 peller 1.1 MVAinfos.append(pickle.load(MVAinfofile))
81     MVAinfofile.close()
82    
83     longe=40
84     #Workdir
85     workdir=ROOT.gDirectory.GetPath()
86    
87     #Apply samples
88 nmohr 1.15 infofile = open(samplesinfo,'r')
89 peller 1.1 Ainfo = pickle.load(infofile)
90     infofile.close()
91    
92 nmohr 1.18
93     class MvaEvaluater:
94     def __init__(self, config, MVAinfo):
95     self.varset = MVAinfo.varset
96     #Define reader
97     self.reader = ROOT.TMVA.Reader("!Color:!Silent")
98     MVAdir=config.get('Directories','vhbbpath')
99     self.systematics=config.get('systematics','systematics').split(' ')
100     self.MVA_Vars={}
101     self.MVAname = MVAinfo.MVAname
102     for systematic in self.systematics:
103     self.MVA_Vars[systematic]=config.get(self.varset,systematic)
104     self.MVA_Vars[systematic]=self.MVA_Vars[systematic].split(' ')
105     #define variables and specatators
106     self.MVA_var_buffer = []
107     for i in range(len( self.MVA_Vars['Nominal'])):
108     self.MVA_var_buffer.append(array( 'f', [ 0 ] ))
109     self.reader.AddVariable( self.MVA_Vars['Nominal'][i],self.MVA_var_buffer[i])
110     self.reader.BookMVA(MVAinfo.MVAname,MVAdir+'/data/'+MVAinfo.getweightfile())
111     #--> Now the MVA is booked
112    
113     def setBranches(self,tree,job):
114     #Set formulas for all vars
115     self.MVA_formulas={}
116     for systematic in self.systematics:
117     if job.type == 'DATA' and not systematic == 'Nominal': continue
118     self.MVA_formulas[systematic]=[]
119     for j in range(len( self.MVA_Vars['Nominal'])):
120     self.MVA_formulas[systematic].append(ROOT.TTreeFormula("MVA_formula%s_%s"%(j,systematic),self.MVA_Vars[systematic][j],tree))
121    
122     def evaluate(self,MVAbranches,job):
123     #Evaluate all vars and fill the branches
124     for systematic in self.systematics:
125     for j in range(len( self.MVA_Vars['Nominal'])):
126     if job.type == 'DATA' and not systematic == 'Nominal': continue
127     self.MVA_var_buffer[j][0] = self.MVA_formulas[systematic][j].EvalInstance()
128     MVAbranches[self.systematics.index(systematic)] = self.reader.EvaluateMVA(self.MVAname)
129    
130    
131     theMVAs = []
132     for mva in MVAinfos:
133     theMVAs.append(MvaEvaluater(config,mva))
134    
135    
136 peller 1.1 #eval
137 peller 1.4 for job in Ainfo:
138 peller 1.8 if eval(job.active):
139     if job.name in namelist:
140     #get trees:
141 peller 1.17 print INpath+'/'+job.prefix+job.identifier+'.root'
142 nmohr 1.18 input = ROOT.TFile.Open(INpath+'/'+job.prefix+job.identifier+'.root','read')
143 peller 1.17 print OUTpath+'/'+job.prefix+job.identifier+'.root'
144 nmohr 1.18 outfile = ROOT.TFile.Open(OUTpath+'/'+job.prefix+job.identifier+'.root','recreate')
145 peller 1.4 input.cd()
146 peller 1.8 obj = ROOT.TObject
147     for key in ROOT.gDirectory.GetListOfKeys():
148     input.cd()
149     obj = key.ReadObj()
150     #print obj.GetName()
151     if obj.GetName() == job.tree:
152     continue
153     outfile.cd()
154     #print key.GetName()
155     obj.Write(key.GetName())
156     tree = input.Get(job.tree)
157     nEntries = tree.GetEntries()
158 peller 1.4 outfile.cd()
159 peller 1.8 newtree = tree.CloneTree(0)
160 nmohr 1.18
161 peller 1.4
162 nmohr 1.18 #Set branch adress for all vars
163     for i in range(0,len(theMVAs)):
164     theMVAs[i].setBranches(tree,job)
165     outfile.cd()
166     #Setup Branches
167     MVAbranches=[]
168     for i in range(0,len(theMVAs)):
169     if job.type == 'Data':
170 peller 1.8 MVAbranches.append(array('f',[0]))
171     newtree.Branch(MVAinfos[i].MVAname,MVAbranches[i],'nominal/F')
172     else:
173 nmohr 1.18 MVAbranches.append(array('f',[0]*11))
174     newtree.Branch(theMVAs[i].MVAname,MVAbranches[i],'nominal:JER_up:JER_down:JES_up:JES_down:beff_up:beff_down:bmis_up:bmis_down:beff1_up:beff1_down/F')
175     MVA_formulas_Nominal = []
176     print '\n--> ' + job.name +':'
177     #progbar setup
178     if nEntries >= longe:
179     step=int(nEntries/longe)
180     long=longe
181     else:
182     long=nEntries
183     step = 1
184     bar=progbar(long)
185     #Fill event by event:
186     for entry in range(0,nEntries):
187     if entry % step == 0:
188     bar.move()
189     #load entry
190     tree.GetEntry(entry)
191 peller 1.8
192 nmohr 1.18 for i in range(0,len(theMVAs)):
193     theMVAs[i].evaluate(MVAbranches[i],job)
194     #Fill:
195     newtree.Fill()
196     newtree.AutoSave()
197     outfile.Close()
198    
199 peller 1.4 print '\n'
200 peller 1.1
201     #Update Info:
202     if doinfo:
203     for job in Ainfo:
204     for MVAinfo in MVAinfos:
205     job.addcomment('Added MVA %s'%MVAinfo.MVAname)
206 peller 1.4 job.addpath(MVAdir)
207 nmohr 1.15 infofile = open(samplesinfo,'w')
208 peller 1.1 pickle.dump(Ainfo,infofile)
209     infofile.close()
210    
211