1 |
// $Id: runSimpleFileCataloger.C,v 1.2 2012/03/29 23:41:59 paus Exp $
|
2 |
|
3 |
#if !defined(__CINT__) || defined(__MAKECINT__)
|
4 |
#include <TROOT.h>
|
5 |
#include <TSystem.h>
|
6 |
#include <TFile.h>
|
7 |
#include <TTree.h>
|
8 |
#include <TBranch.h>
|
9 |
#include <TBasket.h>
|
10 |
#include <TCanvas.h>
|
11 |
#include <TPie.h>
|
12 |
#endif
|
13 |
|
14 |
const TString slash = "/";
|
15 |
const TString hadoopDoor = "root://xrootd.cmsaf.mit.edu/";
|
16 |
|
17 |
void analyzeBranchSizes(const char *dir, const char *file);
|
18 |
|
19 |
//--------------------------------------------------------------------------------------------------
|
20 |
void runSizeAnalyzer(const char *dir = "/mnt/hadoop/cmsprod/filefi/025/r11b-pho-j16-v1",
|
21 |
const char *file = "FA6DDCFE-1D43-E111-8E71-002590200900.root")
|
22 |
{
|
23 |
// -----------------------------------------------------------------------------------------------
|
24 |
// This script runs a full cataloging action on the given directory
|
25 |
// -----------------------------------------------------------------------------------------------
|
26 |
analyzeBranchSizes(dir,file);
|
27 |
return;
|
28 |
}
|
29 |
|
30 |
//--------------------------------------------------------------------------------------------------
|
31 |
Long64_t RawBytes(TBranch* branch, UInt_t recursion=0)
|
32 |
{
|
33 |
Long64_t totBytes = branch->GetTotBytes();
|
34 |
TObjArray *subBranches = branch->GetListOfBranches();
|
35 |
for (Int_t i=0; i<subBranches->GetEntries(); ++i) {
|
36 |
TBranch *subBranch = (TBranch*)subBranches->At(i);
|
37 |
totBytes += RawBytes(subBranch, recursion+1);
|
38 |
}
|
39 |
return totBytes;
|
40 |
}
|
41 |
|
42 |
//--------------------------------------------------------------------------------------------------
|
43 |
Long64_t ZipBytes(TBranch* branch, Double_t ratio, UInt_t recursion=0)
|
44 |
{
|
45 |
//TBasket* currentBasket = branch->GetBasket(branch->GetReadBasket());
|
46 |
//currentBasket->SetWriteMode();
|
47 |
//branch->WriteBasket(currentBasket,0);
|
48 |
|
49 |
Long64_t totBytes = branch->GetZipBytes();
|
50 |
TObjArray *subBranches = branch->GetListOfBranches();
|
51 |
for (Int_t i=0; i<subBranches->GetEntries(); ++i) {
|
52 |
TBranch *subBranch = (TBranch*) subBranches->At(i);
|
53 |
totBytes += ZipBytes(subBranch,ratio,recursion+1);
|
54 |
}
|
55 |
return totBytes;
|
56 |
}
|
57 |
|
58 |
//--------------------------------------------------------------------------------------------------
|
59 |
void analyzeBranchSizes(const char *dir, const char *file)
|
60 |
{
|
61 |
TString fileName = TString(dir) + slash + + TString(file);
|
62 |
if (fileName.Index("castor/cern.ch") != -1)
|
63 |
fileName = TString("castor:") + fileName;
|
64 |
if (fileName.Index("mnt/hadoop/cms/store") != -1) {
|
65 |
fileName.Remove(0,15);
|
66 |
fileName = hadoopDoor + fileName;
|
67 |
}
|
68 |
|
69 |
TFile* f = TFile::Open(fileName.Data());
|
70 |
TTree* tree = (TTree*) f->FindObjectAny("Events");
|
71 |
printf("XX-CATALOG-XX %s %lld\n",fileName.Data(),tree->GetEntries());
|
72 |
|
73 |
Long64_t evtRawSize = tree->GetTotBytes();
|
74 |
Long64_t evtZipSize = tree->GetZipBytes();
|
75 |
|
76 |
Double_t evtComp = (Double_t) evtRawSize/evtZipSize;
|
77 |
|
78 |
TObjArray *evtBranches = tree->GetListOfBranches();
|
79 |
UInt_t nBranches = evtBranches->GetEntries();
|
80 |
|
81 |
Long64_t rawTotal = 0;
|
82 |
Long64_t zipTotal = 0;
|
83 |
|
84 |
printf("\nSizes in bytes\n");
|
85 |
printf( "===============\n");
|
86 |
for (UInt_t i=0; i<nBranches; ++i) {
|
87 |
TBranch* branch = (TBranch*) evtBranches->At(i);
|
88 |
Long64_t branchSizeZip = ZipBytes(branch, evtComp);
|
89 |
Long64_t branchSizeRaw = RawBytes(branch);
|
90 |
|
91 |
printf("%-40s Size = %10lld %10lld\n",branch->GetName(),branchSizeRaw,branchSizeZip);
|
92 |
|
93 |
rawTotal += branchSizeRaw;
|
94 |
zipTotal += branchSizeZip;
|
95 |
|
96 |
}
|
97 |
|
98 |
printf("\nSizes relative to total in percent\n");
|
99 |
printf( "==================================\n");
|
100 |
for (UInt_t i=0; i<nBranches; ++i) {
|
101 |
TBranch* branch = (TBranch*) evtBranches->At(i);
|
102 |
Long64_t branchSizeZip = ZipBytes(branch, evtComp);
|
103 |
Long64_t branchSizeRaw = RawBytes(branch);
|
104 |
|
105 |
printf("%-40s Size = %10f %10f\n",branch->GetName(),
|
106 |
100*double(branchSizeRaw)/double(rawTotal),
|
107 |
100*double(branchSizeZip)/double(zipTotal));
|
108 |
}
|
109 |
|
110 |
|
111 |
TTree* allTree = (TTree*) f->FindObjectAny("AllEvents");
|
112 |
if (allTree)
|
113 |
printf("XX-CATALOG-XX %s %lld %lld\n",fileName.Data(),tree->GetEntries(),allTree->GetEntries());
|
114 |
else
|
115 |
printf("\n WARNING -- All event tree not found in this file.\n\n");
|
116 |
}
|