Logo ROOT  
Reference Guide
 
Loading...
Searching...
No Matches
correlationscatters.cxx
Go to the documentation of this file.
2#include "TMVA/Config.h"
3
4
5
6// this macro plots the correlations (as scatter plots) of
7// the various input variable combinations used in TMVA (e.g. running
8// TMVAnalysis.C). Signal and Background are plotted separately
9
10// input: - Input file (result from TMVA),
11// - normal/decorrelated/PCA
12// - use of TMVA plotting TStyle
13void TMVA::correlationscatters(TString dataset, TString fin , TString var,
14 TString dirName_, TString /*title */ ,
15 Bool_t isRegression ,
16 Bool_t useTMVAStyle )
17{
18 // set style and remove existing canvas'
19 TMVAGlob::Initialize( useTMVAStyle );
20
21 TString extension = dirName_;
22 extension.ReplaceAll( "InputVariables", "" );
23 extension.ReplaceAll( " ", "" );
24 if (extension == "") extension = "_Id"; // use 'Id' for 'idendtity transform'
25
26 var.ReplaceAll( extension, "" );
27 cout << "Called macro \"correlationscatters\" for variable: \"" << var
28 << "\", transformation type \"" << dirName_
29 << "\" (extension: \"" << extension << "\")" << endl;
30
31 // checks if file with name "fin" is already open, and if not opens one
32 TFile* file = TMVAGlob::OpenFile( fin );
33
34 TString dirName = dirName_ + "/CorrelationPlots";
35
36 // find out number of input variables
37 TDirectory* vardir = (TDirectory*)file->GetDirectory(dataset.Data())->Get("InputVariables_Id");
38 if (!vardir) {
39 cout << "ERROR: no such directory: \"InputVariables\"" << endl;
40 return;
41 }
42 Int_t noVars = TMVAGlob::GetNumberOfInputVariables( vardir ); // subtraction of target(s) no longer necessary
43
44 TDirectory* dir = (TDirectory*)file->GetDirectory(dataset.Data())->Get( dirName );
45 if (dir==0) {
46 cout << "No information about " << extension << " available in " << fin << endl;
47 return;
48 }
49 dir->cd();
50
51 TListIter keyIt(dir->GetListOfKeys());
52 Int_t noPlots = noVars - 1;
53
54 cout << "noPlots: " << noPlots << " --> noVars: " << noVars << endl;
55 if (noVars != Int_t(noVars)) {
56 cout << "*** Warning: problem in inferred number of variables ... not an integer *** " << endl;
57 }
58
59 // define Canvas layout here!
60 // default setting
61 Int_t xPad; // no of plots in x
62 Int_t yPad; // no of plots in y
63 Int_t width; // size of canvas
65 switch (noPlots) {
66 case 1:
67 xPad = 1; yPad = 1; width = 400; height = width; break;
68 case 2:
69 xPad = 2; yPad = 1; width = 700; height = 0.55*width; break;
70 case 3:
71 xPad = 3; yPad = 1; width = 800; height = 0.4*width; break;
72 case 4:
73 xPad = 2; yPad = 2; width = 600; height = width; break;
74 default:
75 xPad = 3; yPad = 2; width = 800; height = 0.55*width; break;
76 }
77 Int_t noPadPerCanv = xPad * yPad ;
78
79 // counter variables
80 Int_t countCanvas = 0;
81
82 // loop over all objects in "input_variables" directory
83 TString thename[2] = { "_Signal", "_Background" };
84 if (isRegression) thename[0] = "_Regression";
85 for (UInt_t itype = 0; itype < 2; itype++) {
86
87 TIter next(gDirectory->GetListOfKeys());
88 TKey * key = 0;
89 TCanvas* canv = 0;
90
91 Int_t countPad = 0;
92
93 while ( (key = (TKey*)next()) ) {
94
95 if (key->GetCycle() != 1) continue;
96
97 // make sure, that we only look at histograms
98 TClass *cl = gROOT->GetClass(key->GetClassName());
99 if (!cl->InheritsFrom("TH1")) continue;
100 TH1 *scat = (TH1*)key->ReadObj();
101 TString hname = scat->GetName();
102
103 // check for all signal histograms
104 if (! (hname.EndsWith( thename[itype] + extension ) &&
105 hname.Contains( TString("_") + var + "_" ) && hname.BeginsWith("scat_")) ) {
106 scat->Delete();
107 continue;
108 }
109
110 // found a new signal plot
111
112 // create new canvas
113 if (countPad%noPadPerCanv==0) {
114 ++countCanvas;
115 TString ext = extension; ext.Remove( 0, 1 );
116 canv = new TCanvas( TString::Format("canvas%d", countCanvas),
117 TString::Format("Correlation profiles for '%s'-transformed %s variables",
118 ext.Data(), (isRegression ? "" : (itype==0) ? "signal" : "background")),
119 countCanvas*50+200, countCanvas*20, width, height );
120 canv->Divide(xPad,yPad);
121 }
122
123 if (!canv) continue;
124
125 canv->cd(countPad++%noPadPerCanv+1);
126
127 // find the corredponding backgrouns histo
128 TString bgname = hname;
129 bgname.ReplaceAll("scat_","prof_");
130 TH1 *prof = (TH1*)gDirectory->Get(bgname);
131 if (prof == NULL) {
132 cout << "ERROR!!! couldn't find background histo for" << hname << endl;
133 //exit(1);
134 return;
135 }
136 // this is set but not stored during plot creation in MVA_Factory
138
139 // chop off "signal"
140 TMVAGlob::SetFrameStyle( scat, 1.2 );
141
142 // normalise both signal and background
143 scat->Scale( 1.0/scat->GetSumOfWeights() );
144
145 // finally plot and overlay
146 scat->SetMarkerColor( 4);
147 scat->Draw("col");
148 prof->SetMarkerColor( gConfig().fVariablePlotting.fUsePaperStyle ? 1 : 2 );
149 prof->SetMarkerSize( 0.2 );
150 prof->SetLineColor( gConfig().fVariablePlotting.fUsePaperStyle ? 1 : 2 );
151 prof->SetLineWidth( gConfig().fVariablePlotting.fUsePaperStyle ? 2 : 1 );
152 prof->SetFillStyle( 3002 );
153 prof->SetFillColor( 46 );
154 prof->Draw("samee1");
155 // redraw axes
156 scat->Draw("sameaxis");
157
158 // save canvas to file
159 if (countPad%noPadPerCanv==0) {
160 canv->Update();
161
162 TString fname = TString::Format( "%s/plots/correlationscatter_%s_%s_c%i",dataset.Data(),var.Data(), extension.Data(), countCanvas );
164 TMVAGlob::imgconv( canv, fname );
165 }
166 }
167 if (countPad%noPadPerCanv!=0) {
168 canv->Update();
169
170 TString fname = TString::Format( "%s/plots/correlationscatter_%s_%s_c%i",dataset.Data(),var.Data(), extension.Data(), countCanvas );
172 TMVAGlob::imgconv( canv, fname );
173 }
174 }
175}
bool Bool_t
Definition RtypesCore.h:63
int Int_t
Definition RtypesCore.h:45
unsigned int UInt_t
Definition RtypesCore.h:46
#define gDirectory
Definition TDirectory.h:384
Option_t Option_t width
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t height
#define gROOT
Definition TROOT.h:406
const char * extension
Definition civetweb.c:8026
virtual void SetFillColor(Color_t fcolor)
Set the fill area color.
Definition TAttFill.h:37
virtual void SetFillStyle(Style_t fstyle)
Set the fill area style.
Definition TAttFill.h:39
virtual void SetLineWidth(Width_t lwidth)
Set the line width.
Definition TAttLine.h:43
virtual void SetLineColor(Color_t lcolor)
Set the line color.
Definition TAttLine.h:40
virtual void SetMarkerColor(Color_t mcolor=1)
Set the marker color.
Definition TAttMarker.h:38
virtual void SetMarkerSize(Size_t msize=1)
Set the marker size.
Definition TAttMarker.h:45
The Canvas class.
Definition TCanvas.h:23
TVirtualPad * cd(Int_t subpadnumber=0) override
Set current canvas & pad.
Definition TCanvas.cxx:716
void Update() override
Update canvas pad buffers.
Definition TCanvas.cxx:2483
TClass instances represent classes, structs and namespaces in the ROOT type system.
Definition TClass.h:81
Bool_t InheritsFrom(const char *cl) const override
Return kTRUE if this class inherits from a class with name "classname".
Definition TClass.cxx:4874
static TClass * GetClass(const char *name, Bool_t load=kTRUE, Bool_t silent=kFALSE)
Static method returning pointer to TClass of the specified class name.
Definition TClass.cxx:2968
TDirectory * GetDirectory(const char *apath, Bool_t printError=false, const char *funcname="GetDirectory") override
Find a directory named "apath".
Describe directory structure in memory.
Definition TDirectory.h:45
virtual Bool_t cd()
Change current directory to "this" directory.
virtual TList * GetListOfKeys() const
Definition TDirectory.h:223
A ROOT file is composed of a header, followed by consecutive data records (TKey instances) with a wel...
Definition TFile.h:53
TH1 is the base class of all histogram classes in ROOT.
Definition TH1.h:59
void Draw(Option_t *option="") override
Draw this histogram with options.
Definition TH1.cxx:3062
virtual void Scale(Double_t c1=1, Option_t *option="")
Multiply this histogram by a constant c1.
Definition TH1.cxx:6568
virtual Double_t GetSumOfWeights() const
Return the sum of weights excluding under/overflows.
Definition TH1.cxx:7881
Book space in a file, create I/O buffers, to fill them, (un)compress them.
Definition TKey.h:28
virtual const char * GetClassName() const
Definition TKey.h:75
Short_t GetCycle() const
Return cycle number associated to this key.
Definition TKey.cxx:577
virtual TObject * ReadObj()
To read a TObject* from the file.
Definition TKey.cxx:758
Iterator of linked list.
Definition TList.h:191
const char * GetName() const override
Returns name of object.
Definition TNamed.h:47
virtual void Delete(Option_t *option="")
Delete this object.
Definition TObject.cxx:248
void Divide(Int_t nx=1, Int_t ny=1, Float_t xmargin=0.01, Float_t ymargin=0.01, Int_t color=0) override
Automatic pad generation by division.
Definition TPad.cxx:1153
Basic string class.
Definition TString.h:139
Bool_t EndsWith(const char *pat, ECaseCompare cmp=kExact) const
Return true if string ends with the specified string.
Definition TString.cxx:2244
const char * Data() const
Definition TString.h:376
TString & ReplaceAll(const TString &s1, const TString &s2)
Definition TString.h:704
Bool_t BeginsWith(const char *s, ECaseCompare cmp=kExact) const
Definition TString.h:623
TString & Remove(Ssiz_t pos)
Definition TString.h:685
static TString Format(const char *fmt,...)
Static method which formats a string using a printf style format descriptor and return a TString.
Definition TString.cxx:2378
Bool_t Contains(const char *pat, ECaseCompare cmp=kExact) const
Definition TString.h:632
void Initialize(Bool_t useTMVAStyle=kTRUE)
Definition tmvaglob.cxx:176
Int_t GetNumberOfInputVariables(TDirectory *dir)
Definition tmvaglob.cxx:420
void plot_logo(Float_t v_scale=1.0, Float_t skew=1.0)
Definition tmvaglob.cxx:270
void SetSignalAndBackgroundStyle(TH1 *sig, TH1 *bkg, TH1 *all=nullptr)
Definition tmvaglob.cxx:8
TFile * OpenFile(const TString &fin)
Definition tmvaglob.cxx:192
void SetFrameStyle(TH1 *frame, Float_t scale=1.0)
Definition tmvaglob.cxx:77
void imgconv(TCanvas *c, const TString &fname)
Definition tmvaglob.cxx:212
Config & gConfig()
void correlationscatters(TString dataset, TString fin, TString var="var3", TString dirName_="InputVariables_Id", TString title="TMVA Input Variable", Bool_t isRegression=kFALSE, Bool_t useTMVAStyle=kTRUE)