-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathSpecialSampleAsErrorBand.cpp
263 lines (227 loc) · 9.32 KB
/
SpecialSampleAsErrorBand.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
//File: SpecialSampleAsErrorBand.cpp
//Brief: A program to add an error band to a set of histograms using
// the same histograms produced with a special (Gaudi) sample.
//Author: Andrew Olivier [email protected]
#define USAGE "SpecialSampleAsErrorBand <standardFile> <CVWithSpecialSampleFlux> <nameOfBand> <specialSampleFile> [additionalSpecialSampleUniverses]\n"\
"SpecialSampleAsErrorBand <standardFile> <CVWithSpecialSampleFlux> <nameOfBand> <specialSampleFile> [scaleFactor=1.0]"
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Woverloaded-virtual"
//PlotUtils includes
#include "PlotUtils/MnvH1D.h"
#include "PlotUtils/MnvH2D.h"
#pragma GCC diagnostic pop
//ROOT includes
#include "TFile.h"
#include "TDirectory.h"
#include "TKey.h"
#include "TParameter.h"
//Feature needed with pre-ROOT6 PlotUtils.
#ifndef NCINTEX
#include "Cintex/Cintex.h"
#endif
//c++ includes
#include <iostream>
//Convince the STL to talk to TIter so I can use std::find_if()
namespace std
{
template <>
struct iterator_traits<TIter>
{
using value_type = TObject;
using pointer = TObject*;
using reference = TObject&;
using iterator_category = forward_iterator_tag;
};
}
//Think of this like the bash command line utility 'find dir -name "*"',
//but for TObjects in ROOT files. It also requires that every object
//is of type OBJ. If you're using this with multiple OBJs and performance
//matters, you should rewrite it.
template <class OBJ>
std::vector<OBJ*> find(TDirectory& dir)
{
std::vector<OBJ*> found;
auto& keys = *dir.GetListOfKeys();
for(auto obj: keys)
{
auto key = static_cast<TKey*>(obj);
auto asObj = dynamic_cast<OBJ*>(key->ReadObj());
auto asDir = dynamic_cast<TDirectory*>(key->ReadObj());
if(asObj) found.push_back(asObj);
else if(asDir)
{
auto recurse = find<OBJ>(*asDir);
found.insert(found.end(), recurse.begin(), recurse.end());
}
}
return found;
}
template <class MNVH>
MNVH* cloneWithNewBand(const MNVH* hist, const bool isFluxDifferent, const std::string& bandName, const double cvPOT, const std::unique_ptr<TFile>& originalCV, const std::vector<std::unique_ptr<TFile>>& specialSamples, const float scaleFactor)
{
MNVH* withNewBand = new MNVH(*hist);
using hist_t = typename std::remove_const<typename std::remove_pointer<decltype(hist->GetVertErrorBand(bandName)->GetHist(0))>::type>::type;
std::vector<hist_t*> univs;
for(auto& sample: specialSamples)
{
auto found = dynamic_cast<MNVH*>(sample->Get(hist->GetName()));
if(!found) throw std::runtime_error(std::string("Failed to find a histogram named ") + hist->GetName() + " in " + sample->GetName());
const auto specialPOT = dynamic_cast<TParameter<double>*>(sample->Get("POTUsed"));
if(!specialPOT) throw std::runtime_error(std::string("Found histogram but failed to find POT in ") + sample->GetName());
found->Scale(cvPOT / specialPOT->GetVal());
univs.push_back(static_cast<hist_t*>(found->GetCVHistoWithStatError().Clone())); //Store just the CV
}
const hist_t* originalCVHist = nullptr;
if(!isFluxDifferent) originalCVHist = static_cast<hist_t*>(hist->GetCVHistoWithStatError().Clone());
else
{
const MNVH* originalHist = dynamic_cast<MNVH*>(originalCV->Get(hist->GetName()));
if(!originalHist) throw std::runtime_error(std::string("Failed to find a histogram named ") + hist->GetName() + " in the CV with matching flux (file named " + originalCV->GetName() + ")");
originalCVHist = static_cast<hist_t*>(originalHist->GetCVHistoWithStatError().Clone());
}
//Because we don't have a good procedure for 1-universe error bands,
//create a second symmetric universe from the special sample universe
//and the difference with the CV.
if(univs.size() == 1)
{
const auto origUniv = univs.front();
auto otherUniv = static_cast<hist_t*>(origUniv->Clone());
otherUniv->SetDirectory(nullptr);
otherUniv->Add(originalCVHist, -1.);
otherUniv->Add(originalCVHist, otherUniv, 1., -scaleFactor); //TODO: turn these back on after debugging
univs.push_back(otherUniv);
//Now, apply any scale factor to the "up shift" universe
origUniv->Add(originalCVHist, -1);
origUniv->Add(originalCVHist, origUniv, 1., scaleFactor);
}
//If applying a special sample as a systematic to
//a histogram that isn't from the matching flux conditions,
//multiply by the ratio of CVs.
if(isFluxDifferent)
{
for(auto band: univs)
{
band->Multiply(band, hist);
band->Divide(band, originalCVHist);
}
}
withNewBand->AddVertErrorBand(bandName, univs);
return withNewBand;
}
int main(const int argc, const char** argv)
{
#ifndef NCINTEX
ROOT::Cintex::Cintex::Enable(); //Needed to look up dictionaries for PlotUtils classes like MnvH1D
#endif
TH1::AddDirectory(false);
//Check arguments
if(argc < 2 || !strcmp(argv[1], "-h") || !strcmp(argv[1], "--help") || argc < 5)
{
std::cout << USAGE << "\n";
return 0;
}
const std::string fileName = argv[1];
auto inFile = TFile::Open(fileName.c_str(), "READ");
if(!inFile)
{
std::cerr << fileName << ": no such file or directory.\n\n" << USAGE << "\n";
return 2;
}
const std::string originalFileName = argv[2];
std::unique_ptr<TFile> originalFile(TFile::Open(fileName.c_str(), "READ"));
if(!originalFile)
{
std::cerr << originalFileName << ": no such file or directory.\n\n" << USAGE << "\n";
return 2;
}
const bool isFluxDifferent = (originalFileName == fileName);
const std::string newBandName = argv[3];
//There are 2 uses cases that could trigger if there are exactly 6 arguments: 2 universes or 1 universe and a scale factor.
//Decide by trying to interpret argument 5 as a scale factor. If it's not a scale factor, then assume that
//all arguments after 3 are universe file names.
//TODO: Check whether 5th argument is another universe file or a scale factor here
float scaleFactor = 1.;
bool foundScaleFactor = false;
if(argc == 6) //The only valid use case with a scale factor
{
try
{
scaleFactor = std::stof(argv[5]);
foundScaleFactor = true;
}
catch(const std::invalid_argument& /*e*/) {}
}
std::vector<std::unique_ptr<TFile>> specialSamples;
const int lastFile = foundScaleFactor?5:argc; //If I found a scale factor in argument 5, then don't process it as a file name
for(int whichSample = 4; whichSample < lastFile; ++whichSample)
{
auto file = TFile::Open(argv[whichSample], "READ");
if(!file)
{
std::cerr << "Failed to open a special sample file named " << argv[whichSample] << "\n";
return 2;
}
specialSamples.emplace_back(file);
}
auto all1D = find<PlotUtils::MnvH1D>(*inFile);
auto all2D = find<PlotUtils::MnvH2D>(*inFile);
const auto allParameters = find<TParameter<double>>(*inFile);
//const auto allStrings = find<TNamed>(*inFile);
const auto cvPOT = dynamic_cast<TParameter<double>*>(inFile->Get("POTUsed"));
if(!cvPOT)
{
std::cerr << "Failed to find POT information in CV file named " << inFile->GetName() << ".\n";
return 2;
}
const size_t lastSlash = fileName.rfind('/');
const auto outFileName = fileName.substr(lastSlash + 1, fileName.rfind('.') - lastSlash - 1) + "_with_" + newBandName + ".root";
auto outFile = TFile::Open(outFileName.c_str(), "CREATE");
if(!outFile)
{
std::cerr << "Couldn't create " << outFileName << " in the current directory. Does it already exist?\n";
return 4;
}
//auto isFlux = [](const auto hist) { return std::string(hist->GetName()).find("reweightedflux") != std::string::npos; };
auto isConstantHist = [](const auto hist)
{
const std::string histName(hist->GetName());
if(histName.find("reweightedflux") != std::string::npos) return true;
if(histName.find("FiducialNucleons") != std::string::npos) return true;
return false;
};
//Make the swap
try
{
outFile->cd();
for(const auto hist: all1D)
{
if(!isConstantHist(hist)) cloneWithNewBand(hist, isFluxDifferent, newBandName, cvPOT->GetVal(), originalFile, specialSamples, scaleFactor)->Write();
else
{
hist->AddVertErrorBandAndFillWithCV(newBandName, std::max(specialSamples.size(), 2ul));
hist->Write(); //Don't modify the flux because the special sample might have different flux from the CV sample
}
}
for(const auto hist: all2D)
{
if(!isConstantHist(hist)) cloneWithNewBand(hist, isFluxDifferent, newBandName, cvPOT->GetVal(), originalFile, specialSamples, scaleFactor)->Write();
else
{
hist->AddVertErrorBandAndFillWithCV(newBandName, std::max(specialSamples.size(), 2ul));
hist->Write(); //Don't modify the flux because the special sample might have different flux from the CV sample
}
}
}
catch(const std::runtime_error& e)
{
std::cerr << "Failed to insert new error band, " << newBandName << ", because:\n" << e.what() << "\n";
return 5;
}
//Copy TParameters (POT information) and TStrings (bookkeeping) to the new file.
for(auto par: allParameters) par->Write();
//for(auto str: allStrings) str->Write(); //TODO: I need all TNamed that aren't also TH1s
//Write the swapped histograms to a new file.
//TODO: With the same directory structure
outFile->Write();
return 0;
}