48using Clock = std::chrono::high_resolution_clock;
55 auto result = std::shared_ptr<TH1D>(
static_cast<TH1D *
>(
h.GetPtr()->Clone()));
56 result->SetDirectory(
nullptr);
64constexpr const char *kRawDataUrl =
"http://root.cern./files/tutorials/GlobalLandTemperaturesByCity.csv";
65constexpr const char *kNTupleFileName =
"GlobalLandTemperaturesByCity.root";
71 std::cout <<
"Converting " << kRawDataUrl <<
" to " << kNTupleFileName << std::endl;
73 auto t1 = Clock::now();
76 auto model = RNTupleModel::Create();
79 auto fieldYear = model->MakeField<std::uint32_t>(
"Year");
80 auto fieldMonth = model->MakeField<std::uint32_t>(
"Month");
81 auto fieldDay = model->MakeField<std::uint32_t>(
"Day");
82 auto fieldAvgTemp = model->MakeField<
float>(
"AverageTemperature");
83 auto fieldTempUncrty = model->MakeField<
float>(
"AverageTemperatureUncertainty");
84 auto fieldCity = model->MakeField<std::string>(
"City");
85 auto fieldCountry = model->MakeField<std::string>(
"Country");
86 auto fieldLat = model->MakeField<
float>(
"Latitude");
87 auto fieldLong = model->MakeField<
float>(
"Longitude");
91 auto ntuple = RNTupleWriter::Recreate(std::move(model),
"GlobalTempData", kNTupleFileName);
97 auto file = RRawFile::Create(kRawDataUrl, options);
99 constexpr int kMaxCharsPerLine = 128;
100 while (file->Readln(record)) {
101 if (record.length() >= kMaxCharsPerLine)
102 throw std::runtime_error(
"record too long: " + record);
107 std::replace(record.begin(), record.end(),
',',
' ');
108 char country[kMaxCharsPerLine];
109 char city[kMaxCharsPerLine];
111 sscanf(record.c_str(),
"%u-%u-%u %f %f %s %s %fN %fE", fieldYear.get(), fieldMonth.get(), fieldDay.get(),
112 fieldAvgTemp.get(), fieldTempUncrty.get(), country, city, fieldLat.get(), fieldLong.get());
117 *fieldCountry = country;
122 if (++nRecords % 1000000 == 0)
123 std::cout <<
" ... converted " << nRecords <<
" records" << std::endl;
127 std::cout << nSkipped <<
" records skipped" << std::endl;
128 std::cout << nRecords <<
" records processed" << std::endl;
130 auto t2 = Clock::now();
131 std::cout << std::endl
132 <<
"Processing Time: " << std::chrono::duration_cast<std::chrono::seconds>(t2 -
t1).count() <<
" seconds\n"
142 df.Display()->Print();
145 auto min_value = df.Min(
"AverageTemperature");
146 auto max_value = df.Max(
"AverageTemperature");
149 auto fnWinter = [](
int month) {
return month == 12 || month == 1 || month == 2; };
150 auto fnSpring = [](
int month) {
return month == 3 || month == 4 || month == 5; };
151 auto fnSummer = [](
int month) {
return month == 6 || month == 7 || month == 8; };
152 auto fnFall = [](
int month) {
return month == 9 || month == 10 || month == 11; };
155 auto dfWinter = df.Filter(fnWinter, {
"Month"});
156 auto dfSpring = df.Filter(fnSpring, {
"Month"});
157 auto dfSummer = df.Filter(fnSummer, {
"Month"});
158 auto dfFall = df.Filter(fnFall, {
"Month"});
161 auto winterCount = dfWinter.Count();
162 auto springCount = dfSpring.Count();
163 auto summerCount = dfSummer.Count();
164 auto fallCount = dfFall.Count();
167 auto fn1993_to_2002 = [](
int year) {
return year >= 1993 && year <= 2002; };
168 auto fn2003_to_2013 = [](
int year) {
return year >= 2003 && year <= 2013; };
171 auto df1993_to_2002 = df.Filter(fn1993_to_2002, {
"Year"});
172 auto df2003_to_2013 = df.Filter(fn2003_to_2013, {
"Year"});
175 auto decade_1993_to_2002_Count = *df1993_to_2002.Count();
176 auto decade_2003_to_2013_Count = *df2003_to_2013.Count();
179 auto fallHistResultPtr =
180 dfFall.Histo1D({
"Fall Average Temp",
"Average Temperature by Season", 100, -40, 40},
"AverageTemperature");
181 auto winterHistResultPtr =
182 dfWinter.Histo1D({
"Winter Average Temp",
"Average Temperature by Season", 100, -40, 40},
"AverageTemperature");
183 auto springHistResultPtr =
184 dfSpring.Histo1D({
"Spring Average Temp",
"Average Temperature by Season", 100, -40, 40},
"AverageTemperature");
185 auto summerHistResultPtr =
186 dfSummer.Histo1D({
"Summer Average Temp",
"Average Temperature by Season", 100, -40, 40},
"AverageTemperature");
189 auto hist_1993_to_2002_ResultPtr = df1993_to_2002.Histo1D(
190 {
"1993_to_2002 Average Temp",
"Average Temperature: 1993_to_2002 vs. 2003_to_2013", 100, -40, 40},
191 "AverageTemperature");
192 auto hist_2003_to_2013_ResultPtr = df2003_to_2013.Histo1D(
193 {
"2003_to_2013 Average Temp",
"Average Temperature: 1993_to_2002 vs. 2003_to_2013", 100, -40, 40},
194 "AverageTemperature");
199 std::cout << std::endl <<
"The Minimum temperature is: " << *min_value << std::endl;
200 std::cout <<
"The Maximum temperature is: " << *max_value << std::endl;
203 std::cout << std::endl <<
"The count for Winter: " << *winterCount << std::endl;
204 std::cout <<
"The count for Spring: " << *springCount << std::endl;
205 std::cout <<
"The count for Summer: " << *summerCount << std::endl;
206 std::cout <<
"The count for Fall: " << *fallCount << std::endl;
209 std::cout << std::endl <<
"The count for 1993_to_2002: " << decade_1993_to_2002_Count << std::endl;
210 std::cout <<
"The count for 2003_to_2013: " << decade_2003_to_2013_Count << std::endl;
213 auto fallHist = GetDrawableHist(fallHistResultPtr);
214 auto winterHist = GetDrawableHist(winterHistResultPtr);
215 auto springHist = GetDrawableHist(springHistResultPtr);
216 auto summerHist = GetDrawableHist(summerHistResultPtr);
219 fallHist->SetLineColor(
kOrange);
220 fallHist->SetLineWidth(6);
222 winterHist->SetLineColor(
kBlue);
223 winterHist->SetLineWidth(6);
225 springHist->SetLineColor(
kGreen);
226 springHist->SetLineWidth(6);
228 summerHist->SetLineColor(
kRed);
229 summerHist->SetLineWidth(6);
232 auto hist_1993_to_2002 = GetDrawableHist(hist_1993_to_2002_ResultPtr);
233 auto hist_2003_to_2013 = GetDrawableHist(hist_2003_to_2013_ResultPtr);
236 hist_1993_to_2002->SetLineColor(
kViolet);
237 hist_1993_to_2002->SetLineWidth(6);
239 hist_2003_to_2013->SetLineColor(
kSpring);
240 hist_2003_to_2013->SetLineWidth(6);
243 auto canvas = RCanvas::Create(
"Average Temperature by Season");
250 auto legend = std::make_shared<TLegend>(0.15, 0.65, 0.53, 0.85);
251 legend->AddEntry(fallHist.get(),
"fall",
"l");
252 legend->AddEntry(winterHist.get(),
"winter",
"l");
253 legend->AddEntry(springHist.get(),
"spring",
"l");
254 legend->AddEntry(summerHist.get(),
"summer",
"l");
259 auto canvas2 = RCanvas::Create(
"Average Temperature: 1993_to_2002 vs. 2003_to_2013");
264 auto legend2 = std::make_shared<TLegend>(0.1, 0.7, 0.48, 0.9);
265 legend2->AddEntry(hist_1993_to_2002.get(),
"1993_to_2002",
"l");
266 legend2->AddEntry(hist_2003_to_2013.get(),
"2003_to_2013",
"l");
271void ntpl011_global_temperatures()
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t result
R__EXTERN TSystem * gSystem
Provides v7 drawing facilities for TObject types (TGraph, TH1, TH2, etc).
The RRawFile provides read-only access to local and remote files.
Smart pointer for the return type of actions.
ROOT's RDataFrame offers a modern, high-level interface for analysis of data stored in TTree ,...
1-D histogram with a double per channel (see TH1 documentation)
virtual Bool_t AccessPathName(const char *path, EAccessMode mode=kFileExists)
Returns FALSE if one can access a file using the specified access mode.
On construction, an ROptions parameter can customize the RRawFile behavior.
size_t fBlockSize
Read at least fBlockSize bytes at a time. A value of zero turns off I/O buffering.