25#include <unordered_set>
31 if (!
dynamic_cast<const TChain *
>(tree) && !tree->GetCurrentFile()) {
47 if (
auto ds = GetDataSource()) {
52 const auto n = fLoopManager->GetNEmptyEntries();
54 return "Empty dataframe filling 1 row";
56 return "Empty dataframe filling " + std::to_string(
n) +
" rows";
62 : fLoopManager(
lm), fColRegister(
lm.get())
100 auto tree = fLoopManager->GetTree();
106 if (
auto ds = GetDataSource()) {
108 if (s.rfind(
"R_rdf_sizeof", 0) != 0)
133 const auto col = fColRegister.ResolveAlias(column);
177 for (
const auto &
name : GetDefinedColumnNames())
181 const std::vector<std::string>
metadataProperties = {
"Columns in total",
"Columns from defines",
"Event loops run",
185 std::to_string(GetNRuns()), std::to_string(GetNSlots())};
193 std::stringstream
ss;
216 for (
auto i = 0
u; i <
nCols; i++) {
247 const auto columns = fColRegister.BuildDefineNames();
248 for (
const auto &column :
columns) {
270 return fColRegister.BuildVariationsDescription();
292 if (fLoopManager->GetTree()) {
293 const auto &
branchNames = fLoopManager->GetBranchNames();
319 return fLoopManager->GetNSlots();
338 return fLoopManager->GetNRuns();
343 std::vector<std::string>
types;
346 types.push_back(GetColumnType(column));
355 error +=
" was called with ImplicitMT enabled, but multi-thread is not supported.";
356 throw std::runtime_error(error);
379 fColRegister, *fLoopManager);
380 fColRegister.AddDefine(std::move(
slotColumn));
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
The head node of a RDF computation graph.
A binder for user-defined columns, variations and aliases.
A DFDescription contains useful information about a given RDataFrame computation graph.
RVariationsDescription GetVariations() const
Return a descriptor for the systematic variations registered in this branch of the computation graph.
std::string GetColumnType(std::string_view column)
Return the type of a given column as a string.
RDFDescription Describe()
Return information about the dataframe.
ColumnNames_t GetColumnTypeNamesList(const ColumnNames_t &columnList)
std::shared_ptr< ROOT::Detail::RDF::RLoopManager > fLoopManager
< The RLoopManager at the root of this computation graph. Never null.
unsigned int GetNRuns() const
Gets the number of event loops run.
RDataSource * GetDataSource() const
ColumnNames_t GetDefinedColumnNames()
Returns the names of the defined columns.
void CheckIMTDisabled(std::string_view callerName)
unsigned int GetNSlots() const
Gets the number of data processing slots.
RInterfaceBase(std::shared_ptr< RDFDetail::RLoopManager > lm)
bool HasColumn(std::string_view columnName)
Checks if a column is present in the dataset.
std::string DescribeDataset() const
ColumnNames_t GetColumnNames()
Returns the names of the available columns.
A descriptor for the systematic variations known to a given RDataFrame node.
const_iterator begin() const
const_iterator end() const
A chain is a collection of files containing TTree objects.
std::vector< std::string > GetBranchNames(TTree &t, bool allowDuplicates=true)
Get all the branches names, including the ones of the friend trees.
unsigned int GetColumnWidth(const std::vector< std::string > &names, const unsigned int minColumnSpace=8u)
Get optimal column width for printing a table given the names and the desired minimal space between c...
std::string DescribeDataset(ROOT::RDF::RDataSource &ds)
std::string ColumnName2ColumnTypeName(const std::string &colName, TTree *, RDataSource *, RDefineBase *, bool vector2RVec=true)
Return a string containing the type of the given branch.
bool IsInternalColumn(std::string_view colName)
Whether custom column with name colName is an "internal" column such as rdfentry_ or rdfslot_.
const std::vector< std::string > & GetColumnNamesNoDuplicates(const ROOT::RDF::RDataSource &ds)
std::vector< std::string > GetFileNamesFromTree(const TTree &tree)
std::vector< std::string > ColumnNames_t
tbb::task_arena is an alias of tbb::interface7::task_arena, which doesn't allow to forward declare tb...
Bool_t IsImplicitMTEnabled()
Returns true if the implicit multi-threading in ROOT is enabled.