Logo ROOT  
Reference Guide
 
Loading...
Searching...
No Matches
RNTupleDescriptor.cxx
Go to the documentation of this file.
1/// \file RNTupleDescriptor.cxx
2/// \author Jakob Blomer <jblomer@cern.ch>
3/// \author Javier Lopez-Gomez <javier.lopez.gomez@cern.ch>
4/// \date 2018-10-04
5
6/*************************************************************************
7 * Copyright (C) 1995-2019, Rene Brun and Fons Rademakers. *
8 * All rights reserved. *
9 * *
10 * For the licensing terms see $ROOTSYS/LICENSE. *
11 * For the list of contributors see $ROOTSYS/README/CREDITS. *
12 *************************************************************************/
13
14#include <ROOT/RError.hxx>
15#include <ROOT/RFieldBase.hxx>
16#include <ROOT/RNTuple.hxx>
18#include <ROOT/RNTupleModel.hxx>
19#include <ROOT/RNTupleTypes.hxx>
20#include <ROOT/RNTupleUtils.hxx>
21#include <ROOT/RPage.hxx>
22#include <string_view>
23
24#include <RZip.h>
25#include <TError.h>
26
27#include <algorithm>
28#include <cstdint>
29#include <deque>
30#include <functional>
31#include <iostream>
32#include <set>
33#include <utility>
34
36{
37 return fFieldId == other.fFieldId && fFieldVersion == other.fFieldVersion && fTypeVersion == other.fTypeVersion &&
38 fFieldName == other.fFieldName && fFieldDescription == other.fFieldDescription &&
39 fTypeName == other.fTypeName && fTypeAlias == other.fTypeAlias && fNRepetitions == other.fNRepetitions &&
40 fStructure == other.fStructure && fParentId == other.fParentId &&
41 fProjectionSourceId == other.fProjectionSourceId && fLinkIds == other.fLinkIds &&
42 fLogicalColumnIds == other.fLogicalColumnIds && fTypeChecksum == other.fTypeChecksum &&
43 fIsSoACollection == other.fIsSoACollection;
44}
45
47{
48 RFieldDescriptor clone;
49 clone.fFieldId = fFieldId;
50 clone.fFieldVersion = fFieldVersion;
51 clone.fTypeVersion = fTypeVersion;
52 clone.fFieldName = fFieldName;
53 clone.fFieldDescription = fFieldDescription;
54 clone.fTypeName = fTypeName;
55 clone.fTypeAlias = fTypeAlias;
56 clone.fNRepetitions = fNRepetitions;
57 clone.fStructure = fStructure;
58 clone.fParentId = fParentId;
59 clone.fProjectionSourceId = fProjectionSourceId;
60 clone.fLinkIds = fLinkIds;
61 clone.fColumnCardinality = fColumnCardinality;
62 clone.fLogicalColumnIds = fLogicalColumnIds;
63 clone.fTypeChecksum = fTypeChecksum;
64 clone.fIsSoACollection = fIsSoACollection;
65 return clone;
66}
67
68std::unique_ptr<ROOT::RFieldBase>
70{
71 if (GetStructure() == ROOT::ENTupleStructure::kStreamer) {
72 auto streamerField = std::make_unique<ROOT::RStreamerField>(GetFieldName(), GetTypeName());
73 streamerField->SetOnDiskId(fFieldId);
74 return streamerField;
75 }
76
77 // The structure may be unknown if the descriptor comes from a deserialized field with an unknown structural role.
78 // For forward compatibility, we allow this case and return an InvalidField.
79 if (GetStructure() == ROOT::ENTupleStructure::kUnknown) {
80 if (options.GetReturnInvalidOnError()) {
81 auto invalidField = std::make_unique<ROOT::RInvalidField>(GetFieldName(), GetTypeName(), "",
83 invalidField->SetOnDiskId(fFieldId);
84 return invalidField;
85 } else {
86 throw RException(R__FAIL("unexpected on-disk field structure value for field \"" + GetFieldName() + "\""));
87 }
88 }
89
90 // Untyped records and collections
91 if (GetTypeName().empty()) {
92 switch (GetStructure()) {
94 std::vector<std::unique_ptr<ROOT::RFieldBase>> memberFields;
95 memberFields.reserve(fLinkIds.size());
96 for (auto id : fLinkIds) {
97 const auto &memberDesc = ntplDesc.GetFieldDescriptor(id);
98 auto field = memberDesc.CreateField(ntplDesc, options);
100 return field;
101 memberFields.emplace_back(std::move(field));
102 }
103 auto recordField = std::make_unique<ROOT::RRecordField>(GetFieldName(), std::move(memberFields));
104 recordField->SetOnDiskId(fFieldId);
105 return recordField;
106 }
108 if (fLinkIds.size() != 1) {
109 throw RException(R__FAIL("unsupported untyped collection for field \"" + GetFieldName() + "\""));
110 }
111 auto itemField = ntplDesc.GetFieldDescriptor(fLinkIds[0]).CreateField(ntplDesc, options);
113 return itemField;
114 auto collectionField = ROOT::RVectorField::CreateUntyped(GetFieldName(), std::move(itemField));
115 collectionField->SetOnDiskId(fFieldId);
116 return collectionField;
117 }
118 default: throw RException(R__FAIL("unsupported untyped field structure for field \"" + GetFieldName() + "\""));
119 }
120 }
121
122 try {
123 const auto &fieldName = GetFieldName();
124 const auto &typeName = GetTypeAlias().empty() ? GetTypeName() : GetTypeAlias();
125 // NOTE: Unwrap() here may throw an exception, hence the try block.
126 // If options.fReturnInvalidOnError is false we just rethrow it, otherwise we return an InvalidField wrapping the
127 // error.
128 auto field = ROOT::Internal::CallFieldBaseCreate(fieldName, typeName, options, &ntplDesc, fFieldId).Unwrap();
129 field->SetOnDiskId(fFieldId);
130
131 for (auto &subfield : *field) {
132 const auto subfieldId = ntplDesc.FindFieldId(subfield.GetFieldName(), subfield.GetParent()->GetOnDiskId());
133 subfield.SetOnDiskId(subfieldId);
135 auto &invalidField = static_cast<ROOT::RInvalidField &>(subfield);
136 // A subfield being invalid "infects" its entire ancestry.
137 return invalidField.Clone(fieldName);
138 }
139 }
140
141 return field;
142 } catch (const RException &ex) {
143 if (options.GetReturnInvalidOnError())
144 return std::make_unique<ROOT::RInvalidField>(GetFieldName(), GetTypeName(), ex.what(),
146 else
147 throw ex;
148 }
149}
150
151////////////////////////////////////////////////////////////////////////////////
152
154{
155 return fLogicalColumnId == other.fLogicalColumnId && fPhysicalColumnId == other.fPhysicalColumnId &&
156 fBitsOnStorage == other.fBitsOnStorage && fType == other.fType && fFieldId == other.fFieldId &&
157 fIndex == other.fIndex && fRepresentationIndex == other.fRepresentationIndex &&
158 fValueRange == other.fValueRange;
159}
160
162{
163 RColumnDescriptor clone;
164 clone.fLogicalColumnId = fLogicalColumnId;
165 clone.fPhysicalColumnId = fPhysicalColumnId;
166 clone.fBitsOnStorage = fBitsOnStorage;
167 clone.fType = fType;
168 clone.fFieldId = fFieldId;
169 clone.fIndex = fIndex;
170 clone.fFirstElementIndex = fFirstElementIndex;
171 clone.fRepresentationIndex = fRepresentationIndex;
172 clone.fValueRange = fValueRange;
173 return clone;
174}
175
176////////////////////////////////////////////////////////////////////////////////
177
180{
181 if (!fCumulativeNElements) {
182 // Small range, just iterate through fPageInfos
185 for (const auto &pi : fPageInfos) {
186 if (firstInPage + pi.GetNElements() > idxInCluster) {
188 }
189 pageNumber++;
190 firstInPage += pi.GetNElements();
191 }
192 R__ASSERT(false);
193 }
194
195 const auto N = fCumulativeNElements->size();
196 R__ASSERT(N > 0);
197 R__ASSERT(N == fPageInfos.size());
198
199 std::size_t left = 0;
200 std::size_t right = N - 1;
201 std::size_t midpoint = N;
202 while (left <= right) {
203 midpoint = (left + right) / 2;
204 if ((*fCumulativeNElements)[midpoint] <= idxInCluster) {
205 left = midpoint + 1;
206 continue;
207 }
208
209 if ((midpoint == 0) || ((*fCumulativeNElements)[midpoint - 1] <= idxInCluster))
210 break;
211
212 right = midpoint - 1;
213 }
215
216 auto pageInfo = fPageInfos[midpoint];
217 decltype(idxInCluster) firstInPage = (midpoint == 0) ? 0 : (*fCumulativeNElements)[midpoint - 1];
219 R__ASSERT((firstInPage + pageInfo.GetNElements()) > idxInCluster);
221}
222
223std::size_t
226 std::size_t pageSize)
227{
228 R__ASSERT(fPhysicalColumnId == columnRange.GetPhysicalColumnId());
229 R__ASSERT(!columnRange.IsSuppressed());
230
231 const auto nElements =
232 std::accumulate(fPageInfos.begin(), fPageInfos.end(), 0U,
233 [](std::size_t n, const auto &pageInfo) { return n + pageInfo.GetNElements(); });
234 const auto nElementsRequired = static_cast<std::uint64_t>(columnRange.GetNElements());
235
237 return 0U;
238 R__ASSERT((nElementsRequired > nElements) && "invalid attempt to shrink RPageRange");
239
240 std::vector<RPageInfo> pageInfos;
241 // Synthesize new `RPageInfo`s as needed
242 const std::uint64_t nElementsPerPage = pageSize / element.GetSize();
246 pageInfo.SetNElements(std::min(nElementsPerPage, nRemainingElements));
249 locator.SetNBytesOnStorage(element.GetPackedSize(pageInfo.GetNElements()));
250 pageInfo.SetLocator(locator);
251 pageInfos.emplace_back(pageInfo);
252 nRemainingElements -= pageInfo.GetNElements();
253 }
254
255 pageInfos.insert(pageInfos.end(), std::make_move_iterator(fPageInfos.begin()),
256 std::make_move_iterator(fPageInfos.end()));
257 std::swap(fPageInfos, pageInfos);
259}
260
262{
263 return fClusterId == other.fClusterId && fFirstEntryIndex == other.fFirstEntryIndex &&
264 fNEntries == other.fNEntries && fColumnRanges == other.fColumnRanges && fPageRanges == other.fPageRanges;
265}
266
268{
269 std::uint64_t nbytes = 0;
270 for (const auto &pr : fPageRanges) {
271 for (const auto &pi : pr.second.GetPageInfos()) {
272 nbytes += pi.GetLocator().GetNBytesOnStorage();
273 }
274 }
275 return nbytes;
276}
277
279{
280 RClusterDescriptor clone;
281 clone.fClusterId = fClusterId;
282 clone.fFirstEntryIndex = fFirstEntryIndex;
283 clone.fNEntries = fNEntries;
284 clone.fColumnRanges = fColumnRanges;
285 for (const auto &d : fPageRanges)
286 clone.fPageRanges.emplace(d.first, d.second.Clone());
287 return clone;
288}
289
290////////////////////////////////////////////////////////////////////////////////
291
293{
294 return fContentId == other.fContentId && fTypeName == other.fTypeName && fTypeVersion == other.fTypeVersion;
295}
296
298{
300 clone.fContentId = fContentId;
301 clone.fTypeVersion = fTypeVersion;
302 clone.fTypeName = fTypeName;
303 clone.fContent = fContent;
304 return clone;
305}
306
307////////////////////////////////////////////////////////////////////////////////
308
313
315{
316 // clang-format off
317 return fName == other.fName &&
318 fDescription == other.fDescription &&
319 fNEntries == other.fNEntries &&
320 fGeneration == other.fGeneration &&
321 fFieldZeroId == other.fFieldZeroId &&
322 fFieldDescriptors == other.fFieldDescriptors &&
323 fColumnDescriptors == other.fColumnDescriptors &&
324 fClusterGroupDescriptors == other.fClusterGroupDescriptors &&
325 fClusterDescriptors == other.fClusterDescriptors;
326 // clang-format on
327}
328
330{
332 for (const auto &cd : fClusterDescriptors) {
333 if (!cd.second.ContainsColumn(physicalColumnId))
334 continue;
335 auto columnRange = cd.second.GetColumnRange(physicalColumnId);
336 result = std::max(result, columnRange.GetFirstElementIndex() + columnRange.GetNElements());
337 }
338 return result;
339}
340
341////////////////////////////////////////////////////////////////////////////////
342/// Return the cluster boundaries for each cluster in this RNTuple.
343std::vector<ROOT::Internal::RNTupleClusterBoundaries>
345{
346 std::vector<Internal::RNTupleClusterBoundaries> boundaries;
347 boundaries.reserve(desc.GetNClusters());
348 auto clusterId = desc.FindClusterId(0, 0);
350 const auto &clusterDesc = desc.GetClusterDescriptor(clusterId);
351 R__ASSERT(clusterDesc.GetNEntries() > 0);
352 boundaries.emplace_back(ROOT::Internal::RNTupleClusterBoundaries{
353 clusterDesc.GetFirstEntryIndex(), clusterDesc.GetFirstEntryIndex() + clusterDesc.GetNEntries()});
355 }
356 return boundaries;
357}
358
361{
362 std::string leafName(fieldName);
363 auto posDot = leafName.find_last_of('.');
364 if (posDot != std::string::npos) {
365 auto parentName = leafName.substr(0, posDot);
366 leafName = leafName.substr(posDot + 1);
367 parentId = FindFieldId(parentName, parentId);
368 }
369 auto itrFieldDesc = fFieldDescriptors.find(parentId);
370 if (itrFieldDesc == fFieldDescriptors.end())
372 for (const auto linkId : itrFieldDesc->second.GetLinkIds()) {
373 if (fFieldDescriptors.at(linkId).GetFieldName() == leafName)
374 return linkId;
375 }
377}
378
380{
382 return "";
383
384 const auto &fieldDescriptor = fFieldDescriptors.at(fieldId);
385 auto prefix = GetQualifiedFieldName(fieldDescriptor.GetParentId());
386 if (prefix.empty())
387 return fieldDescriptor.GetFieldName();
388 return prefix + "." + fieldDescriptor.GetFieldName();
389}
390
392{
393 std::string typeName = fieldDesc.GetTypeName();
394
395 // ROOT v6.34, with spec versions before 1.0.0.1, did not properly renormalize the type name.
396 R__ASSERT(fVersionEpoch == 1);
397 if (fVersionMajor == 0 && fVersionMinor == 0 && fVersionPatch < 1) {
398 typeName = ROOT::Internal::GetRenormalizedTypeName(typeName);
399 }
400
401 return typeName;
402}
403
405{
406 return FindFieldId(fieldName, GetFieldZeroId());
407}
408
410 std::uint32_t columnIndex,
411 std::uint16_t representationIndex) const
412{
413 auto itr = fFieldDescriptors.find(fieldId);
414 if (itr == fFieldDescriptors.cend())
416 if (columnIndex >= itr->second.GetColumnCardinality())
418 const auto idx = representationIndex * itr->second.GetColumnCardinality() + columnIndex;
419 if (itr->second.GetLogicalColumnIds().size() <= idx)
421 return itr->second.GetLogicalColumnIds()[idx];
422}
423
425 std::uint32_t columnIndex,
426 std::uint16_t representationIndex) const
427{
428 auto logicalId = FindLogicalColumnId(fieldId, columnIndex, representationIndex);
431 return GetColumnDescriptor(logicalId).GetPhysicalId();
432}
433
436{
437 if (GetNClusterGroups() == 0)
439
440 // Binary search in the cluster group list, followed by a binary search in the clusters of that cluster group
441
442 std::size_t cgLeft = 0;
443 std::size_t cgRight = GetNClusterGroups() - 1;
444 while (cgLeft <= cgRight) {
445 const std::size_t cgMidpoint = (cgLeft + cgRight) / 2;
446 const auto &clusterIds = GetClusterGroupDescriptor(fSortedClusterGroupIds[cgMidpoint]).GetClusterIds();
447 R__ASSERT(!clusterIds.empty());
448
449 const auto &clusterDesc = GetClusterDescriptor(clusterIds.front());
450 // this may happen if the RNTuple has an empty schema
451 if (!clusterDesc.ContainsColumn(physicalColumnId))
453
454 const auto firstElementInGroup = clusterDesc.GetColumnRange(physicalColumnId).GetFirstElementIndex();
456 // Look into the lower half of cluster groups
458 cgRight = cgMidpoint - 1;
459 continue;
460 }
461
462 const auto &lastColumnRange = GetClusterDescriptor(clusterIds.back()).GetColumnRange(physicalColumnId);
463 if ((lastColumnRange.GetFirstElementIndex() + lastColumnRange.GetNElements()) <= index) {
464 // Look into the upper half of cluster groups
465 cgLeft = cgMidpoint + 1;
466 continue;
467 }
468
469 // Binary search in the current cluster group; since we already checked the element range boundaries,
470 // the element must be in that cluster group.
471 std::size_t clusterLeft = 0;
472 std::size_t clusterRight = clusterIds.size() - 1;
473 while (clusterLeft <= clusterRight) {
474 const std::size_t clusterMidpoint = (clusterLeft + clusterRight) / 2;
476 const auto &columnRange = GetClusterDescriptor(clusterId).GetColumnRange(physicalColumnId);
477
478 if (columnRange.Contains(index))
479 return clusterId;
480
481 if (columnRange.GetFirstElementIndex() > index) {
484 continue;
485 }
486
487 if (columnRange.GetFirstElementIndex() + columnRange.GetNElements() <= index) {
489 continue;
490 }
491 }
492 R__ASSERT(false);
493 }
495}
496
498{
499 if (GetNClusterGroups() == 0)
501
502 // Binary search in the cluster group list, followed by a binary search in the clusters of that cluster group
503
504 std::size_t cgLeft = 0;
505 std::size_t cgRight = GetNClusterGroups() - 1;
506 while (cgLeft <= cgRight) {
507 const std::size_t cgMidpoint = (cgLeft + cgRight) / 2;
508 const auto &cgDesc = GetClusterGroupDescriptor(fSortedClusterGroupIds[cgMidpoint]);
509
510 if (cgDesc.GetMinEntry() > entryIdx) {
512 cgRight = cgMidpoint - 1;
513 continue;
514 }
515
516 if (cgDesc.GetMinEntry() + cgDesc.GetEntrySpan() <= entryIdx) {
517 cgLeft = cgMidpoint + 1;
518 continue;
519 }
520
521 // Binary search in the current cluster group; since we already checked the element range boundaries,
522 // the element must be in that cluster group.
523 const auto &clusterIds = cgDesc.GetClusterIds();
524 R__ASSERT(!clusterIds.empty());
525 std::size_t clusterLeft = 0;
526 std::size_t clusterRight = clusterIds.size() - 1;
527 while (clusterLeft <= clusterRight) {
528 const std::size_t clusterMidpoint = (clusterLeft + clusterRight) / 2;
529 const auto &clusterDesc = GetClusterDescriptor(clusterIds[clusterMidpoint]);
530
531 if (clusterDesc.GetFirstEntryIndex() > entryIdx) {
534 continue;
535 }
536
537 if (clusterDesc.GetFirstEntryIndex() + clusterDesc.GetNEntries() <= entryIdx) {
539 continue;
540 }
541
543 }
544 R__ASSERT(false);
545 }
547}
548
550{
551 // TODO(jblomer): we may want to shortcut the common case and check if clusterId + 1 contains
552 // firstEntryInNextCluster. This shortcut would currently always trigger. We do not want, however, to depend
553 // on the linearity of the descriptor IDs, so we should only enable the shortcut if we can ensure that the
554 // binary search code path remains tested.
555 const auto &clusterDesc = GetClusterDescriptor(clusterId);
556 const auto firstEntryInNextCluster = clusterDesc.GetFirstEntryIndex() + clusterDesc.GetNEntries();
557 return FindClusterId(firstEntryInNextCluster);
558}
559
561{
562 // TODO(jblomer): we may want to shortcut the common case and check if clusterId - 1 contains
563 // firstEntryInNextCluster. This shortcut would currently always trigger. We do not want, however, to depend
564 // on the linearity of the descriptor IDs, so we should only enable the shortcut if we can ensure that the
565 // binary search code path remains tested.
566 const auto &clusterDesc = GetClusterDescriptor(clusterId);
567 if (clusterDesc.GetFirstEntryIndex() == 0)
569 return FindClusterId(clusterDesc.GetFirstEntryIndex() - 1);
570}
571
572std::vector<ROOT::DescriptorId_t>
574{
575 std::vector<ROOT::DescriptorId_t> fields;
576 for (const auto fieldId : fFieldIdsOrder) {
577 if (fFieldIdsLookup.count(desc.GetFieldDescriptor(fieldId).GetParentId()) == 0)
578 fields.emplace_back(fieldId);
579 }
580 return fields;
581}
582
588
590 : fNTuple(ntuple)
591{
592 std::deque<ROOT::DescriptorId_t> fieldIdQueue{ntuple.GetFieldZeroId()};
593
594 while (!fieldIdQueue.empty()) {
595 auto currFieldId = fieldIdQueue.front();
596 fieldIdQueue.pop_front();
597
598 const auto &columns = ntuple.GetFieldDescriptor(currFieldId).GetLogicalColumnIds();
599 fColumns.insert(fColumns.end(), columns.begin(), columns.end());
600
601 for (const auto &field : ntuple.GetFieldIterable(currFieldId)) {
602 auto fieldId = field.GetId();
603 fieldIdQueue.push_back(fieldId);
604 }
605 }
606}
607
608std::vector<std::uint64_t> ROOT::RNTupleDescriptor::GetFeatureFlags() const
609{
610 std::vector<std::uint64_t> result;
611 unsigned int base = 0;
612 std::uint64_t flags = 0;
613 for (auto f : fFeatureFlags) {
614 if ((f > 0) && ((f % 64) == 0))
615 throw RException(R__FAIL("invalid feature flag: " + std::to_string(f)));
616 while (f > base + 64) {
617 result.emplace_back(flags);
618 flags = 0;
619 base += 64;
620 }
621 f -= base;
622 flags |= std::uint64_t(1) << f;
623 }
624 result.emplace_back(flags);
625 return result;
626}
627
629 std::vector<RClusterDescriptor> &clusterDescs)
630{
632 if (iter == fClusterGroupDescriptors.end())
633 return R__FAIL("invalid attempt to add details of unknown cluster group");
634 if (iter->second.HasClusterDetails())
635 return R__FAIL("invalid attempt to re-populate cluster group details");
636 if (iter->second.GetNClusters() != clusterDescs.size())
637 return R__FAIL("mismatch of number of clusters");
638
639 std::vector<ROOT::DescriptorId_t> clusterIds;
640 for (unsigned i = 0; i < clusterDescs.size(); ++i) {
641 clusterIds.emplace_back(clusterDescs[i].GetId());
642 auto [_, success] = fClusterDescriptors.emplace(clusterIds.back(), std::move(clusterDescs[i]));
643 if (!success) {
644 return R__FAIL("invalid attempt to re-populate existing cluster");
645 }
646 }
648 return fClusterDescriptors[a].GetFirstEntryIndex() < fClusterDescriptors[b].GetFirstEntryIndex();
649 });
651 cgBuilder.AddSortedClusters(clusterIds);
652 iter->second = cgBuilder.MoveDescriptor().Unwrap();
653 return RResult<void>::Success();
654}
655
657{
659 if (iter == fClusterGroupDescriptors.end())
660 return R__FAIL("invalid attempt to drop cluster details of unknown cluster group");
661 if (!iter->second.HasClusterDetails())
662 return R__FAIL("invalid attempt to drop details of cluster group summary");
663
664 for (auto clusterId : iter->second.GetClusterIds())
666 iter->second = iter->second.CloneSummary();
667 return RResult<void>::Success();
668}
669
670std::unique_ptr<ROOT::RNTupleModel> ROOT::RNTupleDescriptor::CreateModel(const RCreateModelOptions &options) const
671{
672 // Collect all top-level fields that have invalid columns (recursively): by default if we find any we throw an
673 // exception; if we are in ForwardCompatible mode, we proceed but skip of all those top-level fields.
674 std::unordered_set<ROOT::DescriptorId_t> invalidFields;
675 for (const auto &colDesc : GetColumnIterable()) {
677 auto fieldId = colDesc.GetFieldId();
678 while (1) {
679 const auto &field = GetFieldDescriptor(fieldId);
680 if (field.GetParentId() == GetFieldZeroId())
681 break;
682 fieldId = field.GetParentId();
683 }
684 invalidFields.insert(fieldId);
685
686 // No need to look for all invalid fields if we're gonna error out anyway
687 if (!options.GetForwardCompatible())
688 break;
689 }
690 }
691
692 if (!options.GetForwardCompatible() && !invalidFields.empty())
694 "cannot create Model: descriptor contains unknown column types. Use 'SetForwardCompatible(true)' on the "
695 "RCreateModelOptions to create a partial model containing only the fields made up by known columns."));
696
697 auto fieldZero = std::make_unique<ROOT::RFieldZero>();
698 fieldZero->SetOnDiskId(GetFieldZeroId());
699 auto model = options.GetCreateBare() ? RNTupleModel::CreateBare(std::move(fieldZero))
700 : RNTupleModel::Create(std::move(fieldZero));
702 createFieldOpts.SetReturnInvalidOnError(options.GetForwardCompatible());
703 createFieldOpts.SetEmulateUnknownTypes(options.GetEmulateUnknownTypes());
704 for (const auto &topDesc : GetTopLevelFields()) {
705 if (invalidFields.count(topDesc.GetId()) > 0) {
706 // Field contains invalid columns: skip it
707 continue;
708 }
709
710 auto field = topDesc.CreateField(*this, createFieldOpts);
711
712 // If we got an InvalidField here, figure out if it's a hard error or if the field must simply be skipped.
713 // The only case where it's not a hard error is if the field has an unknown structure, as that case is
714 // covered by the ForwardCompatible flag (note that if the flag is off we would not get here
715 // in the first place, so we don't need to check for that flag again).
716 if (field->GetTraits() & ROOT::RFieldBase::kTraitInvalidField) {
717 const auto &invalid = static_cast<const RInvalidField &>(*field);
718 const auto cat = invalid.GetCategory();
720 if (mustThrow)
721 throw RException(R__FAIL(invalid.GetError()));
722
723 // Not a hard error: skip the field and go on.
724 continue;
725 }
726
727 if (options.GetReconstructProjections() && topDesc.IsProjectedField()) {
728 model->AddProjectedField(std::move(field), [this](const std::string &targetName) -> std::string {
729 return GetQualifiedFieldName(GetFieldDescriptor(FindFieldId(targetName)).GetProjectionSourceId());
730 });
731 } else {
732 model->AddField(std::move(field));
733 }
734 }
735 model->Freeze();
736 return model;
737}
738
740{
741 RNTupleDescriptor clone;
742 clone.fName = fName;
747 // OnDiskHeaderSize, OnDiskHeaderXxHash3 not copied because they may come from a merged header + extension header
748 // and therefore not represent the actual sources's header.
749 // OnDiskFooterSize not copied because it contains information beyond the schema, for example the clustering.
750
751 for (const auto &d : fFieldDescriptors)
752 clone.fFieldDescriptors.emplace(d.first, d.second.Clone());
753 for (const auto &d : fColumnDescriptors)
754 clone.fColumnDescriptors.emplace(d.first, d.second.Clone());
755
756 for (const auto &d : fExtraTypeInfoDescriptors)
757 clone.fExtraTypeInfoDescriptors.emplace_back(d.Clone());
759 clone.fHeaderExtension = std::make_unique<RHeaderExtension>(*fHeaderExtension);
760
761 return clone;
762}
763
765{
767
772
776 clone.fNEntries = fNEntries;
777 clone.fNClusters = fNClusters;
778 clone.fGeneration = fGeneration;
779 for (const auto &d : fClusterGroupDescriptors)
780 clone.fClusterGroupDescriptors.emplace(d.first, d.second.Clone());
782 for (const auto &d : fClusterDescriptors)
783 clone.fClusterDescriptors.emplace(d.first, d.second.Clone());
784 for (const auto &d : fAttributeSets)
785 clone.fAttributeSets.emplace_back(d.Clone());
786 return clone;
787}
788
789////////////////////////////////////////////////////////////////////////////////
790
792{
793 return fClusterGroupId == other.fClusterGroupId && fClusterIds == other.fClusterIds &&
794 fMinEntry == other.fMinEntry && fEntrySpan == other.fEntrySpan && fNClusters == other.fNClusters;
795}
796
798{
800 clone.fClusterGroupId = fClusterGroupId;
801 clone.fPageListLocator = fPageListLocator;
802 clone.fPageListLength = fPageListLength;
803 clone.fMinEntry = fMinEntry;
804 clone.fEntrySpan = fEntrySpan;
805 clone.fNClusters = fNClusters;
806 return clone;
807}
808
810{
811 RClusterGroupDescriptor clone = CloneSummary();
812 clone.fClusterIds = fClusterIds;
813 return clone;
814}
815
816////////////////////////////////////////////////////////////////////////////////
817
820 std::uint64_t firstElementIndex,
821 std::uint32_t compressionSettings,
823{
824 if (physicalId != pageRange.fPhysicalColumnId)
825 return R__FAIL("column ID mismatch");
826 if (fCluster.fColumnRanges.count(physicalId) > 0)
827 return R__FAIL("column ID conflict");
829 for (const auto &pi : pageRange.fPageInfos) {
830 columnRange.IncrementNElements(pi.GetNElements());
831 }
832 fCluster.fPageRanges[physicalId] = pageRange.Clone();
833 fCluster.fColumnRanges[physicalId] = columnRange;
834 return RResult<void>::Success();
835}
836
839{
840 if (fCluster.fColumnRanges.count(physicalId) > 0)
841 return R__FAIL("column ID conflict");
842
844 columnRange.SetPhysicalColumnId(physicalId);
845 columnRange.SetIsSuppressed(true);
846 fCluster.fColumnRanges[physicalId] = columnRange;
847 return RResult<void>::Success();
848}
849
852{
853 for (auto &[_, columnRange] : fCluster.fColumnRanges) {
854 if (!columnRange.IsSuppressed())
855 continue;
856 R__ASSERT(columnRange.GetFirstElementIndex() == ROOT::kInvalidNTupleIndex);
857
858 const auto &columnDesc = desc.GetColumnDescriptor(columnRange.GetPhysicalColumnId());
859 const auto &fieldDesc = desc.GetFieldDescriptor(columnDesc.GetFieldId());
860 // We expect only few columns and column representations per field, so we do a linear search
861 for (const auto otherColumnLogicalId : fieldDesc.GetLogicalColumnIds()) {
863 if (otherColumnDesc.GetRepresentationIndex() == columnDesc.GetRepresentationIndex())
864 continue;
865 if (otherColumnDesc.GetIndex() != columnDesc.GetIndex())
866 continue;
867
868 // Found corresponding column of a different column representation
869 const auto &otherColumnRange = fCluster.GetColumnRange(otherColumnDesc.GetPhysicalId());
870 if (otherColumnRange.IsSuppressed())
871 continue;
872
873 columnRange.SetFirstElementIndex(otherColumnRange.GetFirstElementIndex());
874 columnRange.SetNElements(otherColumnRange.GetNElements());
875 break;
876 }
877
878 if (columnRange.GetFirstElementIndex() == ROOT::kInvalidNTupleIndex) {
879 return R__FAIL(std::string("cannot find non-suppressed column for column ID ") +
880 std::to_string(columnRange.GetPhysicalColumnId()) +
881 ", cluster ID: " + std::to_string(fCluster.GetId()));
882 }
883 }
884 return RResult<void>::Success();
885}
886
889{
890 /// Carries out a depth-first traversal of a field subtree rooted at `rootFieldId`. For each field, `visitField` is
891 /// called passing the field ID and the number of overall repetitions, taking into account the repetitions of each
892 /// parent field in the hierarchy.
894 const auto &visitField, const auto &enterSubtree) -> void {
896 for (const auto &f : desc.GetFieldIterable(rootFieldId)) {
897 const std::uint64_t nRepetitions = std::max(f.GetNRepetitions(), std::uint64_t{1U}) * nRepetitionsAtThisLevel;
899 }
900 };
901
902 // Extended columns can only be part of the header extension
903 if (!desc.GetHeaderExtension())
904 return *this;
905
906 // Ensure that all columns in the header extension have their associated `R(Column|Page)Range`
907 // Extended columns can be attached both to fields of the regular header and to fields of the extension header
908 for (const auto &topLevelField : desc.GetTopLevelFields()) {
910 topLevelField.GetId(), std::max(topLevelField.GetNRepetitions(), std::uint64_t{1U}),
911 [&](ROOT::DescriptorId_t fieldId, std::uint64_t nRepetitions) {
912 for (const auto &c : desc.GetColumnIterable(fieldId)) {
913 const ROOT::DescriptorId_t physicalId = c.GetPhysicalId();
914 auto &columnRange = fCluster.fColumnRanges[physicalId];
915
916 // Initialize a RColumnRange for `physicalId` if it was not there. Columns that were created during model
917 // extension won't have on-disk metadata for the clusters that were already committed before the model
918 // was extended. Therefore, these need to be synthetically initialized upon reading.
919 if (columnRange.GetPhysicalColumnId() == ROOT::kInvalidDescriptorId) {
920 columnRange.SetPhysicalColumnId(physicalId);
921 columnRange.SetFirstElementIndex(0);
922 columnRange.SetNElements(0);
923 columnRange.SetIsSuppressed(c.IsSuppressedDeferredColumn());
924 }
925 // Fixup the RColumnRange and RPageRange in deferred columns. We know what the first element index and
926 // number of elements should have been if the column was not deferred; fix those and let
927 // `ExtendToFitColumnRange()` synthesize RPageInfos accordingly.
928 // Note that a deferred column (i.e, whose first element index is > 0) already met the criteria of
929 // `ROOT::RFieldBase::EntryToColumnElementIndex()`, i.e. it is a principal column reachable from the
930 // field zero excluding subfields of collection and variant fields.
931 if (c.IsDeferredColumn()) {
932 if (c.GetRepresentationIndex() == 0) {
933 columnRange.SetFirstElementIndex(fCluster.GetFirstEntryIndex() * nRepetitions);
934 columnRange.SetNElements(fCluster.GetNEntries() * nRepetitions);
935 } else {
936 // Deferred representations which are not the first cannot count on the number of elements being
937 // equal to Entries * nRepetitions because they might have been added in a later cluster. But they
938 // can rely on the first representation having the correct FirstElement/NElements (by definition
939 // the first representation cannot be an "extended" one), therefore they can just copy the value
940 // from it.
941 const auto &field = desc.GetFieldDescriptor(fieldId);
942 const auto firstReprColumnId = field.GetLogicalColumnIds()[c.GetIndex()];
943 const auto &firstReprColumnRange = fCluster.fColumnRanges[firstReprColumnId];
944 columnRange.SetFirstElementIndex(firstReprColumnRange.GetFirstElementIndex());
945 columnRange.SetNElements(firstReprColumnRange.GetNElements());
946 }
947 if (!columnRange.IsSuppressed()) {
948 auto &pageRange = fCluster.fPageRanges[physicalId];
949 pageRange.fPhysicalColumnId = physicalId;
950 const auto element = ROOT::Internal::RColumnElementBase::Generate<void>(c.GetType());
951 pageRange.ExtendToFitColumnRange(columnRange, *element, ROOT::Internal::RPage::kPageZeroSize);
952 }
953 } else if (!columnRange.IsSuppressed()) {
954 fCluster.fPageRanges[physicalId].fPhysicalColumnId = physicalId;
955 }
956 }
957 },
959 }
960 return *this;
961}
962
964{
965 if (fCluster.fClusterId == ROOT::kInvalidDescriptorId)
966 return R__FAIL("unset cluster ID");
967 if (fCluster.fNEntries == 0)
968 return R__FAIL("empty cluster");
969 for (auto &pr : fCluster.fPageRanges) {
970 if (fCluster.fColumnRanges.count(pr.first) == 0) {
971 return R__FAIL("missing column range");
972 }
973 pr.second.fCumulativeNElements.reset();
974 const auto nPages = pr.second.fPageInfos.size();
976 pr.second.fCumulativeNElements = std::make_unique<std::vector<NTupleSize_t>>();
977 pr.second.fCumulativeNElements->reserve(nPages);
979 for (const auto &pi : pr.second.fPageInfos) {
980 sum += pi.GetNElements();
981 pr.second.fCumulativeNElements->emplace_back(sum);
982 }
983 }
984 }
986 std::swap(result, fCluster);
987 return result;
988}
989
990////////////////////////////////////////////////////////////////////////////////
991
994{
996 builder.ClusterGroupId(clusterGroupDesc.GetId())
997 .PageListLocator(clusterGroupDesc.GetPageListLocator())
998 .PageListLength(clusterGroupDesc.GetPageListLength())
999 .MinEntry(clusterGroupDesc.GetMinEntry())
1000 .EntrySpan(clusterGroupDesc.GetEntrySpan())
1001 .NClusters(clusterGroupDesc.GetNClusters());
1002 return builder;
1003}
1004
1006{
1007 if (fClusterGroup.fClusterGroupId == ROOT::kInvalidDescriptorId)
1008 return R__FAIL("unset cluster group ID");
1010 std::swap(result, fClusterGroup);
1011 return result;
1012}
1013
1014////////////////////////////////////////////////////////////////////////////////
1015
1017{
1018 if (fExtraTypeInfo.fContentId == EExtraTypeInfoIds::kInvalid)
1019 throw RException(R__FAIL("invalid extra type info content id"));
1021 std::swap(result, fExtraTypeInfo);
1022 return result;
1023}
1024
1025////////////////////////////////////////////////////////////////////////////////
1026
1028{
1029 if (fDescriptor.fFieldDescriptors.count(fieldId) == 0)
1030 return R__FAIL("field with id '" + std::to_string(fieldId) + "' doesn't exist");
1031 return RResult<void>::Success();
1032}
1033
1035{
1036 if (fDescriptor.fVersionEpoch != RNTuple::kVersionEpoch) {
1037 return R__FAIL("unset or unsupported RNTuple epoch version");
1038 }
1039
1040 // Reuse field name validity check
1041 auto validName = ROOT::Internal::EnsureValidNameForRNTuple(fDescriptor.GetName(), "Field");
1042 if (!validName) {
1044 }
1045
1046 for (const auto &[fieldId, fieldDesc] : fDescriptor.fFieldDescriptors) {
1047 // parent not properly set?
1048 if (fieldId != fDescriptor.GetFieldZeroId() && fieldDesc.GetParentId() == ROOT::kInvalidDescriptorId) {
1049 return R__FAIL("field with id '" + std::to_string(fieldId) + "' has an invalid parent id");
1050 }
1051
1052 // Same number of columns in every column representation?
1053 const auto columnCardinality = fieldDesc.GetColumnCardinality();
1054 if (columnCardinality == 0)
1055 continue;
1056
1057 // In AddColumn, we already checked that all but the last representation are complete.
1058 // Check that the last column representation is complete, i.e. has all columns.
1059 const auto &logicalColumnIds = fieldDesc.GetLogicalColumnIds();
1060 const auto nColumns = logicalColumnIds.size();
1061 // If we have only a single column representation, the following condition is true by construction
1062 if ((nColumns + 1) == columnCardinality)
1063 continue;
1064
1065 const auto &lastColumn = fDescriptor.GetColumnDescriptor(logicalColumnIds.back());
1066 if (lastColumn.GetIndex() + 1 != columnCardinality)
1067 return R__FAIL("field with id '" + std::to_string(fieldId) + "' has incomplete column representations");
1068 }
1069
1070 return RResult<void>::Success();
1071}
1072
1074{
1075 EnsureValidDescriptor().ThrowOnError();
1076 fDescriptor.fSortedClusterGroupIds.reserve(fDescriptor.fClusterGroupDescriptors.size());
1077 for (const auto &[id, _] : fDescriptor.fClusterGroupDescriptors)
1078 fDescriptor.fSortedClusterGroupIds.emplace_back(id);
1079 std::sort(fDescriptor.fSortedClusterGroupIds.begin(), fDescriptor.fSortedClusterGroupIds.end(),
1081 return fDescriptor.fClusterGroupDescriptors[a].GetMinEntry() <
1082 fDescriptor.fClusterGroupDescriptors[b].GetMinEntry();
1083 });
1085 std::swap(result, fDescriptor);
1086 return result;
1087}
1088
1090 std::uint16_t versionMinor, std::uint16_t versionPatch)
1091{
1093 throw RException(R__FAIL("unsupported RNTuple epoch version: " + std::to_string(versionEpoch)));
1094 }
1095 fDescriptor.fVersionEpoch = versionEpoch;
1096 fDescriptor.fVersionMajor = versionMajor;
1097 fDescriptor.fVersionMinor = versionMinor;
1098 fDescriptor.fVersionPatch = versionPatch;
1099}
1100
1102{
1103 fDescriptor.fVersionEpoch = RNTuple::kVersionEpoch;
1104 fDescriptor.fVersionMajor = RNTuple::kVersionMajor;
1105 fDescriptor.fVersionMinor = RNTuple::kVersionMinor;
1106 fDescriptor.fVersionPatch = RNTuple::kVersionPatch;
1107}
1108
1110{
1111 fDescriptor.fName = std::string(name);
1112 fDescriptor.fDescription = std::string(description);
1113}
1114
1116{
1117 if (flag > 0 && flag % 64 == 0)
1118 throw RException(R__FAIL("invalid feature flag: " + std::to_string(flag)));
1119 fDescriptor.fFeatureFlags.insert(flag);
1120}
1121
1124{
1125 if (fDesc.fName.empty())
1126 return R__FAIL("attribute set name cannot be empty");
1127 if (fDesc.fAnchorLength == 0)
1128 return R__FAIL("invalid anchor length");
1129 if (fDesc.fAnchorLocator.GetType() == RNTupleLocator::kTypeUnknown)
1130 return R__FAIL("invalid locator type");
1131
1132 return std::move(fDesc);
1133}
1134
1136{
1137 if (fColumn.GetLogicalId() == ROOT::kInvalidDescriptorId)
1138 return R__FAIL("invalid logical column id");
1139 if (fColumn.GetPhysicalId() == ROOT::kInvalidDescriptorId)
1140 return R__FAIL("invalid physical column id");
1141 if (fColumn.GetFieldId() == ROOT::kInvalidDescriptorId)
1142 return R__FAIL("invalid field id, dangling column");
1143
1144 // NOTE: if the column type is unknown we don't want to fail, as we might be reading an RNTuple
1145 // created with a future version of ROOT. In this case we just skip the valid bit range check,
1146 // as we have no idea what the valid range is.
1147 // In general, reading the metadata of an unknown column is fine, it becomes an error only when
1148 // we try to read the actual data contained in it.
1149 if (fColumn.GetType() != ENTupleColumnType::kUnknown) {
1150 const auto [minBits, maxBits] = ROOT::Internal::RColumnElementBase::GetValidBitRange(fColumn.GetType());
1151 if (fColumn.GetBitsOnStorage() < minBits || fColumn.GetBitsOnStorage() > maxBits)
1152 return R__FAIL("invalid column bit width");
1153 }
1154
1155 return fColumn.Clone();
1156}
1157
1160{
1162 fieldDesc.FieldVersion(field.GetFieldVersion())
1163 .TypeVersion(field.GetTypeVersion())
1164 .FieldName(field.GetFieldName())
1165 .FieldDescription(field.GetDescription())
1166 .TypeName(field.GetTypeName())
1167 .TypeAlias(field.GetTypeAlias())
1168 .Structure(field.GetStructure())
1169 .NRepetitions(field.GetNRepetitions());
1171 fieldDesc.TypeChecksum(field.GetTypeChecksum());
1172 if (field.GetTraits() & ROOT::RFieldBase::kTraitSoACollection) {
1173 assert(field.GetStructure() == ENTupleStructure::kCollection);
1174 fieldDesc.IsSoACollection(true);
1175 }
1176 return fieldDesc;
1177}
1178
1180{
1181 if (fField.GetId() == ROOT::kInvalidDescriptorId) {
1182 return R__FAIL("invalid field id");
1183 }
1184 if (fField.GetStructure() == ROOT::ENTupleStructure::kInvalid) {
1185 return R__FAIL("invalid field structure");
1186 }
1187 if (fField.IsSoACollection() && (fField.GetStructure() != ROOT::ENTupleStructure::kCollection)) {
1188 return R__FAIL("invalid SoA flag on non-collection field");
1189 }
1190 // FieldZero is usually named "" and would be a false positive here
1191 if (fField.GetParentId() != ROOT::kInvalidDescriptorId) {
1192 auto validName = ROOT::Internal::EnsureValidNameForRNTuple(fField.GetFieldName(), "Field");
1193 if (!validName) {
1195 }
1196 if (fField.GetFieldName().empty()) {
1197 return R__FAIL("name cannot be empty string \"\"");
1198 }
1199 }
1200 return fField.Clone();
1201}
1202
1204{
1205 fDescriptor.fFieldDescriptors.emplace(fieldDesc.GetId(), fieldDesc.Clone());
1206 if (fDescriptor.fHeaderExtension)
1207 fDescriptor.fHeaderExtension->MarkExtendedField(fieldDesc);
1208 if (fieldDesc.GetFieldName().empty() && fieldDesc.GetParentId() == ROOT::kInvalidDescriptorId) {
1209 fDescriptor.fFieldZeroId = fieldDesc.GetId();
1210 }
1211}
1212
1215{
1217 if (!(fieldExists = EnsureFieldExists(fieldId)))
1219 if (!(fieldExists = EnsureFieldExists(linkId)))
1220 return R__FAIL("child field with id '" + std::to_string(linkId) + "' doesn't exist in NTuple");
1221
1222 if (linkId == fDescriptor.GetFieldZeroId()) {
1223 return R__FAIL("cannot make FieldZero a child field");
1224 }
1225 // fail if field already has another valid parent
1226 auto parentId = fDescriptor.fFieldDescriptors.at(linkId).GetParentId();
1228 return R__FAIL("field '" + std::to_string(linkId) + "' already has a parent ('" + std::to_string(parentId) + ")");
1229 }
1230 if (fieldId == linkId) {
1231 return R__FAIL("cannot make field '" + std::to_string(fieldId) + "' a child of itself");
1232 }
1233 fDescriptor.fFieldDescriptors.at(linkId).fParentId = fieldId;
1234 fDescriptor.fFieldDescriptors.at(fieldId).fLinkIds.push_back(linkId);
1235 return RResult<void>::Success();
1236}
1237
1240{
1242 if (!(fieldExists = EnsureFieldExists(sourceId)))
1244 if (!(fieldExists = EnsureFieldExists(targetId)))
1245 return R__FAIL("projected field with id '" + std::to_string(targetId) + "' doesn't exist in NTuple");
1246
1247 if (targetId == fDescriptor.GetFieldZeroId()) {
1248 return R__FAIL("cannot make FieldZero a projected field");
1249 }
1250 if (sourceId == targetId) {
1251 return R__FAIL("cannot make field '" + std::to_string(targetId) + "' a projection of itself");
1252 }
1253 if (fDescriptor.fFieldDescriptors.at(sourceId).IsProjectedField()) {
1254 return R__FAIL("cannot make field '" + std::to_string(targetId) + "' a projection of an already projected field");
1255 }
1256 // fail if target field already has another valid projection source
1257 auto &targetDesc = fDescriptor.fFieldDescriptors.at(targetId);
1258 if (targetDesc.IsProjectedField() && targetDesc.GetProjectionSourceId() != sourceId) {
1259 return R__FAIL("field '" + std::to_string(targetId) + "' has already a projection source ('" +
1260 std::to_string(targetDesc.GetProjectionSourceId()) + ")");
1261 }
1262 fDescriptor.fFieldDescriptors.at(targetId).fProjectionSourceId = sourceId;
1263 return RResult<void>::Success();
1264}
1265
1267{
1268 const auto fieldId = columnDesc.GetFieldId();
1269 const auto columnIndex = columnDesc.GetIndex();
1270 const auto representationIndex = columnDesc.GetRepresentationIndex();
1271
1272 auto fieldExists = EnsureFieldExists(fieldId);
1273 if (!fieldExists) {
1275 }
1276 auto &fieldDesc = fDescriptor.fFieldDescriptors.find(fieldId)->second;
1277
1278 if (columnDesc.IsAliasColumn()) {
1279 if (columnDesc.GetType() != fDescriptor.GetColumnDescriptor(columnDesc.GetPhysicalId()).GetType())
1280 return R__FAIL("alias column type mismatch");
1281 }
1282 if (fDescriptor.FindLogicalColumnId(fieldId, columnIndex, representationIndex) != ROOT::kInvalidDescriptorId) {
1283 return R__FAIL("column index clash");
1284 }
1285 if (columnIndex > 0) {
1286 if (fDescriptor.FindLogicalColumnId(fieldId, columnIndex - 1, representationIndex) == ROOT::kInvalidDescriptorId)
1287 return R__FAIL("out of bounds column index");
1288 }
1289 if (representationIndex > 0) {
1290 if (fDescriptor.FindLogicalColumnId(fieldId, 0, representationIndex - 1) == ROOT::kInvalidDescriptorId) {
1291 return R__FAIL("out of bounds representation index");
1292 }
1293 if (columnIndex == 0) {
1294 assert(fieldDesc.fColumnCardinality > 0);
1295 if (fDescriptor.FindLogicalColumnId(fieldId, fieldDesc.fColumnCardinality - 1, representationIndex - 1) ==
1297 return R__FAIL("incomplete column representations");
1298 }
1299 } else {
1300 if (columnIndex >= fieldDesc.fColumnCardinality)
1301 return R__FAIL("irregular column representations");
1302 }
1303 } else {
1304 // This will set the column cardinality to the number of columns of the first representation
1305 fieldDesc.fColumnCardinality = columnIndex + 1;
1306 }
1307
1308 const auto logicalId = columnDesc.GetLogicalId();
1309 fieldDesc.fLogicalColumnIds.emplace_back(logicalId);
1310
1311 if (!columnDesc.IsAliasColumn())
1312 fDescriptor.fNPhysicalColumns++;
1313 if (fDescriptor.fHeaderExtension)
1314 fDescriptor.fHeaderExtension->MarkExtendedColumn(columnDesc);
1315 fDescriptor.fColumnDescriptors.emplace(logicalId, std::move(columnDesc));
1316
1317 return RResult<void>::Success();
1318}
1319
1321{
1322 const auto id = clusterGroup.GetId();
1323 if (fDescriptor.fClusterGroupDescriptors.count(id) > 0)
1324 return R__FAIL("cluster group id clash");
1325 fDescriptor.fNEntries = std::max(fDescriptor.fNEntries, clusterGroup.GetMinEntry() + clusterGroup.GetEntrySpan());
1326 fDescriptor.fNClusters += clusterGroup.GetNClusters();
1327 fDescriptor.fClusterGroupDescriptors.emplace(id, std::move(clusterGroup));
1328 return RResult<void>::Success();
1329}
1330
1335
1337{
1338 if (!fDescriptor.fHeaderExtension)
1339 fDescriptor.fHeaderExtension = std::make_unique<RNTupleDescriptor::RHeaderExtension>();
1340}
1341
1343{
1344 if (fDescriptor.GetNLogicalColumns() == 0)
1345 return;
1346 R__ASSERT(fDescriptor.GetNPhysicalColumns() > 0);
1347
1348 for (ROOT::DescriptorId_t id = fDescriptor.GetNLogicalColumns() - 1; id >= fDescriptor.GetNPhysicalColumns(); --id) {
1349 auto c = fDescriptor.fColumnDescriptors[id].Clone();
1350 R__ASSERT(c.IsAliasColumn());
1351 R__ASSERT(id == c.GetLogicalId());
1352 fDescriptor.fColumnDescriptors.erase(id);
1353 for (auto &link : fDescriptor.fFieldDescriptors[c.fFieldId].fLogicalColumnIds) {
1354 if (link == c.fLogicalColumnId) {
1355 link += offset;
1356 break;
1357 }
1358 }
1359 c.fLogicalColumnId += offset;
1360 R__ASSERT(fDescriptor.fColumnDescriptors.count(c.fLogicalColumnId) == 0);
1361 fDescriptor.fColumnDescriptors.emplace(c.fLogicalColumnId, std::move(c));
1362 }
1363
1364 // Patch up column ids in the header extension
1365 if (auto &xHeader = fDescriptor.fHeaderExtension) {
1366 for (auto &columnId : xHeader->fExtendedColumnRepresentations) {
1367 if (columnId >= fDescriptor.GetNPhysicalColumns())
1368 columnId += offset;
1369 }
1370 }
1371}
1372
1374{
1375 auto clusterId = clusterDesc.GetId();
1376 if (fDescriptor.fClusterDescriptors.count(clusterId) > 0)
1377 return R__FAIL("cluster id clash");
1378 fDescriptor.fClusterDescriptors.emplace(clusterId, std::move(clusterDesc));
1379 return RResult<void>::Success();
1380}
1381
1384{
1385 // Make sure we have no duplicates
1386 if (std::find(fDescriptor.fExtraTypeInfoDescriptors.begin(), fDescriptor.fExtraTypeInfoDescriptors.end(),
1387 extraTypeInfoDesc) != fDescriptor.fExtraTypeInfoDescriptors.end()) {
1388 return R__FAIL("extra type info duplicates");
1389 }
1390 fDescriptor.fExtraTypeInfoDescriptors.emplace_back(std::move(extraTypeInfoDesc));
1391 return RResult<void>::Success();
1392}
1393
1395{
1396 auto it = std::find(fDescriptor.fExtraTypeInfoDescriptors.begin(), fDescriptor.fExtraTypeInfoDescriptors.end(),
1398 if (it != fDescriptor.fExtraTypeInfoDescriptors.end())
1399 *it = std::move(extraTypeInfoDesc);
1400 else
1401 fDescriptor.fExtraTypeInfoDescriptors.emplace_back(std::move(extraTypeInfoDesc));
1402}
1403
1406{
1407 auto &attrSets = fDescriptor.fAttributeSets;
1408 if (std::find_if(attrSets.begin(), attrSets.end(), [&name = attrSetDesc.GetName()](const auto &desc) {
1409 return desc.GetName() == name;
1410 }) != attrSets.end()) {
1411 return R__FAIL("attribute sets with duplicate names");
1412 }
1413 attrSets.push_back(std::move(attrSetDesc));
1414 return RResult<void>::Success();
1415}
1416
1421
1427
1434
1440
1447
1452
1458
1463
1469
1475
1480
1485
1490
1495
1497{
1498 return fAnchorLength == other.fAnchorLength && fSchemaVersionMajor == other.fSchemaVersionMajor &&
1499 fSchemaVersionMinor == other.fSchemaVersionMinor && fAnchorLocator == other.fAnchorLocator &&
1500 fName == other.fName;
1501};
1502
1504{
1506 desc.fAnchorLength = fAnchorLength;
1507 desc.fSchemaVersionMajor = fSchemaVersionMajor;
1508 desc.fSchemaVersionMinor = fSchemaVersionMinor;
1509 desc.fAnchorLocator = fAnchorLocator;
1510 desc.fName = fName;
1511 return desc;
1512}
1513
1515{
1516 if (fieldDesc.GetStructure() != ROOT::ENTupleStructure::kPlain)
1517 return false;
1518 if (fieldDesc.GetTypeName().rfind("std::", 0) == 0)
1519 return false;
1520
1521 auto subFieldId = desc.FindFieldId("_0", fieldDesc.GetId());
1523 return false;
1524
1525 static const std::string gIntTypeNames[] = {"bool", "char", "std::int8_t", "std::uint8_t",
1526 "std::int16_t", "std::uint16_t", "std::int32_t", "std::uint32_t",
1527 "std::int64_t", "std::uint64_t"};
1528 return std::find(std::begin(gIntTypeNames), std::end(gIntTypeNames),
1529 desc.GetFieldDescriptor(subFieldId).GetTypeName()) != std::end(gIntTypeNames);
1530}
1531
1533{
1534 if (fieldDesc.GetStructure() != ROOT::ENTupleStructure::kPlain)
1535 return false;
1536 return (fieldDesc.GetTypeName().rfind("std::atomic<", 0) == 0);
1537}
#define R__FORWARD_ERROR(res)
Short-hand to return an RResult<T> in an error state (i.e. after checking)
Definition RError.hxx:326
#define R__FAIL(msg)
Short-hand to return an RResult<T> in an error state; the RError is implicitly converted into RResult...
Definition RError.hxx:322
#define d(i)
Definition RSha256.hxx:102
#define b(i)
Definition RSha256.hxx:100
#define f(i)
Definition RSha256.hxx:104
#define c(i)
Definition RSha256.hxx:101
#define a(i)
Definition RSha256.hxx:99
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
#define R__ASSERT(e)
Checks condition e and reports a fatal error if it's false.
Definition TError.h:125
#define N
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h offset
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t result
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t index
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize id
char name[80]
Definition TGX11.cxx:148
#define _(A, B)
Definition cfortran.h:108
RResult< ROOT::Experimental::RNTupleAttrSetDescriptor > MoveDescriptor()
Attempt to make an AttributeSet descriptor.
Used to loop over all the Attribute Sets linked to an RNTuple.
Metadata stored for every Attribute Set linked to an RNTuple.
bool operator==(const RNTupleAttrSetDescriptor &other) const
std::uint32_t fAnchorLength
uncompressed size of the linked anchor
A helper class for piece-wise construction of an RClusterDescriptor.
RResult< void > MarkSuppressedColumnRange(ROOT::DescriptorId_t physicalId)
Books the given column ID as being suppressed in this cluster.
RResult< void > CommitColumnRange(ROOT::DescriptorId_t physicalId, std::uint64_t firstElementIndex, std::uint32_t compressionSettings, const RClusterDescriptor::RPageRange &pageRange)
RClusterDescriptorBuilder & AddExtendedColumnRanges(const RNTupleDescriptor &desc)
Add column and page ranges for columns created during late model extension missing in this cluster.
RResult< void > CommitSuppressedColumnRanges(const RNTupleDescriptor &desc)
Sets the first element index and number of elements for all the suppressed column ranges.
RResult< RClusterDescriptor > MoveDescriptor()
Move out the full cluster descriptor including page locations.
A helper class for piece-wise construction of an RClusterGroupDescriptor.
RClusterGroupDescriptorBuilder & EntrySpan(std::uint64_t entrySpan)
RClusterGroupDescriptorBuilder & PageListLocator(const RNTupleLocator &pageListLocator)
static RClusterGroupDescriptorBuilder FromSummary(const RClusterGroupDescriptor &clusterGroupDesc)
RClusterGroupDescriptorBuilder & PageListLength(std::uint64_t pageListLength)
RClusterGroupDescriptorBuilder & MinEntry(std::uint64_t minEntry)
RResult< RClusterGroupDescriptor > MoveDescriptor()
RClusterGroupDescriptorBuilder & ClusterGroupId(ROOT::DescriptorId_t clusterGroupId)
RClusterGroupDescriptorBuilder & NClusters(std::uint32_t nClusters)
RResult< RColumnDescriptor > MakeDescriptor() const
Attempt to make a column descriptor.
A column element encapsulates the translation between basic C++ types and their column representation...
static std::pair< std::uint16_t, std::uint16_t > GetValidBitRange(ROOT::ENTupleColumnType type)
Most types have a fixed on-disk bit width.
RResult< RExtraTypeInfoDescriptor > MoveDescriptor()
A helper class for piece-wise construction of an RFieldDescriptor.
RResult< RFieldDescriptor > MakeDescriptor() const
Attempt to make a field descriptor.
static RFieldDescriptorBuilder FromField(const ROOT::RFieldBase &field)
Make a new RFieldDescriptorBuilder based off a live RNTuple field.
void SetNTuple(std::string_view name, std::string_view description)
void SetSchemaFromExisting(const RNTupleDescriptor &descriptor)
Copies the "schema" part of descriptor into the builder's descriptor.
RResult< void > AddColumn(RColumnDescriptor &&columnDesc)
RResult< void > AddAttributeSet(Experimental::RNTupleAttrSetDescriptor &&attrSetDesc)
RResult< void > AddFieldProjection(ROOT::DescriptorId_t sourceId, ROOT::DescriptorId_t targetId)
void ReplaceExtraTypeInfo(RExtraTypeInfoDescriptor &&extraTypeInfoDesc)
RResult< void > AddExtraTypeInfo(RExtraTypeInfoDescriptor &&extraTypeInfoDesc)
void ShiftAliasColumns(std::uint32_t offset)
Shift column IDs of alias columns by offset
void SetVersion(std::uint16_t versionEpoch, std::uint16_t versionMajor, std::uint16_t versionMinor, std::uint16_t versionPatch)
void BeginHeaderExtension()
Mark the beginning of the header extension; any fields and columns added after a call to this functio...
RResult< void > AddCluster(RClusterDescriptor &&clusterDesc)
RResult< void > EnsureValidDescriptor() const
Checks whether invariants hold:
RResult< void > AddFieldLink(ROOT::DescriptorId_t fieldId, ROOT::DescriptorId_t linkId)
void AddField(const RFieldDescriptor &fieldDesc)
RResult< void > AddClusterGroup(RClusterGroupDescriptor &&clusterGroup)
RResult< void > EnsureFieldExists(ROOT::DescriptorId_t fieldId) const
void SetFeature(unsigned int flag)
Sets the flag-th bit of the feature flag to 1.
The window of element indexes of a particular column in a particular cluster.
Records the partition of data into pages for a particular column in a particular cluster.
static constexpr std::size_t kLargeRangeThreshold
Create the fCumulativeNElements only when its needed, i.e. when there are many pages to search throug...
RPageInfoExtended Find(ROOT::NTupleSize_t idxInCluster) const
Find the page in the RPageRange that contains the given element. The element must exist.
std::size_t ExtendToFitColumnRange(const RColumnRange &columnRange, const ROOT::Internal::RColumnElementBase &element, std::size_t pageSize)
Extend this RPageRange to fit the given RColumnRange.
Metadata for RNTuple clusters.
ROOT::NTupleSize_t fFirstEntryIndex
Clusters can be swapped by adjusting the entry offsets of the cluster and all ranges.
std::unordered_map< ROOT::DescriptorId_t, RColumnRange > fColumnRanges
ROOT::DescriptorId_t fClusterId
RClusterDescriptor Clone() const
bool operator==(const RClusterDescriptor &other) const
RColumnRangeIterable GetColumnRangeIterable() const
Returns an iterator over pairs { columnId, columnRange }. The iteration order is unspecified.
std::unordered_map< ROOT::DescriptorId_t, RPageRange > fPageRanges
std::uint64_t GetNBytesOnStorage() const
Clusters are bundled in cluster groups.
RNTupleLocator fPageListLocator
The page list that corresponds to the cluster group.
RClusterGroupDescriptor Clone() const
std::vector< ROOT::DescriptorId_t > fClusterIds
The cluster IDs can be empty if the corresponding page list is not loaded.
std::uint64_t fMinEntry
The minimum first entry number of the clusters in the cluster group.
std::uint32_t fNClusters
Number of clusters is always known even if the cluster IDs are not (yet) populated.
std::uint64_t fPageListLength
Uncompressed size of the page list.
std::uint64_t fEntrySpan
Number of entries that are (partially for sharded clusters) covered by this cluster group.
bool operator==(const RClusterGroupDescriptor &other) const
RClusterGroupDescriptor CloneSummary() const
Creates a clone without the cluster IDs.
Metadata stored for every column of an RNTuple.
ROOT::DescriptorId_t fPhysicalColumnId
Usually identical to the logical column ID, except for alias columns where it references the shadowed...
bool operator==(const RColumnDescriptor &other) const
ROOT::DescriptorId_t fLogicalColumnId
The actual column identifier, which is the link to the corresponding field.
ROOT::DescriptorId_t fFieldId
Every column belongs to one and only one field.
std::int64_t fFirstElementIndex
The absolute value specifies the index for the first stored element for this column.
std::uint32_t fIndex
A field can be serialized into several columns, which are numbered from zero to $n$.
std::uint16_t fBitsOnStorage
The size in bits of elements of this column.
std::uint16_t fRepresentationIndex
A field may use multiple column representations, which are numbered from zero to $m$.
ROOT::ENTupleColumnType fType
The on-disk column type.
std::optional< RValueRange > fValueRange
Optional value range (used e.g. by quantized real fields)
RColumnDescriptor Clone() const
Get a copy of the descriptor.
Base class for all ROOT issued exceptions.
Definition RError.hxx:78
Field specific extra type information from the header / extenstion header.
bool operator==(const RExtraTypeInfoDescriptor &other) const
RExtraTypeInfoDescriptor Clone() const
EExtraTypeInfoIds fContentId
Specifies the meaning of the extra information.
std::string fTypeName
The type name the extra information refers to; empty for RNTuple-wide extra information.
std::string fContent
The content format depends on the content ID and may be binary.
std::uint32_t fTypeVersion
Type version the extra type information is bound to.
A field translates read and write calls from/to underlying columns to/from tree values.
@ kTraitSoACollection
The field represents a collection in SoA layout.
@ kTraitInvalidField
This field is an instance of RInvalidField and can be safely static_cast to it.
@ kTraitTypeChecksum
The TClass checksum is set and valid.
Metadata stored for every field of an RNTuple.
std::unique_ptr< ROOT::RFieldBase > CreateField(const RNTupleDescriptor &ntplDesc, const ROOT::RCreateFieldOptions &options={}) const
In general, we create a field simply from the C++ type name.
std::uint32_t fFieldVersion
The version of the C++-type-to-column translation mechanics.
ROOT::DescriptorId_t fFieldId
RFieldDescriptor Clone() const
Get a copy of the descriptor.
std::uint64_t fNRepetitions
The number of elements per entry for fixed-size arrays.
std::uint32_t fColumnCardinality
The number of columns in the column representations of the field.
ROOT::DescriptorId_t fProjectionSourceId
For projected fields, the source field ID.
bool operator==(const RFieldDescriptor &other) const
std::string fFieldDescription
Free text set by the user.
ROOT::DescriptorId_t fParentId
Establishes sub field relationships, such as classes and collections.
std::string fTypeAlias
A typedef or using directive that resolved to the type name during field creation.
ROOT::ENTupleStructure fStructure
The structural information carried by this field in the data model tree.
std::vector< ROOT::DescriptorId_t > fLinkIds
The pointers in the other direction from parent to children.
std::string fFieldName
The leaf name, not including parent fields.
bool fIsSoACollection
Indicates if this is a collection that should be represented in memory by a SoA layout.
std::uint32_t fTypeVersion
The version of the C++ type itself.
std::string fTypeName
The C++ type that was used when writing the field.
std::vector< ROOT::DescriptorId_t > fLogicalColumnIds
The ordered list of columns attached to this field: first by representation index then by column inde...
std::optional< std::uint32_t > fTypeChecksum
For custom classes, we store the ROOT TClass reported checksum to facilitate the use of I/O rules tha...
Used in RFieldBase::Check() to record field creation failures.
Definition RField.hxx:96
@ kGeneric
Generic unrecoverable error.
@ kUnknownStructure
The field could not be created because its descriptor had an unknown structural role.
Used to loop over all the clusters of an RNTuple (in unspecified order)
Used to loop over all the cluster groups of an RNTuple (in unspecified order)
Used to loop over a field's associated columns.
std::vector< ROOT::DescriptorId_t > fColumns
The descriptor ids of the columns ordered by field, representation, and column index.
RColumnDescriptorIterable(const RNTupleDescriptor &ntuple, const RFieldDescriptor &fieldDesc)
Used to loop over all the extra type info record of an RNTuple (in unspecified order)
Used to loop over a field's child fields.
std::vector< ROOT::DescriptorId_t > GetTopMostFields(const RNTupleDescriptor &desc) const
Return a vector containing the IDs of the top-level fields defined in the extension header,...
The on-storage metadata of an RNTuple.
const RColumnDescriptor & GetColumnDescriptor(ROOT::DescriptorId_t columnId) const
ROOT::DescriptorId_t FindNextClusterId(ROOT::DescriptorId_t clusterId) const
RFieldDescriptorIterable GetFieldIterable(const RFieldDescriptor &fieldDesc) const
std::set< unsigned int > fFeatureFlags
std::unordered_map< ROOT::DescriptorId_t, RClusterGroupDescriptor > fClusterGroupDescriptors
const RFieldDescriptor & GetFieldDescriptor(ROOT::DescriptorId_t fieldId) const
std::uint64_t fNPhysicalColumns
Updated by the descriptor builder when columns are added.
std::vector< Experimental::RNTupleAttrSetDescriptor > fAttributeSets
List of AttributeSets linked to this RNTuple.
ROOT::DescriptorId_t fFieldZeroId
Set by the descriptor builder.
std::uint64_t fNEntries
Updated by the descriptor builder when the cluster groups are added.
RClusterGroupDescriptorIterable GetClusterGroupIterable() const
RColumnDescriptorIterable GetColumnIterable() const
bool operator==(const RNTupleDescriptor &other) const
std::uint64_t fOnDiskFooterSize
Like fOnDiskHeaderSize, contains both cluster summaries and page locations.
std::uint16_t fVersionMinor
Set by the descriptor builder when deserialized.
ROOT::DescriptorId_t FindClusterId(ROOT::NTupleSize_t entryIdx) const
std::vector< std::uint64_t > GetFeatureFlags() const
ROOT::DescriptorId_t GetFieldZeroId() const
Returns the logical parent of all top-level RNTuple data fields.
std::unique_ptr< ROOT::RNTupleModel > CreateModel(const RCreateModelOptions &options=RCreateModelOptions()) const
Re-create the C++ model from the stored metadata.
std::string GetTypeNameForComparison(const RFieldDescriptor &fieldDesc) const
Adjust the type name of the passed RFieldDescriptor for comparison with another renormalized type nam...
std::unordered_map< ROOT::DescriptorId_t, RClusterDescriptor > fClusterDescriptors
Potentially a subset of all the available clusters.
std::size_t GetNClusters() const
ROOT::DescriptorId_t FindPhysicalColumnId(ROOT::DescriptorId_t fieldId, std::uint32_t columnIndex, std::uint16_t representationIndex) const
RExtraTypeInfoDescriptorIterable GetExtraTypeInfoIterable() const
const RHeaderExtension * GetHeaderExtension() const
Return header extension information; if the descriptor does not have a header extension,...
std::uint64_t fNClusters
Updated by the descriptor builder when the cluster groups are added.
std::uint64_t fOnDiskHeaderXxHash3
Set by the descriptor builder when deserialized.
const RClusterDescriptor & GetClusterDescriptor(ROOT::DescriptorId_t clusterId) const
ROOT::DescriptorId_t FindFieldId(std::string_view fieldName, ROOT::DescriptorId_t parentId) const
std::string fName
The RNTuple name needs to be unique in a given storage location (file)
std::uint64_t fOnDiskHeaderSize
Set by the descriptor builder when deserialized.
RResult< void > DropClusterGroupDetails(ROOT::DescriptorId_t clusterGroupId)
std::uint16_t fVersionMajor
Set by the descriptor builder when deserialized.
std::vector< ROOT::DescriptorId_t > fSortedClusterGroupIds
References cluster groups sorted by entry range and thus allows for binary search.
std::unordered_map< ROOT::DescriptorId_t, RColumnDescriptor > fColumnDescriptors
ROOT::DescriptorId_t FindLogicalColumnId(ROOT::DescriptorId_t fieldId, std::uint32_t columnIndex, std::uint16_t representationIndex) const
std::unordered_map< ROOT::DescriptorId_t, RFieldDescriptor > fFieldDescriptors
ROOT::NTupleSize_t GetNElements(ROOT::DescriptorId_t physicalColumnId) const
RResult< void > AddClusterGroupDetails(ROOT::DescriptorId_t clusterGroupId, std::vector< RClusterDescriptor > &clusterDescs)
Methods to load and drop cluster group details (cluster IDs and page locations)
std::uint16_t fVersionPatch
Set by the descriptor builder when deserialized.
std::string fDescription
Free text from the user.
ROOT::Experimental::RNTupleAttrSetDescriptorIterable GetAttrSetIterable() const
RFieldDescriptorIterable GetTopLevelFields() const
std::uint16_t fVersionEpoch
Set by the descriptor builder when deserialized.
std::vector< RExtraTypeInfoDescriptor > fExtraTypeInfoDescriptors
RNTupleDescriptor Clone() const
std::string GetQualifiedFieldName(ROOT::DescriptorId_t fieldId) const
Walks up the parents of the field ID and returns a field name of the form a.b.c.d In case of invalid ...
RClusterDescriptorIterable GetClusterIterable() const
RNTupleDescriptor CloneSchema() const
Creates a descriptor containing only the schema information about this RNTuple, i....
std::uint64_t fGeneration
The generation of the descriptor.
ROOT::DescriptorId_t FindPrevClusterId(ROOT::DescriptorId_t clusterId) const
std::unique_ptr< RHeaderExtension > fHeaderExtension
Generic information about the physical location of data.
static std::unique_ptr< RNTupleModel > Create()
static std::unique_ptr< RNTupleModel > CreateBare()
Creates a "bare model", i.e. an RNTupleModel with no default entry.
static constexpr std::uint16_t kVersionPatch
Definition RNTuple.hxx:81
static constexpr std::uint16_t kVersionMajor
Definition RNTuple.hxx:79
static constexpr std::uint16_t kVersionEpoch
Definition RNTuple.hxx:78
static constexpr std::uint16_t kVersionMinor
Definition RNTuple.hxx:80
const_iterator begin() const
const_iterator end() const
The class is used as a return type for operations that can fail; wraps a value of type T or an RError...
Definition RError.hxx:222
static std::unique_ptr< RVectorField > CreateUntyped(std::string_view fieldName, std::unique_ptr< RFieldBase > itemField)
const Int_t n
Definition legend1.C:16
Double_t ex[n]
Definition legend1.C:17
ROOT::DescriptorId_t CallFindClusterIdOn(const ROOT::RNTupleDescriptor &desc, ROOT::NTupleSize_t entryIdx)
RResult< void > EnsureValidNameForRNTuple(std::string_view name, std::string_view where)
Check whether a given string is a valid name according to the RNTuple specification.
ROOT::RResult< std::unique_ptr< ROOT::RFieldBase > > CallFieldBaseCreate(const std::string &fieldName, const std::string &typeName, const ROOT::RCreateFieldOptions &options, const ROOT::RNTupleDescriptor *desc, ROOT::DescriptorId_t fieldId)
bool IsCustomEnumFieldDesc(const RNTupleDescriptor &desc, const RFieldDescriptor &fieldDesc)
Tells if the field describes a user-defined enum type.
std::vector< ROOT::Internal::RNTupleClusterBoundaries > GetClusterBoundaries(const RNTupleDescriptor &desc)
Return the cluster boundaries for each cluster in this RNTuple.
std::string GetRenormalizedTypeName(const std::string &metaNormalizedName)
Given a type name normalized by ROOT meta, renormalize it for RNTuple. E.g., insert std::prefix.
bool IsStdAtomicFieldDesc(const RFieldDescriptor &fieldDesc)
Tells if the field describes a std::atomic<T> type.
std::uint64_t DescriptorId_t
Distriniguishes elements of the same type within a descriptor, e.g. different fields.
constexpr NTupleSize_t kInvalidNTupleIndex
std::uint64_t NTupleSize_t
Integer type long enough to hold the maximum number of entries in a column.
constexpr DescriptorId_t kInvalidDescriptorId
Additional information about a page in an in-memory RPageRange.
Information about a single page in the context of a cluster's page range.
static uint64_t sum(uint64_t i)
Definition Factory.cxx:2338