70std::unique_ptr<ROOT::RFieldBase>
75 streamerField->SetOnDiskId(
fFieldId);
96 std::vector<std::unique_ptr<ROOT::RFieldBase>> memberFields;
97 memberFields.reserve(
fLinkIds.size());
100 auto field = memberDesc.
CreateField(ntplDesc, options);
103 memberFields.emplace_back(std::move(field));
105 auto recordField = std::make_unique<ROOT::RRecordField>(
GetFieldName(), std::move(memberFields));
117 collectionField->SetOnDiskId(
fFieldId);
118 return collectionField;
133 for (
auto &subfield : *field) {
134 const auto subfieldId = ntplDesc.
FindFieldId(subfield.GetFieldName(), subfield.GetParent()->GetOnDiskId());
135 subfield.SetOnDiskId(subfieldId);
139 return invalidField.
Clone(fieldName);
188 if (firstInPage + pi.GetNElements() > idxInCluster) {
192 firstInPage += pi.GetNElements();
201 std::size_t left = 0;
202 std::size_t right =
N - 1;
203 std::size_t midpoint =
N;
204 while (left <= right) {
205 midpoint = (left + right) / 2;
214 right = midpoint - 1;
219 decltype(idxInCluster) firstInPage = (midpoint == 0) ? 0 : (*fCumulativeNElements)[midpoint - 1];
221 R__ASSERT((firstInPage + pageInfo.GetNElements()) > idxInCluster);
228 std::size_t pageSize)
233 const auto nElements =
235 [](std::size_t
n,
const auto &pageInfo) { return n + pageInfo.GetNElements(); });
236 const auto nElementsRequired =
static_cast<std::uint64_t
>(columnRange.
GetNElements());
238 if (nElementsRequired == nElements)
240 R__ASSERT((nElementsRequired > nElements) &&
"invalid attempt to shrink RPageRange");
242 std::vector<RPageInfo> pageInfos;
244 const std::uint64_t nElementsPerPage = pageSize / element.
GetSize();
246 for (
auto nRemainingElements = nElementsRequired - nElements; nRemainingElements > 0;) {
248 pageInfo.
SetNElements(std::min(nElementsPerPage, nRemainingElements));
253 pageInfos.emplace_back(pageInfo);
257 pageInfos.insert(pageInfos.end(), std::make_move_iterator(
fPageInfos.begin()),
260 return nElementsRequired - nElements;
271 std::uint64_t nbytes = 0;
273 for (
const auto &pi : pr.second.GetPageInfos()) {
274 nbytes += pi.GetLocator().GetNBytesOnStorage();
335 if (!cd.second.ContainsColumn(physicalColumnId))
337 auto columnRange = cd.second.GetColumnRange(physicalColumnId);
338 result = std::max(result, columnRange.GetFirstElementIndex() + columnRange.GetNElements());
345std::vector<ROOT::Internal::RNTupleClusterBoundaries>
348 std::vector<Internal::RNTupleClusterBoundaries> boundaries;
353 R__ASSERT(clusterDesc.GetNEntries() > 0);
355 clusterDesc.GetFirstEntryIndex(), clusterDesc.GetFirstEntryIndex() + clusterDesc.GetNEntries()});
364 std::string leafName(fieldName);
365 auto posDot = leafName.find_last_of(
'.');
366 if (posDot != std::string::npos) {
367 auto parentName = leafName.substr(0, posDot);
368 leafName = leafName.substr(posDot + 1);
374 for (
const auto linkId : itrFieldDesc->second.GetLinkIds()) {
389 return fieldDescriptor.GetFieldName();
390 return prefix +
"." + fieldDescriptor.GetFieldName();
412 std::uint32_t columnIndex,
413 std::uint16_t representationIndex)
const
418 if (columnIndex >= itr->second.GetColumnCardinality())
420 const auto idx = representationIndex * itr->second.GetColumnCardinality() + columnIndex;
421 if (itr->second.GetLogicalColumnIds().size() <= idx)
423 return itr->second.GetLogicalColumnIds()[idx];
427 std::uint32_t columnIndex,
428 std::uint16_t representationIndex)
const
444 std::size_t cgLeft = 0;
446 while (cgLeft <= cgRight) {
447 const std::size_t cgMidpoint = (cgLeft + cgRight) / 2;
453 if (!clusterDesc.ContainsColumn(physicalColumnId))
456 const auto firstElementInGroup = clusterDesc.GetColumnRange(physicalColumnId).GetFirstElementIndex();
457 if (firstElementInGroup > index) {
460 cgRight = cgMidpoint - 1;
464 const auto &lastColumnRange =
GetClusterDescriptor(clusterIds.back()).GetColumnRange(physicalColumnId);
465 if ((lastColumnRange.GetFirstElementIndex() + lastColumnRange.GetNElements()) <= index) {
467 cgLeft = cgMidpoint + 1;
473 std::size_t clusterLeft = 0;
474 std::size_t clusterRight = clusterIds.size() - 1;
475 while (clusterLeft <= clusterRight) {
476 const std::size_t clusterMidpoint = (clusterLeft + clusterRight) / 2;
477 const auto clusterId = clusterIds[clusterMidpoint];
480 if (columnRange.Contains(index))
483 if (columnRange.GetFirstElementIndex() > index) {
485 clusterRight = clusterMidpoint - 1;
489 if (columnRange.GetFirstElementIndex() + columnRange.GetNElements() <= index) {
490 clusterLeft = clusterMidpoint + 1;
506 std::size_t cgLeft = 0;
508 while (cgLeft <= cgRight) {
509 const std::size_t cgMidpoint = (cgLeft + cgRight) / 2;
512 if (cgDesc.GetMinEntry() > entryIdx) {
514 cgRight = cgMidpoint - 1;
518 if (cgDesc.GetMinEntry() + cgDesc.GetEntrySpan() <= entryIdx) {
519 cgLeft = cgMidpoint + 1;
525 const auto &clusterIds = cgDesc.GetClusterIds();
527 std::size_t clusterLeft = 0;
528 std::size_t clusterRight = clusterIds.size() - 1;
529 while (clusterLeft <= clusterRight) {
530 const std::size_t clusterMidpoint = (clusterLeft + clusterRight) / 2;
533 if (clusterDesc.GetFirstEntryIndex() > entryIdx) {
535 clusterRight = clusterMidpoint - 1;
539 if (clusterDesc.GetFirstEntryIndex() + clusterDesc.GetNEntries() <= entryIdx) {
540 clusterLeft = clusterMidpoint + 1;
544 return clusterIds[clusterMidpoint];
558 const auto firstEntryInNextCluster = clusterDesc.GetFirstEntryIndex() + clusterDesc.GetNEntries();
569 if (clusterDesc.GetFirstEntryIndex() == 0)
574std::vector<ROOT::DescriptorId_t>
577 std::vector<ROOT::DescriptorId_t> fields;
580 fields.emplace_back(fieldId);
594 std::deque<ROOT::DescriptorId_t> fieldIdQueue{ntuple.GetFieldZeroId()};
596 while (!fieldIdQueue.empty()) {
597 auto currFieldId = fieldIdQueue.front();
598 fieldIdQueue.pop_front();
600 const auto &columns = ntuple.GetFieldDescriptor(currFieldId).GetLogicalColumnIds();
601 fColumns.insert(fColumns.end(), columns.begin(), columns.end());
603 for (const auto &field : ntuple.GetFieldIterable(currFieldId)) {
604 auto fieldId = field.GetId();
605 fieldIdQueue.push_back(fieldId);
612 std::vector<std::uint64_t> result;
613 unsigned int base = 0;
614 std::uint64_t flags = 0;
616 if ((
f > 0) && ((
f % 64) == 0))
618 while (
f > base + 64) {
619 result.emplace_back(flags);
624 flags |= std::uint64_t(1) <<
f;
626 result.emplace_back(flags);
631 std::vector<RClusterDescriptor> &clusterDescs)
635 return R__FAIL(
"invalid attempt to add details of unknown cluster group");
636 if (iter->second.HasClusterDetails())
637 return R__FAIL(
"invalid attempt to re-populate cluster group details");
638 if (iter->second.GetNClusters() != clusterDescs.size())
639 return R__FAIL(
"mismatch of number of clusters");
641 std::vector<ROOT::DescriptorId_t> clusterIds;
642 for (
unsigned i = 0; i < clusterDescs.size(); ++i) {
643 clusterIds.emplace_back(clusterDescs[i].GetId());
646 return R__FAIL(
"invalid attempt to re-populate existing cluster");
650 return fClusterDescriptors[a].GetFirstEntryIndex() < fClusterDescriptors[b].GetFirstEntryIndex();
653 cgBuilder.AddSortedClusters(clusterIds);
654 iter->second = cgBuilder.MoveDescriptor().Unwrap();
662 return R__FAIL(
"invalid attempt to drop cluster details of unknown cluster group");
663 if (!iter->second.HasClusterDetails())
664 return R__FAIL(
"invalid attempt to drop details of cluster group summary");
666 for (
auto clusterId : iter->second.GetClusterIds())
668 iter->second = iter->second.CloneSummary();
676 std::unordered_set<ROOT::DescriptorId_t> invalidFields;
679 auto fieldId = colDesc.GetFieldId();
684 fieldId = field.GetParentId();
686 invalidFields.insert(fieldId);
696 "cannot create Model: descriptor contains unknown column types. Use 'SetForwardCompatible(true)' on the "
697 "RCreateModelOptions to create a partial model containing only the fields made up by known columns."));
699 auto fieldZero = std::make_unique<ROOT::RFieldZero>();
707 if (invalidFields.count(topDesc.GetId()) > 0) {
712 auto field = topDesc.CreateField(*
this, createFieldOpts);
719 const auto &invalid =
static_cast<const RInvalidField &
>(*field);
723 throw invalid.GetError();
730 model->AddProjectedField(std::move(field), [
this](
const std::string &targetName) -> std::string {
734 model->AddField(std::move(field));
822 std::uint64_t firstElementIndex,
823 std::uint32_t compressionSettings,
827 return R__FAIL(
"column ID mismatch");
828 if (
fCluster.fColumnRanges.count(physicalId) > 0)
829 return R__FAIL(
"column ID conflict");
835 fCluster.fColumnRanges[physicalId] = columnRange;
842 if (
fCluster.fColumnRanges.count(physicalId) > 0)
843 return R__FAIL(
"column ID conflict");
848 fCluster.fColumnRanges[physicalId] = columnRange;
855 for (
auto &[
_, columnRange] :
fCluster.fColumnRanges) {
856 if (!columnRange.IsSuppressed())
863 for (
const auto otherColumnLogicalId : fieldDesc.GetLogicalColumnIds()) {
865 if (otherColumnDesc.GetRepresentationIndex() == columnDesc.GetRepresentationIndex())
867 if (otherColumnDesc.GetIndex() != columnDesc.GetIndex())
871 const auto &otherColumnRange =
fCluster.GetColumnRange(otherColumnDesc.GetPhysicalId());
872 if (otherColumnRange.IsSuppressed())
875 columnRange.SetFirstElementIndex(otherColumnRange.GetFirstElementIndex());
876 columnRange.SetNElements(otherColumnRange.GetNElements());
881 return R__FAIL(std::string(
"cannot find non-suppressed column for column ID ") +
882 std::to_string(columnRange.GetPhysicalColumnId()) +
883 ", cluster ID: " + std::to_string(
fCluster.GetId()));
895 auto fnTraverseSubtree = [&](
ROOT::DescriptorId_t rootFieldId, std::uint64_t nRepetitionsAtThisLevel,
896 const auto &visitField,
const auto &enterSubtree) ->
void {
897 visitField(rootFieldId, nRepetitionsAtThisLevel);
899 const std::uint64_t nRepetitions = std::max(
f.GetNRepetitions(), std::uint64_t{1U}) * nRepetitionsAtThisLevel;
900 enterSubtree(
f.GetId(), nRepetitions, visitField, enterSubtree);
912 topLevelField.GetId(), std::max(topLevelField.GetNRepetitions(), std::uint64_t{1U}),
914 for (const auto &c : desc.GetColumnIterable(fieldId)) {
915 const ROOT::DescriptorId_t physicalId = c.GetPhysicalId();
916 auto &columnRange = fCluster.fColumnRanges[physicalId];
921 if (columnRange.GetPhysicalColumnId() == ROOT::kInvalidDescriptorId) {
922 columnRange.SetPhysicalColumnId(physicalId);
923 columnRange.SetFirstElementIndex(0);
924 columnRange.SetNElements(0);
925 columnRange.SetIsSuppressed(c.IsSuppressedDeferredColumn());
933 if (c.IsDeferredColumn()) {
934 columnRange.SetFirstElementIndex(fCluster.GetFirstEntryIndex() * nRepetitions);
935 columnRange.SetNElements(fCluster.GetNEntries() * nRepetitions);
936 if (!columnRange.IsSuppressed()) {
937 auto &pageRange = fCluster.fPageRanges[physicalId];
938 pageRange.fPhysicalColumnId = physicalId;
939 const auto element = ROOT::Internal::RColumnElementBase::Generate<void>(c.GetType());
940 pageRange.ExtendToFitColumnRange(columnRange, *element, ROOT::Internal::RPage::kPageZeroSize);
942 } else if (!columnRange.IsSuppressed()) {
943 fCluster.fPageRanges[physicalId].fPhysicalColumnId = physicalId;
955 return R__FAIL(
"unset cluster ID");
957 return R__FAIL(
"empty cluster");
958 for (
auto &pr :
fCluster.fPageRanges) {
959 if (
fCluster.fColumnRanges.count(pr.first) == 0) {
960 return R__FAIL(
"missing column range");
962 pr.second.fCumulativeNElements.reset();
963 const auto nPages = pr.second.fPageInfos.size();
965 pr.second.fCumulativeNElements = std::make_unique<std::vector<NTupleSize_t>>();
966 pr.second.fCumulativeNElements->reserve(nPages);
968 for (
const auto &pi : pr.second.fPageInfos) {
969 sum += pi.GetNElements();
970 pr.second.fCumulativeNElements->emplace_back(
sum);
997 return R__FAIL(
"unset cluster group ID");
1018 if (
fDescriptor.fFieldDescriptors.count(fieldId) == 0)
1019 return R__FAIL(
"field with id '" + std::to_string(fieldId) +
"' doesn't exist");
1026 return R__FAIL(
"unset or unsupported RNTuple epoch version");
1035 for (
const auto &[fieldId, fieldDesc] :
fDescriptor.fFieldDescriptors) {
1038 return R__FAIL(
"field with id '" + std::to_string(fieldId) +
"' has an invalid parent id");
1042 const auto columnCardinality = fieldDesc.GetColumnCardinality();
1043 if (columnCardinality == 0)
1048 const auto &logicalColumnIds = fieldDesc.GetLogicalColumnIds();
1049 const auto nColumns = logicalColumnIds.size();
1051 if ((nColumns + 1) == columnCardinality)
1054 const auto &lastColumn =
fDescriptor.GetColumnDescriptor(logicalColumnIds.back());
1055 if (lastColumn.GetIndex() + 1 != columnCardinality)
1056 return R__FAIL(
"field with id '" + std::to_string(fieldId) +
"' has incomplete column representations");
1066 for (
const auto &[
id,
_] :
fDescriptor.fClusterGroupDescriptors)
1067 fDescriptor.fSortedClusterGroupIds.emplace_back(
id);
1070 return fDescriptor.fClusterGroupDescriptors[a].GetMinEntry() <
1071 fDescriptor.fClusterGroupDescriptors[b].GetMinEntry();
1079 std::uint16_t versionMinor, std::uint16_t versionPatch)
1082 throw RException(
R__FAIL(
"unsupported RNTuple epoch version: " + std::to_string(versionEpoch)));
1099 const std::string_view description)
1102 fDescriptor.fDescription = std::string(description);
1107 if (flag > 0 && flag % 64 == 0)
1115 if (
fDesc.fName.empty())
1116 return R__FAIL(
"attribute set name cannot be empty");
1117 if (
fDesc.fAnchorLength == 0)
1118 return R__FAIL(
"invalid anchor length");
1120 return R__FAIL(
"invalid locator type");
1122 return std::move(
fDesc);
1128 return R__FAIL(
"invalid logical column id");
1130 return R__FAIL(
"invalid physical column id");
1132 return R__FAIL(
"invalid field id, dangling column");
1141 if (
fColumn.GetBitsOnStorage() < minBits ||
fColumn.GetBitsOnStorage() > maxBits)
1142 return R__FAIL(
"invalid column bit width");
1172 return R__FAIL(
"invalid field id");
1175 return R__FAIL(
"invalid field structure");
1178 return R__FAIL(
"invalid SoA flag on non-collection field");
1186 if (
fField.GetFieldName().empty()) {
1187 return R__FAIL(
"name cannot be empty string \"\"");
1197 fDescriptor.fHeaderExtension->MarkExtendedField(fieldDesc);
1210 return R__FAIL(
"child field with id '" + std::to_string(linkId) +
"' doesn't exist in NTuple");
1213 return R__FAIL(
"cannot make FieldZero a child field");
1216 auto parentId =
fDescriptor.fFieldDescriptors.at(linkId).GetParentId();
1218 return R__FAIL(
"field '" + std::to_string(linkId) +
"' already has a parent ('" + std::to_string(parentId) +
")");
1220 if (fieldId == linkId) {
1221 return R__FAIL(
"cannot make field '" + std::to_string(fieldId) +
"' a child of itself");
1223 fDescriptor.fFieldDescriptors.at(linkId).fParentId = fieldId;
1224 fDescriptor.fFieldDescriptors.at(fieldId).fLinkIds.push_back(linkId);
1235 return R__FAIL(
"projected field with id '" + std::to_string(targetId) +
"' doesn't exist in NTuple");
1238 return R__FAIL(
"cannot make FieldZero a projected field");
1240 if (sourceId == targetId) {
1241 return R__FAIL(
"cannot make field '" + std::to_string(targetId) +
"' a projection of itself");
1243 if (
fDescriptor.fFieldDescriptors.at(sourceId).IsProjectedField()) {
1244 return R__FAIL(
"cannot make field '" + std::to_string(targetId) +
"' a projection of an already projected field");
1247 auto &targetDesc =
fDescriptor.fFieldDescriptors.at(targetId);
1248 if (targetDesc.IsProjectedField() && targetDesc.GetProjectionSourceId() != sourceId) {
1249 return R__FAIL(
"field '" + std::to_string(targetId) +
"' has already a projection source ('" +
1250 std::to_string(targetDesc.GetProjectionSourceId()) +
")");
1252 fDescriptor.fFieldDescriptors.at(targetId).fProjectionSourceId = sourceId;
1258 const auto fieldId = columnDesc.GetFieldId();
1259 const auto columnIndex = columnDesc.GetIndex();
1260 const auto representationIndex = columnDesc.GetRepresentationIndex();
1266 auto &fieldDesc =
fDescriptor.fFieldDescriptors.find(fieldId)->second;
1268 if (columnDesc.IsAliasColumn()) {
1269 if (columnDesc.GetType() !=
fDescriptor.GetColumnDescriptor(columnDesc.GetPhysicalId()).GetType())
1270 return R__FAIL(
"alias column type mismatch");
1273 return R__FAIL(
"column index clash");
1275 if (columnIndex > 0) {
1277 return R__FAIL(
"out of bounds column index");
1279 if (representationIndex > 0) {
1281 return R__FAIL(
"out of bounds representation index");
1283 if (columnIndex == 0) {
1284 assert(fieldDesc.fColumnCardinality > 0);
1285 if (
fDescriptor.FindLogicalColumnId(fieldId, fieldDesc.fColumnCardinality - 1, representationIndex - 1) ==
1287 return R__FAIL(
"incomplete column representations");
1290 if (columnIndex >= fieldDesc.fColumnCardinality)
1291 return R__FAIL(
"irregular column representations");
1295 fieldDesc.fColumnCardinality = columnIndex + 1;
1298 const auto logicalId = columnDesc.GetLogicalId();
1299 fieldDesc.fLogicalColumnIds.emplace_back(logicalId);
1301 if (!columnDesc.IsAliasColumn())
1303 fDescriptor.fColumnDescriptors.emplace(logicalId, std::move(columnDesc));
1305 fDescriptor.fHeaderExtension->MarkExtendedColumn(columnDesc);
1312 const auto id = clusterGroup.GetId();
1313 if (
fDescriptor.fClusterGroupDescriptors.count(
id) > 0)
1314 return R__FAIL(
"cluster group id clash");
1315 fDescriptor.fNEntries = std::max(
fDescriptor.fNEntries, clusterGroup.GetMinEntry() + clusterGroup.GetEntrySpan());
1316 fDescriptor.fNClusters += clusterGroup.GetNClusters();
1317 fDescriptor.fClusterGroupDescriptors.emplace(
id, std::move(clusterGroup));
1329 fDescriptor.fHeaderExtension = std::make_unique<RNTupleDescriptor::RHeaderExtension>();
1343 for (
auto &link :
fDescriptor.fFieldDescriptors[
c.fFieldId].fLogicalColumnIds) {
1344 if (link ==
c.fLogicalColumnId) {
1349 c.fLogicalColumnId += offset;
1351 fDescriptor.fColumnDescriptors.emplace(
c.fLogicalColumnId, std::move(
c));
1357 auto clusterId = clusterDesc.GetId();
1358 if (
fDescriptor.fClusterDescriptors.count(clusterId) > 0)
1359 return R__FAIL(
"cluster id clash");
1360 fDescriptor.fClusterDescriptors.emplace(clusterId, std::move(clusterDesc));
1368 if (std::find(
fDescriptor.fExtraTypeInfoDescriptors.begin(),
fDescriptor.fExtraTypeInfoDescriptors.end(),
1369 extraTypeInfoDesc) !=
fDescriptor.fExtraTypeInfoDescriptors.end()) {
1370 return R__FAIL(
"extra type info duplicates");
1372 fDescriptor.fExtraTypeInfoDescriptors.emplace_back(std::move(extraTypeInfoDesc));
1378 auto it = std::find(
fDescriptor.fExtraTypeInfoDescriptors.begin(),
fDescriptor.fExtraTypeInfoDescriptors.end(),
1380 if (it !=
fDescriptor.fExtraTypeInfoDescriptors.end())
1381 *it = std::move(extraTypeInfoDesc);
1383 fDescriptor.fExtraTypeInfoDescriptors.emplace_back(std::move(extraTypeInfoDesc));
1390 if (std::find_if(attrSets.begin(), attrSets.end(), [&
name = attrSetDesc.GetName()](
const auto &desc) {
1391 return desc.GetName() == name;
1392 }) != attrSets.end()) {
1393 return R__FAIL(
"attribute sets with duplicate names");
1395 attrSets.push_back(std::move(attrSetDesc));
1500 if (fieldDesc.
GetTypeName().rfind(
"std::", 0) == 0)
1507 static const std::string gIntTypeNames[] = {
"bool",
"char",
"std::int8_t",
"std::uint8_t",
1508 "std::int16_t",
"std::uint16_t",
"std::int32_t",
"std::uint32_t",
1509 "std::int64_t",
"std::uint64_t"};
1510 return std::find(std::begin(gIntTypeNames), std::end(gIntTypeNames),
1518 return (fieldDesc.
GetTypeName().rfind(
"std::atomic<", 0) == 0);
#define R__FORWARD_ERROR(res)
Short-hand to return an RResult<T> in an error state (i.e. after checking).
#define R__FAIL(msg)
Short-hand to return an RResult<T> in an error state; the RError is implicitly converted into RResult...
#define R__ASSERT(e)
Checks condition e and reports a fatal error if it's false.
ROOT::Experimental::RNTupleAttrSetDescriptor fDesc
RResult< ROOT::Experimental::RNTupleAttrSetDescriptor > MoveDescriptor()
Attempt to make an AttributeSet descriptor.
Used to loop over all the Attribute Sets linked to an RNTuple.
Metadata stored for every Attribute Set linked to an RNTuple.
bool operator==(const RNTupleAttrSetDescriptor &other) const
RNTupleAttrSetDescriptor()=default
std::uint16_t fSchemaVersionMajor
RNTupleAttrSetDescriptor Clone() const
std::uint32_t fAnchorLength
uncompressed size of the linked anchor
RNTupleLocator fAnchorLocator
std::uint16_t fSchemaVersionMinor
A helper class for piece-wise construction of an RClusterDescriptor.
RClusterDescriptor fCluster
RResult< void > MarkSuppressedColumnRange(ROOT::DescriptorId_t physicalId)
Books the given column ID as being suppressed in this cluster.
RResult< void > CommitColumnRange(ROOT::DescriptorId_t physicalId, std::uint64_t firstElementIndex, std::uint32_t compressionSettings, const RClusterDescriptor::RPageRange &pageRange)
RClusterDescriptorBuilder & AddExtendedColumnRanges(const RNTupleDescriptor &desc)
Add column and page ranges for columns created during late model extension missing in this cluster.
RResult< void > CommitSuppressedColumnRanges(const RNTupleDescriptor &desc)
Sets the first element index and number of elements for all the suppressed column ranges.
RResult< RClusterDescriptor > MoveDescriptor()
Move out the full cluster descriptor including page locations.
A helper class for piece-wise construction of an RClusterGroupDescriptor.
RClusterGroupDescriptorBuilder & EntrySpan(std::uint64_t entrySpan)
RClusterGroupDescriptorBuilder & PageListLocator(const RNTupleLocator &pageListLocator)
RClusterGroupDescriptorBuilder()=default
static RClusterGroupDescriptorBuilder FromSummary(const RClusterGroupDescriptor &clusterGroupDesc)
RClusterGroupDescriptorBuilder & PageListLength(std::uint64_t pageListLength)
RClusterGroupDescriptorBuilder & MinEntry(std::uint64_t minEntry)
RClusterGroupDescriptor fClusterGroup
RResult< RClusterGroupDescriptor > MoveDescriptor()
RClusterGroupDescriptorBuilder & ClusterGroupId(ROOT::DescriptorId_t clusterGroupId)
RClusterGroupDescriptorBuilder & NClusters(std::uint32_t nClusters)
RResult< RColumnDescriptor > MakeDescriptor() const
Attempt to make a column descriptor.
RColumnDescriptor fColumn
A column element encapsulates the translation between basic C++ types and their column representation...
static std::pair< std::uint16_t, std::uint16_t > GetValidBitRange(ROOT::ENTupleColumnType type)
Most types have a fixed on-disk bit width.
std::size_t GetSize() const
std::size_t GetPackedSize(std::size_t nElements=1U) const
A helper class for piece-wise construction of an RFieldDescriptor.
RFieldDescriptorBuilder & NRepetitions(std::uint64_t nRepetitions)
RFieldDescriptorBuilder & Structure(const ROOT::ENTupleStructure &structure)
RFieldDescriptorBuilder()=default
Make an empty dangling field descriptor.
RFieldDescriptorBuilder & TypeAlias(const std::string &typeAlias)
RFieldDescriptorBuilder & TypeVersion(std::uint32_t typeVersion)
RFieldDescriptorBuilder & IsSoACollection(bool val)
RFieldDescriptorBuilder & TypeChecksum(const std::optional< std::uint32_t > typeChecksum)
RResult< RFieldDescriptor > MakeDescriptor() const
Attempt to make a field descriptor.
static RFieldDescriptorBuilder FromField(const ROOT::RFieldBase &field)
Make a new RFieldDescriptorBuilder based off a live RNTuple field.
RFieldDescriptorBuilder & FieldDescription(const std::string &fieldDescription)
RFieldDescriptorBuilder & FieldVersion(std::uint32_t fieldVersion)
RFieldDescriptorBuilder & FieldName(const std::string &fieldName)
RFieldDescriptorBuilder & TypeName(const std::string &typeName)
void SetNTuple(const std::string_view name, const std::string_view description)
void SetSchemaFromExisting(const RNTupleDescriptor &descriptor)
Copies the "schema" part of descriptor into the builder's descriptor.
void SetVersionForWriting()
RResult< void > AddColumn(RColumnDescriptor &&columnDesc)
RResult< void > AddAttributeSet(Experimental::RNTupleAttrSetDescriptor &&attrSetDesc)
RResult< void > AddFieldProjection(ROOT::DescriptorId_t sourceId, ROOT::DescriptorId_t targetId)
void ReplaceExtraTypeInfo(RExtraTypeInfoDescriptor &&extraTypeInfoDesc)
RResult< void > AddExtraTypeInfo(RExtraTypeInfoDescriptor &&extraTypeInfoDesc)
void ShiftAliasColumns(std::uint32_t offset)
Shift column IDs of alias columns by offset.
void SetVersion(std::uint16_t versionEpoch, std::uint16_t versionMajor, std::uint16_t versionMinor, std::uint16_t versionPatch)
RNTupleDescriptor MoveDescriptor()
void BeginHeaderExtension()
Mark the beginning of the header extension; any fields and columns added after a call to this functio...
RResult< void > AddCluster(RClusterDescriptor &&clusterDesc)
RResult< void > EnsureValidDescriptor() const
Checks whether invariants hold:
RResult< void > AddFieldLink(ROOT::DescriptorId_t fieldId, ROOT::DescriptorId_t linkId)
void AddField(const RFieldDescriptor &fieldDesc)
RResult< void > AddClusterGroup(RClusterGroupDescriptor &&clusterGroup)
RResult< void > EnsureFieldExists(ROOT::DescriptorId_t fieldId) const
void SetFeature(unsigned int flag)
Sets the flag-th bit of the feature flag to 1.
RNTupleDescriptor fDescriptor
A helper class for serializing and deserialization of the RNTuple binary format.
The window of element indexes of a particular column in a particular cluster.
bool IsSuppressed() const
void SetPhysicalColumnId(ROOT::DescriptorId_t id)
ROOT::DescriptorId_t GetPhysicalColumnId() const
void SetIsSuppressed(bool suppressed)
ROOT::NTupleSize_t GetNElements() const
void IncrementNElements(ROOT::NTupleSize_t by)
Metadata for RNTuple clusters.
ROOT::NTupleSize_t fFirstEntryIndex
Clusters can be swapped by adjusting the entry offsets of the cluster and all ranges.
RClusterDescriptor()=default
std::unordered_map< ROOT::DescriptorId_t, RColumnRange > fColumnRanges
ROOT::NTupleSize_t fNEntries
ROOT::DescriptorId_t fClusterId
RClusterDescriptor Clone() const
bool operator==(const RClusterDescriptor &other) const
RColumnRangeIterable GetColumnRangeIterable() const
Returns an iterator over pairs { columnId, columnRange }. The iteration order is unspecified.
std::unordered_map< ROOT::DescriptorId_t, RPageRange > fPageRanges
std::uint64_t GetNBytesOnStorage() const
Clusters are bundled in cluster groups.
RNTupleLocator fPageListLocator
The page list that corresponds to the cluster group.
RClusterGroupDescriptor Clone() const
std::vector< ROOT::DescriptorId_t > fClusterIds
The cluster IDs can be empty if the corresponding page list is not loaded.
ROOT::DescriptorId_t GetId() const
std::uint64_t fMinEntry
The minimum first entry number of the clusters in the cluster group.
std::uint32_t fNClusters
Number of clusters is always known even if the cluster IDs are not (yet) populated.
std::uint32_t GetNClusters() const
std::uint64_t fPageListLength
Uncompressed size of the page list.
std::uint64_t GetPageListLength() const
std::uint64_t GetMinEntry() const
std::uint64_t GetEntrySpan() const
RClusterGroupDescriptor()=default
RNTupleLocator GetPageListLocator() const
ROOT::DescriptorId_t fClusterGroupId
std::uint64_t fEntrySpan
Number of entries that are (partially for sharded clusters) covered by this cluster group.
bool operator==(const RClusterGroupDescriptor &other) const
RClusterGroupDescriptor CloneSummary() const
Creates a clone without the cluster IDs.
Metadata stored for every column of an RNTuple.
ROOT::DescriptorId_t fPhysicalColumnId
Usually identical to the logical column ID, except for alias columns where it references the shadowed...
bool operator==(const RColumnDescriptor &other) const
RColumnDescriptor()=default
ROOT::DescriptorId_t fLogicalColumnId
The actual column identifier, which is the link to the corresponding field.
ROOT::DescriptorId_t fFieldId
Every column belongs to one and only one field.
std::int64_t fFirstElementIndex
The absolute value specifies the index for the first stored element for this column.
std::uint32_t fIndex
A field can be serialized into several columns, which are numbered from zero to $n$.
std::uint16_t fBitsOnStorage
The size in bits of elements of this column.
std::uint16_t fRepresentationIndex
A field may use multiple column representations, which are numbered from zero to $m$.
ROOT::ENTupleColumnType fType
The on-disk column type.
std::optional< RValueRange > fValueRange
Optional value range (used e.g. by quantized real fields).
RColumnDescriptor Clone() const
Get a copy of the descriptor.
Base class for all ROOT issued exceptions.
A field translates read and write calls from/to underlying columns to/from tree values.
ROOT::ENTupleStructure GetStructure() const
@ kTraitSoACollection
The field represents a collection in SoA layout.
@ kTraitInvalidField
This field is an instance of RInvalidField and can be safely static_cast to it.
@ kTraitTypeChecksum
The TClass checksum is set and valid.
const std::string & GetFieldName() const
const std::string & GetTypeAlias() const
const std::string & GetDescription() const
Get the field's description.
virtual std::uint32_t GetFieldVersion() const
Indicates an evolution of the mapping scheme from C++ type to columns.
virtual std::uint32_t GetTypeChecksum() const
Return the current TClass reported checksum of this class. Only valid if kTraitTypeChecksum is set.
std::uint32_t GetTraits() const
std::size_t GetNRepetitions() const
const std::string & GetTypeName() const
std::unique_ptr< RFieldBase > Clone(std::string_view newName) const
Copies the field and its subfields using a possibly new name and a new, unconnected set of columns.
virtual std::uint32_t GetTypeVersion() const
Indicates an evolution of the C++ type itself.
Metadata stored for every field of an RNTuple.
const std::string & GetTypeAlias() const
std::unique_ptr< ROOT::RFieldBase > CreateField(const RNTupleDescriptor &ntplDesc, const ROOT::RCreateFieldOptions &options={}) const
In general, we create a field simply from the C++ type name.
std::uint32_t fFieldVersion
The version of the C++-type-to-column translation mechanics.
ROOT::DescriptorId_t fFieldId
RFieldDescriptor Clone() const
Get a copy of the descriptor.
ROOT::DescriptorId_t GetId() const
std::uint64_t fNRepetitions
The number of elements per entry for fixed-size arrays.
std::uint32_t fColumnCardinality
The number of columns in the column representations of the field.
ROOT::DescriptorId_t fProjectionSourceId
For projected fields, the source field ID.
ROOT::ENTupleStructure GetStructure() const
bool operator==(const RFieldDescriptor &other) const
std::string fFieldDescription
Free text set by the user.
ROOT::DescriptorId_t fParentId
Establishes sub field relationships, such as classes and collections.
ROOT::DescriptorId_t GetParentId() const
std::string fTypeAlias
A typedef or using directive that resolved to the type name during field creation.
ROOT::ENTupleStructure fStructure
The structural information carried by this field in the data model tree.
std::vector< ROOT::DescriptorId_t > fLinkIds
The pointers in the other direction from parent to children.
std::string fFieldName
The leaf name, not including parent fields.
bool fIsSoACollection
Indicates if this is a collection that should be represented in memory by a SoA layout.
std::uint32_t fTypeVersion
The version of the C++ type itself.
std::string fTypeName
The C++ type that was used when writing the field.
const std::string & GetFieldName() const
RFieldDescriptor()=default
std::vector< ROOT::DescriptorId_t > fLogicalColumnIds
The ordered list of columns attached to this field: first by representation index then by column inde...
const std::string & GetTypeName() const
std::optional< std::uint32_t > fTypeChecksum
For custom classes, we store the ROOT TClass reported checksum to facilitate the use of I/O rules tha...
Used in RFieldBase::Check() to record field creation failures.
@ kGeneric
Generic unrecoverable error.
@ kUnknownStructure
The field could not be created because its descriptor had an unknown structural role.
ECategory GetCategory() const
Used to loop over all the clusters of an RNTuple (in unspecified order).
Used to loop over all the cluster groups of an RNTuple (in unspecified order).
Used to loop over a field's associated columns.
const RNTupleDescriptor & fNTuple
The associated RNTuple for this range.
std::vector< ROOT::DescriptorId_t > fColumns
The descriptor ids of the columns ordered by field, representation, and column index.
RColumnDescriptorIterable(const RNTupleDescriptor &ntuple, const RFieldDescriptor &fieldDesc)
Used to loop over a field's child fields.
The on-storage metadata of an RNTuple.
const RClusterGroupDescriptor & GetClusterGroupDescriptor(ROOT::DescriptorId_t clusterGroupId) const
const RColumnDescriptor & GetColumnDescriptor(ROOT::DescriptorId_t columnId) const
ROOT::DescriptorId_t FindNextClusterId(ROOT::DescriptorId_t clusterId) const
RFieldDescriptorIterable GetFieldIterable(const RFieldDescriptor &fieldDesc) const
std::set< unsigned int > fFeatureFlags
std::unordered_map< ROOT::DescriptorId_t, RClusterGroupDescriptor > fClusterGroupDescriptors
const RFieldDescriptor & GetFieldDescriptor(ROOT::DescriptorId_t fieldId) const
std::uint64_t fNPhysicalColumns
Updated by the descriptor builder when columns are added.
std::vector< Experimental::RNTupleAttrSetDescriptor > fAttributeSets
List of AttributeSets linked to this RNTuple.
ROOT::DescriptorId_t fFieldZeroId
Set by the descriptor builder.
std::uint64_t fNEntries
Updated by the descriptor builder when the cluster groups are added.
RClusterGroupDescriptorIterable GetClusterGroupIterable() const
RColumnDescriptorIterable GetColumnIterable() const
bool operator==(const RNTupleDescriptor &other) const
std::uint64_t fOnDiskFooterSize
Like fOnDiskHeaderSize, contains both cluster summaries and page locations.
std::uint16_t fVersionMinor
Set by the descriptor builder when deserialized.
ROOT::DescriptorId_t FindClusterId(ROOT::NTupleSize_t entryIdx) const
std::vector< std::uint64_t > GetFeatureFlags() const
ROOT::DescriptorId_t GetFieldZeroId() const
Returns the logical parent of all top-level RNTuple data fields.
std::unique_ptr< ROOT::RNTupleModel > CreateModel(const RCreateModelOptions &options=RCreateModelOptions()) const
Re-create the C++ model from the stored metadata.
std::string GetTypeNameForComparison(const RFieldDescriptor &fieldDesc) const
Adjust the type name of the passed RFieldDescriptor for comparison with another renormalized type nam...
std::unordered_map< ROOT::DescriptorId_t, RClusterDescriptor > fClusterDescriptors
Potentially a subset of all the available clusters.
std::size_t GetNClusters() const
ROOT::DescriptorId_t FindPhysicalColumnId(ROOT::DescriptorId_t fieldId, std::uint32_t columnIndex, std::uint16_t representationIndex) const
RExtraTypeInfoDescriptorIterable GetExtraTypeInfoIterable() const
const RHeaderExtension * GetHeaderExtension() const
Return header extension information; if the descriptor does not have a header extension,...
std::uint64_t fNClusters
Updated by the descriptor builder when the cluster groups are added.
std::uint64_t fOnDiskHeaderXxHash3
Set by the descriptor builder when deserialized.
const RClusterDescriptor & GetClusterDescriptor(ROOT::DescriptorId_t clusterId) const
ROOT::DescriptorId_t FindFieldId(std::string_view fieldName, ROOT::DescriptorId_t parentId) const
std::string fName
The RNTuple name needs to be unique in a given storage location (file).
std::uint64_t fOnDiskHeaderSize
Set by the descriptor builder when deserialized.
RNTupleDescriptor()=default
RResult< void > DropClusterGroupDetails(ROOT::DescriptorId_t clusterGroupId)
std::uint16_t fVersionMajor
Set by the descriptor builder when deserialized.
std::vector< ROOT::DescriptorId_t > fSortedClusterGroupIds
References cluster groups sorted by entry range and thus allows for binary search.
std::unordered_map< ROOT::DescriptorId_t, RColumnDescriptor > fColumnDescriptors
ROOT::DescriptorId_t FindLogicalColumnId(ROOT::DescriptorId_t fieldId, std::uint32_t columnIndex, std::uint16_t representationIndex) const
std::unordered_map< ROOT::DescriptorId_t, RFieldDescriptor > fFieldDescriptors
ROOT::NTupleSize_t GetNElements(ROOT::DescriptorId_t physicalColumnId) const
RResult< void > AddClusterGroupDetails(ROOT::DescriptorId_t clusterGroupId, std::vector< RClusterDescriptor > &clusterDescs)
Methods to load and drop cluster group details (cluster IDs and page locations).
std::uint16_t fVersionPatch
Set by the descriptor builder when deserialized.
std::string fDescription
Free text from the user.
ROOT::Experimental::RNTupleAttrSetDescriptorIterable GetAttrSetIterable() const
RFieldDescriptorIterable GetTopLevelFields() const
std::uint16_t fVersionEpoch
Set by the descriptor builder when deserialized.
std::vector< RExtraTypeInfoDescriptor > fExtraTypeInfoDescriptors
RNTupleDescriptor Clone() const
std::size_t GetNClusterGroups() const
std::string GetQualifiedFieldName(ROOT::DescriptorId_t fieldId) const
Walks up the parents of the field ID and returns a field name of the form a.b.c.d In case of invalid ...
RClusterDescriptorIterable GetClusterIterable() const
RNTupleDescriptor CloneSchema() const
Creates a descriptor containing only the schema information about this RNTuple, i....
std::uint64_t fGeneration
The generation of the descriptor.
ROOT::DescriptorId_t FindPrevClusterId(ROOT::DescriptorId_t clusterId) const
std::unique_ptr< RHeaderExtension > fHeaderExtension
Generic information about the physical location of data.
void SetType(ELocatorType type)
void SetNBytesOnStorage(std::uint64_t nBytesOnStorage)
static std::unique_ptr< RNTupleModel > Create()
static std::unique_ptr< RNTupleModel > CreateBare()
Creates a "bare model", i.e. an RNTupleModel with no default entry.
static constexpr std::uint16_t kVersionPatch
static constexpr std::uint16_t kVersionMajor
static constexpr std::uint16_t kVersionEpoch
static constexpr std::uint16_t kVersionMinor
The class is used as a return type for operations that can fail; wraps a value of type T or an RError...
static std::unique_ptr< RVectorField > CreateUntyped(std::string_view fieldName, std::unique_ptr< RFieldBase > itemField)
ROOT::DescriptorId_t CallFindClusterIdOn(const ROOT::RNTupleDescriptor &desc, ROOT::NTupleSize_t entryIdx)
RResult< void > EnsureValidNameForRNTuple(std::string_view name, std::string_view where)
Check whether a given string is a valid name according to the RNTuple specification.
ROOT::RResult< std::unique_ptr< ROOT::RFieldBase > > CallFieldBaseCreate(const std::string &fieldName, const std::string &typeName, const ROOT::RCreateFieldOptions &options, const ROOT::RNTupleDescriptor *desc, ROOT::DescriptorId_t fieldId)
bool IsCustomEnumFieldDesc(const RNTupleDescriptor &desc, const RFieldDescriptor &fieldDesc)
Tells if the field describes a user-defined enum type.
std::vector< ROOT::Internal::RNTupleClusterBoundaries > GetClusterBoundaries(const RNTupleDescriptor &desc)
Return the cluster boundaries for each cluster in this RNTuple.
std::string GetRenormalizedTypeName(const std::string &metaNormalizedName)
Given a type name normalized by ROOT meta, renormalize it for RNTuple. E.g., insert std::prefix.
bool IsStdAtomicFieldDesc(const RFieldDescriptor &fieldDesc)
Tells if the field describes a std::atomic<T> type.
std::uint64_t DescriptorId_t
Distriniguishes elements of the same type within a descriptor, e.g. different fields.
constexpr NTupleSize_t kInvalidNTupleIndex
std::uint64_t NTupleSize_t
Integer type long enough to hold the maximum number of entries in a column.
constexpr DescriptorId_t kInvalidDescriptorId
Additional information about a page in an in-memory RPageRange.
Information about a single page in the context of a cluster's page range.
void SetLocator(const RNTupleLocator &locator)
std::uint32_t GetNElements() const
void SetNElements(std::uint32_t n)
void SetEmulateUnknownTypes(bool v)
void SetReturnInvalidOnError(bool v)
bool GetReturnInvalidOnError() const
Modifiers passed to CreateModel().
bool GetCreateBare() const
bool GetEmulateUnknownTypes() const
bool GetReconstructProjections() const
bool GetForwardCompatible() const
static uint64_t sum(uint64_t i)