41#include <unordered_map>
91 return R__FAIL(
"page checksum verification failed, data corruption detected");
98 return R__FAIL(
"invalid attempt to extract non-existing page checksum");
100 assert(fBufferSize >= kNBytesPageChecksum);
103 reinterpret_cast<const unsigned char *
>(
fBuffer) + fBufferSize - kNBytesPageChecksum,
checksum);
127 for (std::size_t i = 0; i <
itr->second.size(); ++i) {
131 itr->second[i].fRefCounter--;
132 if (
itr->second[i].fRefCounter == 0) {
134 if (
itr->second.empty()) {
135 fColumnInfos.erase(
itr);
161 if (
clusterDesc.GetFirstEntryIndex() >= (fFirstEntry + fNEntries))
176std::unique_ptr<ROOT::Internal::RPageSource>
183 if (location.empty()) {
186 if (location.find(
"daos://") == 0)
188 return std::make_unique<ROOT::Experimental::Internal::RPageSourceDaos>(
ntupleName, location, options);
193 return std::make_unique<ROOT::Internal::RPageSourceFile>(
ntupleName, location, options);
214 if ((
range.fFirstEntry +
range.fNEntries) > GetNEntries()) {
224 fHasStructure =
true;
231 GetExclDescriptorGuard().MoveIn(AttachImpl(
mode));
237 auto clone = CloneImpl();
239 clone->GetExclDescriptorGuard().MoveIn(GetSharedDescriptorGuard()->Clone());
240 clone->fHasStructure =
true;
241 clone->fIsAttached =
true;
248 return GetSharedDescriptorGuard()->GetNEntries();
253 return GetSharedDescriptorGuard()->GetNElements(
columnHandle.fPhysicalId);
264 RNTupleAtomicTimer
timer(fCounters->fTimeWallUnzip, fCounters->fTimeCpuUnzip);
274 std::vector<std::unique_ptr<RColumnElementBase>>
allElements;
280 if (!fActivePhysicalColumns.HasColumnInfos(
columnId))
291 for (
const auto &pi :
pageRange.GetPageInfos()) {
296 sealedPage.SetBufferSize(pi.GetLocator().GetNBytesOnStorage() + pi.HasChecksum() * kNBytesPageChecksum);
323 fCounters->fNPageUnsealed.Add(
pageNo);
327 fTaskScheduler->Wait();
330 throw RException(
R__FAIL(
"page checksum verification failed, data corruption detected"));
352 pageInfo.GetLocator().GetNBytesOnStorage()));
367 GetSharedDescriptorGuard()->GetClusterDescriptor(
clusterId).GetFirstEntryIndex();
368 auto itr = fPreloadedClusters.
begin();
370 if (fPinnedClusters.count(
itr->second) > 0) {
373 fPagePool.Evict(
itr->second);
374 itr = fPreloadedClusters.erase(
itr);
378 while ((
itr != fPreloadedClusters.
end()) &&
383 while (
itr != fPreloadedClusters.
end()) {
384 if (fPinnedClusters.count(
itr->second) > 0) {
387 fPagePool.Evict(
itr->second);
388 itr = fPreloadedClusters.erase(
itr);
417 sealedPage.VerifyChecksumIfEnabled().ThrowOnError();
468 fCounters->fNPageRead.Inc();
469 fCounters->fNRead.Inc();
470 fCounters->fSzReadPayload.Add(
sealedPage.GetBufferSize());
472 if (!fCurrentCluster || (fCurrentCluster->GetId() !=
clusterId) || !fCurrentCluster->ContainsColumn(
columnId))
473 fCurrentCluster = fClusterPool.GetCluster(
clusterId, fActivePhysicalColumns.ToColumnSet());
483 auto onDiskPage = fCurrentCluster->GetOnDiskPage(key);
490 RNTupleAtomicTimer
timer(fCounters->fTimeWallUnzip, fCounters->fTimeCpuUnzip);
497 fCounters->fNPageUnsealed.Inc();
510 UpdateLastUsedCluster(
cachedPageRef.Get().GetClusterInfo().GetId());
570 fMetrics.ObserveMetrics(fClusterPool.GetMetrics());
571 fMetrics.ObserveMetrics(fPagePool.GetMetrics());
572 fCounters = std::make_unique<RCounters>(
RCounters{
575 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"szReadPayload",
"B",
"volume read from storage (required)"),
576 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"szReadOverhead",
"B",
"volume read from storage (overhead)"),
579 "number of partial clusters preloaded from storage"),
580 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"nPageRead",
"",
"number of pages read from storage"),
581 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"nPageUnsealed",
"",
"number of pages unzipped and decoded"),
582 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"timeWallRead",
"ns",
"wall clock time spent reading"),
583 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"timeWallUnzip",
"ns",
"wall clock time spent decompressing"),
586 "CPU time spent decompressing"),
588 "bwRead",
"MB/s",
"bandwidth compressed bytes read per second", fMetrics,
605 "bwReadUnzip",
"MB/s",
"bandwidth uncompressed bytes read per second", fMetrics,
619 "bwUnzip",
"MB/s",
"decompression bandwidth of uncompressed bytes per second", fMetrics,
633 "rtReadEfficiency",
"",
"ratio of payload over all bytes read", fMetrics,
639 return {
true, 1. / (1. + (1. *
szReadOverhead->GetValueAsInt()) / payload)};
645 *fMetrics.MakeCounter<
RNTupleCalcPerf *>(
"rtCompression",
"",
"ratio of compressed bytes / uncompressed bytes",
648 metrics.GetLocalCounter(
"szReadPayload")) {
706 if (fHasStreamerInfosRegistered)
709 for (
const auto &
extraTypeInfo : fDescriptor.GetExtraTypeInfoIterable()) {
717 fHasStreamerInfosRegistered =
true;
725 if (fCurrentPageSize ==
other.fCurrentPageSize)
726 return fColumn->GetOnDiskId() >
other.fColumn->GetOnDiskId();
727 return fCurrentPageSize >
other.fCurrentPageSize;
735 auto itr = fColumnsSortedByPageSize.
begin();
736 while (
itr != fColumnsSortedByPageSize.
end()) {
739 if (
itr->fCurrentPageSize ==
itr->fInitialPageSize) {
748 if (
itr != fColumnsSortedByPageSize.
end())
757 itr = fColumnsSortedByPageSize.find(next);
766 auto itr = fColumnsSortedByPageSize.find(key);
767 if (
itr == fColumnsSortedByPageSize.
end()) {
781 fColumnsSortedByPageSize.erase(
itr);
787 fColumnsSortedByPageSize.insert(
elem);
796 fColumnsSortedByPageSize.insert(
elem);
801 fColumnsSortedByPageSize.insert(
elem);
808 :
RPageStorage(
name), fOptions(options.Clone()), fWritePageMemoryManager(options.GetPageBufferBudget())
821 unsigned char *
pageBuf =
reinterpret_cast<unsigned char *
>(config.
fPage->GetBuffer());
826 if (!config.
fElement->IsMappable()) {
855 const auto nBytes =
page.GetNBytes() + GetWriteOptions().GetEnablePageChecksums() * kNBytesPageChecksum;
856 if (fSealPageBuffer.size() <
nBytes)
857 fSealPageBuffer.resize(
nBytes);
863 config.
fWriteChecksum = GetWriteOptions().GetEnablePageChecksums();
865 config.
fBuffer = fSealPageBuffer.data();
867 return SealPage(config);
872 for (
const auto &
cb : fOnDatasetCommitCallbacks)
874 return CommitDatasetImpl();
889std::unique_ptr<ROOT::Internal::RPageSink>
896 if (location.empty()) {
899 if (location.find(
"daos://") == 0) {
901 return std::make_unique<ROOT::Experimental::Internal::RPageSinkDaos>(
ntupleName, location, options);
908 return std::make_unique<ROOT::Internal::RPageSinkFile>(
ntupleName, location, options);
922 auto columnId = fDescriptorBuilder.GetDescriptor().GetNPhysicalColumns();
937 fDescriptorBuilder.AddColumn(
columnBuilder.MakeDescriptor().Unwrap());
944 if (fIsInitialized) {
952 const auto &
descriptor = fDescriptorBuilder.GetDescriptor();
958 const auto &
reps =
f.GetColumnRepresentatives();
961 return reps.size() *
reps[0].size();
975 fDescriptorBuilder.AddFieldLink(
f.GetParent()->GetOnDiskId(),
fieldId);
984 fDescriptorBuilder.AddFieldLink(
f.GetParent()->GetOnDiskId(),
fieldId);
991 .PhysicalColumnId(
source.GetLogicalId())
993 .BitsOnStorage(
source.GetBitsOnStorage())
994 .ValueRange(
source.GetValueRange())
997 .RepresentationIndex(
source.GetRepresentationIndex());
998 fDescriptorBuilder.AddColumn(
columnBuilder.MakeDescriptor().Unwrap());
1009 for (
auto f :
changeset.fAddedProjectedFields) {
1026 columnRange.SetCompressionSettings(GetWriteOptions().GetCompression());
1030 fOpenPageRanges.emplace_back(std::move(
pageRange));
1035 if (fSerializationContext.GetHeaderSize() > 0)
1036 fSerializationContext.MapSchema(
descriptor,
true);
1042 throw RException(
R__FAIL(
"ROOT bug: unexpected type extra info in UpdateExtraTypeInfo()"));
1049 fDescriptorBuilder.SetNTuple(fNTupleName, model.
GetDescription());
1050 const auto &
descriptor = fDescriptorBuilder.GetDescriptor();
1060 for (
auto f :
fieldZero.GetMutableSubfields())
1070 InitImpl(buffer.get(), fSerializationContext.GetHeaderSize());
1072 fDescriptorBuilder.BeginHeaderExtension();
1075std::unique_ptr<ROOT::RNTupleModel>
1080 const auto &
descriptor = fDescriptorBuilder.GetDescriptor();
1084 R__ASSERT(fOpenColumnRanges.empty() && fOpenPageRanges.empty());
1085 fOpenColumnRanges.reserve(
nColumns);
1088 const auto &column =
descriptor.GetColumnDescriptor(i);
1091 columnRange.SetFirstElementIndex(column.GetFirstElementIndex());
1093 columnRange.SetCompressionSettings(GetWriteOptions().GetCompression());
1097 fOpenPageRanges.emplace_back(std::move(
pageRange));
1106 for (
unsigned int i = 0; i < fOpenColumnRanges.size(); ++i) {
1107 R__ASSERT(fOpenColumnRanges[i].GetPhysicalColumnId() == i);
1108 if (!
cluster.ContainsColumn(i))
1113 fOpenColumnRanges[i].IncrementFirstElementIndex(
columnRange.GetNElements());
1115 fDescriptorBuilder.AddCluster(
cluster.Clone());
1124 modelOpts.SetReconstructProjections(
true);
1130 projectedFields.GetFieldZero().SetOnDiskId(model->GetConstFieldZero().GetOnDiskId());
1137 InitImpl(buffer.get(), fSerializationContext.GetHeaderSize());
1139 fDescriptorBuilder.BeginHeaderExtension();
1142 fIsInitialized =
true;
1149 fOpenColumnRanges.at(
columnHandle.fPhysicalId).SetIsSuppressed(
true);
1154 fOpenColumnRanges.at(
columnHandle.fPhysicalId).IncrementNElements(
page.GetNElements());
1159 pageInfo.SetHasChecksum(GetWriteOptions().GetEnablePageChecksums());
1175std::vector<ROOT::RNTupleLocator>
1177 const std::vector<bool> &
mask)
1179 std::vector<ROOT::RNTupleLocator>
locators;
1182 for (
auto &
range : ranges) {
1200 std::vector<bool>
mask;
1204 std::unordered_map<std::uint64_t, RSealedPageLink>
originalPages;
1206 for (
auto &
range : ranges) {
1212 if (!fFeatures.fCanMergePages || !fOptions->GetEnableSamePageMerging()) {
1213 mask.emplace_back(
true);
1224 mask.emplace_back(
true);
1229 const auto *
p =
itr->second.fSealedPage;
1232 mask.emplace_back(
true);
1237 mask.emplace_back(
false);
1241 mask.shrink_to_fit();
1248 for (
auto &
range : ranges) {
1250 fOpenColumnRanges.at(
range.fPhysicalColumnId).IncrementNElements(
sealedPageIt->GetNElements());
1256 fOpenPageRanges.at(
range.fPhysicalColumnId).GetPageInfos().emplace_back(
pageInfo);
1268 for (
unsigned int i = 0; i < fOpenColumnRanges.size(); ++i) {
1270 columnInfo.fCompressionSettings = fOpenColumnRanges[i].GetCompressionSettings().value();
1271 if (fOpenColumnRanges[i].IsSuppressed()) {
1272 assert(fOpenPageRanges[i].GetPageInfos().empty());
1273 columnInfo.fPageRange.SetPhysicalColumnId(i);
1276 fOpenColumnRanges[i].SetNElements(0);
1277 fOpenColumnRanges[i].SetIsSuppressed(
false);
1279 std::swap(
columnInfo.fPageRange, fOpenPageRanges[i]);
1280 fOpenPageRanges[i].SetPhysicalColumnId(i);
1282 columnInfo.fNElements = fOpenColumnRanges[i].GetNElements();
1283 fOpenColumnRanges[i].SetNElements(0);
1295 clusterBuilder.ClusterId(fDescriptorBuilder.GetDescriptor().GetNActiveClusters())
1296 .FirstEntryIndex(fPrevClusterNEntries)
1306 fOpenColumnRanges[
colId].IncrementFirstElementIndex(
columnInfo.fNElements);
1310 clusterBuilder.CommitSuppressedColumnRanges(fDescriptorBuilder.GetDescriptor()).ThrowOnError();
1323 fDescriptorBuilder.AddCluster(
clusterBuilder.MoveDescriptor().Unwrap());
1324 fPrevClusterNEntries +=
cluster.fNEntries;
1330 const auto &
descriptor = fDescriptorBuilder.GetDescriptor();
1335 for (
auto i = fNextClusterInGroup; i <
nClusters; ++i) {
1336 physClusterIDs.emplace_back(fSerializationContext.MapClusterId(i));
1349 cgBuilder.MinEntry(0).EntrySpan(0).NClusters(0);
1356 .NClusters(
nClusters - fNextClusterInGroup);
1358 std::vector<ROOT::DescriptorId_t>
clusterIds;
1360 for (
auto i = fNextClusterInGroup; i <
nClusters; ++i) {
1364 fDescriptorBuilder.AddClusterGroup(
cgBuilder.MoveDescriptor().Unwrap());
1382 fDescriptorBuilder.AddAttributeSet(std::move(
attrSetDesc)).ThrowOnError();
1387 if (!fInfosOfStreamerFields.empty()) {
1390 for (
const auto &
etDesc : fDescriptorBuilder.GetDescriptor().GetExtraTypeInfoIterable()) {
1397 fInfosOfStreamerFields.merge(
etInfo);
1404 fDescriptorBuilder.ReplaceExtraTypeInfo(
extraInfoBuilder.MoveDescriptor().Unwrap());
1407 const auto &
descriptor = fDescriptorBuilder.GetDescriptor();
1419 fCounters = std::make_unique<RCounters>(
RCounters{
1420 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"nPageCommitted",
"",
"number of pages committed to storage"),
1421 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"szWritePayload",
"B",
"volume written for committed pages"),
1423 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"timeWallWrite",
"ns",
"wall clock time spent writing"),
1424 *fMetrics.MakeCounter<
RNTupleAtomicCounter *>(
"timeWallZip",
"ns",
"wall clock time spent compressing"),
1427 "CPU time spent compressing")});
#define R__FORWARD_ERROR(res)
Short-hand to return an RResult<T> in an error state (i.e. after checking)
#define R__FAIL(msg)
Short-hand to return an RResult<T> in an error state; the RError is implicitly converted into RResult...
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
#define R__ASSERT(e)
Checks condition e and reports a fatal error if it's false.
winID h TVirtualViewer3D TVirtualGLPainter p
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t mask
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t result
Option_t Option_t TPoint TPoint const char mode
A thread-safe integral performance counter.
A metric element that computes its floating point value from other counters.
A collection of Counter objects with a name, a unit, and a description.
A helper class for piece-wise construction of an RClusterDescriptor.
A helper class for piece-wise construction of an RClusterGroupDescriptor.
An in-memory subset of the packed and compressed pages of a cluster.
std::unordered_set< ROOT::DescriptorId_t > ColumnSet_t
A helper class for piece-wise construction of an RColumnDescriptor.
A column element encapsulates the translation between basic C++ types and their column representation...
virtual RIdentifier GetIdentifier() const =0
A column is a storage-backed array of a simple, fixed-size type, from which pages can be mapped into ...
std::optional< std::pair< double, double > > GetValueRange() const
std::uint16_t GetRepresentationIndex() const
ROOT::Internal::RColumnElementBase * GetElement() const
ROOT::ENTupleColumnType GetType() const
ROOT::NTupleSize_t GetFirstElementIndex() const
std::size_t GetWritePageCapacity() const
std::uint16_t GetBitsOnStorage() const
std::uint32_t GetIndex() const
A helper class for piece-wise construction of an RFieldDescriptor.
static RFieldDescriptorBuilder FromField(const ROOT::RFieldBase &field)
Make a new RFieldDescriptorBuilder based off a live RNTuple field.
static std::size_t Zip(const void *from, std::size_t nbytes, int compression, void *to)
Returns the size of the compressed data, written into the provided output buffer.
static void Unzip(const void *from, size_t nbytes, size_t dataLen, void *to)
The nbytes parameter provides the size ls of the from buffer.
static unsigned int GetClusterBunchSize(const RNTupleReadOptions &options)
A helper class for serializing and deserialization of the RNTuple binary format.
static std::uint32_t SerializeXxHash3(const unsigned char *data, std::uint64_t length, std::uint64_t &xxhash3, void *buffer)
Writes a XxHash-3 64bit checksum of the byte range given by data and length.
static RResult< StreamerInfoMap_t > DeserializeStreamerInfos(const std::string &extraTypeInfoContent)
static RResult< void > VerifyXxHash3(const unsigned char *data, std::uint64_t length, std::uint64_t &xxhash3)
Expects an xxhash3 checksum in the 8 bytes following data + length and verifies it.
EDescriptorDeserializeMode
static RResult< std::uint32_t > SerializePageList(void *buffer, const RNTupleDescriptor &desc, std::span< ROOT::DescriptorId_t > physClusterIDs, const RContext &context)
static RResult< std::uint32_t > SerializeFooter(void *buffer, const RNTupleDescriptor &desc, const RContext &context)
static std::uint32_t DeserializeUInt64(const void *buffer, std::uint64_t &val)
static RResult< RContext > SerializeHeader(void *buffer, const RNTupleDescriptor &desc)
static std::string SerializeStreamerInfos(const StreamerInfoMap_t &infos)
A memory region that contains packed and compressed pages.
A page as being stored on disk, that is packed and compressed.
Uses standard C++ memory allocation for the column data pages.
Abstract interface to allocate and release pages.
RStagedCluster StageCluster(ROOT::NTupleSize_t nNewEntries) final
Stage the current cluster and create a new one for the following data.
void UpdateSchema(const ROOT::Internal::RNTupleModelChangeset &changeset, ROOT::NTupleSize_t firstEntry) override
Incorporate incremental changes to the model into the ntuple descriptor.
void CommitSealedPage(ROOT::DescriptorId_t physicalColumnId, const RPageStorage::RSealedPage &sealedPage) final
Write a preprocessed page to storage. The column must have been added before.
std::unique_ptr< RNTupleModel > InitFromDescriptor(const ROOT::RNTupleDescriptor &descriptor, bool copyClusters)
Initialize sink based on an existing descriptor and fill into the descriptor builder,...
void UpdateExtraTypeInfo(const ROOT::RExtraTypeInfoDescriptor &extraTypeInfo) final
Adds an extra type information record to schema.
void CommitAttributeSet(std::string_view attrSetName, const RNTupleLink &attrAnchorInfo) final
Adds the given anchor information (name + locator) into the main RNTuple's descriptor as an attribute...
ColumnHandle_t AddColumn(ROOT::DescriptorId_t fieldId, ROOT::Internal::RColumn &column) final
Register a new column.
virtual std::vector< RNTupleLocator > CommitSealedPageVImpl(std::span< RPageStorage::RSealedPageGroup > ranges, const std::vector< bool > &mask)
Vector commit of preprocessed pages.
RPagePersistentSink(std::string_view ntupleName, const ROOT::RNTupleWriteOptions &options)
void CommitSuppressedColumn(ColumnHandle_t columnHandle) final
Commits a suppressed column for the current cluster.
void CommitStagedClusters(std::span< RStagedCluster > clusters) final
Commit staged clusters, logically appending them to the ntuple descriptor.
static std::unique_ptr< RPageSink > Create(std::string_view ntupleName, std::string_view location, const ROOT::RNTupleWriteOptions &options=ROOT::RNTupleWriteOptions())
Guess the concrete derived page source from the location.
void CommitPage(ColumnHandle_t columnHandle, const ROOT::Internal::RPage &page) final
Write a page to the storage. The column must have been added before.
RNTupleLink CommitDatasetImpl() final
~RPagePersistentSink() override
virtual void InitImpl(unsigned char *serializedHeader, std::uint32_t length)=0
void CommitClusterGroup() final
Write out the page locations (page list envelope) for all the committed clusters since the last call ...
void CommitSealedPageV(std::span< RPageStorage::RSealedPageGroup > ranges) final
Write a vector of preprocessed pages to storage. The corresponding columns must have been added befor...
void EnableDefaultMetrics(const std::string &prefix)
Enables the default set of metrics provided by RPageSink.
Abstract interface to write data into an ntuple.
RNTupleLink CommitDataset()
Run the registered callbacks and finalize the current cluster and the entrire data set.
virtual ROOT::Internal::RPage ReservePage(ColumnHandle_t columnHandle, std::size_t nElements)
Get a new, empty page for the given column that can be filled with up to nElements; nElements must be...
RSealedPage SealPage(const ROOT::Internal::RPage &page, const ROOT::Internal::RColumnElementBase &element)
Helper for streaming a page.
RPageSink(std::string_view ntupleName, const ROOT::RNTupleWriteOptions &options)
void Insert(ROOT::DescriptorId_t physicalColumnId, ROOT::Internal::RColumnElementBase::RIdentifier elementId)
ROOT::Internal::RCluster::ColumnSet_t ToColumnSet() const
void Erase(ROOT::DescriptorId_t physicalColumnId, ROOT::Internal::RColumnElementBase::RIdentifier elementId)
void LoadStructure()
Loads header and footer without decompressing or deserializing them.
virtual ROOT::Internal::RPageRef LoadPage(ColumnHandle_t columnHandle, ROOT::NTupleSize_t globalIndex)
Allocates and fills a page that contains the index-th element.
void RegisterStreamerInfos()
Builds the streamer info records from the descriptor's extra type info section.
void Attach(ROOT::Internal::RNTupleSerializer::EDescriptorDeserializeMode mode=ROOT::Internal::RNTupleSerializer::EDescriptorDeserializeMode::kForReading)
Open the physical storage container and deserialize header and footer.
ColumnHandle_t AddColumn(ROOT::DescriptorId_t fieldId, ROOT::Internal::RColumn &column) override
Register a new column.
void UnzipCluster(ROOT::Internal::RCluster *cluster)
Parallel decompression and unpacking of the pages in the given cluster.
void PrepareLoadCluster(const ROOT::Internal::RCluster::RKey &clusterKey, ROOT::Internal::ROnDiskPageMap &pageZeroMap, std::function< void(ROOT::DescriptorId_t, ROOT::NTupleSize_t, const ROOT::RClusterDescriptor::RPageInfo &)> perPageFunc)
Prepare a page range read for the column set in clusterKey.
void EnableDefaultMetrics(const std::string &prefix)
Enables the default set of metrics provided by RPageSource.
ROOT::NTupleSize_t GetNEntries()
ROOT::Internal::RPageRef LoadZeroPage(ColumnHandle_t columnHandle, const RPageSummary &pageSummary)
void UpdateLastUsedCluster(ROOT::DescriptorId_t clusterId)
Does nothing if fLastUsedCluster == clusterId.
ROOT::NTupleSize_t GetNElements(ColumnHandle_t columnHandle)
ROOT::Internal::RPageRef LoadPageFromSummary(ColumnHandle_t columnHandle, const RPageSummary &pageSummary)
void DropColumn(ColumnHandle_t columnHandle) override
Unregisters a column.
void LoadSealedPage(ROOT::DescriptorId_t physicalColumnId, RNTupleLocalIndex localIndex, RSealedPage &sealedPage)
Read the packed and compressed bytes of a page into the memory buffer provided by sealedPage.
virtual void UnzipClusterImpl(ROOT::Internal::RCluster *cluster)
RPageSource(std::string_view ntupleName, const ROOT::RNTupleReadOptions &fOptions)
void SetEntryRange(const REntryRange &range)
Promise to only read from the given entry range.
std::unique_ptr< RPageSource > Clone() const
Open the same storage multiple time, e.g.
static std::unique_ptr< RPageSource > Create(std::string_view ntupleName, std::string_view location, const ROOT::RNTupleReadOptions &options=ROOT::RNTupleReadOptions())
Guess the concrete derived page source from the file name (location)
static RResult< ROOT::Internal::RPage > UnsealPage(const RSealedPage &sealedPage, const ROOT::Internal::RColumnElementBase &element, ROOT::Internal::RPageAllocator &pageAlloc)
Helper for unstreaming a page.
Common functionality of an ntuple storage for both reading and writing.
RPageStorage(std::string_view name)
Stores information about the cluster in which this page resides.
A page is a slice of a column that is mapped into memory.
static const void * GetPageZeroBuffer()
Return a pointer to the page zero buffer used if there is no on-disk data for a particular deferred c...
const ROOT::RFieldBase * GetSourceField(const ROOT::RFieldBase *target) const
bool TryEvict(std::size_t targetAvailableSize, std::size_t pageSizeLimit)
Flush columns in order of allocated write page size until the sum of all write page allocations leave...
bool TryUpdate(ROOT::Internal::RColumn &column, std::size_t newWritePageSize)
Try to register the new write page size for the given column.
The window of element indexes of a particular column in a particular cluster.
Metadata for RNTuple clusters.
Base class for all ROOT issued exceptions.
A field translates read and write calls from/to underlying columns to/from tree values.
The on-storage metadata of an RNTuple.
Addresses a column element or field item relative to a particular cluster, instead of a global NTuple...
The RNTupleModel encapulates the schema of an RNTuple.
const std::string & GetDescription() const
Common user-tunable settings for reading RNTuples.
Common user-tunable settings for storing RNTuples.
const_iterator begin() const
const_iterator end() const
void ThrowOnError()
Short-hand method to throw an exception in the case of errors.
The class is used as a return type for operations that can fail; wraps a value of type T or an RError...
ROOT::RFieldZero & GetFieldZeroOfModel(RNTupleModel &model)
RResult< void > EnsureValidNameForRNTuple(std::string_view name, std::string_view where)
Check whether a given string is a valid name according to the RNTuple specification.
std::unique_ptr< T[]> MakeUninitArray(std::size_t size)
Make an array of default-initialized elements.
RProjectedFields & GetProjectedFieldsOfModel(RNTupleModel &model)
std::unique_ptr< RColumnElementBase > GenerateColumnElement(std::type_index inMemoryType, ROOT::ENTupleColumnType onDiskType)
void CallConnectPageSinkOnField(RFieldBase &, ROOT::Internal::RPageSink &, ROOT::NTupleSize_t firstEntry=0)
std::uint64_t DescriptorId_t
Distriniguishes elements of the same type within a descriptor, e.g. different fields.
constexpr NTupleSize_t kInvalidNTupleIndex
std::uint64_t NTupleSize_t
Integer type long enough to hold the maximum number of entries in a column.
constexpr DescriptorId_t kInvalidDescriptorId
The identifiers that specifies the content of a (partial) cluster.
Every concrete RColumnElement type is identified by its on-disk type (column type) and the in-memory ...
The incremental changes to a RNTupleModel
On-disk pages within a page source are identified by the column and page number.
Default I/O performance counters that get registered in fMetrics.
Parameters for the SealPage() method.
bool fWriteChecksum
Adds a 8 byte little-endian xxhash3 checksum to the page payload.
std::uint32_t fCompressionSettings
Compression algorithm and level to apply.
void * fBuffer
Location for sealed output. The memory buffer has to be large enough.
const ROOT::Internal::RPage * fPage
Input page to be sealed.
bool fAllowAlias
If false, the output buffer must not point to the input page buffer, which would otherwise be an opti...
const ROOT::Internal::RColumnElementBase * fElement
Corresponds to the page's elements, for size calculation etc.
Cluster that was staged, but not yet logically appended to the RNTuple.
Default I/O performance counters that get registered in fMetrics
Used in SetEntryRange / GetEntryRange.
bool IntersectsWith(const ROOT::RClusterDescriptor &clusterDesc) const
Returns true if the given cluster has entries within the entry range.
Summarizes meta-data necessary to load a certain page. Used by LoadPageFromSummary().
A sealed page contains the bytes of a page as written to storage (packed & compressed).
RResult< void > VerifyChecksumIfEnabled() const
RResult< std::uint64_t > GetChecksum() const
Returns a failure if the sealed page has no checksum.
ROOT::Internal::RColumn * fColumn
bool operator>(const RColumnInfo &other) const
Information about a single page in the context of a cluster's page range.
Modifiers passed to CreateModel()