47enum EDaosMapping { kOidPerCluster, kOidPerPage };
51 DistributionKey_t fDkey;
59static constexpr DistributionKey_t kDistributionKeyDefault = 0x5a3c69f0cafe4a11;
60static constexpr AttributeKey_t kAttributeKeyDefault = 0x4243544b53444229;
61static constexpr AttributeKey_t kAttributeKeyAnchor = 0x4243544b5344422a;
62static constexpr AttributeKey_t kAttributeKeyHeader = 0x4243544b5344422b;
63static constexpr AttributeKey_t kAttributeKeyFooter = 0x4243544b5344422c;
71static constexpr EDaosMapping kDefaultDaosMapping = kOidPerCluster;
73template <EDaosMapping mapping>
75 long unsigned columnId,
long unsigned pageCount)
77 if constexpr (mapping == kOidPerCluster) {
80 static_cast<DistributionKey_t
>(columnId),
static_cast<AttributeKey_t
>(pageCount)};
81 }
else if constexpr (mapping == kOidPerPage) {
84 kDistributionKeyDefault, kAttributeKeyDefault};
90 std::string fPoolLabel;
92 std::string fContainerLabel;
98RDaosURI ParseDaosURI(std::string_view uri)
100 std::regex re(
"daos://([^/]+)/(.+)");
102 if (!std::regex_match(uri.data(),
m, re))
114 if (buffer !=
nullptr) {
115 auto bytes =
reinterpret_cast<unsigned char *
>(buffer);
123 return RNTupleSerializer::SerializeString(
fObjClass,
nullptr) + 20;
130 return R__FAIL(
"DAOS anchor too short");
133 auto bytes =
reinterpret_cast<const unsigned char *
>(buffer);
134 bytes += RNTupleSerializer::DeserializeUInt32(
bytes, fVersion);
135 bytes += RNTupleSerializer::DeserializeUInt32(
bytes, fNBytesHeader);
136 bytes += RNTupleSerializer::DeserializeUInt32(
bytes, fLenHeader);
137 bytes += RNTupleSerializer::DeserializeUInt32(
bytes, fNBytesFooter);
138 bytes += RNTupleSerializer::DeserializeUInt32(
bytes, fLenFooter);
139 auto result = RNTupleSerializer::DeserializeString(
bytes, bufSize - 20, fObjClass);
142 return result.Unwrap() + 20;
155 std::unique_ptr<unsigned char[]> buffer, zipBuffer;
156 auto &anchor = fAnchor.emplace();
162 buffer = std::make_unique<unsigned char[]>(anchorSize);
163 if ((err = cont.
ReadSingleAkey(buffer.get(), anchorSize, oidMetadata, kDistributionKeyDefault, kAttributeKeyAnchor,
167 anchor.Deserialize(buffer.get(), anchorSize).Unwrap();
170 buffer = std::make_unique<unsigned char[]>(anchor.fLenHeader);
171 zipBuffer = std::make_unique<unsigned char[]>(anchor.fNBytesHeader);
172 if ((err = cont.
ReadSingleAkey(zipBuffer.get(), anchor.fNBytesHeader, oidMetadata, kDistributionKeyDefault,
173 kAttributeKeyHeader, kCidMetadata)))
175 decompressor.
Unzip(zipBuffer.get(), anchor.fNBytesHeader, anchor.fLenHeader, buffer.get());
179 buffer = std::make_unique<unsigned char[]>(anchor.fLenFooter);
180 zipBuffer = std::make_unique<unsigned char[]>(anchor.fNBytesFooter);
181 if ((err = cont.
ReadSingleAkey(zipBuffer.get(), anchor.fNBytesFooter, oidMetadata, kDistributionKeyDefault,
182 kAttributeKeyFooter, kCidMetadata)))
184 decompressor.
Unzip(zipBuffer.get(), anchor.fNBytesFooter, anchor.fLenFooter, buffer.get());
190std::pair<ROOT::Experimental::Detail::RDaosContainerNTupleLocator, ROOT::Experimental::RNTupleDescriptorBuilder>
192 const std::string &ntupleName,
198 auto &builder =
result.second;
200 if (
int err = loc.InitNTupleDescriptorBuilder(cont, decompressor, builder); !err) {
201 if (ntupleName.empty() || ntupleName != builder.GetDescriptor().GetName()) {
204 R__FAIL(
"LocateNTuple: ntuple name '" + ntupleName +
"' unavailable in this container."));
217 <<
"Do not store real data with this version of RNTuple!";
218 fCompressor = std::make_unique<RNTupleCompressor>();
225 unsigned char *serializedHeader, std::uint32_t
length)
230 if (oclass.IsUnknown())
233 auto args = ParseDaosURI(fURI);
234 auto pool = std::make_shared<RDaosPool>(args.fPoolLabel);
235 fDaosContainer = std::make_unique<RDaosContainer>(pool, args.fContainerLabel,
true);
236 fDaosContainer->SetDefaultObjectClass(oclass);
240 fNTupleIndex = locator.GetIndex();
242 auto zipBuffer = std::make_unique<unsigned char[]>(
length);
243 auto szZipHeader = fCompressor->Zip(serializedHeader,
length, GetWriteOptions().GetCompression(),
245 WriteNTupleHeader(zipBuffer.get(), szZipHeader,
length);
255 sealedPage = SealPage(page, *element, GetWriteOptions().GetCompression());
259 return CommitSealedPageImpl(columnHandle.
fId, sealedPage);
266 auto offsetData = fPageId.fetch_add(1);
267 DescriptorId_t clusterId = fDescriptorBuilder.GetDescriptor().GetNClusters();
271 RDaosKey daosKey = GetPageDaosKey<kDefaultDaosMapping>(fNTupleIndex, clusterId, columnId, offsetData);
272 fDaosContainer->WriteSingleAkey(sealedPage.
fBuffer, sealedPage.
fSize, daosKey.fOid, daosKey.fDkey, daosKey.fAkey);
276 result.fPosition = offsetData;
278 fCounters->fNPageCommitted.Inc();
279 fCounters->fSzWritePayload.Add(sealedPage.
fSize);
280 fNBytesCurrentCluster += sealedPage.
fSize;
284std::vector<ROOT::Experimental::RNTupleLocator>
288 std::vector<ROOT::Experimental::RNTupleLocator> locators;
291 return c + std::distance(r.fFirst, r.fLast);
293 locators.reserve(nPages);
295 DescriptorId_t clusterId = fDescriptorBuilder.GetDescriptor().GetNClusters();
296 std::size_t szPayload = 0;
299 for (
auto &range : ranges) {
300 for (
auto sealedPageIt = range.fFirst; sealedPageIt != range.fLast; ++sealedPageIt) {
304 auto offsetData = fPageId.fetch_add(1);
306 RDaosKey daosKey = GetPageDaosKey<kDefaultDaosMapping>(fNTupleIndex, clusterId, range.fColumnId, offsetData);
309 it->second.insert(daosKey.fAkey, pageIov);
314 locators.push_back(locator);
316 szPayload += s.
fSize;
319 fNBytesCurrentCluster += szPayload;
323 if (
int err = fDaosContainer->WriteV(writeRequests))
327 fCounters->fNPageCommitted.Add(nPages);
328 fCounters->fSzWritePayload.Add(szPayload);
336 return std::exchange(fNBytesCurrentCluster, 0);
343 auto bufPageListZip = std::make_unique<unsigned char[]>(
length);
344 auto szPageListZip = fCompressor->Zip(serializedPageList,
length, GetWriteOptions().GetCompression(),
347 auto offsetData = fClusterGroupId.fetch_add(1);
348 fDaosContainer->WriteSingleAkey(
349 bufPageListZip.get(), szPageListZip,
350 daos_obj_id_t{kOidLowPageList, static_cast<decltype(daos_obj_id_t::hi)>(fNTupleIndex)}, kDistributionKeyDefault,
351 offsetData, kCidMetadata);
353 result.fPosition = offsetData;
354 result.fBytesOnStorage = szPageListZip;
355 fCounters->fSzWritePayload.Add(szPageListZip);
361 auto bufFooterZip = std::make_unique<unsigned char[]>(
length);
362 auto szFooterZip = fCompressor->Zip(serializedFooter,
length, GetWriteOptions().GetCompression(),
364 WriteNTupleFooter(bufFooterZip.get(), szFooterZip,
length);
370 fDaosContainer->WriteSingleAkey(
372 kDistributionKeyDefault, kAttributeKeyHeader, kCidMetadata);
373 fNTupleAnchor.fLenHeader = lenHeader;
374 fNTupleAnchor.fNBytesHeader = nbytes;
379 fDaosContainer->WriteSingleAkey(
381 kDistributionKeyDefault, kAttributeKeyFooter, kCidMetadata);
382 fNTupleAnchor.fLenFooter = lenFooter;
383 fNTupleAnchor.fNBytesFooter = nbytes;
389 auto buffer = std::make_unique<unsigned char[]>(ntplSize);
390 fNTupleAnchor.Serialize(buffer.get());
391 fDaosContainer->WriteSingleAkey(
392 buffer.get(), ntplSize,
daos_obj_id_t{kOidLowMetadata, static_cast<decltype(daos_obj_id_t::hi)>(fNTupleIndex)},
393 kDistributionKeyDefault, kAttributeKeyAnchor, kCidMetadata);
402 return fPageAllocator->NewPage(columnHandle.
fId, elementSize, nElements);
407 fPageAllocator->DeletePage(page);
414 std::size_t nElements)
416 RPage newPage(columnId, mem, elementSize, nElements);
425 delete[]
reinterpret_cast<unsigned char *
>(page.
GetBuffer());
433 fPagePool(std::make_shared<
RPagePool>()), fURI(uri),
434 fClusterPool(std::make_unique<
RClusterPool>(*this, options.GetClusterBunchSize()))
439 auto args = ParseDaosURI(uri);
440 auto pool = std::make_shared<RDaosPool>(args.fPoolLabel);
441 fDaosContainer = std::make_unique<RDaosContainer>(pool, args.fContainerLabel);
449 std::unique_ptr<unsigned char[]> buffer, zipBuffer;
451 auto [locator, descBuilder] =
453 if (!locator.IsValid())
455 R__FAIL(
"Attach: requested ntuple '" + fNTupleName +
"' is not present in DAOS container."));
458 if (oclass.IsUnknown())
461 fDaosContainer->SetDefaultObjectClass(oclass);
462 fNTupleIndex = locator.GetIndex();
464 ntplDesc = descBuilder.MoveDescriptor();
468 buffer = std::make_unique<unsigned char[]>(cgDesc.GetPageListLength());
469 zipBuffer = std::make_unique<unsigned char[]>(cgDesc.GetPageListLocator().fBytesOnStorage);
470 fDaosContainer->ReadSingleAkey(zipBuffer.get(), cgDesc.GetPageListLocator().fBytesOnStorage, oidPageList,
471 kDistributionKeyDefault, cgDesc.GetPageListLocator().GetPosition<std::uint64_t>(),
473 fDecompressor->Unzip(zipBuffer.get(), cgDesc.GetPageListLocator().fBytesOnStorage, cgDesc.GetPageListLength(),
478 for (std::size_t i = 0; i < clusters.size(); ++i) {
488 return fDaosContainer->GetDefaultObjectClass().ToString();
499 auto descriptorGuard = GetSharedDescriptorGuard();
500 const auto &clusterDescriptor = descriptorGuard->GetClusterDescriptor(clusterId);
501 pageInfo = clusterDescriptor.GetPageRange(columnId).Find(clusterIndex.
GetIndex());
505 sealedPage.
fSize = bytesOnStorage;
508 RDaosKey daosKey = GetPageDaosKey<kDefaultDaosMapping>(fNTupleIndex, clusterId, columnId,
510 fDaosContainer->ReadSingleAkey(
const_cast<void *
>(sealedPage.
fBuffer), bytesOnStorage, daosKey.fOid,
511 daosKey.fDkey, daosKey.fAkey);
520 const auto columnId = columnHandle.
fId;
521 const auto clusterId = clusterInfo.
fClusterId;
522 const auto &pageInfo = clusterInfo.
fPageInfo;
525 const auto elementSize = element->
GetSize();
526 const auto bytesOnStorage = pageInfo.fLocator.fBytesOnStorage;
528 const void *sealedPageBuffer =
nullptr;
529 std::unique_ptr<unsigned char[]> directReadBuffer;
532 directReadBuffer = std::make_unique<unsigned char[]>(bytesOnStorage);
533 RDaosKey daosKey = GetPageDaosKey<kDefaultDaosMapping>(fNTupleIndex, clusterId, columnId,
534 pageInfo.fLocator.GetPosition<std::uint64_t>());
535 fDaosContainer->ReadSingleAkey(directReadBuffer.get(), bytesOnStorage, daosKey.fOid, daosKey.fDkey,
537 fCounters->fNPageLoaded.Inc();
538 fCounters->fNRead.Inc();
539 fCounters->fSzReadPayload.Add(bytesOnStorage);
540 sealedPageBuffer = directReadBuffer.get();
542 if (!fCurrentCluster || (fCurrentCluster->GetId() != clusterId) || !fCurrentCluster->ContainsColumn(columnId))
543 fCurrentCluster = fClusterPool->GetCluster(clusterId, fActiveColumns);
544 R__ASSERT(fCurrentCluster->ContainsColumn(columnId));
546 auto cachedPage = fPagePool->GetPage(columnId,
RClusterIndex(clusterId, idxInCluster));
547 if (!cachedPage.IsNull())
551 auto onDiskPage = fCurrentCluster->GetOnDiskPage(key);
552 R__ASSERT(onDiskPage && (bytesOnStorage == onDiskPage->GetSize()));
553 sealedPageBuffer = onDiskPage->GetAddress();
556 std::unique_ptr<unsigned char[]> pageBuffer;
559 pageBuffer = UnsealPage({sealedPageBuffer, bytesOnStorage, pageInfo.fNElements}, *element);
560 fCounters->fSzUnzip.Add(elementSize * pageInfo.fNElements);
563 auto newPage = fPageAllocator->NewPage(columnId, pageBuffer.release(), elementSize, pageInfo.fNElements);
564 newPage.SetWindow(clusterInfo.
fColumnOffset + pageInfo.fFirstInPage,
566 fPagePool->RegisterPage(
569 fCounters->fNPagePopulated.Inc();
576 const auto columnId = columnHandle.
fId;
577 auto cachedPage = fPagePool->GetPage(columnId, globalIndex);
578 if (!cachedPage.IsNull())
581 std::uint64_t idxInCluster;
584 auto descriptorGuard = GetSharedDescriptorGuard();
585 clusterInfo.
fClusterId = descriptorGuard->FindClusterId(columnId, globalIndex);
588 const auto &clusterDescriptor = descriptorGuard->GetClusterDescriptor(clusterInfo.
fClusterId);
589 clusterInfo.
fColumnOffset = clusterDescriptor.GetColumnRange(columnId).fFirstElementIndex;
592 clusterInfo.
fPageInfo = clusterDescriptor.GetPageRange(columnId).Find(idxInCluster);
594 return PopulatePageFromCluster(columnHandle, clusterInfo, idxInCluster);
602 const auto idxInCluster = clusterIndex.
GetIndex();
603 const auto columnId = columnHandle.
fId;
604 auto cachedPage = fPagePool->GetPage(columnId, clusterIndex);
605 if (!cachedPage.IsNull())
611 auto descriptorGuard = GetSharedDescriptorGuard();
612 const auto &clusterDescriptor = descriptorGuard->GetClusterDescriptor(clusterId);
614 clusterInfo.
fColumnOffset = clusterDescriptor.GetColumnRange(columnId).fFirstElementIndex;
615 clusterInfo.
fPageInfo = clusterDescriptor.GetPageRange(columnId).Find(idxInCluster);
618 return PopulatePageFromCluster(columnHandle, clusterInfo, idxInCluster);
623 fPagePool->ReturnPage(page);
629 return std::unique_ptr<RPageSourceDaos>(clone);
632std::vector<std::unique_ptr<ROOT::Experimental::Detail::RCluster>>
635 std::vector<std::unique_ptr<ROOT::Experimental::Detail::RCluster>>
result;
637 struct RDaosSealedPageLocator {
638 RDaosSealedPageLocator() =
default;
641 : fClusterId(cl), fColumnId(co), fPageNo(
p), fObjectId(o),
fSize(s), fBufPos(
b)
647 std::uint64_t fObjectId = 0;
648 std::uint64_t
fSize = 0;
649 std::size_t fBufPos = 0;
652 std::vector<unsigned char *> clusterBuffers(clusterKeys.size());
653 std::vector<std::unique_ptr<ROnDiskPageMapHeap>> pageMaps(clusterKeys.size());
656 std::size_t szPayload = 0;
659 for (
unsigned i = 0; i < clusterKeys.size(); ++i) {
660 const auto &clusterKey = clusterKeys[i];
661 auto clusterId = clusterKey.fClusterId;
662 std::vector<RDaosSealedPageLocator> onDiskClusterPages;
664 unsigned clusterBufSz = 0;
665 fCounters->fNClusterLoaded.Inc();
667 auto descriptorGuard = GetSharedDescriptorGuard();
668 const auto &clusterDesc = descriptorGuard->GetClusterDescriptor(clusterId);
671 for (
auto columnId : clusterKey.fColumnSet) {
672 const auto &pageRange = clusterDesc.GetPageRange(columnId);
674 for (
const auto &pageInfo : pageRange.fPageInfos) {
675 const auto &pageLocator = pageInfo.fLocator;
676 onDiskClusterPages.push_back(RDaosSealedPageLocator(clusterId, columnId, columnPageCount,
677 pageLocator.GetPosition<std::uint64_t>(),
678 pageLocator.fBytesOnStorage, clusterBufSz));
680 clusterBufSz += pageLocator.fBytesOnStorage;
682 nPages += columnPageCount;
685 szPayload += clusterBufSz;
687 clusterBuffers[i] =
new unsigned char[clusterBufSz];
688 pageMaps[i] = std::make_unique<ROnDiskPageMapHeap>(std::unique_ptr<
unsigned char[]>(clusterBuffers[i]));
691 for (
const auto &s : onDiskClusterPages) {
694 pageMaps[i]->Register(key,
ROnDiskPage(clusterBuffers[i] + s.fBufPos, s.fSize));
698 d_iov_set(&iov, clusterBuffers[i] + s.fBufPos, s.fSize);
700 RDaosKey daosKey = GetPageDaosKey<kDefaultDaosMapping>(fNTupleIndex, s.fClusterId, s.fColumnId, s.fObjectId);
703 it->second.insert(daosKey.fAkey, iov);
706 fCounters->fNPageLoaded.Add(nPages);
707 fCounters->fSzReadPayload.Add(szPayload);
711 if (
int err = fDaosContainer->ReadV(readRequests))
714 fCounters->fNReadV.Inc();
715 fCounters->fNRead.Add(nPages);
718 for (
unsigned i = 0; i < clusterKeys.size(); ++i) {
719 auto cluster = std::make_unique<RCluster>(clusterKeys[i].fClusterId);
720 cluster->Adopt(std::move(pageMaps[i]));
721 for (
auto colId : clusterKeys[i].fColumnSet)
722 cluster->SetColumnAvailable(colId);
724 result.emplace_back(std::move(cluster));
732 fTaskScheduler->Reset();
734 const auto clusterId = cluster->
GetId();
735 auto descriptorGuard = GetSharedDescriptorGuard();
736 const auto &clusterDescriptor = descriptorGuard->GetClusterDescriptor(clusterId);
738 std::vector<std::unique_ptr<RColumnElementBase>> allElements;
741 for (
const auto columnId : columnsInCluster) {
742 const auto &columnDesc = descriptorGuard->GetColumnDescriptor(columnId);
746 const auto &pageRange = clusterDescriptor.GetPageRange(columnId);
747 std::uint64_t pageNo = 0;
748 std::uint64_t firstInPage = 0;
749 for (
const auto &pi : pageRange.fPageInfos) {
752 R__ASSERT(onDiskPage && (onDiskPage->GetSize() == pi.fLocator.fBytesOnStorage));
754 auto taskFunc = [
this, columnId, clusterId, firstInPage, onDiskPage, element = allElements.back().get(),
755 nElements = pi.fNElements,
756 indexOffset = clusterDescriptor.GetColumnRange(columnId).fFirstElementIndex]() {
757 auto pageBuffer = UnsealPage({onDiskPage->GetAddress(), onDiskPage->GetSize(), nElements}, *element);
758 fCounters->fSzUnzip.Add(element->GetSize() * nElements);
760 auto newPage = fPageAllocator->NewPage(columnId, pageBuffer.release(), element->GetSize(), nElements);
762 fPagePool->PreloadPage(
768 fTaskScheduler->AddTask(taskFunc);
770 firstInPage += pi.fNElements;
777 fTaskScheduler->Wait();
#define R__FORWARD_ERROR(res)
Short-hand to return an RResult<T> in an error state (i.e. after checking)
#define R__FAIL(msg)
Short-hand to return an RResult<T> in an error state; the RError is implicitly converted into RResult...
#define R__LOG_WARNING(...)
winID h TVirtualViewer3D TVirtualGLPainter p
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void data
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t r
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t result
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h length
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h Atom_t Int_t ULong_t ULong_t bytes
Managed a set of clusters containing compressed and packed pages.
An in-memory subset of the packed and compressed pages of a cluster.
const ColumnSet_t & GetAvailColumns() const
size_t GetNOnDiskPages() const
DescriptorId_t GetId() const
const ROnDiskPage * GetOnDiskPage(const ROnDiskPage::Key &key) const
static std::unique_ptr< RColumnElementBase > Generate(EColumnType type)
std::size_t GetSize() const
RColumnElementBase * GetElement() const
A RDaosContainer provides read/write access to objects in a given container.
std::unordered_map< ROidDkeyPair, RWOperation, ROidDkeyPair::Hash > MultiObjectRWOperation_t
int ReadSingleAkey(void *buffer, std::size_t length, daos_obj_id_t oid, DistributionKey_t dkey, AttributeKey_t akey, ObjClassId_t cid)
Read data from a single object attribute key to the given buffer.
RDaosObject::DistributionKey_t DistributionKey_t
RDaosObject::AttributeKey_t AttributeKey_t
static Writer_t MakeMemCopyWriter(unsigned char *dest)
Helper class to uncompress data blocks in the ROOT compression frame format.
void Unzip(const void *from, size_t nbytes, size_t dataLen, void *to)
The nbytes parameter provides the size ls of the from buffer.
Record wall time and CPU time between construction and destruction.
A page as being stored on disk, that is packed and compressed.
Manages pages read from a DAOS container.
static RPage NewPage(ColumnId_t columnId, void *mem, std::size_t elementSize, std::size_t nElements)
static void DeletePage(const RPage &page)
Uses standard C++ memory allocation for the column data pages.
A closure that can free the memory associated with a mapped page.
A thread-safe cache of column pages.
void ReleasePage(RPage &page) final
Every page store needs to be able to free pages it handed out.
RPageSinkDaos(std::string_view ntupleName, std::string_view uri, const RNTupleWriteOptions &options)
RNTupleLocator CommitSealedPageImpl(DescriptorId_t columnId, const RPageStorage::RSealedPage &sealedPage) final
void WriteNTupleFooter(const void *data, size_t nbytes, size_t lenFooter)
void WriteNTupleHeader(const void *data, size_t nbytes, size_t lenHeader)
RNTupleLocator CommitClusterGroupImpl(unsigned char *serializedPageList, std::uint32_t length) final
Returns the locator of the page list envelope of the given buffer that contains the serialized page l...
std::uint64_t CommitClusterImpl(NTupleSize_t nEntries) final
Returns the number of bytes written to storage (excluding metadata)
void CommitDatasetImpl(unsigned char *serializedFooter, std::uint32_t length) final
RNTupleLocator CommitPageImpl(ColumnHandle_t columnHandle, const RPage &page) final
~RPageSinkDaos() override
void CreateImpl(const RNTupleModel &model, unsigned char *serializedHeader, std::uint32_t length) final
std::vector< RNTupleLocator > CommitSealedPageVImpl(std::span< RPageStorage::RSealedPageGroup > ranges) final
Vector commit of preprocessed pages.
RPage ReservePage(ColumnHandle_t columnHandle, std::size_t nElements) final
Get a new, empty page for the given column that can be filled with up to nElements.
Abstract interface to write data into an ntuple.
void EnableDefaultMetrics(const std::string &prefix)
Enables the default set of metrics provided by RPageSink.
std::unique_ptr< RNTupleCompressor > fCompressor
Helper to zip pages and header/footer; includes a 16MB (kMAXZIPBUF) zip buffer.
Storage provider that reads ntuple pages from a DAOS container.
std::unique_ptr< RDaosContainer > fDaosContainer
A container that stores object data (header/footer, pages, etc.)
void LoadSealedPage(DescriptorId_t columnId, const RClusterIndex &clusterIndex, RSealedPage &sealedPage) final
Read the packed and compressed bytes of a page into the memory buffer provided by selaedPage.
RPageSourceDaos(std::string_view ntupleName, std::string_view uri, const RNTupleReadOptions &options)
~RPageSourceDaos() override
void ReleasePage(RPage &page) final
Every page store needs to be able to free pages it handed out.
void UnzipClusterImpl(RCluster *cluster) final
std::vector< std::unique_ptr< RCluster > > LoadClusters(std::span< RCluster::RKey > clusterKeys) final
Populates all the pages of the given cluster ids and columns; it is possible that some columns do not...
RPage PopulatePage(ColumnHandle_t columnHandle, NTupleSize_t globalIndex) final
Allocates and fills a page that contains the index-th element.
RPage PopulatePageFromCluster(ColumnHandle_t columnHandle, const RClusterInfo &clusterInfo, ClusterSize_t::ValueType idxInCluster)
std::string GetObjectClass() const
Return the object class used for user data OIDs in this ntuple.
RNTupleDescriptor AttachImpl() final
std::unique_ptr< RPageSource > Clone() const final
The cloned page source creates a new connection to the pool/container.
Abstract interface to read data from an ntuple.
void EnableDefaultMetrics(const std::string &prefix)
Enables the default set of metrics provided by RPageSource.
std::unique_ptr< RNTupleDecompressor > fDecompressor
Helper to unzip pages and header/footer; comprises a 16MB (kMAXZIPBUF) unzip buffer.
Stores information about the cluster in which this page resides.
A page is a slice of a column that is mapped into memory.
ClusterSize_t::ValueType GetNBytes() const
The space taken by column elements in the buffer.
void * GrowUnchecked(ClusterSize_t::ValueType nElements)
Called during writing: returns a pointer after the last element and increases the element counter in ...
A helper class for serializing and deserialization of the RNTuple binary format.
static RResult< void > DeserializePageListV1(const void *buffer, std::uint32_t bufSize, std::vector< RClusterDescriptorBuilder > &clusters)
static RResult< void > DeserializeFooterV1(const void *buffer, std::uint32_t bufSize, RNTupleDescriptorBuilder &descBuilder)
static RResult< void > DeserializeHeaderV1(const void *buffer, std::uint32_t bufSize, RNTupleDescriptorBuilder &descBuilder)
static std::vector< RClusterDescriptorBuilder > GetClusterSummaries(const RNTupleDescriptor &ntplDesc, DescriptorId_t clusterGroupId)
Used to prepare the cluster descriptor builders when loading the page locations for a certain cluster...
Addresses a column element or field item relative to a particular cluster, instead of a global NTuple...
DescriptorId_t GetClusterId() const
ClusterSize_t::ValueType GetIndex() const
Base class for all ROOT issued exceptions.
A helper class for piece-wise construction of an RNTupleDescriptor.
void AddToOnDiskFooterSize(std::uint64_t size)
The real footer size also include the page list envelopes.
void SetOnDiskHeaderSize(std::uint64_t size)
The on-storage meta-data of an ntuple.
RClusterGroupDescriptorIterable GetClusterGroupIterable() const
RResult< void > AddClusterDetails(RClusterDescriptor &&clusterDesc)
Methods to load and drop cluster details.
The RNTupleModel encapulates the schema of an ntuple.
Common user-tunable settings for reading ntuples.
DAOS-specific user-tunable settings for storing ntuples.
const std::string & GetObjectClass() const
Common user-tunable settings for storing ntuples.
The class is used as a return type for operations that can fail; wraps a value of type T or an RError...
const char * d_errstr(int rc)
static void d_iov_set(d_iov_t *iov, void *buf, size_t size)
uint16_t daos_oclass_id_t
std::uint32_t ntuple_index_t
RLogChannel & NTupleLog()
Log channel for RNTuple diagnostics.
std::uint64_t NTupleSize_t
Integer type long enough to hold the maximum number of entries in a column.
std::uint64_t DescriptorId_t
Distriniguishes elements of the same type within a descriptor, e.g. different fields.
std::int64_t ColumnId_t
Uniquely identifies a physical column within the scope of the current process, used to tag pages.
constexpr DescriptorId_t kInvalidDescriptorId
Helper structure concentrating the functionality required to locate an ntuple within a DAOS container...
int InitNTupleDescriptorBuilder(RDaosContainer &cont, RNTupleDecompressor &decompressor, RNTupleDescriptorBuilder &builder)
static std::pair< RDaosContainerNTupleLocator, RNTupleDescriptorBuilder > LocateNTuple(RDaosContainer &cont, const std::string &ntupleName, RNTupleDecompressor &decompressor)
A pair of <object ID, distribution key> that can be used to issue a fetch/update request for multiple...
Describes a read/write operation on multiple objects; see the ReadV/WriteV functions.
Entry point for an RNTuple in a DAOS container.
std::uint32_t fNBytesFooter
The size of the compressed ntuple footer.
std::uint32_t fNBytesHeader
The size of the compressed ntuple header.
std::string fObjClass
The object class for user data OIDs, e.g. SX
std::uint32_t fVersion
Allows for evolving the struct in future versions.
RResult< std::uint32_t > Deserialize(const void *buffer, std::uint32_t bufSize)
std::uint32_t fLenHeader
The size of the uncompressed ntuple header.
static std::uint32_t GetSize()
std::uint32_t Serialize(void *buffer) const
std::uint32_t fLenFooter
The size of the uncompressed ntuple footer.
Wrap around a daos_oclass_id_t.
static constexpr std::size_t kOCNameMaxLength
This limit is currently not defined in any header and any call to daos_oclass_id2name() within DAOS u...
On-disk pages within a page source are identified by the column and page number.
Summarizes cluster-level information that are necessary to populate a certain page.
RClusterDescriptor::RPageRange::RPageInfoExtended fPageInfo
Location of the page on disk.
std::uint64_t fColumnOffset
The first element number of the page's column in the given cluster.
DescriptorId_t fClusterId
A range of sealed pages referring to the same column that can be used for vector commit.
A sealed page contains the bytes of a page as written to storage (packed & compressed).
Generic information about the physical location of data.
std::uint32_t fBytesOnStorage
std::variant< std::uint64_t, std::string, RNTupleLocatorObject64 > fPosition
Simple on-disk locators consisting of a 64-bit offset use variant type uint64_t; extended locators ha...
const T & GetPosition() const