Logo ROOT  
Reference Guide
 
Loading...
Searching...
No Matches
RPageSinkBuf.cxx
Go to the documentation of this file.
1/// \file RPageSinkBuf.cxx
2/// \ingroup NTuple ROOT7
3/// \author Jakob Blomer <jblomer@cern.ch>
4/// \author Max Orok <maxwellorok@gmail.com>
5/// \author Javier Lopez-Gomez <javier.lopez.gomez@cern.ch>
6/// \date 2021-03-17
7/// \warning This is part of the ROOT 7 prototype! It will change without notice. It might trigger earthquakes. Feedback
8/// is welcome!
9
10/*************************************************************************
11 * Copyright (C) 1995-2021, Rene Brun and Fons Rademakers. *
12 * All rights reserved. *
13 * *
14 * For the licensing terms see $ROOTSYS/LICENSE. *
15 * For the list of contributors see $ROOTSYS/README/CREDITS. *
16 *************************************************************************/
17
18#include <ROOT/RNTupleModel.hxx>
20#include <ROOT/RNTupleZip.hxx>
21#include <ROOT/RPageSinkBuf.hxx>
22
23#include <algorithm>
24#include <memory>
25
27{
28 fBufferedPages.clear();
29 // Each RSealedPage points to the same region as `fBuf` for some element in `fBufferedPages`; thus, no further
30 // clean-up is required
31 fSealedPages.clear();
32}
33
35 : RPageSink(inner->GetNTupleName(), inner->GetWriteOptions()), fInnerSink(std::move(inner))
36{
37 fMetrics = Detail::RNTupleMetrics("RPageSinkBuf");
38 fCounters = std::make_unique<RCounters>(RCounters{
39 *fMetrics.MakeCounter<Detail::RNTuplePlainCounter *>("ParallelZip", "", "compressing pages in parallel"),
40 *fMetrics.MakeCounter<Detail::RNTuplePlainCounter *>("timeWallCriticalSection", "ns",
41 "wall clock time spent in critical sections"),
43 "timeCpuCriticalSection", "ns", "CPU time spent in critical section")});
44 fMetrics.ObserveMetrics(fInnerSink->GetMetrics());
45}
46
48{
49 // Wait for unterminated tasks, if any, as they may still hold a reference to `this`.
50 // This cannot be moved to the base class destructor, given non-static members have been destroyed by the time the
51 // base class destructor is invoked.
52 WaitForAllTasks();
53}
54
57{
58 return ColumnHandle_t{fNColumns++, &column};
59}
60
61void ROOT::Experimental::Internal::RPageSinkBuf::ConnectFields(const std::vector<RFieldBase *> &fields,
62 NTupleSize_t firstEntry)
63{
64 auto connectField = [&](RFieldBase &f) {
65 // Field Zero would have id 0.
66 ++fNFields;
67 f.SetOnDiskId(fNFields);
68 CallConnectPageSinkOnField(f, *this, firstEntry); // issues in turn calls to `AddColumn()`
69 };
70 for (auto *f : fields) {
71 connectField(*f);
72 for (auto &descendant : *f) {
73 connectField(descendant);
74 }
75 }
76 fBufferedColumns.resize(fNColumns);
77}
78
80{
81 return fInnerSink->GetDescriptor();
82}
83
85{
86 ConnectFields(model.GetFieldZero().GetSubFields(), 0U);
87
88 fInnerModel = model.Clone();
89 fInnerSink->Init(*fInnerModel);
90}
91
93 NTupleSize_t firstEntry)
94{
95 ConnectFields(changeset.fAddedFields, firstEntry);
96
97 // The buffered page sink maintains a copy of the RNTupleModel for the inner sink; replicate the changes there
98 // TODO(jalopezg): we should be able, in general, to simplify the buffered sink.
99 auto cloneAddField = [&](const RFieldBase *field) {
100 auto cloned = field->Clone(field->GetFieldName());
101 auto p = &(*cloned);
102 fInnerModel->AddField(std::move(cloned));
103 return p;
104 };
105 auto cloneAddProjectedField = [&](RFieldBase *field) {
106 auto cloned = field->Clone(field->GetFieldName());
107 auto p = &(*cloned);
108 auto &projectedFields = changeset.fModel.GetProjectedFields();
110 fieldMap[p] = projectedFields.GetSourceField(field);
111 auto targetIt = cloned->begin();
112 for (auto &f : *field)
113 fieldMap[&(*targetIt++)] = projectedFields.GetSourceField(&f);
114 const_cast<RNTupleModel::RProjectedFields &>(fInnerModel->GetProjectedFields()).Add(std::move(cloned), fieldMap);
115 return p;
116 };
117 RNTupleModelChangeset innerChangeset{*fInnerModel};
118 fInnerModel->Unfreeze();
119 std::transform(changeset.fAddedFields.cbegin(), changeset.fAddedFields.cend(),
120 std::back_inserter(innerChangeset.fAddedFields), cloneAddField);
121 std::transform(changeset.fAddedProjectedFields.cbegin(), changeset.fAddedProjectedFields.cend(),
122 std::back_inserter(innerChangeset.fAddedProjectedFields), cloneAddProjectedField);
123 fInnerModel->Freeze();
124 fInnerSink->UpdateSchema(innerChangeset, firstEntry);
125}
126
128{
129 RPageSink::RSinkGuard g(fInnerSink->GetSinkGuard());
130 Detail::RNTuplePlainTimer timer(fCounters->fTimeWallCriticalSection, fCounters->fTimeCpuCriticalSection);
131 fInnerSink->UpdateExtraTypeInfo(extraTypeInfo);
132}
133
135{
136 fSuppressedColumns.emplace_back(columnHandle);
137}
138
140{
141 auto colId = columnHandle.fPhysicalId;
142 const auto &element = *columnHandle.fColumn->GetElement();
143
144 // Safety: References are guaranteed to be valid until the
145 // element is destroyed. In other words, all buffered page elements are
146 // valid until the return value of DrainBufferedPages() goes out of scope in
147 // CommitCluster().
148 auto &zipItem = fBufferedColumns.at(colId).BufferPage(columnHandle);
149 zipItem.AllocateSealedPageBuf(page.GetNBytes() + GetWriteOptions().GetEnablePageChecksums() * kNBytesPageChecksum);
150 R__ASSERT(zipItem.fBuf);
151 auto &sealedPage = fBufferedColumns.at(colId).RegisterSealedPage();
152
153 if (!fTaskScheduler) {
154 // Seal the page right now, avoiding the allocation and copy, but making sure that the page buffer is not aliased.
155 RSealPageConfig config;
156 config.fPage = &page;
157 config.fElement = &element;
158 config.fCompressionSetting = GetWriteOptions().GetCompression();
159 config.fWriteChecksum = GetWriteOptions().GetEnablePageChecksums();
160 config.fAllowAlias = false;
161 config.fBuffer = zipItem.fBuf.get();
162 sealedPage = SealPage(config);
163 zipItem.fSealedPage = &sealedPage;
164 return;
165 }
166
167 // TODO avoid frequent (de)allocations by holding on to allocated buffers in RColumnBuf
168 zipItem.fPage = fPageAllocator->NewPage(columnHandle.fPhysicalId, page.GetElementSize(), page.GetNElements());
169 // make sure the page is aware of how many elements it will have
170 zipItem.fPage.GrowUnchecked(page.GetNElements());
171 memcpy(zipItem.fPage.GetBuffer(), page.GetBuffer(), page.GetNBytes());
172
173 fCounters->fParallelZip.SetValue(1);
174 // Thread safety: Each thread works on a distinct zipItem which owns its
175 // compression buffer.
176 fTaskScheduler->AddTask([this, &zipItem, &sealedPage, &element] {
177 RSealPageConfig config;
178 config.fPage = &zipItem.fPage;
179 config.fElement = &element;
180 config.fCompressionSetting = GetWriteOptions().GetCompression();
181 config.fWriteChecksum = GetWriteOptions().GetEnablePageChecksums();
182 config.fAllowAlias = true;
183 config.fBuffer = zipItem.fBuf.get();
184 sealedPage = SealPage(config);
185 zipItem.fSealedPage = &sealedPage;
186 });
187}
188
190 const RSealedPage & /*sealedPage*/)
191{
192 throw RException(R__FAIL("should never commit sealed pages to RPageSinkBuf"));
193}
194
195void ROOT::Experimental::Internal::RPageSinkBuf::CommitSealedPageV(std::span<RPageStorage::RSealedPageGroup> /*ranges*/)
196{
197 throw RException(R__FAIL("should never commit sealed pages to RPageSinkBuf"));
198}
199
201{
202 WaitForAllTasks();
203
204 std::vector<RSealedPageGroup> toCommit;
205 toCommit.reserve(fBufferedColumns.size());
206 for (auto &bufColumn : fBufferedColumns) {
207 R__ASSERT(bufColumn.HasSealedPagesOnly());
208 const auto &sealedPages = bufColumn.GetSealedPages();
209 toCommit.emplace_back(bufColumn.GetHandle().fPhysicalId, sealedPages.cbegin(), sealedPages.cend());
210 }
211
212 std::uint64_t nbytes;
213 {
214 RPageSink::RSinkGuard g(fInnerSink->GetSinkGuard());
215 Detail::RNTuplePlainTimer timer(fCounters->fTimeWallCriticalSection, fCounters->fTimeCpuCriticalSection);
216 fInnerSink->CommitSealedPageV(toCommit);
217
218 for (auto handle : fSuppressedColumns)
219 fInnerSink->CommitSuppressedColumn(handle);
220 fSuppressedColumns.clear();
221
222 nbytes = fInnerSink->CommitCluster(nNewEntries);
223 }
224
225 for (auto &bufColumn : fBufferedColumns)
226 bufColumn.DropBufferedPages();
227 return nbytes;
228}
229
231{
232 RPageSink::RSinkGuard g(fInnerSink->GetSinkGuard());
233 Detail::RNTuplePlainTimer timer(fCounters->fTimeWallCriticalSection, fCounters->fTimeCpuCriticalSection);
234 fInnerSink->CommitClusterGroup();
235}
236
238{
239 RPageSink::RSinkGuard g(fInnerSink->GetSinkGuard());
240 Detail::RNTuplePlainTimer timer(fCounters->fTimeWallCriticalSection, fCounters->fTimeCpuCriticalSection);
241 fInnerSink->CommitDataset();
242}
243
246{
247 return fInnerSink->ReservePage(columnHandle, nElements);
248}
#define R__FAIL(msg)
Short-hand to return an RResult<T> in an error state; the RError is implicitly converted into RResult...
Definition RError.hxx:290
#define f(i)
Definition RSha256.hxx:104
#define g(i)
Definition RSha256.hxx:105
#define R__ASSERT(e)
Checks condition e and reports a fatal error if it's false.
Definition TError.h:125
winID h TVirtualViewer3D TVirtualGLPainter p
A collection of Counter objects with a name, a unit, and a description.
void ObserveMetrics(RNTupleMetrics &observee)
CounterPtrT MakeCounter(const std::string &name, Args &&... args)
A non thread-safe integral performance counter.
An either thread-safe or non thread safe counter for CPU ticks.
Record wall time and CPU time between construction and destruction.
A column is a storage-backed array of a simple, fixed-size type, from which pages can be mapped into ...
Definition RColumn.hxx:42
RColumnElementBase * GetElement() const
Definition RColumn.hxx:356
RPageStorage::SealedPageSequence_t fSealedPages
Pages that have been already sealed by a concurrent task.
std::deque< RPageZipItem > fBufferedPages
Using a deque guarantees that element iterators are never invalidated by appends to the end of the it...
std::uint64_t CommitCluster(NTupleSize_t nNewEntries) final
Finalize the current cluster and create a new one for the following data.
std::unique_ptr< RPageSink > fInnerSink
The inner sink, responsible for actually performing I/O.
RPage ReservePage(ColumnHandle_t columnHandle, std::size_t nElements) final
Get a new, empty page for the given column that can be filled with up to nElements; nElements must be...
void CommitSealedPageV(std::span< RPageStorage::RSealedPageGroup > ranges) final
Write a vector of preprocessed pages to storage. The corresponding columns must have been added befor...
void UpdateSchema(const RNTupleModelChangeset &changeset, NTupleSize_t firstEntry) final
Incorporate incremental changes to the model into the ntuple descriptor.
RPageSinkBuf(std::unique_ptr< RPageSink > inner)
const RNTupleDescriptor & GetDescriptor() const final
Return the RNTupleDescriptor being constructed.
std::unique_ptr< RCounters > fCounters
ColumnHandle_t AddColumn(DescriptorId_t fieldId, const RColumn &column) final
Register a new column.
void InitImpl(RNTupleModel &model) final
void CommitPage(ColumnHandle_t columnHandle, const RPage &page) final
Write a page to the storage. The column must have been added before.
void ConnectFields(const std::vector< RFieldBase * > &fields, NTupleSize_t firstEntry)
void CommitSealedPage(DescriptorId_t physicalColumnId, const RSealedPage &sealedPage) final
Write a preprocessed page to storage. The column must have been added before.
void CommitClusterGroup() final
Write out the page locations (page list envelope) for all the committed clusters since the last call ...
void UpdateExtraTypeInfo(const RExtraTypeInfoDescriptor &extraTypeInfo) final
Adds an extra type information record to schema.
void CommitSuppressedColumn(ColumnHandle_t columnHandle) final
Commits a suppressed column for the current cluster.
An RAII wrapper used to synchronize a page sink. See GetSinkGuard().
Abstract interface to write data into an ntuple.
const RNTupleWriteOptions & GetWriteOptions() const
Returns the sink's write options.
const std::string & GetNTupleName() const
Returns the NTuple name.
A page is a slice of a column that is mapped into memory.
Definition RPage.hxx:46
std::uint32_t GetNBytes() const
The space taken by column elements in the buffer.
Definition RPage.hxx:122
std::uint32_t GetElementSize() const
Definition RPage.hxx:123
std::uint32_t GetNElements() const
Definition RPage.hxx:124
Base class for all ROOT issued exceptions.
Definition RError.hxx:78
Field specific extra type information from the header / extenstion header.
A field translates read and write calls from/to underlying columns to/from tree values.
std::vector< RFieldBase * > GetSubFields()
Definition RField.cxx:1007
The on-storage meta-data of an ntuple.
Projected fields are fields whose columns are reused from existing fields.
std::unordered_map< const RFieldBase *, const RFieldBase * > FieldMap_t
The map keys are the projected target fields, the map values are the backing source fields Note that ...
const RFieldBase * GetSourceField(const RFieldBase *target) const
The RNTupleModel encapulates the schema of an ntuple.
std::unique_ptr< RNTupleModel > Clone() const
const RProjectedFields & GetProjectedFields() const
RFieldZero & GetFieldZero()
Non-const access to the root field is used to commit clusters during writing, and to make adjustments...
virtual TObject * Clone(const char *newname="") const
Make a clone of an object using the Streamer facility.
Definition TObject.cxx:223
void CallConnectPageSinkOnField(RFieldBase &, RPageSink &, NTupleSize_t firstEntry=0)
Definition RField.cxx:415
void Add(RHist< DIMENSIONS, PRECISION, STAT_TO... > &to, const RHist< DIMENSIONS, PRECISION, STAT_FROM... > &from)
Add two histograms.
Definition RHist.hxx:342
std::uint64_t NTupleSize_t
Integer type long enough to hold the maximum number of entries in a column.
std::uint64_t DescriptorId_t
Distriniguishes elements of the same type within a descriptor, e.g. different fields.
The incremental changes to a RNTupleModel
std::vector< RFieldBase * > fAddedProjectedFields
Points to the projected fields in fModel that were added as part of an updater transaction.
std::vector< RFieldBase * > fAddedFields
Points to the fields in fModel that were added as part of an updater transaction.
I/O performance counters that get registered in fMetrics.
const RColumnElementBase * fElement
Corresponds to the page's elements, for size calculation etc.
void * fBuffer
Location for sealed output. The memory buffer has to be large enough.
bool fAllowAlias
If false, the output buffer must not point to the input page buffer, which would otherwise be an opti...
int fCompressionSetting
Compression algorithm and level to apply.
bool fWriteChecksum
Adds a 8 byte little-endian xxhash3 checksum to the page payload.
A sealed page contains the bytes of a page as written to storage (packed & compressed).