Logo ROOT  
Reference Guide
 
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Properties Friends Macros Modules Pages
Loading...
Searching...
No Matches
RColumn.hxx
Go to the documentation of this file.
1/// \file ROOT/RColumn.hxx
2/// \ingroup NTuple ROOT7
3/// \author Jakob Blomer <jblomer@cern.ch>
4/// \date 2018-10-09
5/// \warning This is part of the ROOT 7 prototype! It will change without notice. It might trigger earthquakes. Feedback
6/// is welcome!
7
8/*************************************************************************
9 * Copyright (C) 1995-2019, Rene Brun and Fons Rademakers. *
10 * All rights reserved. *
11 * *
12 * For the licensing terms see $ROOTSYS/LICENSE. *
13 * For the list of contributors see $ROOTSYS/README/CREDITS. *
14 *************************************************************************/
15
16#ifndef ROOT7_RColumn
17#define ROOT7_RColumn
18
19#include <ROOT/RConfig.hxx> // for R__likely
21#include <ROOT/RNTupleUtil.hxx>
22#include <ROOT/RPage.hxx>
23#include <ROOT/RPageStorage.hxx>
24
25#include <TError.h>
26
27#include <cstring> // for memcpy
28#include <memory>
29#include <utility>
30
31namespace ROOT::Internal {
32
33// clang-format off
34/**
35\class ROOT::Internal::RColumn
36\ingroup NTuple
37\brief A column is a storage-backed array of a simple, fixed-size type, from which pages can be mapped into memory.
38*/
39// clang-format on
40class RColumn {
41private:
43 /// Columns belonging to the same field are distinguished by their order. E.g. for an std::string field, there is
44 /// the offset column with index 0 and the character value column with index 1.
45 std::uint32_t fIndex;
46 /// Fields can have multiple column representations, distinguished by representation index
47 std::uint16_t fRepresentationIndex;
52 /// The page into which new elements are being written. The page will initially be small
53 /// (RNTupleWriteOptions::fInitialUnzippedPageSize, which corresponds to fInitialElements) and expand as needed and
54 /// as memory for page buffers is still available (RNTupleWriteOptions::fPageBufferBudget) or the maximum page
55 /// size is reached (RNTupleWriteOptions::fMaxUnzippedPageSize).
57 /// The initial number of elements in a page
59 /// The number of elements written resp. available in the column
61 /// The currently mapped page for reading
63 /// The column id in the column descriptor, once connected to a sink or source
65 /// Global index of the first element in this column; usually == 0, unless it is a deferred column
67 /// Used to pack and unpack pages on writing/reading
68 std::unique_ptr<ROOT::Internal::RColumnElementBase> fElement;
69 /// The column team is a set of columns that serve the same column index for different representation IDs.
70 /// Initially, the team has only one member, the very column it belongs to. Through MergeTeams(), two columns
71 /// can join forces. The team is used to react on suppressed columns: if the current team member has a suppressed
72 /// column for a MapPage() call, it get the page from the active column in the corresponding cluster.
73 std::vector<RColumn *> fTeam;
74 /// Points into fTeam to the column that successfully returned the last page.
75 std::size_t fLastGoodTeamIdx = 0;
76
78
79 /// Used when trying to append to a full write page. If possible, expand the page. Otherwise, flush and reset
80 /// to the minimal size.
82 {
84 if (newMaxElements * fElement->GetSize() > fPageSink->GetWriteOptions().GetMaxUnzippedPageSize()) {
85 newMaxElements = fPageSink->GetWriteOptions().GetMaxUnzippedPageSize() / fElement->GetSize();
86 }
87
89 // Maximum page size reached, flush and reset
90 Flush();
91 } else {
93 if (expandedPage.IsNull()) {
94 Flush();
95 } else {
98 expandedPage.GrowUnchecked(fWritePage.GetNElements());
99 fWritePage = std::move(expandedPage);
100 }
101 }
102
104 }
105
106public:
107 template <typename CppT>
108 static std::unique_ptr<RColumn>
110 {
111 auto column = std::unique_ptr<RColumn>(new RColumn(type, columnIdx, representationIdx));
112 column->fElement = ROOT::Internal::RColumnElementBase::Generate<CppT>(type);
113 return column;
114 }
115
116 RColumn(const RColumn &) = delete;
117 RColumn &operator=(const RColumn &) = delete;
118 ~RColumn();
119
120 /// Connect the column to a page sink. `firstElementIndex` can be used to specify the first column element index
121 /// with backing storage for this column. On read back, elements before `firstElementIndex` will cause the zero page
122 /// to be mapped.
125 /// Connect the column to a page source.
127
128 void Append(const void *from)
129 {
132 }
133
134 void *dst = fWritePage.GrowUnchecked(1);
135
136 std::memcpy(dst, from, fElement->GetSize());
137 fNElements++;
138 }
139
140 void AppendV(const void *from, std::size_t count)
141 {
142 auto src = reinterpret_cast<const unsigned char *>(from);
143 // TODO(jblomer): A future optimization should grow the page in one go, up to the maximum unzipped page size
144 while (count > 0) {
146 if (nElementsRemaining == 0) {
149 }
150
152 auto nBatch = std::min(count, nElementsRemaining);
153
155 std::memcpy(dst, src, nBatch * fElement->GetSize());
156 src += nBatch * fElement->GetSize();
157 count -= nBatch;
159 }
160 }
161
162 void Read(const ROOT::NTupleSize_t globalIndex, void *to)
163 {
164 if (!fReadPageRef.Get().Contains(globalIndex)) {
166 }
167 const auto elemSize = fElement->GetSize();
168 void *from = static_cast<unsigned char *>(fReadPageRef.Get().GetBuffer()) +
169 (globalIndex - fReadPageRef.Get().GetGlobalRangeFirst()) * elemSize;
170 std::memcpy(to, from, elemSize);
171 }
172
174 {
175 if (!fReadPageRef.Get().Contains(localIndex)) {
177 }
178 const auto elemSize = fElement->GetSize();
179 void *from = static_cast<unsigned char *>(fReadPageRef.Get().GetBuffer()) +
180 (localIndex.GetIndexInCluster() - fReadPageRef.Get().GetLocalRangeFirst()) * elemSize;
181 std::memcpy(to, from, elemSize);
182 }
183
185 {
186 const auto elemSize = fElement->GetSize();
187 auto tail = static_cast<unsigned char *>(to);
188
189 while (count > 0) {
190 if (!fReadPageRef.Get().Contains(globalIndex)) {
192 }
193 const ROOT::NTupleSize_t idxInPage = globalIndex - fReadPageRef.Get().GetGlobalRangeFirst();
194
195 const void *from = static_cast<unsigned char *>(fReadPageRef.Get().GetBuffer()) + idxInPage * elemSize;
196 const ROOT::NTupleSize_t nBatch = std::min(fReadPageRef.Get().GetNElements() - idxInPage, count);
197
198 std::memcpy(tail, from, elemSize * nBatch);
199
200 tail += nBatch * elemSize;
201 count -= nBatch;
203 }
204 }
205
207 {
208 const auto elemSize = fElement->GetSize();
209 auto tail = static_cast<unsigned char *>(to);
210
211 while (count > 0) {
212 if (!fReadPageRef.Get().Contains(localIndex)) {
214 }
215 ROOT::NTupleSize_t idxInPage = localIndex.GetIndexInCluster() - fReadPageRef.Get().GetLocalRangeFirst();
216
217 const void *from = static_cast<unsigned char *>(fReadPageRef.Get().GetBuffer()) + idxInPage * elemSize;
218 const ROOT::NTupleSize_t nBatch = std::min(count, fReadPageRef.Get().GetNElements() - idxInPage);
219
220 std::memcpy(tail, from, elemSize * nBatch);
221
222 tail += nBatch * elemSize;
223 count -= nBatch;
224 localIndex = RNTupleLocalIndex(localIndex.GetClusterId(), localIndex.GetIndexInCluster() + nBatch);
225 }
226 }
227
228 template <typename CppT>
234
235 template <typename CppT>
241
242 template <typename CppT>
244 {
245 if (R__unlikely(!fReadPageRef.Get().Contains(globalIndex))) {
247 }
248 // +1 to go from 0-based indexing to 1-based number of items
249 nItems = fReadPageRef.Get().GetGlobalRangeLast() - globalIndex + 1;
250 return reinterpret_cast<CppT *>(static_cast<unsigned char *>(fReadPageRef.Get().GetBuffer()) +
251 (globalIndex - fReadPageRef.Get().GetGlobalRangeFirst()) * sizeof(CppT));
252 }
253
254 template <typename CppT>
256 {
257 if (!fReadPageRef.Get().Contains(localIndex)) {
259 }
260 // +1 to go from 0-based indexing to 1-based number of items
261 nItems = fReadPageRef.Get().GetLocalRangeLast() - localIndex.GetIndexInCluster() + 1;
262 return reinterpret_cast<CppT *>(static_cast<unsigned char *>(fReadPageRef.Get().GetBuffer()) +
263 (localIndex.GetIndexInCluster() - fReadPageRef.Get().GetLocalRangeFirst()) *
264 sizeof(CppT));
265 }
266
268 {
269 if (!fReadPageRef.Get().Contains(clusterIndex)) {
271 }
272 return fReadPageRef.Get().GetClusterInfo().GetIndexOffset() + clusterIndex.GetIndexInCluster();
273 }
274
276 {
277 if (!fReadPageRef.Get().Contains(globalIndex)) {
279 }
280 return RNTupleLocalIndex(fReadPageRef.Get().GetClusterInfo().GetId(),
281 globalIndex - fReadPageRef.Get().GetClusterInfo().GetIndexOffset());
282 }
283
284 /// For offset columns only, look at the two adjacent values that define a collection's coordinates
287 {
290 // Try to avoid jumping back to the previous page and jumping back to the previous cluster
291 if (R__likely(globalIndex > 0)) {
292 if (R__likely(fReadPageRef.Get().Contains(globalIndex - 1))) {
295 if (R__unlikely(fReadPageRef.Get().GetClusterInfo().GetIndexOffset() == globalIndex))
296 idxStart = 0;
297 } else {
299 auto selfOffset = fReadPageRef.Get().GetClusterInfo().GetIndexOffset();
301 }
302 } else {
304 }
306 *collectionStart = RNTupleLocalIndex(fReadPageRef.Get().GetClusterInfo().GetId(), idxStart);
307 }
308
318
319 /// Get the currently active cluster id
321 {
323 *varIndex = RNTupleLocalIndex(fReadPageRef.Get().GetClusterInfo().GetId(), varSwitch->GetIndex());
324 *tag = varSwitch->GetTag();
325 }
326
327 void Flush();
328 void CommitSuppressed();
329
334
337
338 void MergeTeams(RColumn &other);
339
343 std::uint16_t GetBitsOnStorage() const
344 {
346 return static_cast<std::uint16_t>(fElement->GetBitsOnStorage());
347 }
348 std::optional<std::pair<double, double>> GetValueRange() const
349 {
351 return fElement->GetValueRange();
352 }
353 std::uint32_t GetIndex() const { return fIndex; }
354 std::uint16_t GetRepresentationIndex() const { return fRepresentationIndex; }
361
362 void SetBitsOnStorage(std::size_t bits) { fElement->SetBitsOnStorage(bits); }
363 std::size_t GetWritePageCapacity() const { return fWritePage.GetCapacity(); }
364 void SetValueRange(double min, double max) { fElement->SetValueRange(min, max); }
365}; // class RColumn
366
367} // namespace ROOT::Internal
368
369#endif
#define R__likely(expr)
Definition RConfig.hxx:603
#define R__unlikely(expr)
Definition RConfig.hxx:602
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
#define R__ASSERT(e)
Checks condition e and reports a fatal error if it's false.
Definition TError.h:125
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t index
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t src
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void char Point_t Rectangle_t WindowAttributes_t Float_t Float_t Float_t Int_t Int_t UInt_t UInt_t Rectangle_t Int_t Int_t Window_t TString Int_t GCValues_t GetPrimarySelectionOwner GetDisplay GetScreen GetColormap GetNativeEvent const char const char dpyName wid window const char font_name cursor keysym reg const char only_if_exist regb h Point_t winding char text const char depth char const char Int_t count const char ColorStruct_t color const char Pixmap_t Pixmap_t PictureAttributes_t attr const char char ret_data h unsigned char height h Atom_t Int_t ULong_t ULong_t unsigned char prop_list Atom_t Atom_t Atom_t Time_t type
The available trivial, native content types of a column.
Abstract interface to write data into an ntuple.
const ROOT::RNTupleWriteOptions & GetWriteOptions() const
Returns the sink's write options.
virtual ROOT::Internal::RPage ReservePage(ColumnHandle_t columnHandle, std::size_t nElements)
Get a new, empty page for the given column that can be filled with up to nElements; nElements must be...
Abstract interface to read data from an ntuple.
A column element encapsulates the translation between basic C++ types and their column representation...
A column is a storage-backed array of a simple, fixed-size type, from which pages can be mapped into ...
Definition RColumn.hxx:40
void GetSwitchInfo(ROOT::NTupleSize_t globalIndex, RNTupleLocalIndex *varIndex, std::uint32_t *tag)
Get the currently active cluster id.
Definition RColumn.hxx:320
void GetCollectionInfo(RNTupleLocalIndex localIndex, RNTupleLocalIndex *collectionStart, ROOT::NTupleSize_t *collectionSize)
Definition RColumn.hxx:309
void Read(RNTupleLocalIndex localIndex, void *to)
Definition RColumn.hxx:173
static std::unique_ptr< RColumn > Create(ROOT::ENTupleColumnType type, std::uint32_t columnIdx, std::uint16_t representationIdx)
Definition RColumn.hxx:109
ROOT::Experimental::Internal::RPageSink * GetPageSink() const
Definition RColumn.hxx:358
RColumn(ROOT::ENTupleColumnType type, std::uint32_t columnIndex, std::uint16_t representationIndex)
ROOT::NTupleSize_t GetGlobalIndex(RNTupleLocalIndex clusterIndex)
Definition RColumn.hxx:267
void HandleWritePageIfFull()
Used when trying to append to a full write page.
Definition RColumn.hxx:81
std::optional< std::pair< double, double > > GetValueRange() const
Definition RColumn.hxx:348
void MergeTeams(RColumn &other)
Definition RColumn.cxx:117
RColumn & operator=(const RColumn &)=delete
void ReadV(RNTupleLocalIndex localIndex, ROOT::NTupleSize_t count, void *to)
Definition RColumn.hxx:206
std::vector< RColumn * > fTeam
The column team is a set of columns that serve the same column index for different representation IDs...
Definition RColumn.hxx:73
std::uint16_t GetRepresentationIndex() const
Definition RColumn.hxx:354
bool ReadPageContains(ROOT::NTupleSize_t globalIndex) const
Definition RColumn.hxx:335
std::size_t fLastGoodTeamIdx
Points into fTeam to the column that successfully returned the last page.
Definition RColumn.hxx:75
CppT * Map(const ROOT::NTupleSize_t globalIndex)
Definition RColumn.hxx:229
CppT * MapV(RNTupleLocalIndex localIndex, ROOT::NTupleSize_t &nItems)
Definition RColumn.hxx:255
ROOT::Experimental::Internal::RPageStorage::ColumnHandle_t fHandleSink
Definition RColumn.hxx:50
void ConnectPageSource(ROOT::DescriptorId_t fieldId, ROOT::Experimental::Internal::RPageSource &pageSource)
Connect the column to a page source.
Definition RColumn.cxx:59
RNTupleLocalIndex GetClusterIndex(ROOT::NTupleSize_t globalIndex)
Definition RColumn.hxx:275
RColumn(const RColumn &)=delete
std::uint16_t fRepresentationIndex
Fields can have multiple column representations, distinguished by representation index.
Definition RColumn.hxx:47
ROOT::Internal::RColumnElementBase * GetElement() const
Definition RColumn.hxx:341
ROOT::Experimental::Internal::RPageSink * fPageSink
Definition RColumn.hxx:48
void SetBitsOnStorage(std::size_t bits)
Definition RColumn.hxx:362
void Read(const ROOT::NTupleSize_t globalIndex, void *to)
Definition RColumn.hxx:162
CppT * Map(RNTupleLocalIndex localIndex)
Definition RColumn.hxx:236
ROOT::ENTupleColumnType GetType() const
Definition RColumn.hxx:342
ROOT::Experimental::Internal::RPageStorage::ColumnHandle_t fHandleSource
Definition RColumn.hxx:51
ROOT::NTupleSize_t GetFirstElementIndex() const
Definition RColumn.hxx:356
bool ReadPageContains(RNTupleLocalIndex localIndex) const
Definition RColumn.hxx:336
void GetCollectionInfo(const ROOT::NTupleSize_t globalIndex, RNTupleLocalIndex *collectionStart, ROOT::NTupleSize_t *collectionSize)
For offset columns only, look at the two adjacent values that define a collection's coordinates.
Definition RColumn.hxx:285
void AppendV(const void *from, std::size_t count)
Definition RColumn.hxx:140
void ReadV(ROOT::NTupleSize_t globalIndex, ROOT::NTupleSize_t count, void *to)
Definition RColumn.hxx:184
std::size_t GetWritePageCapacity() const
Definition RColumn.hxx:363
ROOT::NTupleSize_t GetNElements() const
Definition RColumn.hxx:340
void SetValueRange(double min, double max)
Definition RColumn.hxx:364
ROOT::DescriptorId_t GetOnDiskId() const
Definition RColumn.hxx:355
ROOT::Internal::RPageRef fReadPageRef
The currently mapped page for reading.
Definition RColumn.hxx:62
ROOT::Internal::RPage fWritePage
The page into which new elements are being written.
Definition RColumn.hxx:56
ROOT::Experimental::Internal::RPageSource * fPageSource
Definition RColumn.hxx:49
ROOT::Experimental::Internal::RPageSource * GetPageSource() const
Definition RColumn.hxx:357
CppT * MapV(const ROOT::NTupleSize_t globalIndex, ROOT::NTupleSize_t &nItems)
Definition RColumn.hxx:243
ROOT::Experimental::Internal::RPageStorage::ColumnHandle_t GetHandleSource() const
Definition RColumn.hxx:359
ROOT::DescriptorId_t fOnDiskId
The column id in the column descriptor, once connected to a sink or source.
Definition RColumn.hxx:64
std::uint32_t fIndex
Columns belonging to the same field are distinguished by their order.
Definition RColumn.hxx:45
bool TryMapPage(ROOT::NTupleSize_t globalIndex)
Definition RColumn.cxx:87
ROOT::Experimental::Internal::RPageStorage::ColumnHandle_t GetHandleSink() const
Definition RColumn.hxx:360
ROOT::NTupleSize_t fFirstElementIndex
Global index of the first element in this column; usually == 0, unless it is a deferred column.
Definition RColumn.hxx:66
ROOT::NTupleSize_t fNElements
The number of elements written resp. available in the column.
Definition RColumn.hxx:60
void MapPage(ROOT::NTupleSize_t globalIndex)
Definition RColumn.hxx:330
std::uint16_t GetBitsOnStorage() const
Definition RColumn.hxx:343
std::uint32_t GetIndex() const
Definition RColumn.hxx:353
void Append(const void *from)
Definition RColumn.hxx:128
std::unique_ptr< ROOT::Internal::RColumnElementBase > fElement
Used to pack and unpack pages on writing/reading.
Definition RColumn.hxx:68
void ConnectPageSink(ROOT::DescriptorId_t fieldId, ROOT::Experimental::Internal::RPageSink &pageSink, ROOT::NTupleSize_t firstElementIndex=0U)
Connect the column to a page sink.
Definition RColumn.cxx:42
void MapPage(RNTupleLocalIndex localIndex)
Definition RColumn.hxx:331
ROOT::ENTupleColumnType fType
Definition RColumn.hxx:42
ROOT::NTupleSize_t fInitialNElements
The initial number of elements in a page.
Definition RColumn.hxx:58
Reference to a page stored in the page pool.
const RPage & Get() const
A page is a slice of a column that is mapped into memory.
Definition RPage.hxx:46
std::uint32_t GetNElements() const
Definition RPage.hxx:123
std::size_t GetNBytes() const
The space taken by column elements in the buffer.
Definition RPage.hxx:114
void * GrowUnchecked(std::uint32_t nElements)
Increases the number elements in the page.
Definition RPage.hxx:152
void * GetBuffer() const
Definition RPage.hxx:145
std::uint32_t GetMaxElements() const
Definition RPage.hxx:124
std::size_t GetCapacity() const
Definition RPage.hxx:118
Addresses a column element or field item relative to a particular cluster, instead of a global NTuple...
std::uint64_t DescriptorId_t
Distriniguishes elements of the same type within a descriptor, e.g. different fields.
std::uint64_t NTupleSize_t
Integer type long enough to hold the maximum number of entries in a column.
constexpr DescriptorId_t kInvalidDescriptorId