Logo ROOT  
Reference Guide
 
Loading...
Searching...
No Matches
RNTupleJoinTable.cxx
Go to the documentation of this file.
1/// \file RNTupleJoinTable.cxx
2/// \ingroup NTuple
3/// \author Florine de Geus <florine.de.geus@cern.ch>
4/// \date 2024-04-02
5/// \warning This is part of the ROOT 7 prototype! It will change without notice. It might trigger earthquakes. Feedback
6/// is welcome!
7
8/*************************************************************************
9 * Copyright (C) 1995-2024, Rene Brun and Fons Rademakers. *
10 * All rights reserved. *
11 * *
12 * For the licensing terms see $ROOTSYS/LICENSE. *
13 * For the list of contributors see $ROOTSYS/README/CREDITS. *
14 *************************************************************************/
15
17
18namespace {
20{
22
23 switch (fieldValueSize) {
24 case 1: value = *reinterpret_cast<std::uint8_t *>(valuePtr); break;
25 case 2: value = *reinterpret_cast<std::uint16_t *>(valuePtr); break;
26 case 4: value = *reinterpret_cast<std::uint32_t *>(valuePtr); break;
27 case 8: value = *reinterpret_cast<std::uint64_t *>(valuePtr); break;
28 default: throw ROOT::RException(R__FAIL("value size not supported"));
29 }
30
31 return value;
32}
33} // anonymous namespace
34
36 ROOT::Internal::RPageSource &pageSource, const std::vector<std::string> &joinFieldNames)
37 : fJoinFieldNames(joinFieldNames)
38{
39 static const std::unordered_set<std::string> allowedTypes = {"std::int8_t", "std::int16_t", "std::int32_t",
40 "std::int64_t", "std::uint8_t", "std::uint16_t",
41 "std::uint32_t", "std::uint64_t"};
42
43 pageSource.Attach();
44 auto desc = pageSource.GetSharedDescriptorGuard();
45
46 std::vector<std::unique_ptr<ROOT::RFieldBase>> fields;
47 std::vector<ROOT::RFieldBase::RValue> fieldValues;
48 fieldValues.reserve(fJoinFieldNames.size());
49
50 for (const auto &fieldName : fJoinFieldNames) {
51 auto fieldId = desc->FindFieldId(fieldName);
53 throw RException(R__FAIL("could not find join field \"" + std::string(fieldName) + "\" in RNTuple \"" +
54 pageSource.GetNTupleName() + "\""));
55
56 const auto &fieldDesc = desc->GetFieldDescriptor(fieldId);
57
58 if (allowedTypes.find(fieldDesc.GetTypeName()) == allowedTypes.end()) {
59 throw RException(R__FAIL("cannot use field \"" + fieldName + "\" with type \"" + fieldDesc.GetTypeName() +
60 "\" in join table: only integral types are allowed"));
61 }
62
63 auto field = fieldDesc.CreateField(desc.GetRef());
65
66 fieldValues.emplace_back(field->CreateValue());
67 fJoinFieldValueSizes.emplace_back(field->GetValueSize());
68 fields.emplace_back(std::move(field));
69 }
70
71 std::vector<JoinValue_t> castJoinValues;
72 castJoinValues.reserve(fJoinFieldNames.size());
73
74 for (unsigned i = 0; i < pageSource.GetNEntries(); ++i) {
75 castJoinValues.clear();
76
77 for (auto &fieldValue : fieldValues) {
78 // TODO(fdegeus): use bulk reading
79 fieldValue.Read(i);
80
81 auto valuePtr = fieldValue.GetPtr<void>();
82 castJoinValues.push_back(CastValuePtr(valuePtr.get(), fieldValue.GetField().GetValueSize()));
83 }
84
86 }
87}
88
89const std::vector<ROOT::NTupleSize_t> *
90ROOT ::Experimental::Internal::RNTupleJoinTable::REntryMapping::GetEntryIndexes(std::vector<void *> valuePtrs) const
91{
92 if (valuePtrs.size() != fJoinFieldNames.size())
93 throw RException(R__FAIL("number of value pointers must match number of join fields"));
94
95 std::vector<JoinValue_t> castJoinValues;
96 castJoinValues.reserve(valuePtrs.size());
97
98 for (unsigned i = 0; i < valuePtrs.size(); ++i) {
99 castJoinValues.push_back(CastValuePtr(valuePtrs[i], fJoinFieldValueSizes[i]));
100 }
101
102 if (const auto &entries = fMapping.find(RCombinedJoinFieldValue(castJoinValues)); entries != fMapping.end()) {
103 return &entries->second;
104 }
105
106 return nullptr;
107}
108
109//------------------------------------------------------------------------------
110
111std::unique_ptr<ROOT::Experimental::Internal::RNTupleJoinTable>
113{
114 return std::unique_ptr<RNTupleJoinTable>(new RNTupleJoinTable(fieldNames));
115}
116
126
127std::vector<ROOT::NTupleSize_t>
130{
132 if (partition == fPartitions.end())
133 return {};
134
135 std::vector<ROOT::NTupleSize_t> entryIdxs{};
136
137 for (const auto &joinMapping : partition->second) {
138 auto entriesForMapping = joinMapping->GetEntryIndexes(valuePtrs);
141 }
142
143 return entryIdxs;
144}
145
146std::unordered_map<ROOT::Experimental::Internal::RNTupleJoinTable::PartitionKey_t, std::vector<ROOT::NTupleSize_t>>
148 const std::vector<void *> &valuePtrs, const std::vector<PartitionKey_t> &partitionKeys) const
149{
150 std::unordered_map<PartitionKey_t, std::vector<ROOT::NTupleSize_t>> entryIdxs{};
151
152 for (const auto &partitionKey : partitionKeys) {
154 if (!entriesForPartition.empty()) {
157 }
158 }
159
160 return entryIdxs;
161}
162
163std::unordered_map<ROOT::Experimental::Internal::RNTupleJoinTable::PartitionKey_t, std::vector<ROOT::NTupleSize_t>>
165{
166 std::unordered_map<PartitionKey_t, std::vector<ROOT::NTupleSize_t>> entryIdxs{};
167
168 for (const auto &partition : fPartitions) {
169 for (const auto &joinMapping : partition.second) {
170 auto entriesForMapping = joinMapping->GetEntryIndexes(valuePtrs);
171 if (entriesForMapping) {
174 }
175 }
176 }
177
178 return entryIdxs;
179}
#define R__FAIL(msg)
Short-hand to return an RResult<T> in an error state; the RError is implicitly converted into RResult...
Definition RError.hxx:299
ROOT::Detail::TRangeCast< T, true > TRangeDynCast
TRangeDynCast is an adapter class that allows the typed iteration through a TCollection.
Option_t Option_t TPoint TPoint const char GetTextMagnitude GetFillStyle GetLineColor GetLineWidth GetMarkerStyle GetTextAlign GetTextColor GetTextSize void value
Provides a mapping from one or several join field values to an entry index.
std::vector< std::size_t > fJoinFieldValueSizes
The size (in bytes) for each join field, corresponding to fJoinFieldNames.
std::vector< std::string > fJoinFieldNames
Names of the join fields used for the mapping to their respective entry indexes.
REntryMapping(ROOT::Internal::RPageSource &pageSource, const std::vector< std::string > &joinFieldNames)
Create a new entry mapping.
std::unordered_map< RCombinedJoinFieldValue, std::vector< ROOT::NTupleSize_t >, RCombinedJoinFieldValueHash > fMapping
The mapping itself.
Builds a join table on one or several fields of an RNTuple so it can be joined onto other RNTuples.
std::unordered_map< PartitionKey_t, std::vector< ROOT::NTupleSize_t > > GetPartitionedEntryIndexes(const std::vector< void * > &valuePtrs, const std::vector< PartitionKey_t > &partitionKeys) const
Get all entry indexes for the given join field value(s) for a specific set of partitions.
std::vector< ROOT::NTupleSize_t > GetEntryIndexes(const std::vector< void * > &valuePtrs, PartitionKey_t partitionKey=kDefaultPartitionKey) const
Get all entry indexes for the given join field value(s) within a partition.
RNTupleJoinTable & Add(ROOT::Internal::RPageSource &pageSource, PartitionKey_t partitionKey=kDefaultPartitionKey)
Add an entry mapping to the join table.
static std::unique_ptr< RNTupleJoinTable > Create(const std::vector< std::string > &joinFieldNames)
Create an RNTupleJoinTable from an existing RNTuple.
std::vector< std::string > fJoinFieldNames
Names of the join fields used for the mapping to their respective entry indexes.
RNTupleJoinTable(const std::vector< std::string > &joinFieldNames)
Create an a new RNTupleJoinTable for the RNTuple represented by the provided page source.
std::unordered_map< PartitionKey_t, std::vector< std::unique_ptr< REntryMapping > > > fPartitions
Partitions of one or multiple entry mappings.
Abstract interface to read data from an ntuple.
Base class for all ROOT issued exceptions.
Definition RError.hxx:79
const_iterator begin() const
const_iterator end() const
void CallConnectPageSourceOnField(RFieldBase &, ROOT::Internal::RPageSource &)
constexpr DescriptorId_t kInvalidDescriptorId