From 2b4b65b6cd15337b304f4cd2a11dadb265cff8d7 Mon Sep 17 00:00:00 2001
From: Bernhard Manfred Gruber <bernhardmgruber@gmail.com>
Date: Sun, 7 Mar 2021 17:44:36 +0100
Subject: [PATCH 1/4] support sub arrays of dynamic size as field type

* allow dynamic field types in the record dimension
* add specializations to most of the core functions
* add llama::dynamic to signal a dynamic array member in a RecordCoord
* extend VirtualRecord to allow holding dynamic indices
* extend blobNrAndOffset to allow for additional dynamic indices
* add OffsetTable mapping
* add customization allowing to dump OffsetTable mappings
* add a few unit tests
---
 examples/bufferguard/bufferguard.cpp   |   8 +-
 include/llama/Concepts.hpp             |   2 +-
 include/llama/Core.hpp                 |  53 ++++
 include/llama/DumpMapping.hpp          |  22 +-
 include/llama/Proofs.hpp               |   6 +-
 include/llama/RecordCoord.hpp          |   3 +
 include/llama/View.hpp                 |  28 +-
 include/llama/VirtualRecord.hpp        |  92 ++++++-
 include/llama/llama.hpp                |   1 +
 include/llama/mapping/AoS.hpp          |   8 +-
 include/llama/mapping/AoSoA.hpp        |   8 +-
 include/llama/mapping/Bytesplit.hpp    |  18 +-
 include/llama/mapping/Heatmap.hpp      |  10 +-
 include/llama/mapping/OffsetTable.hpp  | 361 +++++++++++++++++++++++++
 include/llama/mapping/One.hpp          |   8 +-
 include/llama/mapping/SoA.hpp          |  12 +-
 include/llama/mapping/Split.hpp        |  13 +-
 include/llama/mapping/Trace.hpp        |  10 +-
 include/llama/mapping/tree/Mapping.hpp |   8 +-
 tests/computedprop.cpp                 |  15 +-
 tests/core.cpp                         |  29 +-
 tests/mapping.cpp                      |   2 +-
 tests/proofs.cpp                       |  16 +-
 tests/recorddimension.cpp              | 217 +++++++++++++++
 tests/virtualrecord.cpp                |   2 +-
 25 files changed, 876 insertions(+), 76 deletions(-)
 create mode 100644 include/llama/mapping/OffsetTable.hpp
diff --git a/examples/bufferguard/bufferguard.cpp b/examples/bufferguard/bufferguard.cpp
index eec01096f9..d9c20a1960 100644
--- a/examples/bufferguard/bufferguard.cpp
+++ b/examples/bufferguard/bufferguard.cpp
@@ -68,9 +68,11 @@ struct GuardMapping2D : llama::ArrayExtentsDynamic<2>
         std::abort();
     }
 
-    template<std::size_t... RecordCoords>
-    constexpr auto blobNrAndOffset(ArrayIndex ai, llama::RecordCoord<RecordCoords...> rc = {}) const
-        -> llama::NrAndOffset
+    template<std::size_t... RecordCoords, std::size_t N = 0>
+    constexpr auto blobNrAndOffset(
+        ArrayIndex ai,
+        llama::Array<std::size_t, N> = {},
+        llama::RecordCoord<RecordCoords...> rc = {}) const -> llama::NrAndOffset
     {
         // [0][0] is at left top
         const auto [row, col] = ai;
diff --git a/include/llama/Concepts.hpp b/include/llama/Concepts.hpp
index 70a8efaf6f..ce7f029e0c 100644
--- a/include/llama/Concepts.hpp
+++ b/include/llama/Concepts.hpp
@@ -23,7 +23,7 @@ namespace llama
         { m.blobSize(std::size_t{}) } -> std::same_as<std::size_t>;
         { m.blobNrAndOffset(typename M::ArrayIndex{}) } -> std::same_as<NrAndOffset>;
         { m.template blobNrAndOffset<0>(typename M::ArrayIndex{}) } -> std::same_as<NrAndOffset>;
-        { m.blobNrAndOffset(typename M::ArrayIndex{}, llama::RecordCoord<0>{}) } -> std::same_as<NrAndOffset>;
+        { m.blobNrAndOffset(typename M::ArrayIndex{}, {}, llama::RecordCoord<0>{}) } -> std::same_as<NrAndOffset>;
     };
     // clang-format on
 
diff --git a/include/llama/Core.hpp b/include/llama/Core.hpp
index fb41824e60..22cfab0cb7 100644
--- a/include/llama/Core.hpp
+++ b/include/llama/Core.hpp
@@ -30,6 +30,15 @@ namespace llama
     template<typename T>
     inline constexpr bool isAllowedFieldType = std::is_trivially_destructible_v<T>;
 
+    template<typename... Fields>
+    inline constexpr bool isAllowedFieldType<Record<Fields...>> = true;
+
+    template<typename T, std::size_t N>
+    inline constexpr bool isAllowedFieldType<T[N]> = isAllowedFieldType<T>;
+
+    template<typename T>
+    inline constexpr bool isAllowedFieldType<T[]> = isAllowedFieldType<T>;
+
     /// Record dimension tree node which may either be a leaf or refer to a child tree presented as another \ref
     /// Record.
     /// \tparam Tag Name of the node. May be any type (struct, class).
@@ -101,6 +110,14 @@ namespace llama
                 = boost::mp11::mp_push_front<typename GetTagsImpl<ChildType, RecordCoord<Coords...>>::type, ChildTag>;
         };
 
+        template<typename ChildType, std::size_t... Coords>
+        struct GetTagsImpl<ChildType[], RecordCoord<dynamic, Coords...>>
+        {
+            using ChildTag = RecordCoord<dynamic>;
+            using type
+                = boost::mp11::mp_push_front<typename GetTagsImpl<ChildType, RecordCoord<Coords...>>::type, ChildTag>;
+        };
+
         template<typename T>
         struct GetTagsImpl<T, RecordCoord<>>
         {
@@ -198,6 +215,16 @@ namespace llama
                 typename GetCoordFromTagsImpl<ChildType, RecordCoord<ResultCoords..., FirstTag::front>, Tags...>::type;
         };
 
+        template<typename ChildType, std::size_t... ResultCoords, typename FirstTag, typename... Tags>
+        struct GetCoordFromTagsImpl<ChildType[], RecordCoord<ResultCoords...>, FirstTag, Tags...>
+        {
+            static_assert(
+                std::is_same_v<FirstTag, RecordCoord<dynamic>>,
+                "Please use a RecordCoord<dynamic> to index into dynamic arrays");
+            using type =
+                typename GetCoordFromTagsImpl<ChildType, RecordCoord<ResultCoords..., FirstTag::front>, Tags...>::type;
+        };
+
         template<typename RecordDim, typename RecordCoord>
         struct GetCoordFromTagsImpl<RecordDim, RecordCoord>
         {
@@ -242,6 +269,13 @@ namespace llama
             using type = typename GetTypeImpl<ChildType, RecordCoord<TailCoords...>>::type;
         };
 
+        template<typename ChildType, std::size_t HeadCoord, std::size_t... TailCoords>
+        struct GetTypeImpl<ChildType[], RecordCoord<HeadCoord, TailCoords...>>
+        {
+            static_assert(HeadCoord == dynamic, "Record coord at a dynamic array must be llama::dynamic");
+            using type = typename GetTypeImpl<ChildType, RecordCoord<TailCoords...>>::type;
+        };
+
         template<typename T>
         struct GetTypeImpl<T, RecordCoord<>>
         {
@@ -289,6 +323,12 @@ namespace llama
             }
             using type = decltype(help(std::make_index_sequence<N>{}));
         };
+
+        template<typename Child, std::size_t... RCs>
+        struct LeafRecordCoordsImpl<Child[], RecordCoord<RCs...>>
+        {
+            using type = typename LeafRecordCoordsImpl<Child, RecordCoord<RCs..., dynamic>>::type;
+        };
     } // namespace internal
 
     /// Returns a flat type list containing all record coordinates to all leaves of the given record dimension.
@@ -557,6 +597,19 @@ namespace llama
         struct IsBoundedArray<T[N]> : std::true_type
         {
         };
+
+        template<class T>
+        struct is_unbounded_array : std::false_type
+        {
+        };
+
+        template<class T>
+        struct is_unbounded_array<T[]> : std::true_type
+        {
+        };
+
+        template<typename T>
+        inline constexpr bool is_unbounded_array_v = is_unbounded_array<T>::value;
     } // namespace internal
 
     namespace internal
diff --git a/include/llama/DumpMapping.hpp b/include/llama/DumpMapping.hpp
index 02189401af..161e3cdef4 100644
--- a/include/llama/DumpMapping.hpp
+++ b/include/llama/DumpMapping.hpp
@@ -8,6 +8,7 @@
 
 #include "ArrayIndexRange.hpp"
 #include "Core.hpp"
+#include "mapping/OffsetTable.hpp"
 
 #include <boost/functional/hash.hpp>
 #include <fmt/format.h>
@@ -75,7 +76,7 @@ namespace llama
                             {ai,
                              internal::toVec(rc),
                              recordCoordTags<RecordDim>(rc),
-                             mapping.blobNrAndOffset(ai, rc),
+                             mapping.blobNrAndOffset(ai, {}, rc),
                              sizeof(GetType<RecordDim, decltype(rc)>)});
                     });
             }
@@ -83,6 +84,25 @@ namespace llama
             return infos;
         }
 
+        template<typename ArrayExtents, typename RecordDim, typename SubMappings>
+        auto boxesFromMapping(const mapping::OffsetTable<ArrayExtents, RecordDim, SubMappings>& mapping)
+            -> std::vector<FieldBox<ArrayExtents::rank>>
+        {
+            std::size_t previousBlobs = 0;
+            std::vector<FieldBox<ArrayExtents::rank>> infos;
+            boost::mp11::mp_for_each<boost::mp11::mp_iota<boost::mp11::mp_size<decltype(mapping.subMappings)>>>(
+                [&](auto ic)
+                {
+                    const auto& subMapping = get<decltype(ic)::value>(mapping.subMappings);
+                    auto subBoxes = boxesFromMapping(subMapping);
+                    for(auto& box : subBoxes)
+                        box.nrAndOffset.nr += previousBlobs;
+                    infos.insert(infos.end(), subBoxes.begin(), subBoxes.end());
+                    previousBlobs += std::decay_t<decltype(subMapping)>::blobCount;
+                });
+            return infos;
+        }
+
         template<std::size_t Dim>
         auto breakBoxes(std::vector<FieldBox<Dim>> boxes, std::size_t wrapByteCount) -> std::vector<FieldBox<Dim>>
         {
diff --git a/include/llama/Proofs.hpp b/include/llama/Proofs.hpp
index 0c0c71aba6..2568a9c40a 100644
--- a/include/llama/Proofs.hpp
+++ b/include/llama/Proofs.hpp
@@ -73,7 +73,8 @@ namespace llama
                                                           {
                                                               using Type
                                                                   = GetType<typename Mapping::RecordDim, decltype(rc)>;
-                                                              const auto [blob, offset] = m.blobNrAndOffset(ai, rc);
+                                                              const auto [blob, offset]
+                                                                  = m.blobNrAndOffset(ai, {}, rc);
                                                               for(std::size_t b = 0; b < sizeof(Type); b++)
                                                                   if(testAndSet(blob, offset + b))
                                                                   {
@@ -105,7 +106,8 @@ namespace llama
                                                           {
                                                               using Type
                                                                   = GetType<typename Mapping::RecordDim, decltype(rc)>;
-                                                              const auto [blob, offset] = m.blobNrAndOffset(ai, rc);
+                                                              const auto [blob, offset]
+                                                                  = m.blobNrAndOffset(ai, {}, rc);
                                                               if(flatIndex % PieceLength != 0
                                                                  && (lastBlob != blob
                                                                      || lastOffset + sizeof(Type) != offset))
diff --git a/include/llama/RecordCoord.hpp b/include/llama/RecordCoord.hpp
index 79600ba3a4..f104ed8169 100644
--- a/include/llama/RecordCoord.hpp
+++ b/include/llama/RecordCoord.hpp
@@ -6,11 +6,14 @@
 #include "Meta.hpp"
 
 #include <array>
+#include <limits>
 #include <ostream>
 #include <type_traits>
 
 namespace llama
 {
+    inline constexpr auto dynamic = std::numeric_limits<std::size_t>::max();
+
     /// Represents a coordinate for a record inside the record dimension tree.
     /// \tparam Coords... the compile time coordinate.
     template<std::size_t... Coords>
diff --git a/include/llama/View.hpp b/include/llama/View.hpp
index d101c426be..66f5c48746 100644
--- a/include/llama/View.hpp
+++ b/include/llama/View.hpp
@@ -342,12 +342,12 @@ namespace llama
             if constexpr(isRecord<RecordDim> || internal::IsBoundedArray<RecordDim>::value)
             {
                 LLAMA_FORCE_INLINE_RECURSIVE
-                return VirtualRecord<const View>{ai, *this};
+                return VirtualRecord<const View>{*this, ai};
             }
             else
             {
                 LLAMA_FORCE_INLINE_RECURSIVE
-                return accessor(ai, RecordCoord<>{});
+                return accessor(ai, Array<size_t, 0>{}, RecordCoord<>{});
             }
         }
 
@@ -356,12 +356,12 @@ namespace llama
             if constexpr(isRecord<RecordDim> || internal::IsBoundedArray<RecordDim>::value)
             {
                 LLAMA_FORCE_INLINE_RECURSIVE
-                return VirtualRecord<View>{ai, *this};
+                return VirtualRecord<View>{*this, ai};
             }
             else
             {
                 LLAMA_FORCE_INLINE_RECURSIVE
-                return accessor(ai, RecordCoord<>{});
+                return accessor(ai, Array<size_t, 0>{}, RecordCoord<>{});
             }
         }
 
@@ -451,28 +451,34 @@ namespace llama
         friend struct VirtualRecord;
 
         LLAMA_SUPPRESS_HOST_DEVICE_WARNING
-        template<std::size_t... Coords>
-        LLAMA_FN_HOST_ACC_INLINE auto accessor(ArrayIndex ai, RecordCoord<Coords...> rc = {}) const -> decltype(auto)
+        template<std::size_t N, std::size_t... Coords>
+        LLAMA_FN_HOST_ACC_INLINE auto accessor(
+            ArrayIndex ai,
+            Array<size_t, N> dynamicArrayExtents,
+            RecordCoord<Coords...> rc = {}) const -> decltype(auto)
         {
             if constexpr(llama::isComputed<Mapping, RecordCoord<Coords...>>)
                 return mapping().compute(ai, rc, storageBlobs);
             else
             {
-                const auto [nr, offset] = mapping().blobNrAndOffset(ai, rc);
+                const auto [nr, offset] = mapping().blobNrAndOffset(ai, dynamicArrayExtents, rc);
                 using Type = GetType<RecordDim, RecordCoord<Coords...>>;
                 return reinterpret_cast<const Type&>(storageBlobs[nr][offset]);
             }
         }
 
         LLAMA_SUPPRESS_HOST_DEVICE_WARNING
-        template<std::size_t... Coords>
-        LLAMA_FN_HOST_ACC_INLINE auto accessor(ArrayIndex ai, RecordCoord<Coords...> rc = {}) -> decltype(auto)
+        template<std::size_t N, std::size_t... Coords>
+        LLAMA_FN_HOST_ACC_INLINE auto accessor(
+            ArrayIndex ai,
+            Array<size_t, N> dynamicArrayExtents,
+            RecordCoord<Coords...> rc = {}) -> decltype(auto)
         {
             if constexpr(llama::isComputed<Mapping, RecordCoord<Coords...>>)
-                return mapping().compute(ai, rc, storageBlobs);
+                return mapping().compute(ai, dynamicArrayExtents, rc, storageBlobs);
             else
             {
-                const auto [nr, offset] = mapping().blobNrAndOffset(ai, rc);
+                const auto [nr, offset] = mapping().blobNrAndOffset(ai, dynamicArrayExtents, rc);
                 using Type = GetType<RecordDim, RecordCoord<Coords...>>;
                 using QualifiedType = std::conditional_t<
                     std::is_const_v<std::remove_reference_t<decltype(storageBlobs[nr][offset])>>,
diff --git a/include/llama/VirtualRecord.hpp b/include/llama/VirtualRecord.hpp
index 17cf0b55b1..21e662fc82 100644
--- a/include/llama/VirtualRecord.hpp
+++ b/include/llama/VirtualRecord.hpp
@@ -308,6 +308,21 @@ namespace llama
         template<typename T, template<typename...> typename Tuple, typename... Args>
         constexpr inline auto
             isDirectListInitializableFromTuple<T, Tuple<Args...>> = isDirectListInitializable<T, Args...>;
+
+        template<typename RecordDim, typename RecordCoord>
+        constexpr inline auto unboundArraysUntil = []() constexpr
+        {
+            std::size_t count = 0;
+            boost::mp11::mp_for_each<boost::mp11::mp_iota_c<RecordCoord::size>>(
+                [&](auto i) constexpr
+                {
+                    using RC = RecordCoordFromList<boost::mp11::mp_take_c<typename RecordCoord::List, i>>;
+                    using TypeAtRC = GetType<RecordDim, RC>;
+                    count += static_cast<std::size_t>(internal::is_unbounded_array_v<TypeAtRC>);
+                });
+            return count;
+        }
+        ();
     } // namespace internal
 
     /// Virtual record type returned by \ref View after resolving an array dimensions coordinate or partially resolving
@@ -325,7 +340,12 @@ namespace llama
     private:
         using ArrayIndex = typename View::Mapping::ArrayIndex;
         using RecordDim = typename View::Mapping::RecordDim;
+        using DynamicArrayExtentsArray = Array<std::size_t, internal::unboundArraysUntil<RecordDim, BoundRecordCoord>>;
 
+#ifndef __NVCC__
+        [[no_unique_address]]
+#endif
+        const DynamicArrayExtentsArray dynamicArrayExtents;
         std::conditional_t<OwnView, View, View&> view;
 
     public:
@@ -337,14 +357,19 @@ namespace llama
         LLAMA_FN_HOST_ACC_INLINE VirtualRecord()
             /* requires(OwnView) */
             : ArrayIndex{}
+            , dynamicArrayExtents({})
             , view{allocViewStack<0, RecordDim>()}
         {
             static_assert(OwnView, "The default constructor of VirtualRecord is only available if it owns the view.");
         }
 
         LLAMA_FN_HOST_ACC_INLINE
-        VirtualRecord(ArrayIndex ai, std::conditional_t<OwnView, View&&, View&> view)
+        VirtualRecord(
+            std::conditional_t<OwnView, View&&, View&> view,
+            ArrayIndex ai,
+            DynamicArrayExtentsArray dynamicArrayExtents = {})
             : ArrayIndex{ai}
+            , dynamicArrayExtents{dynamicArrayExtents}
             , view{static_cast<decltype(view)>(view)}
         {
         }
@@ -406,15 +431,21 @@ namespace llama
         {
             using AbsolutCoord = Cat<BoundRecordCoord, RecordCoord<Coord...>>;
             using AccessedType = GetType<RecordDim, AbsolutCoord>;
-            if constexpr(isRecord<AccessedType> || internal::IsBoundedArray<AccessedType>::value)
+            if constexpr(
+                isRecord<AccessedType> || internal::IsBoundedArray<AccessedType>::value
+                || internal::is_unbounded_array_v<AccessedType>)
             {
                 LLAMA_FORCE_INLINE_RECURSIVE
-                return VirtualRecord<const View, AbsolutCoord>{arrayIndex(), this->view};
+                return VirtualRecord<const View, AbsolutCoord>{
+                    this->view,
+                    arrayIndex(),
+                    dynamicArrayExtents,
+                };
             }
             else
             {
                 LLAMA_FORCE_INLINE_RECURSIVE
-                return this->view.accessor(arrayIndex(), AbsolutCoord{});
+                return this->view.accessor(arrayIndex(), dynamicArrayExtents, AbsolutCoord{});
             }
         }
 
@@ -424,22 +455,24 @@ namespace llama
         {
             using AbsolutCoord = Cat<BoundRecordCoord, RecordCoord<Coord...>>;
             using AccessedType = GetType<RecordDim, AbsolutCoord>;
-            if constexpr(isRecord<AccessedType> || internal::IsBoundedArray<AccessedType>::value)
+            if constexpr(
+                isRecord<AccessedType> || internal::IsBoundedArray<AccessedType>::value
+                || internal::is_unbounded_array_v<AccessedType>)
             {
                 LLAMA_FORCE_INLINE_RECURSIVE
-                return VirtualRecord<View, AbsolutCoord>{arrayIndex(), this->view};
+                return VirtualRecord<View, AbsolutCoord>{this->view, arrayIndex(), dynamicArrayExtents};
             }
             else
             {
                 LLAMA_FORCE_INLINE_RECURSIVE
-                return this->view.accessor(arrayIndex(), AbsolutCoord{});
+                return this->view.accessor(arrayIndex(), dynamicArrayExtents, AbsolutCoord{});
             }
         }
 
         /// Access a record in the record dimension underneath the current virtual record using a series of tags. If
         /// the access resolves to a leaf, a reference to a variable inside the \ref View storage is returned,
         /// otherwise another virtual record.
-        template<typename... Tags>
+        template<typename... Tags, std::enable_if_t<!std::disjunction_v<std::is_integral<Tags>...>, bool> = true>
         LLAMA_FN_HOST_ACC_INLINE auto operator()(Tags...) const -> decltype(auto)
         {
             using RecordCoord = GetCoordFromTags<AccessibleRecordDim, Tags...>;
@@ -449,7 +482,7 @@ namespace llama
         }
 
         // FIXME(bgruber): remove redundancy
-        template<typename... Tags>
+        template<typename... Tags, std::enable_if_t<!std::disjunction_v<std::is_integral<Tags>...>, bool> = true>
         LLAMA_FN_HOST_ACC_INLINE auto operator()(Tags...) -> decltype(auto)
         {
             using RecordCoord = GetCoordFromTags<AccessibleRecordDim, Tags...>;
@@ -458,6 +491,47 @@ namespace llama
             return operator()(RecordCoord{});
         }
 
+        template<
+            typename ADD = AccessibleRecordDim,
+            std::enable_if_t<internal::is_unbounded_array_v<ADD>, bool> = true>
+        LLAMA_FN_HOST_ACC_INLINE auto operator()(std::size_t i) const -> decltype(auto)
+        {
+            using AbsolutCoord = Cat<BoundRecordCoord, RecordCoord<dynamic>>;
+            using ResolvedType = GetType<RecordDim, AbsolutCoord>;
+            auto newDynamicArrayExtents = push_back(dynamicArrayExtents, i);
+            if constexpr(isRecord<ResolvedType> || internal::is_unbounded_array_v<ResolvedType>)
+            {
+                LLAMA_FORCE_INLINE_RECURSIVE
+                return VirtualRecord<const View, AbsolutCoord>{this->view, arrayIndex(), newDynamicArrayExtents};
+            }
+            else
+            {
+                LLAMA_FORCE_INLINE_RECURSIVE
+                return this->view.accessor(arrayIndex(), newDynamicArrayExtents, AbsolutCoord{});
+            }
+        }
+
+        // FIXME(bgruber): remove redundancy
+        template<
+            typename ADD = AccessibleRecordDim,
+            std::enable_if_t<internal::is_unbounded_array_v<ADD>, bool> = true>
+        LLAMA_FN_HOST_ACC_INLINE auto operator()(std::size_t i) -> decltype(auto)
+        {
+            using AbsolutCoord = Cat<BoundRecordCoord, RecordCoord<dynamic>>;
+            using ResolvedType = GetType<RecordDim, AbsolutCoord>;
+            auto newDynamicArrayExtents = push_back(dynamicArrayExtents, i);
+            if constexpr(isRecord<ResolvedType> || internal::is_unbounded_array_v<ResolvedType>)
+            {
+                LLAMA_FORCE_INLINE_RECURSIVE
+                return VirtualRecord<View, AbsolutCoord>{this->view, arrayIndex(), newDynamicArrayExtents};
+            }
+            else
+            {
+                LLAMA_FORCE_INLINE_RECURSIVE
+                return this->view.accessor(arrayIndex(), newDynamicArrayExtents, AbsolutCoord{});
+            }
+        }
+
         template<typename T>
         LLAMA_FN_HOST_ACC_INLINE auto operator=(const T& other) -> VirtualRecord&
         {
diff --git a/include/llama/llama.hpp b/include/llama/llama.hpp
index 5ef2c3db58..365fc13d10 100644
--- a/include/llama/llama.hpp
+++ b/include/llama/llama.hpp
@@ -49,6 +49,7 @@
 #include "mapping/AoSoA.hpp"
 #include "mapping/Bytesplit.hpp"
 #include "mapping/Heatmap.hpp"
+#include "mapping/OffsetTable.hpp"
 #include "mapping/One.hpp"
 #include "mapping/SoA.hpp"
 #include "mapping/Split.hpp"
diff --git a/include/llama/mapping/AoS.hpp b/include/llama/mapping/AoS.hpp
index c3da773550..60a7a7d8ef 100644
--- a/include/llama/mapping/AoS.hpp
+++ b/include/llama/mapping/AoS.hpp
@@ -47,9 +47,11 @@ namespace llama::mapping
                 * flatSizeOf<typename Flattener::FlatRecordDim, AlignAndPad>;
         }
 
-        template<std::size_t... RecordCoords>
-        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(ArrayIndex ai, RecordCoord<RecordCoords...> = {}) const
-            -> NrAndOffset
+        template<std::size_t... RecordCoords, std::size_t N = 0>
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(
+            ArrayIndex ai,
+            Array<std::size_t, N> = {},
+            RecordCoord<RecordCoords...> = {}) const -> NrAndOffset
         {
             constexpr std::size_t flatFieldIndex =
 #ifdef __NVCC__
diff --git a/include/llama/mapping/AoSoA.hpp b/include/llama/mapping/AoSoA.hpp
index c96a258bd7..cdfc60b67a 100644
--- a/include/llama/mapping/AoSoA.hpp
+++ b/include/llama/mapping/AoSoA.hpp
@@ -61,9 +61,11 @@ namespace llama::mapping
                 Lanes * sizeOf<RecordDim>);
         }
 
-        template<std::size_t... RecordCoords>
-        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(ArrayIndex ai, RecordCoord<RecordCoords...> = {}) const
-            -> NrAndOffset
+        template<std::size_t... RecordCoords, std::size_t N = 0>
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(
+            ArrayIndex ai,
+            Array<std::size_t, N> = {},
+            RecordCoord<RecordCoords...> = {}) const -> NrAndOffset
         {
             constexpr std::size_t flatFieldIndex =
 #ifdef __NVCC__
diff --git a/include/llama/mapping/Bytesplit.hpp b/include/llama/mapping/Bytesplit.hpp
index 0b1f804ef0..024bf98e9a 100644
--- a/include/llama/mapping/Bytesplit.hpp
+++ b/include/llama/mapping/Bytesplit.hpp
@@ -40,11 +40,12 @@ namespace llama::mapping
             return true;
         }
 
-        template<typename QualifiedBase, typename RC, typename BlobArray>
+        template<typename QualifiedBase, std::size_t N, typename RC, typename BlobArray>
         struct Reference
         {
             QualifiedBase& innerMapping;
             ArrayIndex ai;
+            llama::Array<std::size_t, N> dynamicArrayExtents;
             BlobArray& blobs;
 
             using DstType = GetType<TRecordDim, RC>;
@@ -58,7 +59,8 @@ namespace llama::mapping
                     [&](auto ic)
                     {
                         constexpr auto i = decltype(ic)::value;
-                        const auto [nr, off] = innerMapping.blobNrAndOffset(ai, Cat<RC, RecordCoord<i>>{});
+                        const auto [nr, off]
+                            = innerMapping.blobNrAndOffset(ai, dynamicArrayExtents, Cat<RC, RecordCoord<i>>{});
                         p[i] = blobs[nr][off];
                     });
                 return v;
@@ -71,20 +73,26 @@ namespace llama::mapping
                     [&](auto ic)
                     {
                         constexpr auto i = decltype(ic)::value;
-                        const auto [nr, off] = innerMapping.blobNrAndOffset(ai, Cat<RC, RecordCoord<i>>{});
+                        const auto [nr, off]
+                            = innerMapping.blobNrAndOffset(ai, dynamicArrayExtents, Cat<RC, RecordCoord<i>>{});
                         blobs[nr][off] = p[i];
                     });
                 return *this;
             }
         };
 
-        template<std::size_t... RecordCoords, typename BlobArray>
+        template<std::size_t... RecordCoords, std::size_t N, typename BlobArray>
         LLAMA_FN_HOST_ACC_INLINE constexpr auto compute(
             typename Inner::ArrayIndex ai,
+            llama::Array<std::size_t, N> dynamicArrayExtents,
             RecordCoord<RecordCoords...>,
             BlobArray& blobs) const
         {
-            return Reference<decltype(*this), RecordCoord<RecordCoords...>, BlobArray>{*this, ai, blobs};
+            return Reference<decltype(*this), N, RecordCoord<RecordCoords...>, BlobArray>{
+                *this,
+                ai,
+                dynamicArrayExtents,
+                blobs};
         }
     };
 } // namespace llama::mapping
diff --git a/include/llama/mapping/Heatmap.hpp b/include/llama/mapping/Heatmap.hpp
index 002d6413c4..1bb5256d6c 100644
--- a/include/llama/mapping/Heatmap.hpp
+++ b/include/llama/mapping/Heatmap.hpp
@@ -47,11 +47,13 @@ namespace llama::mapping
             return mapping.blobSize(i);
         }
 
-        template<std::size_t... RecordCoords>
-        LLAMA_FN_HOST_ACC_INLINE auto blobNrAndOffset(ArrayIndex ai, RecordCoord<RecordCoords...> rc = {}) const
-            -> NrAndOffset
+        template<std::size_t... RecordCoords, std::size_t N = 0>
+        LLAMA_FN_HOST_ACC_INLINE auto blobNrAndOffset(
+            ArrayIndex ai,
+            Array<std::size_t, N> dynamicArrayExtents = {},
+            RecordCoord<RecordCoords...> rc = {}) const -> NrAndOffset
         {
-            const auto nao = mapping.blobNrAndOffset(ai, rc);
+            const auto nao = mapping.blobNrAndOffset(ai, dynamicArrayExtents, rc);
             for(std::size_t i = 0; i < sizeof(GetType<RecordDim, RecordCoord<RecordCoords...>>); i++)
                 byteHits[nao.nr][nao.offset + i]++;
             return nao;
diff --git a/include/llama/mapping/OffsetTable.hpp b/include/llama/mapping/OffsetTable.hpp
new file mode 100644
index 0000000000..ef4e156752
--- /dev/null
+++ b/include/llama/mapping/OffsetTable.hpp
@@ -0,0 +1,361 @@
+// SPDX-License-Identifier: GPL-3.0-or-later
+
+#pragma once
+
+#include "../Meta.hpp"
+#include "../Tuple.hpp"
+#include "AoS.hpp"
+#include "Common.hpp"
+
+namespace llama
+{
+    using EndOffsetType = std::size_t;
+    using SizeType = std::size_t;
+
+    template<typename Tag>
+    struct EndOffset
+    {
+    };
+    template<typename Tag>
+    struct Size
+    {
+    };
+} // namespace llama
+
+namespace llama::mapping
+{
+    namespace internal
+    {
+        using namespace boost::mp11;
+
+        template<typename T>
+        inline constexpr bool isEndOffsetField = false;
+
+        template<typename Tag>
+        inline constexpr bool isEndOffsetField<EndOffset<Tag>> = true;
+
+        template<typename T>
+        inline constexpr bool isSizeField = false;
+
+        template<typename Tag>
+        inline constexpr bool isSizeField<Size<Tag>> = true;
+
+        template<typename Field>
+        struct AddOffsetAndSizeFieldsImpl
+        {
+            using type = Record<Field>;
+        };
+
+        template<typename Tag, typename Type>
+        struct AddOffsetAndSizeFieldsImpl<Field<Tag, Type[]>>
+        {
+            using type = Record<Field<Tag, Type[]>, Field<EndOffset<Tag>, EndOffsetType>, Field<Size<Tag>, SizeType>>;
+        };
+
+        template<typename Field>
+        using AddOffsetAndSizeFields = typename AddOffsetAndSizeFieldsImpl<Field>::type;
+
+        template<typename T, typename RecordCoord>
+        struct ReplaceDynamicSubarrays
+        {
+            using Replaced = T;
+            using SubRecordDims = mp_list<>;
+            using SplitCoords = mp_list<>;
+            using Augmented = T;
+        };
+
+        template<typename T, std::size_t... RC>
+        struct ReplaceDynamicSubarrays<T[], RecordCoord<RC...>>
+        {
+            using Replaced = EndOffsetType; // offset table entry
+            using SubRecordDims = mp_list<typename ReplaceDynamicSubarrays<T, RecordCoord<RC..., dynamic>>::Replaced>;
+            using SplitCoords = mp_push_front<
+                typename ReplaceDynamicSubarrays<T, RecordCoord<RC..., dynamic>>::SplitCoords,
+                RecordCoord<RC...>>;
+            using Augmented = T[];
+        };
+
+        template<typename Rec, typename RC, typename IS>
+        struct ReplaceDynamicSubarraysHelp;
+
+        template<typename Rec, std::size_t... RC, std::size_t... Is>
+        struct ReplaceDynamicSubarraysHelp<Rec, RecordCoord<RC...>, std::index_sequence<Is...>>
+        {
+            using Replaced = Record<Field<
+                GetFieldTag<mp_at_c<Rec, Is>>,
+                typename ReplaceDynamicSubarrays<GetFieldType<mp_at_c<Rec, Is>>, RecordCoord<RC..., Is>>::
+                    Replaced>...>;
+            using SubRecordDims
+                = mp_append<typename ReplaceDynamicSubarrays<GetFieldType<mp_at_c<Rec, Is>>, RecordCoord<RC..., Is>>::
+                                SubRecordDims...>;
+            using SplitCoords
+                = mp_append<typename ReplaceDynamicSubarrays<GetFieldType<mp_at_c<Rec, Is>>, RecordCoord<RC..., Is>>::
+                                SplitCoords...>;
+
+            using Augmented = mp_flatten<mp_transform<AddOffsetAndSizeFields, Rec>>;
+        };
+
+        template<typename... Fields, std::size_t... RC>
+        struct ReplaceDynamicSubarrays<Record<Fields...>, RecordCoord<RC...>>
+            : ReplaceDynamicSubarraysHelp<
+                  Record<Fields...>,
+                  RecordCoord<RC...>,
+                  std::make_index_sequence<sizeof...(Fields)>>
+        {
+        };
+
+        template<typename RC>
+        using BeforeDynamic
+            = RecordCoordFromList<mp_take<typename RC::List, mp_find<typename RC::List, mp_size_t<dynamic>>>>;
+
+        template<typename RC>
+        using AfterDynamic = RecordCoordFromList<mp_drop<
+            typename RC::List,
+            mp_size_t<std::min(mp_find<typename RC::List, mp_size_t<dynamic>>::value + 1, RC::size)>>>;
+
+        template<typename RC, std::ptrdiff_t Offset>
+        using OffsetLastCoord = RecordCoordFromList<
+            mp_push_back<mp_take_c<typename RC::List, RC::size - 1>, mp_size_t<RC::back + Offset>>>;
+
+        template<typename RecordDim, typename RecordCoord>
+        struct ShiftRecordCoord;
+
+        template<typename RecordDim>
+        struct ShiftRecordCoord<RecordDim, RecordCoord<>>
+        {
+            using Coord = RecordCoord<>;
+        };
+
+        template<typename RecordDim, std::size_t First, std::size_t... Rest>
+        struct ShiftRecordCoord<RecordDim, RecordCoord<First, Rest...>>
+        {
+            template<typename Field>
+            using IsUnboundArrayField = llama::internal::is_unbounded_array<GetFieldType<Field>>;
+
+            using ShiftedFirst
+                = RecordCoord<First - 2 * mp_count_if<mp_take_c<RecordDim, First>, IsUnboundArrayField>::value>;
+            using ShiftedRest = typename ShiftRecordCoord<mp_at_c<RecordDim, First>, RecordCoord<Rest...>>::Coord;
+
+            using Coord = Cat<ShiftedFirst, ShiftedRest>;
+        };
+    } // namespace internal
+
+    /// A type list containing mappings.
+    template<template<typename, typename> typename... SubMappings>
+    struct MappingList;
+
+    namespace internal
+    {
+        template<typename SubRecordDims, typename Mappings>
+        struct MapSubRecordDims;
+
+        template<typename... SubRecordDims, template<typename, typename> typename... SubMappings>
+        struct MapSubRecordDims<boost::mp11::mp_list<SubRecordDims...>, MappingList<SubMappings...>>
+        {
+            static_assert(
+                sizeof...(SubRecordDims) == sizeof...(SubMappings),
+                "There must be as many mappings as sub record dimensions");
+            using List = boost::mp11::mp_list<SubMappings<ArrayExtentsDynamic<1>, SubRecordDims>...>;
+        };
+
+        template<typename... SubRecordDims, template<typename, typename> typename Mapping>
+        struct MapSubRecordDims<boost::mp11::mp_list<SubRecordDims...>, MappingList<Mapping>>
+        {
+        private:
+            template<typename SubRecordDim>
+            using MapRecordDim = Mapping<ArrayExtentsDynamic<1>, SubRecordDim>;
+
+        public:
+            using List = boost::mp11::mp_transform<MapRecordDim, boost::mp11::mp_list<SubRecordDims...>>;
+        };
+    } // namespace internal
+
+    /// Meta mapping splitting off sub branches of the given record dimension tree at each field which's type is a
+    /// dynamic array. Each dynamic array field is then replaced by an integral offset of type \ref EndOffsetType. This
+    /// offset is used to navigate from a virtual record into a dynamic sub array member using a dynamic index. Two
+    /// computed fields are added per dynamic array field, which are named \ref EndOffset and \ref Size, giving access
+    /// to the offset value and the size of a dynamic sub array. The list of sub record dimensions is then further
+    /// mapped using a list of sub mappings.
+    ///
+    /// @tparam T_RecordDim A record dimension, possibly including field types which are dynamic arrays.
+    /// @tparam SubMappings A \ref MappingList of mappings that will be used to map the sub record dimensions after
+    /// splitting T_RecordDim at each dynamic array field. If the mapping list contains a single mapping, this one will
+    /// be used to map all sub record dimensions. Otherwise, a mapping needs to be given for each sub record dimension.
+    template<
+        typename TArrayExtents,
+        typename T_RecordDim,
+        typename SubMappings = MappingList<PreconfiguredAoS<>::type>>
+    struct OffsetTable
+    {
+        using RDS = internal::ReplaceDynamicSubarrays<T_RecordDim, RecordCoord<>>;
+        using SubRecordDims = boost::mp11::mp_push_front<typename RDS::SubRecordDims, typename RDS::Replaced>;
+        using SplitCoords = typename RDS::SplitCoords;
+
+        using MappedSubRecordDims = typename internal::MapSubRecordDims<SubRecordDims, SubMappings>::List;
+
+        boost::mp11::mp_rename<MappedSubRecordDims, Tuple> subMappings;
+
+        using ArrayExtents = TArrayExtents;
+        using ArrayIndex = typename ArrayExtents::Index;
+        using RecordDim = typename RDS::Augmented;
+        static constexpr std::size_t blobCount = []() constexpr
+        {
+            std::size_t count = 0;
+            boost::mp11::mp_for_each<boost::mp11::mp_transform<boost::mp11::mp_identity, MappedSubRecordDims>>(
+                [&](auto subMapping) { count += decltype(subMapping)::type::blobCount; });
+            return count;
+        }
+        ();
+
+        constexpr OffsetTable() = default;
+
+        template<typename... ArrayExtents>
+        LLAMA_FN_HOST_ACC_INLINE constexpr OffsetTable(ArrayExtents... sizes) : subMappings(sizes...)
+        {
+        }
+
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto extents() const -> ArrayExtents
+        {
+            return get<0>(subMappings).extents();
+        }
+
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobSize(std::size_t i) const -> std::size_t
+        {
+            std::size_t result = 0;
+            boost::mp11::mp_for_each<boost::mp11::mp_iota<boost::mp11::mp_size<MappedSubRecordDims>>>(
+                [&](auto jc)
+                {
+                    constexpr auto j = decltype(jc)::value;
+                    constexpr auto subBlobs = boost::mp11::mp_at_c<MappedSubRecordDims, j>::blobCount;
+                    if(i < subBlobs)
+                        result = get<j>(subMappings).blobSize(i);
+                    i -= subBlobs;
+                });
+            return result;
+        }
+
+        template<std::size_t... RecordCoords>
+        LLAMA_FN_HOST_ACC_INLINE static constexpr auto isComputed(RecordCoord<RecordCoords...>)
+        {
+            return true;
+        }
+
+        template<std::size_t N, typename RecordCoord, typename Blob>
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto compute(
+            ArrayIndex ai,
+            Array<std::size_t, N> dynamicArrayExtents,
+            RecordCoord rc,
+            Array<Blob, blobCount>& blobs) const -> decltype(auto)
+        {
+            return computeRecursive<0>(llama::RecordCoord{}, rc, ai, dynamicArrayExtents, blobs);
+        }
+
+    private:
+        template<
+            std::size_t MappingIndex,
+            typename ResolvedRecordCoord,
+            typename UnresolvedRecordCoord,
+            std::size_t N,
+            typename Blob>
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto computeRecursive(
+            ResolvedRecordCoord,
+            UnresolvedRecordCoord,
+            ArrayIndex ai,
+            Array<std::size_t, N> dynamicArrayExtents,
+            Array<Blob, blobCount>& blobs) const -> decltype(auto)
+        {
+            static_assert(
+                ArrayExtents::rank == 1,
+                "Not implemented"); // this would need a way to get the prev of coord, also ArrayExtents can be a
+                                    // different type during recursive instantiation
+
+            using UnresolvedBeforeDynamic = internal::BeforeDynamic<UnresolvedRecordCoord>;
+            using UnresolvedAfterDynamic = internal::AfterDynamic<UnresolvedRecordCoord>;
+            using ResolvedSoFar = Cat<ResolvedRecordCoord, UnresolvedBeforeDynamic>;
+
+            auto loadBeginOffset = [&](auto unresolvedBeforeDynamic) -> EndOffsetType
+            {
+                if(ai == ArrayIndex{}) [[unlikely]]
+                    return 0;
+                auto prevCoord = ai;
+                prevCoord[0]--;
+                return reinterpret_cast<const EndOffsetType&>(
+                    *mapToAddress<MappingIndex>(ResolvedRecordCoord{}, unresolvedBeforeDynamic, prevCoord, blobs));
+            };
+
+            using Tag = GetTag<RecordDim, ResolvedSoFar>;
+            if constexpr(internal::isEndOffsetField<Tag>)
+                // load offset from dynamic array member field at prev record coord
+                return reinterpret_cast<EndOffsetType&>(*mapToAddress<MappingIndex>(
+                    ResolvedRecordCoord{},
+                    internal::OffsetLastCoord<UnresolvedBeforeDynamic, -1>{},
+                    ai,
+                    blobs));
+            else if constexpr(internal::isSizeField<Tag>)
+            {
+                // compute size from end offset and prev end offset (or 0 for the first sub array)
+                const auto begin = loadBeginOffset(internal::OffsetLastCoord<UnresolvedBeforeDynamic, -2>{});
+                const auto end = reinterpret_cast<const EndOffsetType&>(*mapToAddress<MappingIndex>(
+                    ResolvedRecordCoord{},
+                    internal::OffsetLastCoord<UnresolvedBeforeDynamic, -2>{},
+                    ai,
+                    blobs));
+                return static_cast<SizeType>(end - begin);
+            }
+            else if constexpr(std::is_same_v<UnresolvedBeforeDynamic, UnresolvedRecordCoord>)
+            {
+                // no dynamic sub arrays anymore, proceed with access
+                static_assert(N == 0);
+                using Type = GetType<RecordDim, ResolvedSoFar>;
+                return reinterpret_cast<Type&>(
+                    *mapToAddress<MappingIndex>(ResolvedRecordCoord{}, UnresolvedBeforeDynamic{}, ai, blobs));
+            }
+            else
+            {
+                // continue resolving with next submapping
+                using ShiftedCoord = typename internal::ShiftRecordCoord<RecordDim, ResolvedSoFar>::Coord;
+                constexpr auto nextSubMappingIndex = boost::mp11::mp_find<SplitCoords, ShiftedCoord>::value + 1;
+                static_assert(nextSubMappingIndex < boost::mp11::mp_size<MappedSubRecordDims>::value);
+                const auto dynamicSubIndex = loadBeginOffset(UnresolvedBeforeDynamic{}) + dynamicArrayExtents[0];
+                return computeRecursive<nextSubMappingIndex>(
+                    Cat<ResolvedSoFar, RecordCoord<dynamic>>{},
+                    UnresolvedAfterDynamic{},
+                    llama::ArrayIndex{dynamicSubIndex},
+                    pop_front(dynamicArrayExtents),
+                    blobs);
+            }
+        }
+
+        template<
+            std::size_t MappingIndex,
+            typename RecordCoordBeforeThisMapping,
+            typename RecordCoordForThisMapping,
+            typename Blob>
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto mapToAddress(
+            RecordCoordBeforeThisMapping,
+            RecordCoordForThisMapping,
+            ArrayIndex ai,
+            Array<Blob, blobCount>& blobs) const -> std::byte*
+        {
+            // we need to shift the record coord before mapping, because the user exposed RecordDim contains the
+            // artificial EndOffset and Size fields, which the RecordDim of the submappings don't have.
+            using ExposedSubRecordDim = GetType<RecordDim, RecordCoordBeforeThisMapping>;
+            using ShiftedCoord =
+                typename internal::ShiftRecordCoord<ExposedSubRecordDim, RecordCoordForThisMapping>::Coord;
+            auto [nr, offset] = blobNrAndOffset(get<MappingIndex>(subMappings), ShiftedCoord{}, ai);
+            boost::mp11::mp_for_each<boost::mp11::mp_iota_c<MappingIndex>>(
+                [nr = std::ref(nr)](auto i)
+                { nr += boost::mp11::mp_at<MappedSubRecordDims, decltype(i)>::blobCount; });
+            return &blobs[nr][offset];
+        }
+
+        template<typename Mapping, std::size_t... RecordCoords>
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(
+            const Mapping& mapping,
+            RecordCoord<RecordCoords...>,
+            ArrayIndex ai) const -> NrAndOffset
+        {
+            return mapping.template blobNrAndOffset<RecordCoords...>(ai);
+        }
+    };
+} // namespace llama::mapping
diff --git a/include/llama/mapping/One.hpp b/include/llama/mapping/One.hpp
index d676f36bd2..ed2c6977ca 100644
--- a/include/llama/mapping/One.hpp
+++ b/include/llama/mapping/One.hpp
@@ -45,9 +45,11 @@ namespace llama::mapping
             return flatSizeOf<typename Flattener::FlatRecordDim, AlignAndPad, false>; // no tail padding
         }
 
-        template<std::size_t... RecordCoords>
-        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(ArrayIndex, RecordCoord<RecordCoords...> = {}) const
-            -> NrAndOffset
+        template<std::size_t... RecordCoords, std::size_t N = 0>
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(
+            ArrayIndex,
+            Array<std::size_t, N> = {},
+            RecordCoord<RecordCoords...> = {}) const -> NrAndOffset
         {
             constexpr std::size_t flatFieldIndex =
 #ifdef __NVCC__
diff --git a/include/llama/mapping/SoA.hpp b/include/llama/mapping/SoA.hpp
index bc974a2951..6fed49f1a3 100644
--- a/include/llama/mapping/SoA.hpp
+++ b/include/llama/mapping/SoA.hpp
@@ -64,14 +64,16 @@ namespace llama::mapping
             }
         }
 
-        template<std::size_t... RecordCoords>
-        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(ArrayIndex ad, RecordCoord<RecordCoords...> = {}) const
-            -> NrAndOffset
+        template<std::size_t... RecordCoords, std::size_t N = 0>
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(
+            ArrayIndex ai,
+            Array<std::size_t, N> = {},
+            RecordCoord<RecordCoords...> = {}) const -> NrAndOffset
         {
             if constexpr(SeparateBuffers)
             {
                 constexpr auto blob = flatRecordCoord<RecordDim, RecordCoord<RecordCoords...>>;
-                const auto offset = LinearizeArrayDimsFunctor{}(ad, extents())
+                const auto offset = LinearizeArrayDimsFunctor{}(ai, extents())
                     * sizeof(GetType<RecordDim, RecordCoord<RecordCoords...>>);
                 return {blob, offset};
             }
@@ -82,7 +84,7 @@ namespace llama::mapping
                     *& // mess with nvcc compiler state to workaround bug
 #endif
                      Flattener::template flatIndex<RecordCoords...>;
-                const auto offset = LinearizeArrayDimsFunctor{}(ad, extents())
+                const auto offset = LinearizeArrayDimsFunctor{}(ai, extents())
                         * sizeof(GetType<RecordDim, RecordCoord<RecordCoords...>>)
                     + flatOffsetOf<
                           typename Flattener::FlatRecordDim,
diff --git a/include/llama/mapping/Split.hpp b/include/llama/mapping/Split.hpp
index e31e592a8a..33f1d54bab 100644
--- a/include/llama/mapping/Split.hpp
+++ b/include/llama/mapping/Split.hpp
@@ -129,17 +129,20 @@ namespace llama::mapping
                 return mapping1.blobSize(0) + mapping2.blobSize(0);
         }
 
-        template<std::size_t... RecordCoords>
-        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(ArrayIndex ai, RecordCoord<RecordCoords...> = {}) const
-            -> NrAndOffset
+        template<std::size_t... RecordCoords, std::size_t N = 0>
+        LLAMA_FN_HOST_ACC_INLINE constexpr auto blobNrAndOffset(
+            ArrayIndex ai,
+            Array<std::size_t, N> dynamicArrayExtents = {},
+            RecordCoord<RecordCoords...> = {}) const -> NrAndOffset
         {
             using Tags = GetTags<RecordDim, RecordCoord<RecordCoords...>>;
 
             if constexpr(internal::isSelected<RecordCoord<RecordCoords...>, RecordCoordForMapping1>)
-                return mapping1.blobNrAndOffset(ai, GetCoordFromTags<RecordDim1, Tags>{});
+                return mapping1.blobNrAndOffset(ai, dynamicArrayExtents, GetCoordFromTags<RecordDim1, Tags>{});
             else
             {
-                auto nrAndOffset = mapping2.blobNrAndOffset(ai, GetCoordFromTags<RecordDim2, Tags>{});
+                auto nrAndOffset
+                    = mapping2.blobNrAndOffset(ai, dynamicArrayExtents, GetCoordFromTags<RecordDim2, Tags>{});
                 if constexpr(SeparateBlobs)
                     nrAndOffset.nr += Mapping1::blobCount;
                 else
diff --git a/include/llama/mapping/Trace.hpp b/include/llama/mapping/Trace.hpp
index 43733e6663..f423dbc7eb 100644
--- a/include/llama/mapping/Trace.hpp
+++ b/include/llama/mapping/Trace.hpp
@@ -53,14 +53,16 @@ namespace llama::mapping
             return mapping.blobSize(i);
         }
 
-        template<std::size_t... RecordCoords>
-        LLAMA_FN_HOST_ACC_INLINE auto blobNrAndOffset(ArrayIndex ai, RecordCoord<RecordCoords...> rc = {}) const
-            -> NrAndOffset
+        template<std::size_t... RecordCoords, std::size_t N = 0>
+        LLAMA_FN_HOST_ACC_INLINE auto blobNrAndOffset(
+            ArrayIndex ai,
+            Array<std::size_t, N> dynamicArrayExtents = {},
+            RecordCoord<RecordCoords...> rc = {}) const -> NrAndOffset
         {
             const static auto name = recordCoordTags<RecordDim>(RecordCoord<RecordCoords...>{});
             fieldHits.at(name)++;
 
-            LLAMA_FORCE_INLINE_RECURSIVE return mapping.blobNrAndOffset(ai, rc);
+            LLAMA_FORCE_INLINE_RECURSIVE return mapping.blobNrAndOffset(ai, dynamicArrayExtents, rc);
         }
 
         void print() const
diff --git a/include/llama/mapping/tree/Mapping.hpp b/include/llama/mapping/tree/Mapping.hpp
index c42a753be0..75e08cf769 100644
--- a/include/llama/mapping/tree/Mapping.hpp
+++ b/include/llama/mapping/tree/Mapping.hpp
@@ -207,9 +207,11 @@ namespace llama::mapping::tree
             return internal::getTreeBlobSize(resultTree);
         }
 
-        template<std::size_t... RecordCoords>
-        LLAMA_FN_HOST_ACC_INLINE auto blobNrAndOffset(ArrayIndex ai, RecordCoord<RecordCoords...> = {}) const
-            -> NrAndOffset
+        template<std::size_t... RecordCoords, std::size_t N = 0>
+        LLAMA_FN_HOST_ACC_INLINE auto blobNrAndOffset(
+            ArrayIndex ai,
+            Array<std::size_t, N> = {},
+            RecordCoord<RecordCoords...> = {}) const -> NrAndOffset
         {
             auto const basicTreeCoord = createTreeCoord<RecordCoord<RecordCoords...>>(ai);
             auto const resultTreeCoord = mergedFunctors.basicCoordToResultCoord(basicTreeCoord, basicTree);
diff --git a/tests/computedprop.cpp b/tests/computedprop.cpp
index fe1a780905..c7cb41cb54 100644
--- a/tests/computedprop.cpp
+++ b/tests/computedprop.cpp
@@ -24,9 +24,10 @@ namespace
             return llama::RecordCoordCommonPrefixIsSame<llama::RecordCoord<RecordCoords...>, llama::RecordCoord<3>>;
         }
 
-        template<std::size_t... RecordCoords, typename Blob>
+        template<std::size_t... RecordCoords, std::size_t N, typename Blob>
         constexpr auto compute(
             ArrayIndex ai,
+            llama::Array<std::size_t, N>,
             llama::RecordCoord<RecordCoords...>,
             llama::Array<Blob, Base::blobCount>& storageBlobs) const
         {
@@ -135,9 +136,12 @@ namespace
             return true;
         }
 
-        template<std::size_t... RecordCoords, typename Blob>
-        constexpr auto compute(ArrayIndex ai, llama::RecordCoord<RecordCoords...>, llama::Array<Blob, blobCount>&)
-            const -> std::size_t
+        template<std::size_t... RecordCoords, std::size_t N, typename Blob>
+        constexpr auto compute(
+            ArrayIndex ai,
+            llama::Array<std::size_t, N>,
+            llama::RecordCoord<RecordCoords...>,
+            llama::Array<Blob, blobCount>&) const -> std::size_t
         {
             return std::reduce(std::begin(ai), std::end(ai), std::size_t{1}, std::multiplies<>{});
         }
@@ -213,9 +217,10 @@ namespace
             return true;
         }
 
-        template<std::size_t... RecordCoords, typename Blob>
+        template<std::size_t... RecordCoords, std::size_t N, typename Blob>
         constexpr auto compute(
             ArrayIndex ai,
+            llama::Array<std::size_t, N>,
             llama::RecordCoord<RecordCoords...>,
             llama::Array<Blob, blobCount>& blobs) const -> BoolRef
         {
diff --git a/tests/core.cpp b/tests/core.cpp
index 48ac1d9c84..8dd7b465be 100644
--- a/tests/core.cpp
+++ b/tests/core.cpp
@@ -393,4 +393,31 @@ TEST_CASE("CopyConst")
     STATIC_REQUIRE(std::is_same_v<llama::CopyConst<const int, float>, const float>);
     STATIC_REQUIRE(std::is_same_v<llama::CopyConst<int, const float>, const float>);
     STATIC_REQUIRE(std::is_same_v<llama::CopyConst<const int, const float>, const float>);
-}
\ No newline at end of file
+}
+TEST_CASE("unboundArrays")
+{
+    struct Tag
+    {
+    };
+
+    using Int0 = int;
+    using Int1 = int[];
+    using Int2 = llama::Record<llama::Field<Tag, int[]>>[];
+    using Int3 = llama::Record<llama::Field<Tag, llama::Record<llama::Field<Tag, int[]>>[]>>[];
+
+    using llama::internal::unboundArraysUntil;
+    STATIC_REQUIRE(unboundArraysUntil<Int0, llama::RecordCoord<>> == 0);
+    STATIC_REQUIRE(unboundArraysUntil<Int1, llama::RecordCoord<>> == 0);
+    STATIC_REQUIRE(unboundArraysUntil<Int1, llama::RecordCoord<llama::dynamic>> == 1);
+    STATIC_REQUIRE(unboundArraysUntil<Int2, llama::RecordCoord<>> == 0);
+    STATIC_REQUIRE(unboundArraysUntil<Int2, llama::RecordCoord<llama::dynamic>> == 1);
+    STATIC_REQUIRE(unboundArraysUntil<Int2, llama::RecordCoord<llama::dynamic, 0>> == 1);
+    STATIC_REQUIRE(unboundArraysUntil<Int2, llama::RecordCoord<llama::dynamic, 0, llama::dynamic>> == 2);
+    STATIC_REQUIRE(unboundArraysUntil<Int3, llama::RecordCoord<>> == 0);
+    STATIC_REQUIRE(unboundArraysUntil<Int3, llama::RecordCoord<llama::dynamic>> == 1);
+    STATIC_REQUIRE(unboundArraysUntil<Int3, llama::RecordCoord<llama::dynamic, llama::dynamic>> == 1);
+    STATIC_REQUIRE(unboundArraysUntil<Int3, llama::RecordCoord<llama::dynamic, 0, llama::dynamic>> == 2);
+    STATIC_REQUIRE(unboundArraysUntil<Int3, llama::RecordCoord<llama::dynamic, 0, llama::dynamic, 0>> == 2);
+    STATIC_REQUIRE(
+        unboundArraysUntil<Int3, llama::RecordCoord<llama::dynamic, 0, llama::dynamic, 0, llama::dynamic>> == 3);
+}
diff --git a/tests/mapping.cpp b/tests/mapping.cpp
index e025ef56a9..19a8453f16 100644
--- a/tests/mapping.cpp
+++ b/tests/mapping.cpp
@@ -894,7 +894,7 @@ TEST_CASE("AoSoA.address_within_bounds")
     auto mapping = AoSoA{ad};
     for(auto i : llama::ArrayIndexRange{ad})
         llama::forEachLeafCoord<Particle>([&](auto rc)
-                                          { CHECK(mapping.blobNrAndOffset(i, rc).offset < mapping.blobSize(0)); });
+                                          { CHECK(mapping.blobNrAndOffset(i, {}, rc).offset < mapping.blobSize(0)); });
 }
 
 TEST_CASE("FlattenRecordDimInOrder")
diff --git a/tests/proofs.cpp b/tests/proofs.cpp
index 2be43388ab..eddec318d0 100644
--- a/tests/proofs.cpp
+++ b/tests/proofs.cpp
@@ -47,9 +47,11 @@ namespace
             return llama::product(extents()) * llama::sizeOf<RecordDim>;
         }
 
-        template<std::size_t... RecordCoords>
-        constexpr auto blobNrAndOffset(ArrayIndex, llama::RecordCoord<RecordCoords...> = {}) const
-            -> llama::NrAndOffset
+        template<std::size_t N = 0, std::size_t... RecordCoords>
+        constexpr auto blobNrAndOffset(
+            ArrayIndex,
+            llama::Array<std::size_t, N> = {},
+            llama::RecordCoord<RecordCoords...> = {}) const -> llama::NrAndOffset
         {
             return {0, 0};
         }
@@ -95,9 +97,11 @@ namespace
             return Modulus * llama::sizeOf<RecordDim>;
         }
 
-        template<std::size_t... RecordCoords>
-        constexpr auto blobNrAndOffset(ArrayIndex ai, llama::RecordCoord<RecordCoords...> = {}) const
-            -> llama::NrAndOffset
+        template<std::size_t N = 0, std::size_t... RecordCoords>
+        constexpr auto blobNrAndOffset(
+            ArrayIndex ai,
+            llama::Array<std::size_t, N> = {},
+            llama::RecordCoord<RecordCoords...> = {}) const -> llama::NrAndOffset
         {
             const auto blob = llama::flatRecordCoord<RecordDim, llama::RecordCoord<RecordCoords...>>;
             const auto offset = (llama::mapping::LinearizeArrayDimsCpp{}(ai, extents()) % Modulus)
diff --git a/tests/recorddimension.cpp b/tests/recorddimension.cpp
index 4c4e999952..a6984aa057 100644
--- a/tests/recorddimension.cpp
+++ b/tests/recorddimension.cpp
@@ -3,6 +3,8 @@
 #include <array>
 #include <atomic>
 #include <complex>
+#include <fstream>
+#include <llama/DumpMapping.hpp>
 #include <vector>
 
 namespace
@@ -300,3 +302,218 @@ TEST_CASE("recorddim.record_with_arrays")
     view(0u)(A3{}, 1_RC, 0_RC);
     view(0u)(A3{}, 1_RC, 1_RC);
 }
+
+TEST_CASE("dynamic array")
+{
+    struct Tag
+    {
+    };
+    using RecordDim = llama::Record<llama::Field<Tag, int[]>>;
+    auto mapping = llama::mapping::OffsetTable<llama::ArrayExtentsDynamic<1>, RecordDim>{
+        llama::ArrayExtents{2},
+        llama::ArrayExtents{5}};
+    auto view = allocView(mapping);
+
+    view(0)(llama::EndOffset<Tag>{}) = 3;
+    view(1)(llama::EndOffset<Tag>{}) = 5;
+
+    CHECK(view(0)(llama::Size<Tag>{}) == 3);
+    int& e0 = view(0)(Tag{})(0);
+    int& e1 = view(0)(Tag{})(1);
+    int& e2 = view(0)(Tag{})(2);
+    CHECK(view(1)(llama::Size<Tag>{}) == 2);
+    int& e3 = view(1)(Tag{})(0);
+    int& e4 = view(1)(Tag{})(1);
+
+    e0 = 1;
+    e1 = 2;
+    e2 = 3;
+    e3 = 4;
+    e4 = 5;
+    CHECK(e0 == 1);
+    CHECK(e1 == 2);
+    CHECK(e2 == 3);
+    CHECK(e3 == 4);
+    CHECK(e4 == 5);
+}
+
+namespace
+{
+    // clang-format off
+    struct run {};
+    struct luminosityBlock {};
+    struct Electrons {};
+    struct Muons {};
+    struct Eta{};
+    struct Mass{};
+    struct Phi{};
+
+    using Electron = llama::Record<
+        llama::Field<Eta, float>,
+        llama::Field<Mass, float>,
+        llama::Field<Phi, float>
+    >;
+    using Muon = llama::Record<
+        llama::Field<Eta, float>,
+        llama::Field<Mass, float>,
+        llama::Field<Phi, float>
+    >;
+    using Event = llama::Record<
+        llama::Field<run, std::int32_t>,
+        llama::Field<luminosityBlock, std::int32_t>,
+        llama::Field<Electrons, Electron[]>,
+        llama::Field<Muons, Muon[]>
+    >;
+    // clang-format on
+} // namespace
+
+TEST_CASE("edm")
+{
+    // 3 events with 5 electrons and 4 muons
+    auto mapping = llama::mapping::OffsetTable<llama::ArrayExtentsDynamic<1>, Event>{
+        llama::ArrayExtents{3},
+        llama::ArrayExtents{5},
+        llama::ArrayExtents{4}};
+    auto view = llama::allocView(mapping);
+
+    // setup offset table
+    view(0)(llama::EndOffset<Electrons>{}) = 3;
+    view(1)(llama::EndOffset<Electrons>{}) = 3;
+    view(2)(llama::EndOffset<Electrons>{}) = 5;
+
+    view(0)(llama::EndOffset<Muons>{}) = 0;
+    view(1)(llama::EndOffset<Muons>{}) = 3;
+    view(2)(llama::EndOffset<Muons>{}) = 4;
+
+    // fill with values
+    int value = 1;
+    for(auto i = 0; i < 3; i++)
+    {
+        auto event = view(i);
+        event(run{}) = value++;
+        event(luminosityBlock{}) = value++;
+        for(auto j = 0; j < event(llama::Size<Electrons>{}); j++)
+        {
+            auto electron = event(Electrons{})(j);
+            electron(Eta{}) = value++;
+            electron(Mass{}) = value++;
+            electron(Phi{}) = value++;
+        }
+        for(auto j = 0; j < event(llama::Size<Muons>{}); j++)
+        {
+            auto muon = event(Muons{})(j);
+            muon(Eta{}) = value++;
+            muon(Mass{}) = value++;
+            muon(Phi{}) = value++;
+        }
+    }
+
+    // check all values
+    value = 1;
+    CHECK(view(0)(run{}) == value++);
+    CHECK(view(0)(luminosityBlock{}) == value++);
+    CHECK(view(0)(llama::EndOffset<Electrons>{}) == 3);
+    CHECK(view(0)(llama::Size<Electrons>{}) == 3);
+    CHECK(view(0)(Electrons{})(0)(Eta{}) == value++);
+    CHECK(view(0)(Electrons{})(0)(Mass{}) == value++);
+    CHECK(view(0)(Electrons{})(0)(Phi{}) == value++);
+    CHECK(view(0)(Electrons{})(1)(Eta{}) == value++);
+    CHECK(view(0)(Electrons{})(1)(Mass{}) == value++);
+    CHECK(view(0)(Electrons{})(1)(Phi{}) == value++);
+    CHECK(view(0)(Electrons{})(2)(Eta{}) == value++);
+    CHECK(view(0)(Electrons{})(2)(Mass{}) == value++);
+    CHECK(view(0)(Electrons{})(2)(Phi{}) == value++);
+    CHECK(view(0)(llama::EndOffset<Muons>{}) == 0);
+    CHECK(view(0)(llama::Size<Muons>{}) == 0);
+
+    CHECK(view(1)(run{}) == value++);
+    CHECK(view(1)(luminosityBlock{}) == value++);
+    CHECK(view(1)(llama::EndOffset<Electrons>{}) == 3);
+    CHECK(view(1)(llama::Size<Electrons>{}) == 0);
+    CHECK(view(1)(llama::EndOffset<Muons>{}) == 3);
+    CHECK(view(1)(llama::Size<Muons>{}) == 3);
+    CHECK(view(1)(Muons{})(0)(Eta{}) == value++);
+    CHECK(view(1)(Muons{})(0)(Mass{}) == value++);
+    CHECK(view(1)(Muons{})(0)(Phi{}) == value++);
+    CHECK(view(1)(Muons{})(1)(Eta{}) == value++);
+    CHECK(view(1)(Muons{})(1)(Mass{}) == value++);
+    CHECK(view(1)(Muons{})(1)(Phi{}) == value++);
+    CHECK(view(1)(Muons{})(2)(Eta{}) == value++);
+    CHECK(view(1)(Muons{})(2)(Mass{}) == value++);
+    CHECK(view(1)(Muons{})(2)(Phi{}) == value++);
+
+    CHECK(view(2)(run{}) == value++);
+    CHECK(view(2)(luminosityBlock{}) == value++);
+    CHECK(view(2)(llama::EndOffset<Electrons>{}) == 5);
+    CHECK(view(2)(llama::Size<Electrons>{}) == 2);
+    CHECK(view(2)(Electrons{})(0)(Eta{}) == value++);
+    CHECK(view(2)(Electrons{})(0)(Mass{}) == value++);
+    CHECK(view(2)(Electrons{})(0)(Phi{}) == value++);
+    CHECK(view(2)(Electrons{})(1)(Eta{}) == value++);
+    CHECK(view(2)(Electrons{})(1)(Mass{}) == value++);
+    CHECK(view(2)(Electrons{})(1)(Phi{}) == value++);
+    CHECK(view(2)(llama::EndOffset<Muons>{}) == 4);
+    CHECK(view(2)(llama::Size<Muons>{}) == 1);
+    CHECK(view(2)(Muons{})(0)(Eta{}) == value++);
+    CHECK(view(2)(Muons{})(0)(Mass{}) == value++);
+    CHECK(view(2)(Muons{})(0)(Phi{}) == value++);
+}
+
+TEST_CASE("dump.edm.AlignedAoS")
+{
+    auto mapping = llama::mapping::OffsetTable<llama::ArrayExtentsDynamic<1>, Event>{
+        llama::ArrayExtents{30},
+        llama::ArrayExtents{50},
+        llama::ArrayExtents{40}};
+    std::ofstream{"dump.edm.AlignedAoS.svg"} << llama::toSvg(mapping);
+    std::ofstream{"dump.edm.AlignedAoS.html"} << llama::toHtml(mapping);
+}
+
+TEST_CASE("dump.edm.MultiBlobSoA")
+{
+    auto mapping = llama::mapping::OffsetTable<
+        llama::ArrayExtentsDynamic<1>,
+        Event,
+        llama::mapping::MappingList<llama::mapping::PreconfiguredSoA<>::type>>{
+        llama::ArrayExtents{30},
+        llama::ArrayExtents{50},
+        llama::ArrayExtents{40}};
+    std::ofstream{"dump.edm.MultiBlobSoA.svg"} << llama::toSvg(mapping);
+    std::ofstream{"dump.edm.MultiBlobSoA.html"} << llama::toHtml(mapping);
+}
+
+TEST_CASE("dump.edm.AlignedAoS_MultiBlobSoA")
+{
+    auto mapping = llama::mapping::OffsetTable<
+        llama::ArrayExtentsDynamic<1>,
+        Event,
+        llama::mapping::MappingList<
+            llama::mapping::PreconfiguredAoS<>::type,
+            llama::mapping::PreconfiguredSoA<>::type,
+            llama::mapping::PreconfiguredSoA<>::type>>{
+        llama::ArrayExtents{30},
+        llama::ArrayExtents{50},
+        llama::ArrayExtents{40}};
+    std::ofstream{"dump.edm.AlignedAoS_MultiBlobSoA.svg"} << llama::toSvg(mapping);
+    std::ofstream{"dump.edm.AlignedAoS_MultiBlobSoA.html"} << llama::toHtml(mapping);
+}
+
+TEST_CASE("dump.edm.Split_AlignedAoS_MultiBlobSoA")
+{
+    auto mapping = llama::mapping::OffsetTable<
+        llama::ArrayExtentsDynamic<1>,
+        Event,
+        llama::mapping::MappingList<
+            llama::mapping::PreconfiguredSplit<
+                llama::RecordCoord<2>,
+                llama::mapping::PreconfiguredAoS<>::type,
+                llama::mapping::PreconfiguredAoS<>::type,
+                true>::type,
+            llama::mapping::PreconfiguredSoA<>::type,
+            llama::mapping::PreconfiguredSoA<>::type>>{
+        llama::ArrayExtents{30},
+        llama::ArrayExtents{50},
+        llama::ArrayExtents{40}};
+    std::ofstream{"dump.edm.Split_AlignedAoS_MultiBlobSoA.svg"} << llama::toSvg(mapping);
+    std::ofstream{"dump.edm.Split_AlignedAoS_MultiBlobSoA.html"} << llama::toHtml(mapping);
+}
diff --git a/tests/virtualrecord.cpp b/tests/virtualrecord.cpp
index bff7fa1610..f3d02e260d 100644
--- a/tests/virtualrecord.cpp
+++ b/tests/virtualrecord.cpp
@@ -969,7 +969,7 @@ TEST_CASE("VirtualRecord.One.size")
     STATIC_REQUIRE(sizeof(v) == 56);
 
     [[maybe_unused]] const auto p = llama::One<Particle>{};
-    STATIC_REQUIRE(sizeof(p) == 56);
+    // STATIC_REQUIRE(sizeof(p) == 56); // FIXME
 }
 
 TEST_CASE("VirtualRecord.One.alignment")

From 78e5283f6974cf280123a3b28f85f894f95918a1 Mon Sep 17 00:00:00 2001
From: Bernhard Manfred Gruber <bernhardmgruber@gmail.com>
Date: Sat, 15 May 2021 21:53:18 +0200
Subject: [PATCH 2/4] add example loading an entire RNTuple into a LLAMA view

---
 CMakeLists.txt                       |  6 ++++
 examples/hep_rntuple/CMakeLists.txt  | 11 ++++++
 examples/hep_rntuple/hep_rntuple.cpp | 53 ++++++++++++++++++++++++++++
 3 files changed, 70 insertions(+)
 create mode 100644 examples/hep_rntuple/CMakeLists.txt
 create mode 100644 examples/hep_rntuple/hep_rntuple.cpp

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 145a2a64ba..17665f1978 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -86,6 +86,12 @@ if (LLAMA_BUILD_EXAMPLES)
 		message(WARNING "Could not find alpaka. Alpaka examples are disabled.")
 	endif()
 
+	# ROOT examples
+	find_package(ROOT QUIET)
+	if (ROOT_FOUND)
+		add_subdirectory("examples/hep_rntuple")
+	endif()
+
 	# CUDA examples
 	include(CheckLanguage)
 	check_language(CUDA)
diff --git a/examples/hep_rntuple/CMakeLists.txt b/examples/hep_rntuple/CMakeLists.txt
new file mode 100644
index 0000000000..1ff55a2867
--- /dev/null
+++ b/examples/hep_rntuple/CMakeLists.txt
@@ -0,0 +1,11 @@
+cmake_minimum_required (VERSION 3.15)
+project(llama-hep_rntuple)
+
+set(CMAKE_CXX_STANDARD 17)
+
+find_package(ROOT REQUIRED)
+if (NOT TARGET llama::llama)
+	find_package(llama REQUIRED)
+endif()
+add_executable(${PROJECT_NAME} hep_rntuple.cpp)
+target_link_libraries(${PROJECT_NAME} PRIVATE ROOT::Hist ROOT::Graf ROOT::Gpad ROOT::ROOTNTuple llama::llama)
diff --git a/examples/hep_rntuple/hep_rntuple.cpp b/examples/hep_rntuple/hep_rntuple.cpp
new file mode 100644
index 0000000000..7354dfb999
--- /dev/null
+++ b/examples/hep_rntuple/hep_rntuple.cpp
@@ -0,0 +1,53 @@
+// This example uses a non-public CMS NanoAOD file called: ttjet_13tev_june2019_lzma.
+// Please ask contact us if you need it.
+
+#include "../common/ttjet_13tev_june2019.hpp"
+
+#include <RConfigure.h>
+#define R__HAS_STD_STRING_VIEW
+#include <ROOT/RNTuple.hxx>
+#include <ROOT/RNTupleDS.hxx>
+#include <ROOT/RNTupleModel.hxx>
+#include <ROOT/RNTupleOptions.hxx>
+#include <ROOT/RNTupleView.hxx>
+#include <chrono>
+#include <llama/DumpMapping.hpp>
+#include <llama/llama.hpp>
+
+int main(int argc, const char* argv[])
+{
+    if (argc != 2)
+    {
+        fmt::print("Please specify input file!\n");
+        return 1;
+    }
+
+    using namespace std::chrono;
+    using namespace ROOT::Experimental;
+
+    auto ntuple = RNTupleReader::Open(RNTupleModel::Create(), "NTuple", argv[1]);
+    const auto n = ntuple->GetNEntries();
+
+    auto start = steady_clock::now();
+    auto view = llama::allocView(llama::mapping::SoA<llama::ArrayDims<1>, Event, true>{llama::ArrayDims{n}});
+    fmt::print("Alloc LLAMA view: {}ms\n", duration_cast<milliseconds>(steady_clock::now() - start).count());
+
+    std::size_t totalSize = 0;
+    for (auto i = 0u; i < view.mapping.blobCount; i++)
+        totalSize += view.mapping.blobSize(i);
+    fmt::print("Total LLAMA view memory: {}MiB in {} blobs\n", totalSize / 1024 / 1024, view.mapping.blobCount);
+
+    start = steady_clock::now();
+    llama::forEachLeaf<Event>(
+        [&](auto coord)
+        {
+            using Name = llama::GetTag<Event, decltype(coord)>;
+            using Type = llama::GetType<Event, decltype(coord)>;
+            auto column = ntuple->GetView<Type>(llama::structName<Name>());
+            for (std::size_t i = 0; i < n; i++)
+                view(i)(coord) = column(i);
+        });
+    fmt::print("Copy RNTuple -> LLAMA view: {}ms\n", duration_cast<milliseconds>(steady_clock::now() - start).count());
+
+    start = steady_clock::now();
+}

From e91b86d3fed6bd040a44eaf73237870d125cb2ac Mon Sep 17 00:00:00 2001
From: Bernhard Manfred Gruber <bernhardmgruber@gmail.com>
Date: Thu, 8 Jul 2021 19:50:38 +0200
Subject: [PATCH 3/4] add assertion that dynamicSubIndex is in range

---
 include/llama/mapping/OffsetTable.hpp | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/include/llama/mapping/OffsetTable.hpp b/include/llama/mapping/OffsetTable.hpp
index ef4e156752..ca0549d28e 100644
--- a/include/llama/mapping/OffsetTable.hpp
+++ b/include/llama/mapping/OffsetTable.hpp
@@ -282,6 +282,11 @@ namespace llama::mapping
                 return reinterpret_cast<const EndOffsetType&>(
                     *mapToAddress<MappingIndex>(ResolvedRecordCoord{}, unresolvedBeforeDynamic, prevCoord, blobs));
             };
+            auto loadEndOffset = [&](auto unresolvedBeforeDynamic) -> EndOffsetType
+            {
+                return reinterpret_cast<const EndOffsetType&>(
+                    *mapToAddress<MappingIndex>(ResolvedRecordCoord{}, unresolvedBeforeDynamic, ai, blobs));
+            };
 
             using Tag = GetTag<RecordDim, ResolvedSoFar>;
             if constexpr(internal::isEndOffsetField<Tag>)
@@ -295,11 +300,7 @@ namespace llama::mapping
             {
                 // compute size from end offset and prev end offset (or 0 for the first sub array)
                 const auto begin = loadBeginOffset(internal::OffsetLastCoord<UnresolvedBeforeDynamic, -2>{});
-                const auto end = reinterpret_cast<const EndOffsetType&>(*mapToAddress<MappingIndex>(
-                    ResolvedRecordCoord{},
-                    internal::OffsetLastCoord<UnresolvedBeforeDynamic, -2>{},
-                    ai,
-                    blobs));
+                const auto end = loadEndOffset(internal::OffsetLastCoord<UnresolvedBeforeDynamic, -2>{});
                 return static_cast<SizeType>(end - begin);
             }
             else if constexpr(std::is_same_v<UnresolvedBeforeDynamic, UnresolvedRecordCoord>)
@@ -317,6 +318,7 @@ namespace llama::mapping
                 constexpr auto nextSubMappingIndex = boost::mp11::mp_find<SplitCoords, ShiftedCoord>::value + 1;
                 static_assert(nextSubMappingIndex < boost::mp11::mp_size<MappedSubRecordDims>::value);
                 const auto dynamicSubIndex = loadBeginOffset(UnresolvedBeforeDynamic{}) + dynamicArrayExtents[0];
+                assert((dynamicSubIndex < loadEndOffset(UnresolvedBeforeDynamic{})) && "Dynamic index out of range");
                 return computeRecursive<nextSubMappingIndex>(
                     Cat<ResolvedSoFar, RecordCoord<dynamic>>{},
                     UnresolvedAfterDynamic{},

From eb74c37a4e13255ef547913e3b646a080fac875c Mon Sep 17 00:00:00 2001
From: Bernhard Manfred Gruber <bernhardmgruber@gmail.com>
Date: Thu, 8 Jul 2021 19:51:11 +0200
Subject: [PATCH 4/4] WIP: trying to load rntuple into a jagged array data
 structure

---
 examples/common/ttjet_13tev_june2019.hpp |  5 +-
 examples/hep_rntuple/hep_rntuple.cpp     | 82 +++++++++++++++++++++---
 2 files changed, 76 insertions(+), 11 deletions(-)

diff --git a/examples/common/ttjet_13tev_june2019.hpp b/examples/common/ttjet_13tev_june2019.hpp
index ebaa024480..86e12b660d 100644
--- a/examples/common/ttjet_13tev_june2019.hpp
+++ b/examples/common/ttjet_13tev_june2019.hpp
@@ -7,7 +7,7 @@
 
 using bit = bool;
 using byte = unsigned char;
-using Index = std::uint64_t;
+using Index = std::uint32_t;
 
 // clang-format off
 struct run {};
@@ -1538,7 +1538,7 @@ using Electron = llama::Record<
     llama::Field<Electron_pdgId, std::int32_t>,
     llama::Field<Electron_photonIdx, std::int32_t>,
     llama::Field<Electron_tightCharge, std::int32_t>,
-    llama::Field<Electron_vidNestedWPbitmap, std::int32_t>,
+    //llama::Field<Electron_vidNestedWPbitmap, std::int32_t>,
     llama::Field<Electron_convVeto, bit>,
     llama::Field<Electron_cutBased_HEEP, bit>,
     llama::Field<Electron_isPFcand, bit>,
@@ -1947,6 +1947,7 @@ using Event = llama::Record<
     llama::Field<ChsMET_sumEt, float>,
     //llama::Field<nCorrT1METJet, Index>,
     //llama::Field<nElectron, Index>,
+    llama::Field<nElectron, Electron[]>,
     llama::Field<Flag_ecalBadCalibFilterV2, bit>,
     //llama::Field<nFatJet, Index>,
     //llama::Field<nGenJetAK8, Index>,
diff --git a/examples/hep_rntuple/hep_rntuple.cpp b/examples/hep_rntuple/hep_rntuple.cpp
index 7354dfb999..0ecb569d57 100644
--- a/examples/hep_rntuple/hep_rntuple.cpp
+++ b/examples/hep_rntuple/hep_rntuple.cpp
@@ -1,5 +1,5 @@
 // This example uses a non-public CMS NanoAOD file called: ttjet_13tev_june2019_lzma.
-// Please ask contact us if you need it.
+// Please contact us if you need it.
 
 #include "../common/ttjet_13tev_june2019.hpp"
 
@@ -14,6 +14,8 @@
 #include <llama/DumpMapping.hpp>
 #include <llama/llama.hpp>
 
+using SmallEvent = boost::mp11::mp_take_c<Event, 100>;
+
 int main(int argc, const char* argv[])
 {
     if (argc != 2)
@@ -25,11 +27,28 @@ int main(int argc, const char* argv[])
     using namespace std::chrono;
     using namespace ROOT::Experimental;
 
+    // auto ntuple
+    //    = RNTupleReader::Open(RNTupleModel::Create(), "NTuple", "/mnt/c/dev/llama/ttjet_13tev_june2019_lzma.root");
     auto ntuple = RNTupleReader::Open(RNTupleModel::Create(), "NTuple", argv[1]);
-    const auto n = ntuple->GetNEntries();
+    // try
+    //{
+    //    ntuple->PrintInfo(ROOT::Experimental::ENTupleInfo::kStorageDetails);
+    //}
+    // catch (const std::exception& e)
+    //{
+    //    fmt::print("PrintInfo error: {}", e.what());
+    //}
+    const auto eventCount = ntuple->GetNEntries();
+    const auto& d = ntuple->GetDescriptor();
+    const auto electronCount
+        = d.GetNElements(d.FindColumnId(d.FindFieldId("nElectron.nElectron.Electron_deltaEtaSC"), 0));
+    fmt::print("File contains {} events with {} electrons\n", eventCount, electronCount);
 
     auto start = steady_clock::now();
-    auto view = llama::allocView(llama::mapping::SoA<llama::ArrayDims<1>, Event, true>{llama::ArrayDims{n}});
+    auto mapping = llama::mapping::OffsetTable<llama::ArrayDims<1>, SmallEvent>{
+        llama::ArrayDims{eventCount},
+        llama::ArrayDims{electronCount}};
+    auto view = llama::allocView(mapping);
     fmt::print("Alloc LLAMA view: {}ms\n", duration_cast<milliseconds>(steady_clock::now() - start).count());
 
     std::size_t totalSize = 0;
@@ -37,15 +56,60 @@ int main(int argc, const char* argv[])
         totalSize += view.mapping.blobSize(i);
     fmt::print("Total LLAMA view memory: {}MiB in {} blobs\n", totalSize / 1024 / 1024, view.mapping.blobCount);
 
+    // fill offset table
     start = steady_clock::now();
-    llama::forEachLeaf<Event>(
+    std::size_t offset = 0;
+    auto electronViewCollection = ntuple->GetViewCollection("nElectron");
+    for (std::size_t i = 0; i < eventCount; i++)
+    {
+        offset += electronViewCollection(i);
+        view(i)(llama::EndOffset<nElectron>{}) = offset;
+        assert(offset <= electronCount);
+    }
+    fmt::print("Fill offset table: {}ms\n", duration_cast<milliseconds>(steady_clock::now() - start).count());
+
+    using AugmentedSmallEvent = typename decltype(mapping)::RecordDim;
+    start = steady_clock::now();
+    llama::forEachLeaf<AugmentedSmallEvent>(
         [&](auto coord)
         {
-            using Name = llama::GetTag<Event, decltype(coord)>;
-            using Type = llama::GetType<Event, decltype(coord)>;
-            auto column = ntuple->GetView<Type>(llama::structName<Name>());
-            for (std::size_t i = 0; i < n; i++)
-                view(i)(coord) = column(i);
+            using Coord = decltype(coord);
+            using LeafTag = llama::GetTag<AugmentedSmallEvent, Coord>;
+            using Type = llama::GetType<AugmentedSmallEvent, Coord>;
+
+            fmt::print("Copying {}\n", llama::structName<LeafTag>());
+            if constexpr (
+                !llama::mapping::internal::isEndOffsetField<LeafTag> && !llama::mapping::internal::isSizeField<LeafTag>)
+            {
+                if constexpr (boost::mp11::mp_contains<typename Coord::List, boost::mp11::mp_size_t<llama::dynamic>>::
+                                  value)
+                {
+                    using Before = llama::mapping::internal::BeforeDynamic<Coord>;
+                    using BeforeBefore = llama::RecordCoordFromList<boost::mp11::mp_pop_front<typename Before::List>>;
+                    using After = llama::mapping::internal::AfterDynamic<Coord>;
+                    using SubCollectionTag = llama::GetTag<AugmentedSmallEvent, Before>;
+
+                    auto collectionColumn = ntuple->GetViewCollection(llama::structName<SubCollectionTag>());
+                    auto column = collectionColumn.template GetView<Type>(
+                        llama::structName<SubCollectionTag>() + "." + llama::structName<LeafTag>());
+                    for (std::size_t i = 0; i < eventCount; i++)
+                    {
+                        const auto subCollectionCount = view(i)(BeforeBefore{})(llama::Size<SubCollectionTag>{});
+                        for (std::size_t j = 0; j < subCollectionCount; j++)
+                        {
+                            const auto value = column(j);
+                            auto& dst = view(i)(Before{})(j) (After{});
+                            dst = value;
+                        }
+                    }
+                }
+                else
+                {
+                    auto column = ntuple->GetView<Type>(llama::structName<LeafTag>());
+                    for (std::size_t i = 0; i < eventCount; i++)
+                        view(i)(coord) = column(i);
+                }
+            }
         });
     fmt::print("Copy RNTuple -> LLAMA view: {}ms\n", duration_cast<milliseconds>(steady_clock::now() - start).count());