vecmem 1.14.0
Loading...
Searching...
No Matches
aligned_multiple_placement.ipp
1/*
2 * VecMem project, part of the ACTS project (R&D line)
3 *
4 * (c) 2022-2024 CERN for the benefit of the ACTS project
5 *
6 * Mozilla Public License Version 2.0
7 */
8
9#pragma once
10
11// vecmem headers
12#include "vecmem/utils/type_traits.hpp"
13
14// Standard library headers
15#include <algorithm>
16#include <tuple>
17#include <type_traits>
18
19namespace vecmem {
20namespace details {
45template <typename T, typename... Ts, typename P, typename... Ps>
46std::tuple<std::add_pointer_t<T>, std::add_pointer_t<Ts>...>
47aligned_multiple_placement_helper(void *p, std::size_t q, P n, Ps &&... ps) {
48 /*
49 * We start out by calculating the size of the current region.
50 */
51 std::size_t size = sizeof(T) * static_cast<std::size_t>(n);
52
53 /*
54 * We will start out by having this region point to null, because it is
55 * possible to not allocate anything: this is the case if n is equal to
56 * zero, and we support this for convenience if this happens
57 * programmatically.
58 */
59 T *beg = nullptr;
60
61 /*
62 * As mentioned, we only proceed to allocation if we actually need any
63 * memory for this region.
64 */
65 if (size > 0) {
66 /*
67 * We will use `std::align` to determine the beginning of this region
68 * of memory. This function has a few side-effects. The returned
69 * pointer is aligned to the boundary of T, and:
70 *
71 * 1. The variable p is updated such that it equals beg.
72 * 2. The size is decreased to compensate for the side of the padding,
73 * but crucially NOT for the size of the allocation itself!
74 */
75 beg = static_cast<T *>(std::align(alignof(T), size, p, q));
76
77 /*
78 * If `std::align` returns a null pointer, there was insufficient
79 * memory to find an allocated pointer. This should never happen in
80 * practice, but we should check for it regardless.
81 */
82 assert(beg != nullptr);
83
84 /*
85 * Now, we will update our current pointer and remaining size (which,
86 * remember, `std::align` does not do: it only gives the start of the
87 * region and reduces the size by the padding). Essentially, this gives
88 * us the parameters for the next invocation of this function.
89 */
90 p = static_cast<void *>(static_cast<char *>(p) + size);
91 q -= size;
92 }
93
94 /*
95 * We now proceed in one of two different ways: if there are any remaining
96 * regions to reserve memory for, we call this function recursively. Note
97 * that the base case of this recursion is static and known at compile
98 * time. If we have no more types to reserve for, then we are done.
99 */
100 if constexpr (sizeof...(Ts) > 0) {
101 /*
102 * We apply here the same tuple concatenation trick that we use in
103 * aligned_multiple_placement: we concate a single-element tuple
104 * containing the start of the current region with whatever is returned
105 * by the recursive invocation of this method.
106 */
107 return std::tuple_cat(
108 /*
109 * Here we construct the single-element tuple.
110 */
111 std::make_tuple<std::add_pointer_t<T>>(std::move(beg)),
112 /*
113 * Next, we recursively call this method, but with one type
114 * argument stripped, as well as one size argument. We use the
115 * updated pointer and remaining size for this.
116 */
118 std::forward<Ps>(ps)...));
119 } else {
120 /*
121 * If we have no more types, we can return a single-element tuple. This
122 * tuple will be concatenated into a larger one by the caller.
123 */
124 return std::make_tuple<std::add_pointer_t<T>>(std::move(beg));
125 }
126#ifdef __GNUC__
127 // Certain combinations of CUDA + GCC generate a warning here, thinking
128 // that the code may reach this point in the function. So for just GCC,
129 // let's add some help here. Telling it that this part of the function is
130 // not (meant to be) reachable.
132#endif // __GNUC__
133}
134
135template <typename... Ts, typename... Ps>
136std::tuple<vecmem::unique_alloc_ptr<char[]>, std::add_pointer_t<Ts>...>
137aligned_multiple_placement(vecmem::memory_resource &r, Ps &&... ps) {
138 /*
139 * First, we will assert that we have exactly as many template arguments as
140 * we have positional arguments, barring the memory resource. This is very
141 * important, because each template type must be accompanied by a number of
142 * times that type should occur.
143 */
144 static_assert(sizeof...(Ts) == sizeof...(Ps),
145 "Number of type parameters must be equal to the number of "
146 "value parameters.");
147
148 /*
149 * Next, we want all of our positional arguments to be size types, or at
150 * least some type that is trivially convertible to it. We can't really
151 * enforce that cleanly using C++, so we just accept a parameter pack of
152 * arbitrary types and then we check that they're all size-like.
153 */
154 static_assert(std::conjunction_v<std::is_convertible<Ps, std::size_t>...>,
155 "All parameters must be of type std::size_t");
156
157 /*
158 * Calculate the maximum alignment between all of the types in the template
159 * parameter pack, which will determine the amount of additional space
160 * we need to allocate.
161 */
162 std::size_t alignment = vecmem::details::max(alignof(Ts)...);
163
164 /*
165 * Next, we pessimistically calculate the number of bytes we need. We do
166 * this by considering all the types in our parameter pack and multiplying
167 * their size by the number of times we want each type to exist. That
168 * happens using the C++ template fold expression. Then, we add some
169 * buffer, because each additional type will risk wasting some space due to
170 * alignment requirements. We do this by adding the maximum alignment once
171 * for each type, because each type introduces at _most_ that amount of
172 * wasted space. This guarantees that we never run out of space, but it can
173 * sometimes waste a little bit of space (on the order of dozens of bytes
174 * for the common case, but potentially up to a few kilobytes for severely
175 * over-aligned types).
176 */
177 const std::size_t bytes =
178 ((static_cast<std::size_t>(ps) * sizeof(Ts)) + ...) +
179 sizeof...(Ts) * alignment;
180
181 /*
182 * We can now make the allocation request with the memory resource, which
183 * in this case does not need to know anything about our alignment
184 * requirements: we are going to handle all of those ourselves.
185 */
188
189 /*
190 * We'll make a non-owning copy of this pointer, because we will need it in
191 * a moment _after_ we've moved it, so we cannot use the original version
192 * of it anymore.
193 */
194 void *p = ptr.get();
195
196 /*
197 * Now we come to the meat of the pudding. Remember that we want to return
198 * a tuple containing a unique pointer to the start of the allocation as
199 * a whole, and then one pointer for where each of our type regions starts.
200 * To accomplish this, we will concatenate two smaller tuples, namely:
201 *
202 * 1. A single-element tuple containing the unique pointer to the start of
203 * the allocated region.
204 * 2. A tuple of length equal to the number of type parameters, each
205 * element of which is a pointer representing where that type's region
206 * starts.
207 *
208 * It's a little bit silly that we need to construct a single-element tuple
209 * for the first part, but that's simply how `std::tuple_cat` works.
210 */
211 return std::tuple_cat(
212 /*
213 * Here, we construct our single-element tuple, into which we simply
214 * move the unique pointer which manages the memory that we have
215 * allocated previously.
216 */
217 std::make_tuple<vecmem::unique_alloc_ptr<char[]>>(std::move(ptr)),
218 /*
219 * And here we call a helper function, which will actually do all of
220 * the alignment. We pass it the start of our allocation, the amount of
221 * remaining space, and then the number of times we want all of our
222 * types to appear.
223 */
225 std::forward<Ps>(ps)...));
226}
227} // namespace details
228} // namespace vecmem
std::tuple< vecmem::unique_alloc_ptr< char[]>, std::add_pointer_t< Ts >... > aligned_multiple_placement(vecmem::memory_resource &r, Ps &&... ps)
Allocation of aligned arrays of given types.
Definition aligned_multiple_placement.ipp:137
auto max(T &&t)
Find the maximum of a variadic number of elements, terminal function.
Definition type_traits.hpp:101
std::tuple< std::add_pointer_t< T >, std::add_pointer_t< Ts >... > aligned_multiple_placement_helper(void *p, std::size_t q, P n, Ps &&... ps)
Helper function for aligned_multiple_placement.
Definition aligned_multiple_placement.ipp:47
Main namespace for the vecmem classes/functions.
Definition atomic_ref.hpp:16
std::vector< T, vecmem::polymorphic_allocator< T > > vector
Alias type for vectors with our polymorphic allocator.
Definition vector.hpp:35
std::unique_ptr< T, details::unique_alloc_deleter< T > > unique_alloc_ptr
A unique pointer type for trivial types.
Definition unique_ptr.hpp:69