warp-lang 1.1.0__py3-none-manylinux2014_x86_64.whl → 1.2.0__py3-none-manylinux2014_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of warp-lang might be problematic. Click here for more details.

Files changed (218) hide show
  1. warp/bin/warp-clang.so +0 -0
  2. warp/bin/warp.so +0 -0
  3. warp/build.py +10 -37
  4. warp/build_dll.py +2 -2
  5. warp/builtins.py +274 -6
  6. warp/codegen.py +51 -4
  7. warp/config.py +2 -2
  8. warp/constants.py +4 -0
  9. warp/context.py +418 -203
  10. warp/examples/benchmarks/benchmark_api.py +0 -2
  11. warp/examples/benchmarks/benchmark_cloth_warp.py +0 -1
  12. warp/examples/benchmarks/benchmark_launches.py +0 -2
  13. warp/examples/core/example_dem.py +0 -2
  14. warp/examples/core/example_fluid.py +0 -2
  15. warp/examples/core/example_graph_capture.py +0 -2
  16. warp/examples/core/example_marching_cubes.py +0 -2
  17. warp/examples/core/example_mesh.py +0 -2
  18. warp/examples/core/example_mesh_intersect.py +0 -2
  19. warp/examples/core/example_nvdb.py +0 -2
  20. warp/examples/core/example_raycast.py +0 -2
  21. warp/examples/core/example_raymarch.py +0 -2
  22. warp/examples/core/example_render_opengl.py +0 -2
  23. warp/examples/core/example_sph.py +0 -2
  24. warp/examples/core/example_torch.py +0 -3
  25. warp/examples/core/example_wave.py +0 -2
  26. warp/examples/fem/example_apic_fluid.py +140 -115
  27. warp/examples/fem/example_burgers.py +262 -0
  28. warp/examples/fem/example_convection_diffusion.py +0 -2
  29. warp/examples/fem/example_convection_diffusion_dg.py +0 -2
  30. warp/examples/fem/example_deformed_geometry.py +0 -2
  31. warp/examples/fem/example_diffusion.py +0 -2
  32. warp/examples/fem/example_diffusion_3d.py +5 -4
  33. warp/examples/fem/example_diffusion_mgpu.py +0 -2
  34. warp/examples/fem/example_mixed_elasticity.py +0 -2
  35. warp/examples/fem/example_navier_stokes.py +0 -2
  36. warp/examples/fem/example_stokes.py +0 -2
  37. warp/examples/fem/example_stokes_transfer.py +0 -2
  38. warp/examples/optim/example_bounce.py +0 -2
  39. warp/examples/optim/example_cloth_throw.py +0 -2
  40. warp/examples/optim/example_diffray.py +0 -2
  41. warp/examples/optim/example_drone.py +0 -2
  42. warp/examples/optim/example_inverse_kinematics.py +0 -2
  43. warp/examples/optim/example_inverse_kinematics_torch.py +0 -2
  44. warp/examples/optim/example_spring_cage.py +0 -2
  45. warp/examples/optim/example_trajectory.py +0 -2
  46. warp/examples/optim/example_walker.py +0 -2
  47. warp/examples/sim/example_cartpole.py +0 -2
  48. warp/examples/sim/example_cloth.py +0 -2
  49. warp/examples/sim/example_granular.py +0 -2
  50. warp/examples/sim/example_granular_collision_sdf.py +0 -2
  51. warp/examples/sim/example_jacobian_ik.py +0 -2
  52. warp/examples/sim/example_particle_chain.py +0 -2
  53. warp/examples/sim/example_quadruped.py +0 -2
  54. warp/examples/sim/example_rigid_chain.py +0 -2
  55. warp/examples/sim/example_rigid_contact.py +0 -2
  56. warp/examples/sim/example_rigid_force.py +0 -2
  57. warp/examples/sim/example_rigid_gyroscopic.py +0 -2
  58. warp/examples/sim/example_rigid_soft_contact.py +0 -2
  59. warp/examples/sim/example_soft_body.py +0 -2
  60. warp/fem/__init__.py +1 -0
  61. warp/fem/cache.py +3 -1
  62. warp/fem/geometry/__init__.py +1 -0
  63. warp/fem/geometry/element.py +4 -0
  64. warp/fem/geometry/grid_3d.py +0 -4
  65. warp/fem/geometry/nanogrid.py +455 -0
  66. warp/fem/integrate.py +63 -9
  67. warp/fem/space/__init__.py +43 -158
  68. warp/fem/space/basis_space.py +34 -0
  69. warp/fem/space/collocated_function_space.py +1 -1
  70. warp/fem/space/grid_2d_function_space.py +13 -132
  71. warp/fem/space/grid_3d_function_space.py +16 -154
  72. warp/fem/space/hexmesh_function_space.py +37 -134
  73. warp/fem/space/nanogrid_function_space.py +202 -0
  74. warp/fem/space/quadmesh_2d_function_space.py +12 -119
  75. warp/fem/space/restriction.py +4 -1
  76. warp/fem/space/shape/__init__.py +77 -0
  77. warp/fem/space/shape/cube_shape_function.py +5 -15
  78. warp/fem/space/tetmesh_function_space.py +6 -76
  79. warp/fem/space/trimesh_2d_function_space.py +6 -76
  80. warp/native/array.h +12 -3
  81. warp/native/builtin.h +48 -5
  82. warp/native/bvh.cpp +14 -10
  83. warp/native/bvh.cu +23 -15
  84. warp/native/bvh.h +1 -0
  85. warp/native/clang/clang.cpp +2 -1
  86. warp/native/crt.cpp +11 -1
  87. warp/native/crt.h +18 -1
  88. warp/native/exports.h +187 -0
  89. warp/native/mat.h +47 -0
  90. warp/native/mesh.cpp +1 -1
  91. warp/native/mesh.cu +1 -2
  92. warp/native/nanovdb/GridHandle.h +366 -0
  93. warp/native/nanovdb/HostBuffer.h +590 -0
  94. warp/native/nanovdb/NanoVDB.h +3999 -2157
  95. warp/native/nanovdb/PNanoVDB.h +936 -99
  96. warp/native/quat.h +28 -1
  97. warp/native/rand.h +5 -1
  98. warp/native/vec.h +45 -1
  99. warp/native/volume.cpp +335 -103
  100. warp/native/volume.cu +39 -13
  101. warp/native/volume.h +725 -303
  102. warp/native/volume_builder.cu +381 -360
  103. warp/native/volume_builder.h +16 -1
  104. warp/native/volume_impl.h +61 -0
  105. warp/native/warp.cu +8 -2
  106. warp/native/warp.h +15 -7
  107. warp/render/render_opengl.py +191 -52
  108. warp/sim/integrator_featherstone.py +10 -3
  109. warp/sim/integrator_xpbd.py +16 -22
  110. warp/sparse.py +89 -27
  111. warp/stubs.py +83 -0
  112. warp/tests/assets/test_index_grid.nvdb +0 -0
  113. warp/tests/aux_test_dependent.py +0 -2
  114. warp/tests/aux_test_grad_customs.py +0 -2
  115. warp/tests/aux_test_reference.py +0 -2
  116. warp/tests/aux_test_reference_reference.py +0 -2
  117. warp/tests/aux_test_square.py +0 -2
  118. warp/tests/disabled_kinematics.py +0 -2
  119. warp/tests/test_adam.py +0 -2
  120. warp/tests/test_arithmetic.py +0 -36
  121. warp/tests/test_array.py +9 -11
  122. warp/tests/test_array_reduce.py +0 -2
  123. warp/tests/test_async.py +0 -2
  124. warp/tests/test_atomic.py +0 -2
  125. warp/tests/test_bool.py +58 -50
  126. warp/tests/test_builtins_resolution.py +0 -2
  127. warp/tests/test_bvh.py +0 -2
  128. warp/tests/test_closest_point_edge_edge.py +0 -1
  129. warp/tests/test_codegen.py +0 -4
  130. warp/tests/test_compile_consts.py +130 -10
  131. warp/tests/test_conditional.py +0 -2
  132. warp/tests/test_copy.py +0 -2
  133. warp/tests/test_ctypes.py +6 -8
  134. warp/tests/test_dense.py +0 -2
  135. warp/tests/test_devices.py +0 -2
  136. warp/tests/test_dlpack.py +9 -11
  137. warp/tests/test_examples.py +42 -39
  138. warp/tests/test_fabricarray.py +0 -3
  139. warp/tests/test_fast_math.py +0 -2
  140. warp/tests/test_fem.py +75 -54
  141. warp/tests/test_fp16.py +0 -2
  142. warp/tests/test_func.py +0 -2
  143. warp/tests/test_generics.py +27 -2
  144. warp/tests/test_grad.py +147 -8
  145. warp/tests/test_grad_customs.py +0 -2
  146. warp/tests/test_hash_grid.py +1 -3
  147. warp/tests/test_import.py +0 -2
  148. warp/tests/test_indexedarray.py +0 -2
  149. warp/tests/test_intersect.py +0 -2
  150. warp/tests/test_jax.py +0 -2
  151. warp/tests/test_large.py +11 -9
  152. warp/tests/test_launch.py +0 -2
  153. warp/tests/test_lerp.py +10 -54
  154. warp/tests/test_linear_solvers.py +3 -5
  155. warp/tests/test_lvalue.py +0 -2
  156. warp/tests/test_marching_cubes.py +0 -2
  157. warp/tests/test_mat.py +0 -2
  158. warp/tests/test_mat_lite.py +0 -2
  159. warp/tests/test_mat_scalar_ops.py +0 -2
  160. warp/tests/test_math.py +0 -2
  161. warp/tests/test_matmul.py +35 -37
  162. warp/tests/test_matmul_lite.py +29 -31
  163. warp/tests/test_mempool.py +0 -2
  164. warp/tests/test_mesh.py +0 -3
  165. warp/tests/test_mesh_query_aabb.py +0 -2
  166. warp/tests/test_mesh_query_point.py +0 -2
  167. warp/tests/test_mesh_query_ray.py +0 -2
  168. warp/tests/test_mlp.py +0 -2
  169. warp/tests/test_model.py +0 -2
  170. warp/tests/test_module_hashing.py +111 -0
  171. warp/tests/test_modules_lite.py +0 -3
  172. warp/tests/test_multigpu.py +0 -2
  173. warp/tests/test_noise.py +0 -4
  174. warp/tests/test_operators.py +0 -2
  175. warp/tests/test_options.py +0 -2
  176. warp/tests/test_peer.py +0 -2
  177. warp/tests/test_pinned.py +0 -2
  178. warp/tests/test_print.py +0 -2
  179. warp/tests/test_quat.py +0 -2
  180. warp/tests/test_rand.py +41 -5
  181. warp/tests/test_reload.py +0 -10
  182. warp/tests/test_rounding.py +0 -2
  183. warp/tests/test_runlength_encode.py +0 -2
  184. warp/tests/test_sim_grad.py +0 -2
  185. warp/tests/test_sim_kinematics.py +0 -2
  186. warp/tests/test_smoothstep.py +0 -2
  187. warp/tests/test_snippet.py +0 -2
  188. warp/tests/test_sparse.py +0 -2
  189. warp/tests/test_spatial.py +0 -2
  190. warp/tests/test_special_values.py +362 -0
  191. warp/tests/test_streams.py +0 -2
  192. warp/tests/test_struct.py +0 -2
  193. warp/tests/test_tape.py +0 -2
  194. warp/tests/test_torch.py +0 -2
  195. warp/tests/test_transient_module.py +0 -2
  196. warp/tests/test_types.py +0 -2
  197. warp/tests/test_utils.py +0 -2
  198. warp/tests/test_vec.py +0 -2
  199. warp/tests/test_vec_lite.py +0 -2
  200. warp/tests/test_vec_scalar_ops.py +0 -2
  201. warp/tests/test_verify_fp.py +0 -2
  202. warp/tests/test_volume.py +237 -13
  203. warp/tests/test_volume_write.py +86 -3
  204. warp/tests/unittest_serial.py +10 -9
  205. warp/tests/unittest_suites.py +6 -2
  206. warp/tests/unittest_utils.py +2 -171
  207. warp/tests/unused_test_misc.py +0 -2
  208. warp/tests/walkthrough_debug.py +1 -1
  209. warp/thirdparty/unittest_parallel.py +37 -40
  210. warp/types.py +514 -77
  211. {warp_lang-1.1.0.dist-info → warp_lang-1.2.0.dist-info}/METADATA +57 -30
  212. warp_lang-1.2.0.dist-info/RECORD +359 -0
  213. warp/examples/fem/example_convection_diffusion_dg0.py +0 -204
  214. warp/native/nanovdb/PNanoVDBWrite.h +0 -295
  215. warp_lang-1.1.0.dist-info/RECORD +0 -352
  216. {warp_lang-1.1.0.dist-info → warp_lang-1.2.0.dist-info}/LICENSE.md +0 -0
  217. {warp_lang-1.1.0.dist-info → warp_lang-1.2.0.dist-info}/WHEEL +0 -0
  218. {warp_lang-1.1.0.dist-info → warp_lang-1.2.0.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,590 @@
1
+ // Copyright Contributors to the OpenVDB Project
2
+ // SPDX-License-Identifier: MPL-2.0
3
+
4
+ /*!
5
+ @file nanovdb/HostBuffer.h
6
+
7
+ @date April 20, 2021
8
+
9
+ @brief HostBuffer - a buffer that contains a shared or private bump
10
+ pool to either externally or internally managed host memory.
11
+
12
+ @details This HostBuffer can be used in multiple ways, most of which are
13
+ demonstrated in the examples below. Memory in the pool can
14
+ be managed or unmanged (e.g. internal or external) and can
15
+ be shared between multiple buffers or belong to a single buffer.
16
+
17
+ Example that uses HostBuffer::create inside io::readGrids to create a
18
+ full self-managed buffer, i.e. not shared and without padding, per grid in the file.
19
+ @code
20
+ auto handles = nanovdb::io::readGrids("file.nvdb");
21
+ @endcode
22
+
23
+ Example that uses HostBuffer::createFull. Assuming you have a raw pointer
24
+ to a NanoVDB grid of unknown type, this examples shows how to create its
25
+ GridHandle which can be used to enquire about the grid type and meta data.
26
+ @code
27
+ void *data;// pointer to a NanoVDB grid of unknown type
28
+ uint64_t size;// byte size of NanoVDB grid of unknown type
29
+ auto buffer = nanovdb::HostBuffer::createFull(size, data);
30
+ nanovdb::GridHandle<> gridHandle(std::move(buffer));
31
+ @endcode
32
+
33
+ Example that uses HostBuffer::createPool for internally managed host memory.
34
+ Suppose you want to read multiple grids in multiple files, but reuse the same
35
+ fixed sized memory buffer to both avoid memory fragmentation as well as
36
+ exceeding the fixed memory ceiling!
37
+ @code
38
+ auto pool = nanovdb::HostBuffer::createPool(1 << 30);// 1 GB memory pool
39
+ std::vector<std::string>> frames;// vector of grid names
40
+ for (int i=0; i<frames.size(); ++i) {
41
+ auto handles = nanovdb::io::readGrids(frames[i], 0, pool);// throws if grids in file exceed 1 GB
42
+ ...
43
+ pool.reset();// clears all handles and resets the memory pool for reuse
44
+ }
45
+ @endcode
46
+
47
+ Example that uses HostBuffer::createPool for externally managed host memory.
48
+ Note that in this example @c handles are allowed to outlive @c pool since
49
+ they internally store a shared pointer to the memory pool. However @c data
50
+ MUST outlive @c handles since the pool does not own its memory in this example.
51
+ @code
52
+ const size_t poolSize = 1 << 30;// 1 GB
53
+ void *data = std::malloc(size + NANOVDB_DATA_ALIGNMENT);// 1 GB pool with padding
54
+ void *buffer = nanovdb::alignPtr(data);// 32B aligned buffer
55
+ //void *buffer = std::aligned_alloc(NANOVDB_DATA_ALIGNMENT, poolSize);// in C++17
56
+ auto pool = nanovdb::HostBuffer::createPool(poolSize, buffer);
57
+ auto handles1 = nanovdb::io::readGrids("file1.nvdb", 0, pool);
58
+ auto handles2 = nanovdb::io::readGrids("file2.nvdb", 0, pool);
59
+ ....
60
+ std::free(data);
61
+ //std::free(buffer);
62
+ @endcode
63
+
64
+ Example that uses HostBuffer::createPool for externally managed host memory.
65
+ Note that in this example @c handles are allowed to outlive @c pool since
66
+ they internally store a shared pointer to the memory pool. However @c array
67
+ MUST outlive @c handles since the pool does not own its memory in this example.
68
+ @code
69
+ const size_t poolSize = 1 << 30;// 1 GB
70
+ std::unique_ptr<char[]> array(new char[size + NANOVDB_DATA_ALIGNMENT]);// scoped pool of 1 GB with padding
71
+ void *buffer = nanovdb::alignPtr(array.get());// 32B aligned buffer
72
+ auto pool = nanovdb::HostBuffer::createPool(poolSize, buffer);
73
+ auto handles = nanovdb::io::readGrids("file.nvdb", 0, pool);
74
+ @endcode
75
+ */
76
+
77
+ #ifndef NANOVDB_HOSTBUFFER_H_HAS_BEEN_INCLUDED
78
+ #define NANOVDB_HOSTBUFFER_H_HAS_BEEN_INCLUDED
79
+
80
+ #include <nanovdb/NanoVDB.h>// for NANOVDB_DATA_ALIGNMENT;
81
+ #include <stdint.h> // for types like int32_t etc
82
+ #include <cstdio> // for fprintf
83
+ #include <cstdlib> // for std::malloc/std::realloc/std::free
84
+ #include <memory>// for std::make_shared
85
+ #include <mutex>// for std::mutex
86
+ #include <unordered_set>// for std::unordered_set
87
+ #include <cassert>// for assert
88
+ #include <sstream>// for std::stringstream
89
+ #include <cstring>// for memcpy
90
+
91
+ #define checkPtr(ptr, msg) \
92
+ { \
93
+ ptrAssert((ptr), (msg), __FILE__, __LINE__); \
94
+ }
95
+
96
+ namespace nanovdb {
97
+
98
+ template<typename BufferT>
99
+ struct BufferTraits
100
+ {
101
+ static constexpr bool hasDeviceDual = false;
102
+ };
103
+
104
+ // ----------------------------> HostBuffer <--------------------------------------
105
+
106
+ /// @brief This is a buffer that contains a shared or private pool
107
+ /// to either externally or internally managed host memory.
108
+ ///
109
+ /// @note Terminology:
110
+ /// Pool: 0 = buffer.size() < buffer.poolSize()
111
+ /// Buffer: 0 < buffer.size() < buffer.poolSize()
112
+ /// Full: 0 < buffer.size() = buffer.poolSize()
113
+ /// Empty: 0 = buffer.size() = buffer.poolSize()
114
+ class HostBuffer
115
+ {
116
+ struct Pool;// forward declaration of private pool struct
117
+ std::shared_ptr<Pool> mPool;
118
+ uint64_t mSize; // total number of bytes for the NanoVDB grid.
119
+ void* mData; // raw buffer for the NanoVDB grid.
120
+
121
+ #if defined(DEBUG) || defined(_DEBUG)
122
+ static inline void ptrAssert(void* ptr, const char* msg, const char* file, int line, bool abort = true)
123
+ {
124
+ if (ptr == nullptr) {
125
+ fprintf(stderr, "NULL pointer error: %s %s %d\n", msg, file, line);
126
+ if (abort)
127
+ exit(1);
128
+ }
129
+ if (uint64_t(ptr) % NANOVDB_DATA_ALIGNMENT) {
130
+ fprintf(stderr, "Alignment pointer error: %s %s %d\n", msg, file, line);
131
+ if (abort)
132
+ exit(1);
133
+ }
134
+ }
135
+ #else
136
+ static inline void ptrAssert(void*, const char*, const char*, int, bool = true)
137
+ {
138
+ }
139
+ #endif
140
+
141
+ public:
142
+ /// @brief Return a full buffer or an empty buffer
143
+ HostBuffer(uint64_t bufferSize = 0);
144
+
145
+ /// @brief Move copy-constructor
146
+ HostBuffer(HostBuffer&& other);
147
+
148
+ /// @brief Custom descructor
149
+ ~HostBuffer() { this->clear(); }
150
+
151
+ /// @brief Move copy assignment operation
152
+ HostBuffer& operator=(HostBuffer&& other);
153
+
154
+ /// @brief Disallow copy-construction
155
+ HostBuffer(const HostBuffer&) = delete;
156
+
157
+ /// @brief Disallow copy assignment operation
158
+ HostBuffer& operator=(const HostBuffer&) = delete;
159
+
160
+ /// @brief Return a pool buffer which satisfies: buffer.size == 0,
161
+ /// buffer.poolSize() == poolSize, and buffer.data() == nullptr.
162
+ /// If data==nullptr, memory for the pool will be allocated.
163
+ ///
164
+ /// @throw If poolSize is zero.
165
+ static HostBuffer createPool(uint64_t poolSize, void *data = nullptr);
166
+
167
+ /// @brief Return a full buffer which satisfies: buffer.size == bufferSize,
168
+ /// buffer.poolSize() == bufferSize, and buffer.data() == data.
169
+ /// If data==nullptr, memory for the pool will be allocated.
170
+ ///
171
+ /// @throw If bufferSize is zero.
172
+ static HostBuffer createFull(uint64_t bufferSize, void *data = nullptr);
173
+
174
+ /// @brief Return a buffer with @c bufferSize bytes managed by
175
+ /// the specified memory @c pool. If none is provided, i.e.
176
+ /// @c pool == nullptr or @c pool->poolSize() == 0, one is
177
+ /// created with size @c bufferSize, i.e. a full buffer is returned.
178
+ ///
179
+ /// @throw If the specified @c pool has insufficient memory for
180
+ /// the requested buffer size.
181
+ static HostBuffer create(uint64_t bufferSize, const HostBuffer* pool = nullptr);
182
+
183
+ /// @brief Initialize as a full buffer with the specified size. If data is NULL
184
+ /// the memory is internally allocated.
185
+ void init(uint64_t bufferSize, void *data = nullptr);
186
+
187
+ //@{
188
+ /// @brief Retuns a pointer to the raw memory buffer managed by this allocator.
189
+ ///
190
+ /// @warning Note that the pointer can be NULL if the allocator was not initialized!
191
+ const void* data() const { return mData; }
192
+ void* data() { return mData; }
193
+ //@}
194
+
195
+ //@{
196
+ /// @brief Returns the size in bytes associated with this buffer.
197
+ uint64_t bufferSize() const { return mSize; }
198
+ uint64_t size() const { return this->bufferSize(); }
199
+ //@}
200
+
201
+ /// @brief Returns the size in bytes of the memory pool shared with this instance.
202
+ uint64_t poolSize() const;
203
+
204
+ /// @brief Return true if memory is managed (using std::malloc and std:free) by the
205
+ /// shared pool in this buffer. Else memory is assumed to be managed externally.
206
+ bool isManaged() const;
207
+
208
+ //@{
209
+ /// @brief Returns true if this buffer has no memory associated with it
210
+ bool isEmpty() const { return !mPool || mSize == 0 || mData == nullptr; }
211
+ bool empty() const { return this->isEmpty(); }
212
+ //@}
213
+
214
+ /// @brief Return true if this is a pool, i.e. an empty buffer with a nonempty
215
+ /// internal pool, i.e. this->size() == 0 and this->poolSize() != 0
216
+ bool isPool() const { return mSize == 0 && this->poolSize() > 0; }
217
+
218
+ /// @brief Return true if the pool exists, is nonempty but has no more available memory
219
+ bool isFull() const;
220
+
221
+ /// @brief Clear this buffer so it is empty.
222
+ void clear();
223
+
224
+ /// @brief Clears all existing buffers that are registered against the memory pool
225
+ /// and resets the pool so it can be reused to create new buffers.
226
+ ///
227
+ /// @throw If this instance is not empty or contains no pool.
228
+ ///
229
+ /// @warning This method is not thread-safe!
230
+ void reset();
231
+
232
+ /// @brief Total number of bytes from the pool currently in use by buffers
233
+ uint64_t poolUsage() const;
234
+
235
+ /// @brief resize the pool size. It will attempt to resize the existing
236
+ /// memory block, but if that fails a deep copy is performed.
237
+ /// If @c data is not NULL it will be used as new externally
238
+ /// managed memory for the pool. All registered buffers are
239
+ /// updated so GridHandle::grid might return a new address (if
240
+ /// deep copy was performed).
241
+ ///
242
+ /// @note This method can be use to resize the memory pool and even
243
+ /// change it from internally to externally managed memory or vice versa.
244
+ ///
245
+ /// @throw if @c poolSize is less than this->poolUsage() the used memory
246
+ /// or allocations fail.
247
+ void resizePool(uint64_t poolSize, void *data = nullptr);
248
+
249
+ }; // HostBuffer class
250
+
251
+ // --------------------------> Implementation of HostBuffer::Pool <------------------------------------
252
+
253
+ // This is private struct of HostBuffer so you can safely ignore the API
254
+ struct HostBuffer::Pool
255
+ {
256
+ using HashTableT = std::unordered_set<HostBuffer*>;
257
+ std::mutex mMutex; // mutex for updating mRegister and mFree
258
+ HashTableT mRegister;
259
+ void *mData, *mFree;
260
+ uint64_t mSize, mPadding;
261
+ bool mManaged;
262
+
263
+ /// @brief External memory ctor
264
+ Pool(uint64_t size = 0, void* data = nullptr)
265
+ : mData(data)
266
+ , mFree(mData)
267
+ , mSize(size)
268
+ , mPadding(0)
269
+ , mManaged(data == nullptr)
270
+ {
271
+ if (mManaged) {
272
+ mData = Pool::alloc(mSize);
273
+ if (mData == nullptr) throw std::runtime_error("Pool::Pool malloc failed");
274
+ }
275
+ mPadding = alignmentPadding(mData);
276
+ if (!mManaged && mPadding != 0) {
277
+ throw std::runtime_error("Pool::Pool: external memory buffer is not aligned to " +
278
+ std::to_string(NANOVDB_DATA_ALIGNMENT) +
279
+ " bytes.\nHint: use nanovdb::alignPtr or std::aligned_alloc (C++17 only)");
280
+ }
281
+ mFree = util::PtrAdd(mData, mPadding);
282
+ }
283
+
284
+ /// @brief Custom destructor
285
+ ~Pool()
286
+ {
287
+ assert(mRegister.empty());
288
+ if (mManaged) std::free(mData);
289
+ }
290
+
291
+ /// @brief Disallow copy-construction
292
+ Pool(const Pool&) = delete;
293
+
294
+ /// @brief Disallow move-construction
295
+ Pool(const Pool&&) = delete;
296
+
297
+ /// @brief Disallow copy assignment operation
298
+ Pool& operator=(const Pool&) = delete;
299
+
300
+ /// @brief Disallow move assignment operation
301
+ Pool& operator=(const Pool&&) = delete;
302
+
303
+ /// @brief Return the total number of bytes used from this Pool by buffers
304
+ uint64_t usage() const { return util::PtrDiff(mFree, mData) - mPadding; }
305
+
306
+ /// @brief Allocate a buffer of the specified size and add it to the register
307
+ void add(HostBuffer* buffer, uint64_t size)
308
+ {
309
+ void *alignedFree = util::PtrAdd(mFree, alignmentPadding(mFree));
310
+
311
+ if (util::PtrAdd(alignedFree, size) > util::PtrAdd(mData, mPadding + mSize)) {
312
+ std::stringstream ss;
313
+ ss << "HostBuffer::Pool: insufficient memory\n"
314
+ << "\tA buffer requested " << size << " bytes with " << NANOVDB_DATA_ALIGNMENT
315
+ << "-bytes alignment from a pool with "
316
+ << mSize << " bytes of which\n\t" << (util::PtrDiff(alignedFree, mData) - mPadding)
317
+ << " bytes are used by " << mRegister.size() << " other buffer(s). "
318
+ << "Pool is " << (mManaged ? "internally" : "externally") << " managed.\n";
319
+ //std::cerr << ss.str();
320
+ throw std::runtime_error(ss.str());
321
+ }
322
+ buffer->mSize = size;
323
+ const std::lock_guard<std::mutex> lock(mMutex);
324
+ mRegister.insert(buffer);
325
+ buffer->mData = alignedFree;
326
+ mFree = util::PtrAdd(alignedFree, size);
327
+ }
328
+
329
+ /// @brief Remove the specified buffer from the register
330
+ void remove(HostBuffer *buffer)
331
+ {
332
+ const std::lock_guard<std::mutex> lock(mMutex);
333
+ mRegister.erase(buffer);
334
+ }
335
+
336
+ /// @brief Replaces buffer1 with buffer2 in the register
337
+ void replace(HostBuffer *buffer1, HostBuffer *buffer2)
338
+ {
339
+ const std::lock_guard<std::mutex> lock(mMutex);
340
+ mRegister.erase( buffer1);
341
+ mRegister.insert(buffer2);
342
+ }
343
+
344
+ /// @brief Reset the register and all its buffers
345
+ void reset()
346
+ {
347
+ for (HostBuffer *buffer : mRegister) {
348
+ buffer->mPool.reset();
349
+ buffer->mSize = 0;
350
+ buffer->mData = nullptr;
351
+ }
352
+ mRegister.clear();
353
+ mFree = util::PtrAdd(mData, mPadding);
354
+ }
355
+
356
+ /// @brief Resize this Pool and update registered buffers as needed. If data is no NULL
357
+ /// it is used as externally managed memory.
358
+ void resize(uint64_t size, void *data = nullptr)
359
+ {
360
+ const uint64_t memUsage = this->usage();
361
+
362
+ const bool managed = (data == nullptr);
363
+
364
+ if (!managed && alignmentPadding(data) != 0) {
365
+ throw std::runtime_error("Pool::resize: external memory buffer is not aligned to " +
366
+ std::to_string(NANOVDB_DATA_ALIGNMENT) + " bytes");
367
+ }
368
+
369
+ if (memUsage > size) {
370
+ throw std::runtime_error("Pool::resize: insufficient memory");
371
+ }
372
+
373
+ uint64_t padding = 0;
374
+ if (mManaged && managed && size != mSize) { // managed -> managed
375
+ padding = mPadding;
376
+ data = Pool::realloc(mData, memUsage, size, padding); // performs both copy and free of mData
377
+ } else if (!mManaged && managed) { // un-managed -> managed
378
+ data = Pool::alloc(size);
379
+ padding = alignmentPadding(data);
380
+ }
381
+
382
+ if (data == nullptr) {
383
+ throw std::runtime_error("Pool::resize: allocation failed");
384
+ } else if (data != mData) {
385
+ void* paddedData = util::PtrAdd(data, padding);
386
+
387
+ if (!(mManaged && managed)) { // no need to copy if managed -> managed
388
+ memcpy(paddedData, util::PtrAdd(mData, mPadding), memUsage);
389
+ }
390
+
391
+ for (HostBuffer* buffer : mRegister) { // update registered buffers
392
+ //buffer->mData = paddedData + ptrdiff_t(buffer->mData - (mData + mPadding));
393
+ buffer->mData = util::PtrAdd(paddedData, util::PtrDiff(buffer->mData, util::PtrAdd(mData, mPadding)));
394
+ }
395
+ mFree = util::PtrAdd(paddedData, memUsage); // update the free pointer
396
+ if (mManaged && !managed) {// only free if managed -> un-managed
397
+ std::free(mData);
398
+ }
399
+
400
+ mData = data;
401
+ mPadding = padding;
402
+ }
403
+ mSize = size;
404
+ mManaged = managed;
405
+ }
406
+ /// @brief Return true is all the memory in this pool is in use.
407
+ bool isFull() const
408
+ {
409
+ assert(mFree <= util::PtrAdd(mData, mPadding + mSize));
410
+ return mSize > 0 ? mFree == util::PtrAdd(mData, mPadding + mSize) : false;
411
+ }
412
+
413
+ private:
414
+
415
+ static void* alloc(uint64_t size)
416
+ {
417
+ //#if (__cplusplus >= 201703L)
418
+ // return std::aligned_alloc(NANOVDB_DATA_ALIGNMENT, size);//C++17 or newer
419
+ //#else
420
+ // make sure we alloc enough space to align the result
421
+ return std::malloc(size + NANOVDB_DATA_ALIGNMENT);
422
+ //#endif
423
+ }
424
+
425
+ static void* realloc(void* const origData,
426
+ uint64_t origSize,
427
+ uint64_t desiredSize,
428
+ uint64_t& padding)
429
+ {
430
+ // make sure we alloc enough space to align the result
431
+ void* data = std::realloc(origData, desiredSize + NANOVDB_DATA_ALIGNMENT);
432
+
433
+ if (data != nullptr && data != origData) {
434
+ uint64_t newPadding = alignmentPadding(data);
435
+ // Number of padding bytes may have changed -- move data if that's the case
436
+ if (newPadding != padding) {
437
+ // Realloc should not happen when shrinking down buffer, but let's be safe
438
+ std::memmove(util::PtrAdd(data, newPadding),
439
+ util::PtrAdd(data, padding),
440
+ math::Min(origSize, desiredSize));
441
+ padding = newPadding;
442
+ }
443
+ }
444
+
445
+ return data;
446
+ }
447
+
448
+ };// struct HostBuffer::Pool
449
+
450
+ // --------------------------> Implementation of HostBuffer <------------------------------------
451
+
452
+ inline HostBuffer::HostBuffer(uint64_t size) : mPool(nullptr), mSize(size), mData(nullptr)
453
+ {
454
+ if (size>0) {
455
+ mPool = std::make_shared<Pool>(size);
456
+ mData = mPool->mFree;
457
+ mPool->mRegister.insert(this);
458
+ mPool->mFree = util::PtrAdd(mPool->mFree, size);
459
+ }
460
+ }
461
+
462
+ inline HostBuffer::HostBuffer(HostBuffer&& other) : mPool(other.mPool), mSize(other.mSize), mData(other.mData)
463
+ {
464
+ if (mPool && mSize != 0) {
465
+ mPool->replace(&other, this);
466
+ }
467
+ other.mPool.reset();
468
+ other.mSize = 0;
469
+ other.mData = nullptr;
470
+ }
471
+
472
+ inline void HostBuffer::init(uint64_t bufferSize, void *data)
473
+ {
474
+ if (bufferSize == 0) {
475
+ throw std::runtime_error("HostBuffer: invalid buffer size");
476
+ }
477
+ if (mPool) {
478
+ mPool.reset();
479
+ }
480
+ if (!mPool || mPool->mSize != bufferSize) {
481
+ mPool = std::make_shared<Pool>(bufferSize, data);
482
+ }
483
+ mPool->add(this, bufferSize);
484
+ }
485
+
486
+ inline HostBuffer& HostBuffer::operator=(HostBuffer&& other)
487
+ {
488
+ if (mPool) {
489
+ mPool->remove(this);
490
+ }
491
+ mPool = other.mPool;
492
+ mSize = other.mSize;
493
+ mData = other.mData;
494
+ if (mPool && mSize != 0) {
495
+ mPool->replace(&other, this);
496
+ }
497
+ other.mPool.reset();
498
+ other.mSize = 0;
499
+ other.mData = nullptr;
500
+ return *this;
501
+ }
502
+
503
+ inline uint64_t HostBuffer::poolSize() const
504
+ {
505
+ return mPool ? mPool->mSize : 0u;
506
+ }
507
+
508
+ inline uint64_t HostBuffer::poolUsage() const
509
+ {
510
+ return mPool ? mPool->usage(): 0u;
511
+ }
512
+
513
+ inline bool HostBuffer::isManaged() const
514
+ {
515
+ return mPool ? mPool->mManaged : false;
516
+ }
517
+
518
+ inline bool HostBuffer::isFull() const
519
+ {
520
+ return mPool ? mPool->isFull() : false;
521
+ }
522
+
523
+ inline HostBuffer HostBuffer::createPool(uint64_t poolSize, void *data)
524
+ {
525
+ if (poolSize == 0) {
526
+ throw std::runtime_error("HostBuffer: invalid pool size");
527
+ }
528
+ HostBuffer buffer;
529
+ buffer.mPool = std::make_shared<Pool>(poolSize, data);
530
+ // note the buffer is NOT registered by its pool since it is not using its memory
531
+ buffer.mSize = 0;
532
+ buffer.mData = nullptr;
533
+ return buffer;
534
+ }
535
+
536
+ inline HostBuffer HostBuffer::createFull(uint64_t bufferSize, void *data)
537
+ {
538
+ if (bufferSize == 0) {
539
+ throw std::runtime_error("HostBuffer: invalid buffer size");
540
+ }
541
+ HostBuffer buffer;
542
+ buffer.mPool = std::make_shared<Pool>(bufferSize, data);
543
+ buffer.mPool->add(&buffer, bufferSize);
544
+ return buffer;
545
+ }
546
+
547
+ inline HostBuffer HostBuffer::create(uint64_t bufferSize, const HostBuffer* pool)
548
+ {
549
+ HostBuffer buffer;
550
+ if (pool == nullptr || !pool->mPool) {
551
+ buffer.mPool = std::make_shared<Pool>(bufferSize);
552
+ } else {
553
+ buffer.mPool = pool->mPool;
554
+ }
555
+ buffer.mPool->add(&buffer, bufferSize);
556
+ return buffer;
557
+ }
558
+
559
+ inline void HostBuffer::clear()
560
+ {
561
+ if (mPool) {// remove self from the buffer register in the pool
562
+ mPool->remove(this);
563
+ }
564
+ mPool.reset();
565
+ mSize = 0;
566
+ mData = nullptr;
567
+ }
568
+
569
+ inline void HostBuffer::reset()
570
+ {
571
+ if (this->size()>0) {
572
+ throw std::runtime_error("HostBuffer: only empty buffers can call reset");
573
+ }
574
+ if (!mPool) {
575
+ throw std::runtime_error("HostBuffer: this buffer contains no pool to reset");
576
+ }
577
+ mPool->reset();
578
+ }
579
+
580
+ inline void HostBuffer::resizePool(uint64_t size, void *data)
581
+ {
582
+ if (!mPool) {
583
+ throw std::runtime_error("HostBuffer: this buffer contains no pool to resize");
584
+ }
585
+ mPool->resize(size, data);
586
+ }
587
+
588
+ } // namespace nanovdb
589
+
590
+ #endif // end of NANOVDB_HOSTBUFFER_H_HAS_BEEN_INCLUDED