warp-lang 1.9.1__py3-none-manylinux_2_34_aarch64.whl → 1.10.0rc2__py3-none-manylinux_2_34_aarch64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of warp-lang might be problematic. Click here for more details.
- warp/__init__.py +301 -287
- warp/__init__.pyi +794 -305
- warp/_src/__init__.py +14 -0
- warp/_src/autograd.py +1075 -0
- warp/_src/build.py +618 -0
- warp/_src/build_dll.py +640 -0
- warp/{builtins.py → _src/builtins.py} +1382 -377
- warp/_src/codegen.py +4359 -0
- warp/{config.py → _src/config.py} +178 -169
- warp/_src/constants.py +57 -0
- warp/_src/context.py +8294 -0
- warp/_src/dlpack.py +462 -0
- warp/_src/fabric.py +355 -0
- warp/_src/fem/__init__.py +14 -0
- warp/_src/fem/adaptivity.py +508 -0
- warp/_src/fem/cache.py +687 -0
- warp/_src/fem/dirichlet.py +188 -0
- warp/{fem → _src/fem}/domain.py +40 -30
- warp/_src/fem/field/__init__.py +131 -0
- warp/_src/fem/field/field.py +701 -0
- warp/{fem → _src/fem}/field/nodal_field.py +30 -15
- warp/{fem → _src/fem}/field/restriction.py +1 -1
- warp/{fem → _src/fem}/field/virtual.py +53 -27
- warp/_src/fem/geometry/__init__.py +32 -0
- warp/{fem → _src/fem}/geometry/adaptive_nanogrid.py +77 -163
- warp/_src/fem/geometry/closest_point.py +97 -0
- warp/{fem → _src/fem}/geometry/deformed_geometry.py +14 -22
- warp/{fem → _src/fem}/geometry/element.py +32 -10
- warp/{fem → _src/fem}/geometry/geometry.py +48 -20
- warp/{fem → _src/fem}/geometry/grid_2d.py +12 -23
- warp/{fem → _src/fem}/geometry/grid_3d.py +12 -23
- warp/{fem → _src/fem}/geometry/hexmesh.py +40 -63
- warp/{fem → _src/fem}/geometry/nanogrid.py +255 -248
- warp/{fem → _src/fem}/geometry/partition.py +121 -63
- warp/{fem → _src/fem}/geometry/quadmesh.py +26 -45
- warp/{fem → _src/fem}/geometry/tetmesh.py +40 -63
- warp/{fem → _src/fem}/geometry/trimesh.py +26 -45
- warp/{fem → _src/fem}/integrate.py +164 -158
- warp/_src/fem/linalg.py +383 -0
- warp/_src/fem/operator.py +396 -0
- warp/_src/fem/polynomial.py +229 -0
- warp/{fem → _src/fem}/quadrature/pic_quadrature.py +15 -20
- warp/{fem → _src/fem}/quadrature/quadrature.py +95 -47
- warp/_src/fem/space/__init__.py +248 -0
- warp/{fem → _src/fem}/space/basis_function_space.py +20 -11
- warp/_src/fem/space/basis_space.py +679 -0
- warp/{fem → _src/fem}/space/dof_mapper.py +3 -3
- warp/{fem → _src/fem}/space/function_space.py +14 -13
- warp/{fem → _src/fem}/space/grid_2d_function_space.py +4 -7
- warp/{fem → _src/fem}/space/grid_3d_function_space.py +4 -4
- warp/{fem → _src/fem}/space/hexmesh_function_space.py +4 -10
- warp/{fem → _src/fem}/space/nanogrid_function_space.py +3 -9
- warp/{fem → _src/fem}/space/partition.py +117 -60
- warp/{fem → _src/fem}/space/quadmesh_function_space.py +4 -10
- warp/{fem → _src/fem}/space/restriction.py +66 -33
- warp/_src/fem/space/shape/__init__.py +152 -0
- warp/{fem → _src/fem}/space/shape/cube_shape_function.py +9 -9
- warp/{fem → _src/fem}/space/shape/shape_function.py +8 -9
- warp/{fem → _src/fem}/space/shape/square_shape_function.py +6 -6
- warp/{fem → _src/fem}/space/shape/tet_shape_function.py +3 -3
- warp/{fem → _src/fem}/space/shape/triangle_shape_function.py +3 -3
- warp/{fem → _src/fem}/space/tetmesh_function_space.py +3 -9
- warp/_src/fem/space/topology.py +459 -0
- warp/{fem → _src/fem}/space/trimesh_function_space.py +3 -9
- warp/_src/fem/types.py +112 -0
- warp/_src/fem/utils.py +486 -0
- warp/_src/jax.py +186 -0
- warp/_src/jax_experimental/__init__.py +14 -0
- warp/_src/jax_experimental/custom_call.py +387 -0
- warp/_src/jax_experimental/ffi.py +1284 -0
- warp/_src/jax_experimental/xla_ffi.py +656 -0
- warp/_src/marching_cubes.py +708 -0
- warp/_src/math.py +414 -0
- warp/_src/optim/__init__.py +14 -0
- warp/_src/optim/adam.py +163 -0
- warp/_src/optim/linear.py +1606 -0
- warp/_src/optim/sgd.py +112 -0
- warp/_src/paddle.py +406 -0
- warp/_src/render/__init__.py +14 -0
- warp/_src/render/imgui_manager.py +289 -0
- warp/_src/render/render_opengl.py +3636 -0
- warp/_src/render/render_usd.py +937 -0
- warp/_src/render/utils.py +160 -0
- warp/_src/sparse.py +2716 -0
- warp/_src/tape.py +1206 -0
- warp/{thirdparty → _src/thirdparty}/unittest_parallel.py +9 -2
- warp/_src/torch.py +391 -0
- warp/_src/types.py +5870 -0
- warp/_src/utils.py +1693 -0
- warp/autograd.py +12 -1054
- warp/bin/warp-clang.so +0 -0
- warp/bin/warp.so +0 -0
- warp/build.py +8 -588
- warp/build_dll.py +6 -721
- warp/codegen.py +6 -4251
- warp/constants.py +6 -39
- warp/context.py +12 -8062
- warp/dlpack.py +6 -444
- warp/examples/distributed/example_jacobi_mpi.py +4 -5
- warp/examples/fem/example_adaptive_grid.py +1 -1
- warp/examples/fem/example_apic_fluid.py +1 -1
- warp/examples/fem/example_burgers.py +8 -8
- warp/examples/fem/example_diffusion.py +1 -1
- warp/examples/fem/example_distortion_energy.py +1 -1
- warp/examples/fem/example_mixed_elasticity.py +2 -2
- warp/examples/fem/example_navier_stokes.py +1 -1
- warp/examples/fem/example_nonconforming_contact.py +7 -7
- warp/examples/fem/example_stokes.py +1 -1
- warp/examples/fem/example_stokes_transfer.py +1 -1
- warp/examples/fem/utils.py +2 -2
- warp/examples/interop/example_jax_callable.py +1 -1
- warp/examples/interop/example_jax_ffi_callback.py +1 -1
- warp/examples/interop/example_jax_kernel.py +1 -1
- warp/examples/tile/example_tile_mcgp.py +191 -0
- warp/fabric.py +6 -337
- warp/fem/__init__.py +159 -97
- warp/fem/adaptivity.py +7 -489
- warp/fem/cache.py +9 -648
- warp/fem/dirichlet.py +6 -184
- warp/fem/field/__init__.py +8 -109
- warp/fem/field/field.py +7 -652
- warp/fem/geometry/__init__.py +7 -18
- warp/fem/geometry/closest_point.py +11 -77
- warp/fem/linalg.py +18 -366
- warp/fem/operator.py +11 -369
- warp/fem/polynomial.py +9 -209
- warp/fem/space/__init__.py +5 -211
- warp/fem/space/basis_space.py +6 -662
- warp/fem/space/shape/__init__.py +41 -118
- warp/fem/space/topology.py +6 -437
- warp/fem/types.py +6 -81
- warp/fem/utils.py +11 -444
- warp/jax.py +8 -165
- warp/jax_experimental/__init__.py +14 -1
- warp/jax_experimental/custom_call.py +8 -365
- warp/jax_experimental/ffi.py +17 -873
- warp/jax_experimental/xla_ffi.py +5 -605
- warp/marching_cubes.py +5 -689
- warp/math.py +16 -393
- warp/native/array.h +385 -37
- warp/native/builtin.h +314 -37
- warp/native/bvh.cpp +43 -9
- warp/native/bvh.cu +62 -27
- warp/native/bvh.h +310 -309
- warp/native/clang/clang.cpp +102 -97
- warp/native/coloring.cpp +0 -1
- warp/native/crt.h +208 -0
- warp/native/exports.h +156 -0
- warp/native/hashgrid.cu +2 -0
- warp/native/intersect.h +24 -1
- warp/native/intersect_tri.h +44 -35
- warp/native/mat.h +1456 -276
- warp/native/mesh.cpp +4 -4
- warp/native/mesh.cu +4 -2
- warp/native/mesh.h +176 -61
- warp/native/quat.h +0 -52
- warp/native/scan.cu +2 -0
- warp/native/sparse.cu +7 -3
- warp/native/spatial.h +12 -0
- warp/native/tile.h +681 -89
- warp/native/tile_radix_sort.h +1 -1
- warp/native/tile_reduce.h +394 -46
- warp/native/tile_scan.h +4 -4
- warp/native/vec.h +469 -0
- warp/native/version.h +23 -0
- warp/native/volume.cpp +1 -1
- warp/native/volume.cu +1 -0
- warp/native/volume.h +1 -1
- warp/native/volume_builder.cu +2 -0
- warp/native/warp.cpp +57 -29
- warp/native/warp.cu +253 -171
- warp/native/warp.h +11 -8
- warp/optim/__init__.py +6 -3
- warp/optim/adam.py +6 -145
- warp/optim/linear.py +14 -1585
- warp/optim/sgd.py +6 -94
- warp/paddle.py +6 -388
- warp/render/__init__.py +8 -4
- warp/render/imgui_manager.py +7 -267
- warp/render/render_opengl.py +6 -3618
- warp/render/render_usd.py +6 -919
- warp/render/utils.py +6 -142
- warp/sparse.py +37 -2563
- warp/tape.py +6 -1188
- warp/tests/__main__.py +1 -1
- warp/tests/cuda/test_async.py +4 -4
- warp/tests/cuda/test_conditional_captures.py +1 -1
- warp/tests/cuda/test_multigpu.py +1 -1
- warp/tests/cuda/test_streams.py +58 -1
- warp/tests/geometry/test_bvh.py +157 -22
- warp/tests/geometry/test_marching_cubes.py +0 -1
- warp/tests/geometry/test_mesh.py +5 -3
- warp/tests/geometry/test_mesh_query_aabb.py +5 -12
- warp/tests/geometry/test_mesh_query_point.py +5 -2
- warp/tests/geometry/test_mesh_query_ray.py +15 -3
- warp/tests/geometry/test_volume_write.py +5 -5
- warp/tests/interop/test_dlpack.py +14 -14
- warp/tests/interop/test_jax.py +772 -49
- warp/tests/interop/test_paddle.py +1 -1
- warp/tests/test_adam.py +0 -1
- warp/tests/test_arithmetic.py +9 -9
- warp/tests/test_array.py +527 -100
- warp/tests/test_array_reduce.py +3 -3
- warp/tests/test_atomic.py +12 -8
- warp/tests/test_atomic_bitwise.py +209 -0
- warp/tests/test_atomic_cas.py +4 -4
- warp/tests/test_bool.py +2 -2
- warp/tests/test_builtins_resolution.py +5 -571
- warp/tests/test_codegen.py +33 -14
- warp/tests/test_conditional.py +1 -1
- warp/tests/test_context.py +6 -6
- warp/tests/test_copy.py +242 -161
- warp/tests/test_ctypes.py +3 -3
- warp/tests/test_devices.py +24 -2
- warp/tests/test_examples.py +16 -84
- warp/tests/test_fabricarray.py +35 -35
- warp/tests/test_fast_math.py +0 -2
- warp/tests/test_fem.py +56 -10
- warp/tests/test_fixedarray.py +3 -3
- warp/tests/test_func.py +8 -5
- warp/tests/test_generics.py +1 -1
- warp/tests/test_indexedarray.py +24 -24
- warp/tests/test_intersect.py +39 -9
- warp/tests/test_large.py +1 -1
- warp/tests/test_lerp.py +3 -1
- warp/tests/test_linear_solvers.py +1 -1
- warp/tests/test_map.py +35 -4
- warp/tests/test_mat.py +52 -62
- warp/tests/test_mat_constructors.py +4 -5
- warp/tests/test_mat_lite.py +1 -1
- warp/tests/test_mat_scalar_ops.py +121 -121
- warp/tests/test_math.py +34 -0
- warp/tests/test_module_aot.py +4 -4
- warp/tests/test_modules_lite.py +28 -2
- warp/tests/test_print.py +11 -11
- warp/tests/test_quat.py +93 -58
- warp/tests/test_runlength_encode.py +1 -1
- warp/tests/test_scalar_ops.py +38 -10
- warp/tests/test_smoothstep.py +1 -1
- warp/tests/test_sparse.py +126 -15
- warp/tests/test_spatial.py +105 -87
- warp/tests/test_special_values.py +6 -6
- warp/tests/test_static.py +7 -7
- warp/tests/test_struct.py +13 -2
- warp/tests/test_triangle_closest_point.py +48 -1
- warp/tests/test_types.py +27 -15
- warp/tests/test_utils.py +52 -52
- warp/tests/test_vec.py +29 -29
- warp/tests/test_vec_constructors.py +5 -5
- warp/tests/test_vec_scalar_ops.py +97 -97
- warp/tests/test_version.py +75 -0
- warp/tests/tile/test_tile.py +178 -0
- warp/tests/tile/test_tile_atomic_bitwise.py +403 -0
- warp/tests/tile/test_tile_cholesky.py +7 -4
- warp/tests/tile/test_tile_load.py +26 -2
- warp/tests/tile/test_tile_mathdx.py +3 -3
- warp/tests/tile/test_tile_matmul.py +1 -1
- warp/tests/tile/test_tile_mlp.py +2 -4
- warp/tests/tile/test_tile_reduce.py +214 -13
- warp/tests/unittest_suites.py +6 -14
- warp/tests/unittest_utils.py +10 -9
- warp/tests/walkthrough_debug.py +3 -1
- warp/torch.py +6 -373
- warp/types.py +29 -5764
- warp/utils.py +10 -1659
- {warp_lang-1.9.1.dist-info → warp_lang-1.10.0rc2.dist-info}/METADATA +46 -99
- warp_lang-1.10.0rc2.dist-info/RECORD +468 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/Gaia-LICENSE.txt +6 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/appdirs-LICENSE.txt +22 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/asset_pixel_jpg-LICENSE.txt +3 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/cuda-LICENSE.txt +1582 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/dlpack-LICENSE.txt +201 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/fp16-LICENSE.txt +28 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/libmathdx-LICENSE.txt +220 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/llvm-LICENSE.txt +279 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/moller-LICENSE.txt +16 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/nanovdb-LICENSE.txt +2 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/nvrtc-LICENSE.txt +1592 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/svd-LICENSE.txt +23 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/unittest_parallel-LICENSE.txt +21 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/usd-LICENSE.txt +213 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/windingnumber-LICENSE.txt +21 -0
- warp/examples/assets/cartpole.urdf +0 -110
- warp/examples/assets/crazyflie.usd +0 -0
- warp/examples/assets/nv_ant.xml +0 -92
- warp/examples/assets/nv_humanoid.xml +0 -183
- warp/examples/assets/quadruped.urdf +0 -268
- warp/examples/optim/example_bounce.py +0 -266
- warp/examples/optim/example_cloth_throw.py +0 -228
- warp/examples/optim/example_drone.py +0 -870
- warp/examples/optim/example_inverse_kinematics.py +0 -182
- warp/examples/optim/example_inverse_kinematics_torch.py +0 -191
- warp/examples/optim/example_softbody_properties.py +0 -400
- warp/examples/optim/example_spring_cage.py +0 -245
- warp/examples/optim/example_trajectory.py +0 -227
- warp/examples/sim/example_cartpole.py +0 -143
- warp/examples/sim/example_cloth.py +0 -225
- warp/examples/sim/example_cloth_self_contact.py +0 -316
- warp/examples/sim/example_granular.py +0 -130
- warp/examples/sim/example_granular_collision_sdf.py +0 -202
- warp/examples/sim/example_jacobian_ik.py +0 -244
- warp/examples/sim/example_particle_chain.py +0 -124
- warp/examples/sim/example_quadruped.py +0 -203
- warp/examples/sim/example_rigid_chain.py +0 -203
- warp/examples/sim/example_rigid_contact.py +0 -195
- warp/examples/sim/example_rigid_force.py +0 -133
- warp/examples/sim/example_rigid_gyroscopic.py +0 -115
- warp/examples/sim/example_rigid_soft_contact.py +0 -140
- warp/examples/sim/example_soft_body.py +0 -196
- warp/examples/tile/example_tile_walker.py +0 -327
- warp/sim/__init__.py +0 -74
- warp/sim/articulation.py +0 -793
- warp/sim/collide.py +0 -2570
- warp/sim/graph_coloring.py +0 -307
- warp/sim/import_mjcf.py +0 -791
- warp/sim/import_snu.py +0 -227
- warp/sim/import_urdf.py +0 -579
- warp/sim/import_usd.py +0 -898
- warp/sim/inertia.py +0 -357
- warp/sim/integrator.py +0 -245
- warp/sim/integrator_euler.py +0 -2000
- warp/sim/integrator_featherstone.py +0 -2101
- warp/sim/integrator_vbd.py +0 -2487
- warp/sim/integrator_xpbd.py +0 -3295
- warp/sim/model.py +0 -4821
- warp/sim/particles.py +0 -121
- warp/sim/render.py +0 -431
- warp/sim/utils.py +0 -431
- warp/tests/sim/disabled_kinematics.py +0 -244
- warp/tests/sim/test_cloth.py +0 -863
- warp/tests/sim/test_collision.py +0 -743
- warp/tests/sim/test_coloring.py +0 -347
- warp/tests/sim/test_inertia.py +0 -161
- warp/tests/sim/test_model.py +0 -226
- warp/tests/sim/test_sim_grad.py +0 -287
- warp/tests/sim/test_sim_grad_bounce_linear.py +0 -212
- warp/tests/sim/test_sim_kinematics.py +0 -98
- warp/thirdparty/__init__.py +0 -0
- warp_lang-1.9.1.dist-info/RECORD +0 -456
- /warp/{fem → _src/fem}/quadrature/__init__.py +0 -0
- /warp/{tests/sim → _src/thirdparty}/__init__.py +0 -0
- /warp/{thirdparty → _src/thirdparty}/appdirs.py +0 -0
- /warp/{thirdparty → _src/thirdparty}/dlpack.py +0 -0
- {warp_lang-1.9.1.dist-info → warp_lang-1.10.0rc2.dist-info}/WHEEL +0 -0
- {warp_lang-1.9.1.dist-info → warp_lang-1.10.0rc2.dist-info}/licenses/LICENSE.md +0 -0
- {warp_lang-1.9.1.dist-info → warp_lang-1.10.0rc2.dist-info}/top_level.txt +0 -0
warp/_src/fem/cache.py
ADDED
|
@@ -0,0 +1,687 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import ast
|
|
17
|
+
import bisect
|
|
18
|
+
import hashlib
|
|
19
|
+
import pickle
|
|
20
|
+
import re
|
|
21
|
+
import weakref
|
|
22
|
+
from typing import Any, Callable, ClassVar, Dict, Optional, Tuple, Union
|
|
23
|
+
|
|
24
|
+
import warp as wp
|
|
25
|
+
from warp._src.codegen import Struct, StructInstance, get_annotations
|
|
26
|
+
from warp._src.fem.operator import Integrand
|
|
27
|
+
from warp._src.fem.types import Domain, Field
|
|
28
|
+
from warp._src.types import get_type_code, type_repr, type_scalar_type, type_size, type_size_in_bytes, type_to_warp
|
|
29
|
+
from warp._src.utils import warn
|
|
30
|
+
|
|
31
|
+
_kernel_cache = {}
|
|
32
|
+
_struct_cache = {}
|
|
33
|
+
_func_cache = {}
|
|
34
|
+
|
|
35
|
+
_key_re = re.compile("[^0-9a-zA-Z_]+")
|
|
36
|
+
|
|
37
|
+
|
|
38
|
+
def _make_key(obj, suffix: Any, options: Optional[Dict[str, Any]] = None):
|
|
39
|
+
sorted_opts = tuple(sorted(options.items())) if options is not None else ()
|
|
40
|
+
key = (
|
|
41
|
+
obj.__module__,
|
|
42
|
+
obj.__qualname__,
|
|
43
|
+
suffix,
|
|
44
|
+
sorted_opts,
|
|
45
|
+
)
|
|
46
|
+
return key
|
|
47
|
+
|
|
48
|
+
|
|
49
|
+
def _native_key(obj, key: Any):
|
|
50
|
+
uid = hashlib.blake2b(pickle.dumps(key), digest_size=4).hexdigest()
|
|
51
|
+
key = f"{obj.__name__}_{uid}"
|
|
52
|
+
return _key_re.sub("", key)
|
|
53
|
+
|
|
54
|
+
|
|
55
|
+
def _arg_type_key(arg_type):
|
|
56
|
+
if isinstance(arg_type, str):
|
|
57
|
+
return arg_type
|
|
58
|
+
if arg_type in (Field, Domain):
|
|
59
|
+
return ""
|
|
60
|
+
return get_type_code(type_to_warp(arg_type))
|
|
61
|
+
|
|
62
|
+
|
|
63
|
+
def _make_cache_key(func, key, argspec=None, allow_overloads: bool = True):
|
|
64
|
+
if not allow_overloads:
|
|
65
|
+
return key
|
|
66
|
+
|
|
67
|
+
if argspec is None:
|
|
68
|
+
annotations = get_annotations(func)
|
|
69
|
+
else:
|
|
70
|
+
annotations = argspec.annotations
|
|
71
|
+
|
|
72
|
+
sig_key = (key, *((k, _arg_type_key(v)) for k, v in annotations.items()))
|
|
73
|
+
return sig_key
|
|
74
|
+
|
|
75
|
+
|
|
76
|
+
def _register_function(
|
|
77
|
+
func,
|
|
78
|
+
key,
|
|
79
|
+
module,
|
|
80
|
+
**kwargs,
|
|
81
|
+
):
|
|
82
|
+
# wp.Function will override existing func for a given key...
|
|
83
|
+
# manually add back our overloads
|
|
84
|
+
key = _native_key(func, key)
|
|
85
|
+
existing = module.functions.get(key)
|
|
86
|
+
new_fn = wp.Function(
|
|
87
|
+
func=func,
|
|
88
|
+
key=key,
|
|
89
|
+
namespace="",
|
|
90
|
+
module=module,
|
|
91
|
+
**kwargs,
|
|
92
|
+
)
|
|
93
|
+
|
|
94
|
+
if existing:
|
|
95
|
+
existing.add_overload(new_fn)
|
|
96
|
+
module.functions[key] = existing
|
|
97
|
+
return module.functions[key]
|
|
98
|
+
|
|
99
|
+
|
|
100
|
+
def get_func(func, suffix: Any, code_transformers=None, allow_overloads=False):
|
|
101
|
+
key = _make_key(func, suffix)
|
|
102
|
+
cache_key = _make_cache_key(func, key, allow_overloads=allow_overloads)
|
|
103
|
+
|
|
104
|
+
if cache_key not in _func_cache:
|
|
105
|
+
module = wp.get_module(func.__module__)
|
|
106
|
+
_func_cache[cache_key] = _register_function(
|
|
107
|
+
func,
|
|
108
|
+
key,
|
|
109
|
+
module,
|
|
110
|
+
code_transformers=code_transformers,
|
|
111
|
+
)
|
|
112
|
+
|
|
113
|
+
return _func_cache[cache_key]
|
|
114
|
+
|
|
115
|
+
|
|
116
|
+
def dynamic_func(suffix: Any, code_transformers=None, allow_overloads=False):
|
|
117
|
+
def wrap_func(func: Callable):
|
|
118
|
+
return get_func(func, suffix=suffix, code_transformers=code_transformers, allow_overloads=allow_overloads)
|
|
119
|
+
|
|
120
|
+
return wrap_func
|
|
121
|
+
|
|
122
|
+
|
|
123
|
+
def get_kernel(
|
|
124
|
+
func,
|
|
125
|
+
suffix: Any,
|
|
126
|
+
kernel_options: Dict[str, Any],
|
|
127
|
+
allow_overloads=False,
|
|
128
|
+
):
|
|
129
|
+
key = _make_key(func, suffix, kernel_options)
|
|
130
|
+
cache_key = _make_cache_key(func, key, allow_overloads=allow_overloads)
|
|
131
|
+
|
|
132
|
+
if cache_key not in _kernel_cache:
|
|
133
|
+
kernel_key = _native_key(func, key)
|
|
134
|
+
module_name = f"{func.__module__}.dyn.{kernel_key}"
|
|
135
|
+
module = wp.get_module(module_name)
|
|
136
|
+
module.options = dict(wp.get_module(func.__module__).options)
|
|
137
|
+
module.options.update(kernel_options)
|
|
138
|
+
_kernel_cache[cache_key] = wp.Kernel(func=func, key=kernel_key, module=module, options=kernel_options)
|
|
139
|
+
|
|
140
|
+
return _kernel_cache[cache_key]
|
|
141
|
+
|
|
142
|
+
|
|
143
|
+
def dynamic_kernel(suffix: Any, kernel_options: Optional[Dict[str, Any]] = None, allow_overloads=False):
|
|
144
|
+
if kernel_options is None:
|
|
145
|
+
kernel_options = {}
|
|
146
|
+
|
|
147
|
+
def wrap_kernel(func: Callable):
|
|
148
|
+
return get_kernel(func, suffix=suffix, kernel_options=kernel_options, allow_overloads=allow_overloads)
|
|
149
|
+
|
|
150
|
+
return wrap_kernel
|
|
151
|
+
|
|
152
|
+
|
|
153
|
+
def get_struct(struct: type, suffix: Any):
|
|
154
|
+
key = _make_key(struct, suffix)
|
|
155
|
+
cache_key = key
|
|
156
|
+
|
|
157
|
+
if cache_key not in _struct_cache:
|
|
158
|
+
# used in codegen
|
|
159
|
+
struct.__qualname__ = _native_key(struct, key)
|
|
160
|
+
module = wp.get_module(struct.__module__)
|
|
161
|
+
_struct_cache[cache_key] = Struct(
|
|
162
|
+
key=struct.__qualname__,
|
|
163
|
+
cls=struct,
|
|
164
|
+
module=module,
|
|
165
|
+
)
|
|
166
|
+
|
|
167
|
+
return _struct_cache[cache_key]
|
|
168
|
+
|
|
169
|
+
|
|
170
|
+
def dynamic_struct(suffix: Any):
|
|
171
|
+
def wrap_struct(struct: type):
|
|
172
|
+
return get_struct(struct, suffix=suffix)
|
|
173
|
+
|
|
174
|
+
return wrap_struct
|
|
175
|
+
|
|
176
|
+
|
|
177
|
+
def get_argument_struct(arg_types: Dict[str, type]):
|
|
178
|
+
class Args:
|
|
179
|
+
pass
|
|
180
|
+
|
|
181
|
+
annotations = get_annotations(Args)
|
|
182
|
+
|
|
183
|
+
for name, arg_type in arg_types.items():
|
|
184
|
+
setattr(Args, name, None)
|
|
185
|
+
annotations[name] = arg_type
|
|
186
|
+
|
|
187
|
+
try:
|
|
188
|
+
Args.__annotations__ = annotations
|
|
189
|
+
except AttributeError:
|
|
190
|
+
Args.__dict__.__annotations__ = annotations
|
|
191
|
+
|
|
192
|
+
suffix = tuple((name, _arg_type_key(arg_type)) for name, arg_type in annotations.items())
|
|
193
|
+
return get_struct(Args, suffix=suffix)
|
|
194
|
+
|
|
195
|
+
|
|
196
|
+
def populate_argument_struct(value_struct: StructInstance, values: Optional[Dict[str, Any]], func_name: str):
|
|
197
|
+
if values is None:
|
|
198
|
+
values = {}
|
|
199
|
+
|
|
200
|
+
Args = value_struct._cls
|
|
201
|
+
|
|
202
|
+
try:
|
|
203
|
+
for k, v in values.items():
|
|
204
|
+
setattr(value_struct, k, v)
|
|
205
|
+
except Exception as err:
|
|
206
|
+
if k not in Args.vars:
|
|
207
|
+
raise ValueError(
|
|
208
|
+
f"Passed value argument '{k}' does not match any of the function '{func_name}' parameters"
|
|
209
|
+
) from err
|
|
210
|
+
raise ValueError(
|
|
211
|
+
f"Passed value argument '{k}' of type '{type_repr(v)}' is incompatible with the function '{func_name}' parameter of type '{type_repr(Args.vars[k].type)}'"
|
|
212
|
+
) from err
|
|
213
|
+
|
|
214
|
+
missing_values = Args.vars.keys() - values.keys()
|
|
215
|
+
if missing_values:
|
|
216
|
+
warn(
|
|
217
|
+
f"Missing values for parameter(s) '{', '.join(missing_values)}' of the function '{func_name}', will be zero-initialized"
|
|
218
|
+
)
|
|
219
|
+
|
|
220
|
+
return value_struct
|
|
221
|
+
|
|
222
|
+
|
|
223
|
+
class ExpandStarredArgumentStruct(ast.NodeTransformer):
|
|
224
|
+
def __init__(
|
|
225
|
+
self,
|
|
226
|
+
structs: Dict[str, Struct],
|
|
227
|
+
):
|
|
228
|
+
self._structs = structs
|
|
229
|
+
|
|
230
|
+
@staticmethod
|
|
231
|
+
def _build_path(path, node):
|
|
232
|
+
if isinstance(node, ast.Attribute):
|
|
233
|
+
ExpandStarredArgumentStruct._build_path(path, node.value)
|
|
234
|
+
path.append(node.attr)
|
|
235
|
+
if isinstance(node, ast.Name):
|
|
236
|
+
path.append(node.id)
|
|
237
|
+
return path
|
|
238
|
+
|
|
239
|
+
def _get_expanded_struct(self, arg_node):
|
|
240
|
+
if not isinstance(arg_node, ast.Starred):
|
|
241
|
+
return None
|
|
242
|
+
path = ".".join(ExpandStarredArgumentStruct._build_path([], arg_node.value))
|
|
243
|
+
return self._structs.get(path, None)
|
|
244
|
+
|
|
245
|
+
def visit_Call(self, call: ast.Call):
|
|
246
|
+
call = self.generic_visit(call)
|
|
247
|
+
|
|
248
|
+
expanded_args = []
|
|
249
|
+
for arg in call.args:
|
|
250
|
+
struct = self._get_expanded_struct(arg)
|
|
251
|
+
if struct is None:
|
|
252
|
+
expanded_args.append(arg)
|
|
253
|
+
else:
|
|
254
|
+
expanded_args += [ast.Attribute(value=arg.value, attr=field) for field in struct.vars.keys()]
|
|
255
|
+
call.args = expanded_args
|
|
256
|
+
|
|
257
|
+
return call
|
|
258
|
+
|
|
259
|
+
|
|
260
|
+
def get_integrand_function(
|
|
261
|
+
integrand: Integrand,
|
|
262
|
+
suffix: str,
|
|
263
|
+
func=None,
|
|
264
|
+
annotations=None,
|
|
265
|
+
code_transformers=None,
|
|
266
|
+
):
|
|
267
|
+
key = _make_key(integrand.func, suffix)
|
|
268
|
+
|
|
269
|
+
if key not in integrand.cached_funcs:
|
|
270
|
+
integrand.cached_funcs[key] = _register_function(
|
|
271
|
+
func=integrand.func if func is None else func,
|
|
272
|
+
key=key,
|
|
273
|
+
module=integrand.module,
|
|
274
|
+
overloaded_annotations=annotations,
|
|
275
|
+
code_transformers=code_transformers,
|
|
276
|
+
)
|
|
277
|
+
|
|
278
|
+
return integrand.cached_funcs[key]
|
|
279
|
+
|
|
280
|
+
|
|
281
|
+
def get_integrand_kernel(
|
|
282
|
+
integrand: Integrand,
|
|
283
|
+
suffix: str,
|
|
284
|
+
kernel_fn: Optional[Callable] = None,
|
|
285
|
+
kernel_options: Optional[Dict[str, Any]] = None,
|
|
286
|
+
code_transformers=None,
|
|
287
|
+
FieldStruct=None,
|
|
288
|
+
ValueStruct=None,
|
|
289
|
+
) -> Tuple[wp.Kernel, StructInstance, StructInstance]:
|
|
290
|
+
options = {**integrand.module.options, **integrand.kernel_options}
|
|
291
|
+
if kernel_options is not None:
|
|
292
|
+
options.update(kernel_options)
|
|
293
|
+
|
|
294
|
+
key = _make_key(integrand.func, suffix, options=options)
|
|
295
|
+
if key not in integrand.cached_kernels:
|
|
296
|
+
if kernel_fn is None:
|
|
297
|
+
return None, None, None
|
|
298
|
+
|
|
299
|
+
kernel_key = _native_key(integrand.func, key)
|
|
300
|
+
module = wp.get_module(f"{integrand.module.name}.{kernel_key}")
|
|
301
|
+
module.options = options
|
|
302
|
+
|
|
303
|
+
integrand.cached_kernels[key] = (
|
|
304
|
+
wp.Kernel(
|
|
305
|
+
func=kernel_fn, key=kernel_key, module=module, code_transformers=code_transformers, options=options
|
|
306
|
+
),
|
|
307
|
+
FieldStruct(),
|
|
308
|
+
ValueStruct(),
|
|
309
|
+
)
|
|
310
|
+
|
|
311
|
+
return integrand.cached_kernels[key]
|
|
312
|
+
|
|
313
|
+
|
|
314
|
+
def pod_type_key(pod_type: type):
|
|
315
|
+
"""Hashable key for POD (single or sequence of scalars) types"""
|
|
316
|
+
|
|
317
|
+
pod_type = type_to_warp(pod_type)
|
|
318
|
+
if hasattr(pod_type, "_wp_scalar_type_"):
|
|
319
|
+
if hasattr(pod_type, "_shape_"):
|
|
320
|
+
return (pod_type.__name__, pod_type._shape_, pod_type._wp_scalar_type_.__name__)
|
|
321
|
+
return (pod_type.__name__, pod_type._length_, pod_type._wp_scalar_type_.__name__)
|
|
322
|
+
return pod_type.__name__
|
|
323
|
+
|
|
324
|
+
|
|
325
|
+
def cached_arg_value(func: Callable):
|
|
326
|
+
"""Decorator to be applied to member methods assembling Arg structs, so that the result gets
|
|
327
|
+
automatically cached for the lifetime of the parent object
|
|
328
|
+
"""
|
|
329
|
+
|
|
330
|
+
cache_attr = f"_{func.__name__}_cache"
|
|
331
|
+
|
|
332
|
+
def get_arg(obj, device):
|
|
333
|
+
cache = getattr(obj, cache_attr, None)
|
|
334
|
+
if cache is None:
|
|
335
|
+
cache = {}
|
|
336
|
+
setattr(obj, cache_attr, cache)
|
|
337
|
+
|
|
338
|
+
device = wp.get_device(device)
|
|
339
|
+
if device.ordinal not in cache:
|
|
340
|
+
cache[device.ordinal] = func(obj, device)
|
|
341
|
+
|
|
342
|
+
return cache[device.ordinal]
|
|
343
|
+
|
|
344
|
+
def invalidate(obj, device=None):
|
|
345
|
+
if device is not None and hasattr(obj, cache_attr):
|
|
346
|
+
cache = getattr(obj, cache_attr)
|
|
347
|
+
if device.ordinal in cache:
|
|
348
|
+
del cache[device.ordinal]
|
|
349
|
+
else:
|
|
350
|
+
setattr(obj, cache_attr, {})
|
|
351
|
+
|
|
352
|
+
get_arg.invalidate = invalidate
|
|
353
|
+
|
|
354
|
+
return get_arg
|
|
355
|
+
|
|
356
|
+
|
|
357
|
+
def setup_dynamic_attributes(
|
|
358
|
+
obj,
|
|
359
|
+
cls: Optional[type] = None,
|
|
360
|
+
constructors: Optional[Dict[str, Callable]] = None,
|
|
361
|
+
key: Optional[str] = None,
|
|
362
|
+
):
|
|
363
|
+
if cls is None:
|
|
364
|
+
cls = type(obj)
|
|
365
|
+
|
|
366
|
+
if key is None:
|
|
367
|
+
key = obj.name
|
|
368
|
+
|
|
369
|
+
if constructors is None:
|
|
370
|
+
constructors = cls._dynamic_attribute_constructors
|
|
371
|
+
|
|
372
|
+
key = (key, frozenset(constructors.keys()))
|
|
373
|
+
|
|
374
|
+
if not hasattr(cls, "_cached_dynamic_attrs"):
|
|
375
|
+
cls._cached_dynamic_attrs = {}
|
|
376
|
+
|
|
377
|
+
attrs = cls._cached_dynamic_attrs.get(key)
|
|
378
|
+
if attrs is None:
|
|
379
|
+
attrs = {}
|
|
380
|
+
# create attributes one-by-one, as some may depend on previous ones
|
|
381
|
+
for k, v in constructors.items():
|
|
382
|
+
attr = v(obj)
|
|
383
|
+
attrs[k] = attr
|
|
384
|
+
setattr(obj, k, attr)
|
|
385
|
+
cls._cached_dynamic_attrs[key] = attrs
|
|
386
|
+
else:
|
|
387
|
+
for k, v in attrs.items():
|
|
388
|
+
setattr(obj, k, v)
|
|
389
|
+
|
|
390
|
+
|
|
391
|
+
_cached_vec_types = {}
|
|
392
|
+
_cached_mat_types = {}
|
|
393
|
+
|
|
394
|
+
|
|
395
|
+
def cached_vec_type(length, dtype):
|
|
396
|
+
key = (length, dtype)
|
|
397
|
+
if key not in _cached_vec_types:
|
|
398
|
+
_cached_vec_types[key] = wp.vec(length=length, dtype=dtype)
|
|
399
|
+
|
|
400
|
+
return _cached_vec_types[key]
|
|
401
|
+
|
|
402
|
+
|
|
403
|
+
def cached_mat_type(shape, dtype):
|
|
404
|
+
key = (*shape, dtype)
|
|
405
|
+
if key not in _cached_mat_types:
|
|
406
|
+
_cached_mat_types[key] = wp.mat(shape=shape, dtype=dtype)
|
|
407
|
+
|
|
408
|
+
return _cached_mat_types[key]
|
|
409
|
+
|
|
410
|
+
|
|
411
|
+
Temporary = wp.array
|
|
412
|
+
"""Temporary array borrowed from a :class:`TemporaryStore`.
|
|
413
|
+
|
|
414
|
+
The array will be automatically returned to the temporary pool for reuse upon destruction of this object, unless
|
|
415
|
+
the temporary is explicitly detached from the pool using :meth:`detach`.
|
|
416
|
+
The temporary may also be explicitly returned to the pool before destruction using :meth:`release`.
|
|
417
|
+
|
|
418
|
+
Note: `Temporary` is now a direct alias for `wp.array` with a custom deleter. Convenience `detach` and `release`
|
|
419
|
+
are added at borrow time, as well as a self-pointing `array` attribute is for backward compatibility.
|
|
420
|
+
"""
|
|
421
|
+
|
|
422
|
+
|
|
423
|
+
class TemporaryStore:
|
|
424
|
+
"""
|
|
425
|
+
Shared pool of temporary arrays that will be persisted and reused across invocations of ``warp.fem`` functions.
|
|
426
|
+
|
|
427
|
+
A :class:`TemporaryStore` instance may either be passed explicitly to ``warp.fem`` functions that accept such an argument, for instance :func:`.integrate.integrate`,
|
|
428
|
+
or can be set globally as the default store using :func:`set_default_temporary_store`.
|
|
429
|
+
|
|
430
|
+
By default, there is no default temporary store, so that temporary allocations are not persisted.
|
|
431
|
+
"""
|
|
432
|
+
|
|
433
|
+
_default_store: ClassVar[Optional["TemporaryStore"]] = None
|
|
434
|
+
|
|
435
|
+
class Pool:
|
|
436
|
+
class Deleter:
|
|
437
|
+
def __init__(self, pool: "TemporaryStore.Pool"):
|
|
438
|
+
self.pool = weakref.ref(pool)
|
|
439
|
+
|
|
440
|
+
def __call__(self, ptr, size):
|
|
441
|
+
pool = self.pool()
|
|
442
|
+
if pool is not None:
|
|
443
|
+
pool.redeem(ptr)
|
|
444
|
+
|
|
445
|
+
def detach(self, temporary: Temporary):
|
|
446
|
+
pool = self.pool()
|
|
447
|
+
if pool is not None:
|
|
448
|
+
pool.detach(temporary)
|
|
449
|
+
|
|
450
|
+
def __init__(self, dtype, device, pinned: bool):
|
|
451
|
+
self.dtype = dtype
|
|
452
|
+
self.device = device
|
|
453
|
+
self.pinned = pinned
|
|
454
|
+
|
|
455
|
+
self._pool: list[int] = [] # Currently available buffers for borrowing, ordered by size
|
|
456
|
+
self._pool_capacities: list[int] = [] # Sizes of available arrays for borrowing, ascending
|
|
457
|
+
self._allocs: dict[int, int] = {} # All allocated capacities, including borrowed ones
|
|
458
|
+
|
|
459
|
+
self._dtype_size = type_size_in_bytes(dtype)
|
|
460
|
+
self._allocator = device.get_allocator(pinned=self.pinned)
|
|
461
|
+
self._deleter = TemporaryStore.Pool.Deleter(self)
|
|
462
|
+
|
|
463
|
+
# self._held_temporaries = set() # Temporaries that are prevented from going out of scope
|
|
464
|
+
|
|
465
|
+
def borrow(self, shape, dtype, requires_grad: bool):
|
|
466
|
+
if requires_grad:
|
|
467
|
+
grad = self.borrow(shape=shape, dtype=dtype, requires_grad=False)
|
|
468
|
+
# Zero-out gradient to mimic semantics of wp.empty()
|
|
469
|
+
grad.zero_()
|
|
470
|
+
else:
|
|
471
|
+
grad = None
|
|
472
|
+
|
|
473
|
+
capacity = self._dtype_size
|
|
474
|
+
if isinstance(shape, int):
|
|
475
|
+
capacity *= shape
|
|
476
|
+
else:
|
|
477
|
+
for d in shape:
|
|
478
|
+
capacity *= d
|
|
479
|
+
|
|
480
|
+
if capacity == 0:
|
|
481
|
+
ptr = 0
|
|
482
|
+
deleter = None
|
|
483
|
+
else:
|
|
484
|
+
index = bisect.bisect_left(
|
|
485
|
+
a=self._pool_capacities,
|
|
486
|
+
x=capacity,
|
|
487
|
+
)
|
|
488
|
+
if index < len(self._pool):
|
|
489
|
+
# Big enough array found, remove from pool
|
|
490
|
+
ptr = self._pool.pop(index)
|
|
491
|
+
capacity = self._pool_capacities.pop(index)
|
|
492
|
+
else:
|
|
493
|
+
# No big enough array found, allocate new one
|
|
494
|
+
if len(self._pool) > 0:
|
|
495
|
+
grow_factor = 1.5
|
|
496
|
+
capacity = max(int(self._pool_capacities[-1] * grow_factor), capacity)
|
|
497
|
+
|
|
498
|
+
ptr = self._allocator.alloc(capacity)
|
|
499
|
+
self._allocs[ptr] = capacity
|
|
500
|
+
deleter = self._deleter
|
|
501
|
+
|
|
502
|
+
temporary = Temporary(
|
|
503
|
+
ptr=ptr,
|
|
504
|
+
capacity=capacity,
|
|
505
|
+
shape=shape,
|
|
506
|
+
dtype=dtype,
|
|
507
|
+
grad=grad,
|
|
508
|
+
device=self.device,
|
|
509
|
+
pinned=self.pinned,
|
|
510
|
+
deleter=deleter,
|
|
511
|
+
)
|
|
512
|
+
return temporary
|
|
513
|
+
|
|
514
|
+
def redeem(self, ptr: int):
|
|
515
|
+
capacity = self._allocs[ptr]
|
|
516
|
+
# Insert back array into available pool
|
|
517
|
+
index = bisect.bisect_left(
|
|
518
|
+
a=self._pool_capacities,
|
|
519
|
+
x=capacity,
|
|
520
|
+
)
|
|
521
|
+
self._pool.insert(index, ptr)
|
|
522
|
+
self._pool_capacities.insert(index, capacity)
|
|
523
|
+
|
|
524
|
+
def detach(self, array: Temporary):
|
|
525
|
+
del self._allocs[array.ptr]
|
|
526
|
+
array.deleter = self._allocator.deleter
|
|
527
|
+
|
|
528
|
+
def __del__(self):
|
|
529
|
+
for ptr, capacity in self._allocs.items():
|
|
530
|
+
self._allocator.free(ptr, capacity)
|
|
531
|
+
|
|
532
|
+
def __init__(self):
|
|
533
|
+
self.clear()
|
|
534
|
+
|
|
535
|
+
def clear(self):
|
|
536
|
+
self._temporaries = {}
|
|
537
|
+
|
|
538
|
+
def borrow(self, shape, dtype, pinned: bool = False, device=None, requires_grad: bool = False) -> Temporary:
|
|
539
|
+
dtype = type_to_warp(dtype)
|
|
540
|
+
device = wp.get_device(device)
|
|
541
|
+
|
|
542
|
+
type_length = type_size(dtype)
|
|
543
|
+
key = (dtype._type_, type_length, pinned, device.ordinal)
|
|
544
|
+
|
|
545
|
+
try:
|
|
546
|
+
pool = self._temporaries[key]
|
|
547
|
+
except KeyError:
|
|
548
|
+
value_type = (
|
|
549
|
+
cached_vec_type(length=type_length, dtype=type_scalar_type(dtype)) if type_length > 1 else dtype
|
|
550
|
+
)
|
|
551
|
+
pool = TemporaryStore.Pool(value_type, device, pinned=pinned)
|
|
552
|
+
self._temporaries[key] = pool
|
|
553
|
+
|
|
554
|
+
res = TemporaryStore.add_temporary_convenience_methods(
|
|
555
|
+
pool.borrow(dtype=dtype, shape=shape, requires_grad=requires_grad)
|
|
556
|
+
)
|
|
557
|
+
return res
|
|
558
|
+
|
|
559
|
+
@staticmethod
|
|
560
|
+
def add_temporary_convenience_methods(temporary: wp.array) -> Temporary:
|
|
561
|
+
temporary.release = TemporaryStore._release_temporary.__get__(temporary)
|
|
562
|
+
temporary.detach = TemporaryStore._detach_temporary.__get__(temporary)
|
|
563
|
+
temporary.array = temporary
|
|
564
|
+
return temporary
|
|
565
|
+
|
|
566
|
+
@staticmethod
|
|
567
|
+
def _detach_temporary(temporary) -> wp.array:
|
|
568
|
+
"""Detaches the temporary so it is never returned to the pool"""
|
|
569
|
+
if temporary.deleter is not None:
|
|
570
|
+
if isinstance(temporary.deleter, TemporaryStore.Pool.Deleter):
|
|
571
|
+
temporary.deleter.detach(temporary)
|
|
572
|
+
return temporary
|
|
573
|
+
|
|
574
|
+
@staticmethod
|
|
575
|
+
def _release_temporary(temporary):
|
|
576
|
+
"""Returns the temporary array to the pool"""
|
|
577
|
+
if temporary.deleter is not None:
|
|
578
|
+
with temporary.device.context_guard:
|
|
579
|
+
temporary.deleter(temporary.ptr, temporary.capacity)
|
|
580
|
+
temporary.deleter = None
|
|
581
|
+
|
|
582
|
+
|
|
583
|
+
def set_default_temporary_store(temporary_store: Optional[TemporaryStore]):
|
|
584
|
+
"""Globally sets the default :class:`TemporaryStore` instance to use for temporary allocations in ``warp.fem`` functions.
|
|
585
|
+
|
|
586
|
+
If the default temporary store is set to ``None``, temporary allocations are not persisted unless a :class:`TemporaryStore` is provided at a per-function granularity.
|
|
587
|
+
"""
|
|
588
|
+
|
|
589
|
+
TemporaryStore._default_store = temporary_store
|
|
590
|
+
|
|
591
|
+
|
|
592
|
+
def borrow_temporary(
|
|
593
|
+
temporary_store: Optional[TemporaryStore],
|
|
594
|
+
shape: Union[int, Tuple[int]],
|
|
595
|
+
dtype: type,
|
|
596
|
+
pinned: bool = False,
|
|
597
|
+
requires_grad: bool = False,
|
|
598
|
+
device=None,
|
|
599
|
+
) -> Temporary:
|
|
600
|
+
"""
|
|
601
|
+
Borrows and returns a temporary array with specified attributes from a shared pool.
|
|
602
|
+
|
|
603
|
+
If an array with sufficient capacity and matching desired attributes is already available in the pool, it will be returned.
|
|
604
|
+
Otherwise, a new allocation will be performed.
|
|
605
|
+
|
|
606
|
+
Args:
|
|
607
|
+
temporary_store: the shared pool to borrow the temporary from. If `temporary_store` is ``None``, the global default temporary store, if set, will be used.
|
|
608
|
+
shape: desired dimensions for the temporary array
|
|
609
|
+
dtype: desired data type for the temporary array
|
|
610
|
+
pinned: whether a pinned allocation is desired
|
|
611
|
+
device: device on which the memory should be allocated; if ``None``, the current device will be used.
|
|
612
|
+
"""
|
|
613
|
+
|
|
614
|
+
if temporary_store is None:
|
|
615
|
+
temporary_store = TemporaryStore._default_store
|
|
616
|
+
|
|
617
|
+
if temporary_store is None:
|
|
618
|
+
return TemporaryStore.add_temporary_convenience_methods(
|
|
619
|
+
Temporary(shape=shape, dtype=dtype, pinned=pinned, device=device, requires_grad=requires_grad)
|
|
620
|
+
)
|
|
621
|
+
|
|
622
|
+
return temporary_store.borrow(shape=shape, dtype=dtype, device=device, pinned=pinned, requires_grad=requires_grad)
|
|
623
|
+
|
|
624
|
+
|
|
625
|
+
def borrow_temporary_like(
|
|
626
|
+
array: Union[wp.array, Temporary],
|
|
627
|
+
temporary_store: Optional[TemporaryStore],
|
|
628
|
+
) -> Temporary:
|
|
629
|
+
"""
|
|
630
|
+
Borrows and returns a temporary array with the same attributes as another array or temporary.
|
|
631
|
+
|
|
632
|
+
Args:
|
|
633
|
+
array: Warp or temporary array to read the desired attributes from
|
|
634
|
+
temporary_store: the shared pool to borrow the temporary from. If `temporary_store` is ``None``, the global default temporary store, if set, will be used.
|
|
635
|
+
"""
|
|
636
|
+
return borrow_temporary(
|
|
637
|
+
temporary_store=temporary_store,
|
|
638
|
+
shape=array.shape,
|
|
639
|
+
dtype=array.dtype,
|
|
640
|
+
pinned=array.pinned,
|
|
641
|
+
device=array.device,
|
|
642
|
+
requires_grad=array.requires_grad,
|
|
643
|
+
)
|
|
644
|
+
|
|
645
|
+
|
|
646
|
+
_device_events = {}
|
|
647
|
+
|
|
648
|
+
|
|
649
|
+
def capture_event(device=None):
|
|
650
|
+
"""
|
|
651
|
+
Records a CUDA event on the current stream and returns it,
|
|
652
|
+
reusing previously created events if possible.
|
|
653
|
+
|
|
654
|
+
If the current device is not a CUDA device, returns ``None``.
|
|
655
|
+
|
|
656
|
+
The event can be returned to the shared per-device pool for future reuse by
|
|
657
|
+
calling :func:`synchronize_event`
|
|
658
|
+
"""
|
|
659
|
+
|
|
660
|
+
device = wp.get_device(device)
|
|
661
|
+
if not device.is_cuda:
|
|
662
|
+
return None
|
|
663
|
+
|
|
664
|
+
try:
|
|
665
|
+
device_events = _device_events[device.ordinal]
|
|
666
|
+
except KeyError:
|
|
667
|
+
device_events = []
|
|
668
|
+
_device_events[device.ordinal] = device_events
|
|
669
|
+
|
|
670
|
+
with wp.ScopedDevice(device):
|
|
671
|
+
if not device_events:
|
|
672
|
+
return wp.record_event()
|
|
673
|
+
|
|
674
|
+
return wp.record_event(device_events.pop())
|
|
675
|
+
|
|
676
|
+
|
|
677
|
+
def synchronize_event(event: Union[wp.Event, None]):
|
|
678
|
+
"""
|
|
679
|
+
Synchronize an event created with :func:`capture_event` and returns it to the
|
|
680
|
+
per-device event pool.
|
|
681
|
+
|
|
682
|
+
If `event` is ``None``, do nothing.
|
|
683
|
+
"""
|
|
684
|
+
|
|
685
|
+
if event is not None:
|
|
686
|
+
wp.synchronize_event(event)
|
|
687
|
+
_device_events[event.device.ordinal].append(event)
|