warp-lang 1.0.1__py3-none-manylinux2014_aarch64.whl → 1.1.0__py3-none-manylinux2014_aarch64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of warp-lang might be problematic. Click here for more details.
- warp/__init__.py +108 -97
- warp/__init__.pyi +1 -1
- warp/bin/warp-clang.so +0 -0
- warp/bin/warp.so +0 -0
- warp/build.py +115 -113
- warp/build_dll.py +383 -375
- warp/builtins.py +3425 -3354
- warp/codegen.py +2878 -2792
- warp/config.py +40 -36
- warp/constants.py +45 -45
- warp/context.py +5194 -5102
- warp/dlpack.py +442 -442
- warp/examples/__init__.py +16 -16
- warp/examples/assets/bear.usd +0 -0
- warp/examples/assets/bunny.usd +0 -0
- warp/examples/assets/cartpole.urdf +110 -110
- warp/examples/assets/crazyflie.usd +0 -0
- warp/examples/assets/cube.usd +0 -0
- warp/examples/assets/nv_ant.xml +92 -92
- warp/examples/assets/nv_humanoid.xml +183 -183
- warp/examples/assets/quadruped.urdf +267 -267
- warp/examples/assets/rocks.nvdb +0 -0
- warp/examples/assets/rocks.usd +0 -0
- warp/examples/assets/sphere.usd +0 -0
- warp/examples/benchmarks/benchmark_api.py +383 -383
- warp/examples/benchmarks/benchmark_cloth.py +278 -279
- warp/examples/benchmarks/benchmark_cloth_cupy.py +88 -88
- warp/examples/benchmarks/benchmark_cloth_jax.py +97 -100
- warp/examples/benchmarks/benchmark_cloth_numba.py +146 -142
- warp/examples/benchmarks/benchmark_cloth_numpy.py +77 -77
- warp/examples/benchmarks/benchmark_cloth_pytorch.py +86 -86
- warp/examples/benchmarks/benchmark_cloth_taichi.py +112 -112
- warp/examples/benchmarks/benchmark_cloth_warp.py +146 -146
- warp/examples/benchmarks/benchmark_launches.py +295 -295
- warp/examples/browse.py +29 -28
- warp/examples/core/example_dem.py +234 -221
- warp/examples/core/example_fluid.py +293 -267
- warp/examples/core/example_graph_capture.py +144 -129
- warp/examples/core/example_marching_cubes.py +188 -176
- warp/examples/core/example_mesh.py +174 -154
- warp/examples/core/example_mesh_intersect.py +205 -193
- warp/examples/core/example_nvdb.py +176 -169
- warp/examples/core/example_raycast.py +105 -89
- warp/examples/core/example_raymarch.py +199 -178
- warp/examples/core/example_render_opengl.py +185 -141
- warp/examples/core/example_sph.py +405 -389
- warp/examples/core/example_torch.py +222 -181
- warp/examples/core/example_wave.py +263 -249
- warp/examples/fem/bsr_utils.py +378 -380
- warp/examples/fem/example_apic_fluid.py +407 -391
- warp/examples/fem/example_convection_diffusion.py +182 -168
- warp/examples/fem/example_convection_diffusion_dg.py +219 -209
- warp/examples/fem/example_convection_diffusion_dg0.py +204 -194
- warp/examples/fem/example_deformed_geometry.py +177 -159
- warp/examples/fem/example_diffusion.py +201 -173
- warp/examples/fem/example_diffusion_3d.py +177 -152
- warp/examples/fem/example_diffusion_mgpu.py +221 -214
- warp/examples/fem/example_mixed_elasticity.py +244 -222
- warp/examples/fem/example_navier_stokes.py +259 -243
- warp/examples/fem/example_stokes.py +220 -192
- warp/examples/fem/example_stokes_transfer.py +265 -249
- warp/examples/fem/mesh_utils.py +133 -109
- warp/examples/fem/plot_utils.py +292 -287
- warp/examples/optim/example_bounce.py +260 -248
- warp/examples/optim/example_cloth_throw.py +222 -210
- warp/examples/optim/example_diffray.py +566 -535
- warp/examples/optim/example_drone.py +864 -835
- warp/examples/optim/example_inverse_kinematics.py +176 -169
- warp/examples/optim/example_inverse_kinematics_torch.py +185 -170
- warp/examples/optim/example_spring_cage.py +239 -234
- warp/examples/optim/example_trajectory.py +223 -201
- warp/examples/optim/example_walker.py +306 -292
- warp/examples/sim/example_cartpole.py +139 -128
- warp/examples/sim/example_cloth.py +196 -184
- warp/examples/sim/example_granular.py +124 -113
- warp/examples/sim/example_granular_collision_sdf.py +197 -185
- warp/examples/sim/example_jacobian_ik.py +236 -213
- warp/examples/sim/example_particle_chain.py +118 -106
- warp/examples/sim/example_quadruped.py +193 -179
- warp/examples/sim/example_rigid_chain.py +197 -189
- warp/examples/sim/example_rigid_contact.py +189 -176
- warp/examples/sim/example_rigid_force.py +127 -126
- warp/examples/sim/example_rigid_gyroscopic.py +109 -97
- warp/examples/sim/example_rigid_soft_contact.py +134 -124
- warp/examples/sim/example_soft_body.py +190 -178
- warp/fabric.py +337 -335
- warp/fem/__init__.py +60 -27
- warp/fem/cache.py +401 -388
- warp/fem/dirichlet.py +178 -179
- warp/fem/domain.py +262 -263
- warp/fem/field/__init__.py +100 -101
- warp/fem/field/field.py +148 -149
- warp/fem/field/nodal_field.py +298 -299
- warp/fem/field/restriction.py +22 -21
- warp/fem/field/test.py +180 -181
- warp/fem/field/trial.py +183 -183
- warp/fem/geometry/__init__.py +15 -19
- warp/fem/geometry/closest_point.py +69 -70
- warp/fem/geometry/deformed_geometry.py +270 -271
- warp/fem/geometry/element.py +744 -744
- warp/fem/geometry/geometry.py +184 -186
- warp/fem/geometry/grid_2d.py +380 -373
- warp/fem/geometry/grid_3d.py +441 -435
- warp/fem/geometry/hexmesh.py +953 -953
- warp/fem/geometry/partition.py +374 -376
- warp/fem/geometry/quadmesh_2d.py +532 -532
- warp/fem/geometry/tetmesh.py +840 -840
- warp/fem/geometry/trimesh_2d.py +577 -577
- warp/fem/integrate.py +1630 -1615
- warp/fem/operator.py +190 -191
- warp/fem/polynomial.py +214 -213
- warp/fem/quadrature/__init__.py +2 -2
- warp/fem/quadrature/pic_quadrature.py +243 -245
- warp/fem/quadrature/quadrature.py +295 -294
- warp/fem/space/__init__.py +294 -292
- warp/fem/space/basis_space.py +488 -489
- warp/fem/space/collocated_function_space.py +100 -105
- warp/fem/space/dof_mapper.py +236 -236
- warp/fem/space/function_space.py +148 -145
- warp/fem/space/grid_2d_function_space.py +267 -267
- warp/fem/space/grid_3d_function_space.py +305 -306
- warp/fem/space/hexmesh_function_space.py +350 -352
- warp/fem/space/partition.py +350 -350
- warp/fem/space/quadmesh_2d_function_space.py +368 -369
- warp/fem/space/restriction.py +158 -160
- warp/fem/space/shape/__init__.py +13 -15
- warp/fem/space/shape/cube_shape_function.py +738 -738
- warp/fem/space/shape/shape_function.py +102 -103
- warp/fem/space/shape/square_shape_function.py +611 -611
- warp/fem/space/shape/tet_shape_function.py +565 -567
- warp/fem/space/shape/triangle_shape_function.py +429 -429
- warp/fem/space/tetmesh_function_space.py +294 -292
- warp/fem/space/topology.py +297 -295
- warp/fem/space/trimesh_2d_function_space.py +223 -221
- warp/fem/types.py +77 -77
- warp/fem/utils.py +495 -495
- warp/jax.py +166 -141
- warp/jax_experimental.py +341 -339
- warp/native/array.h +1072 -1025
- warp/native/builtin.h +1560 -1560
- warp/native/bvh.cpp +398 -398
- warp/native/bvh.cu +525 -525
- warp/native/bvh.h +429 -429
- warp/native/clang/clang.cpp +495 -464
- warp/native/crt.cpp +31 -31
- warp/native/crt.h +334 -334
- warp/native/cuda_crt.h +1049 -1049
- warp/native/cuda_util.cpp +549 -540
- warp/native/cuda_util.h +288 -203
- warp/native/cutlass_gemm.cpp +34 -34
- warp/native/cutlass_gemm.cu +372 -372
- warp/native/error.cpp +66 -66
- warp/native/error.h +27 -27
- warp/native/fabric.h +228 -228
- warp/native/hashgrid.cpp +301 -278
- warp/native/hashgrid.cu +78 -77
- warp/native/hashgrid.h +227 -227
- warp/native/initializer_array.h +32 -32
- warp/native/intersect.h +1204 -1204
- warp/native/intersect_adj.h +365 -365
- warp/native/intersect_tri.h +322 -322
- warp/native/marching.cpp +2 -2
- warp/native/marching.cu +497 -497
- warp/native/marching.h +2 -2
- warp/native/mat.h +1498 -1498
- warp/native/matnn.h +333 -333
- warp/native/mesh.cpp +203 -203
- warp/native/mesh.cu +293 -293
- warp/native/mesh.h +1887 -1887
- warp/native/nanovdb/NanoVDB.h +4782 -4782
- warp/native/nanovdb/PNanoVDB.h +2553 -2553
- warp/native/nanovdb/PNanoVDBWrite.h +294 -294
- warp/native/noise.h +850 -850
- warp/native/quat.h +1084 -1084
- warp/native/rand.h +299 -299
- warp/native/range.h +108 -108
- warp/native/reduce.cpp +156 -156
- warp/native/reduce.cu +348 -348
- warp/native/runlength_encode.cpp +61 -61
- warp/native/runlength_encode.cu +46 -46
- warp/native/scan.cpp +30 -30
- warp/native/scan.cu +36 -36
- warp/native/scan.h +7 -7
- warp/native/solid_angle.h +442 -442
- warp/native/sort.cpp +94 -94
- warp/native/sort.cu +97 -97
- warp/native/sort.h +14 -14
- warp/native/sparse.cpp +337 -337
- warp/native/sparse.cu +544 -544
- warp/native/spatial.h +630 -630
- warp/native/svd.h +562 -562
- warp/native/temp_buffer.h +30 -30
- warp/native/vec.h +1132 -1132
- warp/native/volume.cpp +297 -297
- warp/native/volume.cu +32 -32
- warp/native/volume.h +538 -538
- warp/native/volume_builder.cu +425 -425
- warp/native/volume_builder.h +19 -19
- warp/native/warp.cpp +1057 -1052
- warp/native/warp.cu +2943 -2828
- warp/native/warp.h +313 -305
- warp/optim/__init__.py +9 -9
- warp/optim/adam.py +120 -120
- warp/optim/linear.py +1104 -939
- warp/optim/sgd.py +104 -92
- warp/render/__init__.py +10 -10
- warp/render/render_opengl.py +3217 -3204
- warp/render/render_usd.py +768 -749
- warp/render/utils.py +152 -150
- warp/sim/__init__.py +52 -59
- warp/sim/articulation.py +685 -685
- warp/sim/collide.py +1594 -1590
- warp/sim/import_mjcf.py +489 -481
- warp/sim/import_snu.py +220 -221
- warp/sim/import_urdf.py +536 -516
- warp/sim/import_usd.py +887 -881
- warp/sim/inertia.py +316 -317
- warp/sim/integrator.py +234 -233
- warp/sim/integrator_euler.py +1956 -1956
- warp/sim/integrator_featherstone.py +1910 -1991
- warp/sim/integrator_xpbd.py +3294 -3312
- warp/sim/model.py +4473 -4314
- warp/sim/particles.py +113 -112
- warp/sim/render.py +417 -403
- warp/sim/utils.py +413 -410
- warp/sparse.py +1227 -1227
- warp/stubs.py +2109 -2469
- warp/tape.py +1162 -225
- warp/tests/__init__.py +1 -1
- warp/tests/__main__.py +4 -4
- warp/tests/assets/torus.usda +105 -105
- warp/tests/aux_test_class_kernel.py +26 -26
- warp/tests/aux_test_compile_consts_dummy.py +10 -10
- warp/tests/aux_test_conditional_unequal_types_kernels.py +21 -21
- warp/tests/aux_test_dependent.py +22 -22
- warp/tests/aux_test_grad_customs.py +23 -23
- warp/tests/aux_test_reference.py +11 -11
- warp/tests/aux_test_reference_reference.py +10 -10
- warp/tests/aux_test_square.py +17 -17
- warp/tests/aux_test_unresolved_func.py +14 -14
- warp/tests/aux_test_unresolved_symbol.py +14 -14
- warp/tests/disabled_kinematics.py +239 -239
- warp/tests/run_coverage_serial.py +31 -31
- warp/tests/test_adam.py +157 -157
- warp/tests/test_arithmetic.py +1124 -1124
- warp/tests/test_array.py +2417 -2326
- warp/tests/test_array_reduce.py +150 -150
- warp/tests/test_async.py +668 -656
- warp/tests/test_atomic.py +141 -141
- warp/tests/test_bool.py +204 -149
- warp/tests/test_builtins_resolution.py +1292 -1292
- warp/tests/test_bvh.py +164 -171
- warp/tests/test_closest_point_edge_edge.py +228 -228
- warp/tests/test_codegen.py +566 -553
- warp/tests/test_compile_consts.py +97 -101
- warp/tests/test_conditional.py +246 -246
- warp/tests/test_copy.py +232 -215
- warp/tests/test_ctypes.py +632 -632
- warp/tests/test_dense.py +67 -67
- warp/tests/test_devices.py +91 -98
- warp/tests/test_dlpack.py +530 -529
- warp/tests/test_examples.py +400 -378
- warp/tests/test_fabricarray.py +955 -955
- warp/tests/test_fast_math.py +62 -54
- warp/tests/test_fem.py +1277 -1278
- warp/tests/test_fp16.py +130 -130
- warp/tests/test_func.py +338 -337
- warp/tests/test_generics.py +571 -571
- warp/tests/test_grad.py +746 -640
- warp/tests/test_grad_customs.py +333 -336
- warp/tests/test_hash_grid.py +210 -164
- warp/tests/test_import.py +39 -39
- warp/tests/test_indexedarray.py +1134 -1134
- warp/tests/test_intersect.py +67 -67
- warp/tests/test_jax.py +307 -307
- warp/tests/test_large.py +167 -164
- warp/tests/test_launch.py +354 -354
- warp/tests/test_lerp.py +261 -261
- warp/tests/test_linear_solvers.py +191 -171
- warp/tests/test_lvalue.py +421 -493
- warp/tests/test_marching_cubes.py +65 -65
- warp/tests/test_mat.py +1801 -1827
- warp/tests/test_mat_lite.py +115 -115
- warp/tests/test_mat_scalar_ops.py +2907 -2889
- warp/tests/test_math.py +126 -193
- warp/tests/test_matmul.py +500 -499
- warp/tests/test_matmul_lite.py +410 -410
- warp/tests/test_mempool.py +188 -190
- warp/tests/test_mesh.py +284 -324
- warp/tests/test_mesh_query_aabb.py +228 -241
- warp/tests/test_mesh_query_point.py +692 -702
- warp/tests/test_mesh_query_ray.py +292 -303
- warp/tests/test_mlp.py +276 -276
- warp/tests/test_model.py +110 -110
- warp/tests/test_modules_lite.py +39 -39
- warp/tests/test_multigpu.py +163 -163
- warp/tests/test_noise.py +248 -248
- warp/tests/test_operators.py +250 -250
- warp/tests/test_options.py +123 -125
- warp/tests/test_peer.py +133 -137
- warp/tests/test_pinned.py +78 -78
- warp/tests/test_print.py +54 -54
- warp/tests/test_quat.py +2086 -2086
- warp/tests/test_rand.py +288 -288
- warp/tests/test_reload.py +217 -217
- warp/tests/test_rounding.py +179 -179
- warp/tests/test_runlength_encode.py +190 -190
- warp/tests/test_sim_grad.py +243 -0
- warp/tests/test_sim_kinematics.py +91 -97
- warp/tests/test_smoothstep.py +168 -168
- warp/tests/test_snippet.py +305 -266
- warp/tests/test_sparse.py +468 -460
- warp/tests/test_spatial.py +2148 -2148
- warp/tests/test_streams.py +486 -473
- warp/tests/test_struct.py +710 -675
- warp/tests/test_tape.py +173 -148
- warp/tests/test_torch.py +743 -743
- warp/tests/test_transient_module.py +87 -87
- warp/tests/test_types.py +556 -659
- warp/tests/test_utils.py +490 -499
- warp/tests/test_vec.py +1264 -1268
- warp/tests/test_vec_lite.py +73 -73
- warp/tests/test_vec_scalar_ops.py +2099 -2099
- warp/tests/test_verify_fp.py +94 -94
- warp/tests/test_volume.py +737 -736
- warp/tests/test_volume_write.py +255 -265
- warp/tests/unittest_serial.py +37 -37
- warp/tests/unittest_suites.py +363 -359
- warp/tests/unittest_utils.py +603 -578
- warp/tests/unused_test_misc.py +71 -71
- warp/tests/walkthrough_debug.py +85 -85
- warp/thirdparty/appdirs.py +598 -598
- warp/thirdparty/dlpack.py +143 -143
- warp/thirdparty/unittest_parallel.py +566 -561
- warp/torch.py +321 -295
- warp/types.py +4504 -4450
- warp/utils.py +1008 -821
- {warp_lang-1.0.1.dist-info → warp_lang-1.1.0.dist-info}/LICENSE.md +126 -126
- {warp_lang-1.0.1.dist-info → warp_lang-1.1.0.dist-info}/METADATA +338 -400
- warp_lang-1.1.0.dist-info/RECORD +352 -0
- warp/examples/assets/cube.usda +0 -42
- warp/examples/assets/sphere.usda +0 -56
- warp/examples/assets/torus.usda +0 -105
- warp_lang-1.0.1.dist-info/RECORD +0 -352
- {warp_lang-1.0.1.dist-info → warp_lang-1.1.0.dist-info}/WHEEL +0 -0
- {warp_lang-1.0.1.dist-info → warp_lang-1.1.0.dist-info}/top_level.txt +0 -0
warp/tests/test_model.py
CHANGED
|
@@ -1,110 +1,110 @@
|
|
|
1
|
-
# Copyright (c) 2022 NVIDIA CORPORATION. All rights reserved.
|
|
2
|
-
# NVIDIA CORPORATION and its licensors retain all intellectual property
|
|
3
|
-
# and proprietary rights in and to this software, related documentation
|
|
4
|
-
# and any modifications thereto. Any use, reproduction, disclosure or
|
|
5
|
-
# distribution of this software and related documentation without an express
|
|
6
|
-
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
|
-
|
|
8
|
-
import unittest
|
|
9
|
-
|
|
10
|
-
import numpy as np
|
|
11
|
-
|
|
12
|
-
import warp as wp
|
|
13
|
-
from warp.sim import ModelBuilder
|
|
14
|
-
from warp.tests.unittest_utils import *
|
|
15
|
-
|
|
16
|
-
wp.init()
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
class TestModel(unittest.TestCase):
|
|
20
|
-
def test_add_triangles(self):
|
|
21
|
-
rng = np.random.default_rng(123)
|
|
22
|
-
|
|
23
|
-
pts = np.array(
|
|
24
|
-
[
|
|
25
|
-
[-0.00585869, 0.34189449, -1.17415233],
|
|
26
|
-
[-1.894547, 0.1788074, 0.9251329],
|
|
27
|
-
[-1.26141048, 0.16140787, 0.08823282],
|
|
28
|
-
[-0.08609255, -0.82722546, 0.65995427],
|
|
29
|
-
[0.78827592, -1.77375711, -0.55582718],
|
|
30
|
-
]
|
|
31
|
-
)
|
|
32
|
-
tris = np.array([[0, 3, 4], [0, 2, 3], [2, 1, 3], [1, 4, 3]])
|
|
33
|
-
|
|
34
|
-
builder1 = ModelBuilder()
|
|
35
|
-
builder2 = ModelBuilder()
|
|
36
|
-
for pt in pts:
|
|
37
|
-
builder1.add_particle(wp.vec3(pt), wp.vec3(), 1.0)
|
|
38
|
-
builder2.add_particle(wp.vec3(pt), wp.vec3(), 1.0)
|
|
39
|
-
|
|
40
|
-
# test add_triangle(s) with default arguments:
|
|
41
|
-
areas = builder2.add_triangles(tris[:, 0], tris[:, 1], tris[:, 2])
|
|
42
|
-
for i, t in enumerate(tris):
|
|
43
|
-
area = builder1.add_triangle(t[0], t[1], t[2])
|
|
44
|
-
self.assertAlmostEqual(area, areas[i], places=6)
|
|
45
|
-
|
|
46
|
-
# test add_triangle(s) with non default arguments:
|
|
47
|
-
tri_ke = rng.standard_normal(size=pts.shape[0])
|
|
48
|
-
tri_ka = rng.standard_normal(size=pts.shape[0])
|
|
49
|
-
tri_kd = rng.standard_normal(size=pts.shape[0])
|
|
50
|
-
tri_drag = rng.standard_normal(size=pts.shape[0])
|
|
51
|
-
tri_lift = rng.standard_normal(size=pts.shape[0])
|
|
52
|
-
for i, t in enumerate(tris):
|
|
53
|
-
builder1.add_triangle(
|
|
54
|
-
t[0],
|
|
55
|
-
t[1],
|
|
56
|
-
t[2],
|
|
57
|
-
tri_ke[i],
|
|
58
|
-
tri_ka[i],
|
|
59
|
-
tri_kd[i],
|
|
60
|
-
tri_drag[i],
|
|
61
|
-
tri_lift[i],
|
|
62
|
-
)
|
|
63
|
-
builder2.add_triangles(tris[:, 0], tris[:, 1], tris[:, 2], tri_ke, tri_ka, tri_kd, tri_drag, tri_lift)
|
|
64
|
-
|
|
65
|
-
assert_np_equal(np.array(builder1.tri_indices), np.array(builder2.tri_indices))
|
|
66
|
-
assert_np_equal(np.array(builder1.tri_poses), np.array(builder2.tri_poses), tol=1.0e-6)
|
|
67
|
-
assert_np_equal(np.array(builder1.tri_activations), np.array(builder2.tri_activations))
|
|
68
|
-
assert_np_equal(np.array(builder1.tri_materials), np.array(builder2.tri_materials))
|
|
69
|
-
|
|
70
|
-
def test_add_edges(self):
|
|
71
|
-
rng = np.random.default_rng(123)
|
|
72
|
-
|
|
73
|
-
pts = np.array(
|
|
74
|
-
[
|
|
75
|
-
[-0.00585869, 0.34189449, -1.17415233],
|
|
76
|
-
[-1.894547, 0.1788074, 0.9251329],
|
|
77
|
-
[-1.26141048, 0.16140787, 0.08823282],
|
|
78
|
-
[-0.08609255, -0.82722546, 0.65995427],
|
|
79
|
-
[0.78827592, -1.77375711, -0.55582718],
|
|
80
|
-
]
|
|
81
|
-
)
|
|
82
|
-
edges = np.array([[0, 4, 3, 1], [3, 2, 4, 1]])
|
|
83
|
-
|
|
84
|
-
builder1 = ModelBuilder()
|
|
85
|
-
builder2 = ModelBuilder()
|
|
86
|
-
for pt in pts:
|
|
87
|
-
builder1.add_particle(wp.vec3(pt), wp.vec3(), 1.0)
|
|
88
|
-
builder2.add_particle(wp.vec3(pt), wp.vec3(), 1.0)
|
|
89
|
-
|
|
90
|
-
# test defaults:
|
|
91
|
-
for i in range(2):
|
|
92
|
-
builder1.add_edge(edges[i, 0], edges[i, 1], edges[i, 2], edges[i, 3])
|
|
93
|
-
builder2.add_edges(edges[:, 0], edges[:, 1], edges[:, 2], edges[:, 3])
|
|
94
|
-
|
|
95
|
-
# test non defaults:
|
|
96
|
-
rest = rng.standard_normal(size=2)
|
|
97
|
-
edge_ke = rng.standard_normal(size=2)
|
|
98
|
-
edge_kd = rng.standard_normal(size=2)
|
|
99
|
-
for i in range(2):
|
|
100
|
-
builder1.add_edge(edges[i, 0], edges[i, 1], edges[i, 2], edges[i, 3], rest[i], edge_ke[i], edge_kd[i])
|
|
101
|
-
builder2.add_edges(edges[:, 0], edges[:, 1], edges[:, 2], edges[:, 3], rest, edge_ke, edge_kd)
|
|
102
|
-
|
|
103
|
-
assert_np_equal(np.array(builder1.edge_indices), np.array(builder2.edge_indices))
|
|
104
|
-
assert_np_equal(np.array(builder1.edge_rest_angle), np.array(builder2.edge_rest_angle), tol=1.0e-4)
|
|
105
|
-
assert_np_equal(np.array(builder1.edge_bending_properties), np.array(builder2.edge_bending_properties))
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
if __name__ == "__main__":
|
|
109
|
-
wp.build.clear_kernel_cache()
|
|
110
|
-
unittest.main(verbosity=2)
|
|
1
|
+
# Copyright (c) 2022 NVIDIA CORPORATION. All rights reserved.
|
|
2
|
+
# NVIDIA CORPORATION and its licensors retain all intellectual property
|
|
3
|
+
# and proprietary rights in and to this software, related documentation
|
|
4
|
+
# and any modifications thereto. Any use, reproduction, disclosure or
|
|
5
|
+
# distribution of this software and related documentation without an express
|
|
6
|
+
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
|
+
|
|
8
|
+
import unittest
|
|
9
|
+
|
|
10
|
+
import numpy as np
|
|
11
|
+
|
|
12
|
+
import warp as wp
|
|
13
|
+
from warp.sim import ModelBuilder
|
|
14
|
+
from warp.tests.unittest_utils import *
|
|
15
|
+
|
|
16
|
+
wp.init()
|
|
17
|
+
|
|
18
|
+
|
|
19
|
+
class TestModel(unittest.TestCase):
|
|
20
|
+
def test_add_triangles(self):
|
|
21
|
+
rng = np.random.default_rng(123)
|
|
22
|
+
|
|
23
|
+
pts = np.array(
|
|
24
|
+
[
|
|
25
|
+
[-0.00585869, 0.34189449, -1.17415233],
|
|
26
|
+
[-1.894547, 0.1788074, 0.9251329],
|
|
27
|
+
[-1.26141048, 0.16140787, 0.08823282],
|
|
28
|
+
[-0.08609255, -0.82722546, 0.65995427],
|
|
29
|
+
[0.78827592, -1.77375711, -0.55582718],
|
|
30
|
+
]
|
|
31
|
+
)
|
|
32
|
+
tris = np.array([[0, 3, 4], [0, 2, 3], [2, 1, 3], [1, 4, 3]])
|
|
33
|
+
|
|
34
|
+
builder1 = ModelBuilder()
|
|
35
|
+
builder2 = ModelBuilder()
|
|
36
|
+
for pt in pts:
|
|
37
|
+
builder1.add_particle(wp.vec3(pt), wp.vec3(), 1.0)
|
|
38
|
+
builder2.add_particle(wp.vec3(pt), wp.vec3(), 1.0)
|
|
39
|
+
|
|
40
|
+
# test add_triangle(s) with default arguments:
|
|
41
|
+
areas = builder2.add_triangles(tris[:, 0], tris[:, 1], tris[:, 2])
|
|
42
|
+
for i, t in enumerate(tris):
|
|
43
|
+
area = builder1.add_triangle(t[0], t[1], t[2])
|
|
44
|
+
self.assertAlmostEqual(area, areas[i], places=6)
|
|
45
|
+
|
|
46
|
+
# test add_triangle(s) with non default arguments:
|
|
47
|
+
tri_ke = rng.standard_normal(size=pts.shape[0])
|
|
48
|
+
tri_ka = rng.standard_normal(size=pts.shape[0])
|
|
49
|
+
tri_kd = rng.standard_normal(size=pts.shape[0])
|
|
50
|
+
tri_drag = rng.standard_normal(size=pts.shape[0])
|
|
51
|
+
tri_lift = rng.standard_normal(size=pts.shape[0])
|
|
52
|
+
for i, t in enumerate(tris):
|
|
53
|
+
builder1.add_triangle(
|
|
54
|
+
t[0],
|
|
55
|
+
t[1],
|
|
56
|
+
t[2],
|
|
57
|
+
tri_ke[i],
|
|
58
|
+
tri_ka[i],
|
|
59
|
+
tri_kd[i],
|
|
60
|
+
tri_drag[i],
|
|
61
|
+
tri_lift[i],
|
|
62
|
+
)
|
|
63
|
+
builder2.add_triangles(tris[:, 0], tris[:, 1], tris[:, 2], tri_ke, tri_ka, tri_kd, tri_drag, tri_lift)
|
|
64
|
+
|
|
65
|
+
assert_np_equal(np.array(builder1.tri_indices), np.array(builder2.tri_indices))
|
|
66
|
+
assert_np_equal(np.array(builder1.tri_poses), np.array(builder2.tri_poses), tol=1.0e-6)
|
|
67
|
+
assert_np_equal(np.array(builder1.tri_activations), np.array(builder2.tri_activations))
|
|
68
|
+
assert_np_equal(np.array(builder1.tri_materials), np.array(builder2.tri_materials))
|
|
69
|
+
|
|
70
|
+
def test_add_edges(self):
|
|
71
|
+
rng = np.random.default_rng(123)
|
|
72
|
+
|
|
73
|
+
pts = np.array(
|
|
74
|
+
[
|
|
75
|
+
[-0.00585869, 0.34189449, -1.17415233],
|
|
76
|
+
[-1.894547, 0.1788074, 0.9251329],
|
|
77
|
+
[-1.26141048, 0.16140787, 0.08823282],
|
|
78
|
+
[-0.08609255, -0.82722546, 0.65995427],
|
|
79
|
+
[0.78827592, -1.77375711, -0.55582718],
|
|
80
|
+
]
|
|
81
|
+
)
|
|
82
|
+
edges = np.array([[0, 4, 3, 1], [3, 2, 4, 1]])
|
|
83
|
+
|
|
84
|
+
builder1 = ModelBuilder()
|
|
85
|
+
builder2 = ModelBuilder()
|
|
86
|
+
for pt in pts:
|
|
87
|
+
builder1.add_particle(wp.vec3(pt), wp.vec3(), 1.0)
|
|
88
|
+
builder2.add_particle(wp.vec3(pt), wp.vec3(), 1.0)
|
|
89
|
+
|
|
90
|
+
# test defaults:
|
|
91
|
+
for i in range(2):
|
|
92
|
+
builder1.add_edge(edges[i, 0], edges[i, 1], edges[i, 2], edges[i, 3])
|
|
93
|
+
builder2.add_edges(edges[:, 0], edges[:, 1], edges[:, 2], edges[:, 3])
|
|
94
|
+
|
|
95
|
+
# test non defaults:
|
|
96
|
+
rest = rng.standard_normal(size=2)
|
|
97
|
+
edge_ke = rng.standard_normal(size=2)
|
|
98
|
+
edge_kd = rng.standard_normal(size=2)
|
|
99
|
+
for i in range(2):
|
|
100
|
+
builder1.add_edge(edges[i, 0], edges[i, 1], edges[i, 2], edges[i, 3], rest[i], edge_ke[i], edge_kd[i])
|
|
101
|
+
builder2.add_edges(edges[:, 0], edges[:, 1], edges[:, 2], edges[:, 3], rest, edge_ke, edge_kd)
|
|
102
|
+
|
|
103
|
+
assert_np_equal(np.array(builder1.edge_indices), np.array(builder2.edge_indices))
|
|
104
|
+
assert_np_equal(np.array(builder1.edge_rest_angle), np.array(builder2.edge_rest_angle), tol=1.0e-4)
|
|
105
|
+
assert_np_equal(np.array(builder1.edge_bending_properties), np.array(builder2.edge_bending_properties))
|
|
106
|
+
|
|
107
|
+
|
|
108
|
+
if __name__ == "__main__":
|
|
109
|
+
wp.build.clear_kernel_cache()
|
|
110
|
+
unittest.main(verbosity=2)
|
warp/tests/test_modules_lite.py
CHANGED
|
@@ -1,39 +1,39 @@
|
|
|
1
|
-
# Copyright (c) 2023 NVIDIA CORPORATION. All rights reserved.
|
|
2
|
-
# NVIDIA CORPORATION and its licensors retain all intellectual property
|
|
3
|
-
# and proprietary rights in and to this software, related documentation
|
|
4
|
-
# and any modifications thereto. Any use, reproduction, disclosure or
|
|
5
|
-
# distribution of this software and related documentation without an express
|
|
6
|
-
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
|
-
|
|
8
|
-
import unittest
|
|
9
|
-
|
|
10
|
-
import warp as wp
|
|
11
|
-
from warp.tests.unittest_utils import *
|
|
12
|
-
|
|
13
|
-
wp.init()
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
devices = get_test_devices()
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
class TestModuleLite(unittest.TestCase):
|
|
20
|
-
def test_module_lite_load(self):
|
|
21
|
-
# Load current module
|
|
22
|
-
wp.load_module()
|
|
23
|
-
|
|
24
|
-
# Load named module
|
|
25
|
-
wp.load_module(wp.config)
|
|
26
|
-
|
|
27
|
-
# Load named module (string)
|
|
28
|
-
wp.load_module(wp.config, recursive=True)
|
|
29
|
-
|
|
30
|
-
def test_module_lite_options(self):
|
|
31
|
-
wp.set_module_options({"max_unroll": 8})
|
|
32
|
-
module_options = wp.get_module_options()
|
|
33
|
-
self.assertIsInstance(module_options, dict)
|
|
34
|
-
self.assertEqual(module_options["max_unroll"], 8)
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
if __name__ == "__main__":
|
|
38
|
-
wp.build.clear_kernel_cache()
|
|
39
|
-
unittest.main(verbosity=2)
|
|
1
|
+
# Copyright (c) 2023 NVIDIA CORPORATION. All rights reserved.
|
|
2
|
+
# NVIDIA CORPORATION and its licensors retain all intellectual property
|
|
3
|
+
# and proprietary rights in and to this software, related documentation
|
|
4
|
+
# and any modifications thereto. Any use, reproduction, disclosure or
|
|
5
|
+
# distribution of this software and related documentation without an express
|
|
6
|
+
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
|
+
|
|
8
|
+
import unittest
|
|
9
|
+
|
|
10
|
+
import warp as wp
|
|
11
|
+
from warp.tests.unittest_utils import *
|
|
12
|
+
|
|
13
|
+
wp.init()
|
|
14
|
+
|
|
15
|
+
|
|
16
|
+
devices = get_test_devices()
|
|
17
|
+
|
|
18
|
+
|
|
19
|
+
class TestModuleLite(unittest.TestCase):
|
|
20
|
+
def test_module_lite_load(self):
|
|
21
|
+
# Load current module
|
|
22
|
+
wp.load_module()
|
|
23
|
+
|
|
24
|
+
# Load named module
|
|
25
|
+
wp.load_module(wp.config)
|
|
26
|
+
|
|
27
|
+
# Load named module (string)
|
|
28
|
+
wp.load_module(wp.config, recursive=True)
|
|
29
|
+
|
|
30
|
+
def test_module_lite_options(self):
|
|
31
|
+
wp.set_module_options({"max_unroll": 8})
|
|
32
|
+
module_options = wp.get_module_options()
|
|
33
|
+
self.assertIsInstance(module_options, dict)
|
|
34
|
+
self.assertEqual(module_options["max_unroll"], 8)
|
|
35
|
+
|
|
36
|
+
|
|
37
|
+
if __name__ == "__main__":
|
|
38
|
+
wp.build.clear_kernel_cache()
|
|
39
|
+
unittest.main(verbosity=2)
|
warp/tests/test_multigpu.py
CHANGED
|
@@ -1,163 +1,163 @@
|
|
|
1
|
-
# Copyright (c) 2022 NVIDIA CORPORATION. All rights reserved.
|
|
2
|
-
# NVIDIA CORPORATION and its licensors retain all intellectual property
|
|
3
|
-
# and proprietary rights in and to this software, related documentation
|
|
4
|
-
# and any modifications thereto. Any use, reproduction, disclosure or
|
|
5
|
-
# distribution of this software and related documentation without an express
|
|
6
|
-
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
|
-
|
|
8
|
-
import unittest
|
|
9
|
-
|
|
10
|
-
import numpy as np
|
|
11
|
-
|
|
12
|
-
import warp as wp
|
|
13
|
-
from warp.
|
|
14
|
-
from warp.
|
|
15
|
-
|
|
16
|
-
wp.init()
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
@wp.kernel
|
|
20
|
-
def inc(a: wp.array(dtype=float)):
|
|
21
|
-
tid = wp.tid()
|
|
22
|
-
a[tid] = a[tid] + 1.0
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
@wp.kernel
|
|
26
|
-
def arange(start: int, step: int, a: wp.array(dtype=int)):
|
|
27
|
-
tid = wp.tid()
|
|
28
|
-
a[tid] = start + step * tid
|
|
29
|
-
|
|
30
|
-
|
|
31
|
-
class TestMultiGPU(unittest.TestCase):
|
|
32
|
-
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
33
|
-
def test_multigpu_set_device(self):
|
|
34
|
-
# save default device
|
|
35
|
-
saved_device = wp.get_device()
|
|
36
|
-
|
|
37
|
-
n = 32
|
|
38
|
-
|
|
39
|
-
wp.set_device("cuda:0")
|
|
40
|
-
a0 = wp.empty(n, dtype=int)
|
|
41
|
-
wp.launch(arange, dim=a0.size, inputs=[0, 1, a0])
|
|
42
|
-
|
|
43
|
-
wp.set_device("cuda:1")
|
|
44
|
-
a1 = wp.empty(n, dtype=int)
|
|
45
|
-
wp.launch(arange, dim=a1.size, inputs=[0, 1, a1])
|
|
46
|
-
|
|
47
|
-
# restore default device
|
|
48
|
-
wp.set_device(saved_device)
|
|
49
|
-
|
|
50
|
-
assert a0.device == "cuda:0"
|
|
51
|
-
assert a1.device == "cuda:1"
|
|
52
|
-
|
|
53
|
-
expected = np.arange(n, dtype=int)
|
|
54
|
-
|
|
55
|
-
assert_np_equal(a0.numpy(), expected)
|
|
56
|
-
assert_np_equal(a1.numpy(), expected)
|
|
57
|
-
|
|
58
|
-
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
59
|
-
def test_multigpu_scoped_device(self):
|
|
60
|
-
n = 32
|
|
61
|
-
|
|
62
|
-
with wp.ScopedDevice("cuda:0"):
|
|
63
|
-
a0 = wp.empty(n, dtype=int)
|
|
64
|
-
wp.launch(arange, dim=a0.size, inputs=[0, 1, a0])
|
|
65
|
-
|
|
66
|
-
with wp.ScopedDevice("cuda:1"):
|
|
67
|
-
a1 = wp.empty(n, dtype=int)
|
|
68
|
-
wp.launch(arange, dim=a1.size, inputs=[0, 1, a1])
|
|
69
|
-
|
|
70
|
-
assert a0.device == "cuda:0"
|
|
71
|
-
assert a1.device == "cuda:1"
|
|
72
|
-
|
|
73
|
-
expected = np.arange(n, dtype=int)
|
|
74
|
-
|
|
75
|
-
assert_np_equal(a0.numpy(), expected)
|
|
76
|
-
assert_np_equal(a1.numpy(), expected)
|
|
77
|
-
|
|
78
|
-
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
79
|
-
def test_multigpu_nesting(self):
|
|
80
|
-
initial_device = wp.get_device()
|
|
81
|
-
initial_cuda_device = wp.get_cuda_device()
|
|
82
|
-
|
|
83
|
-
with wp.ScopedDevice("cuda:1"):
|
|
84
|
-
assert wp.get_device() == "cuda:1"
|
|
85
|
-
assert wp.get_cuda_device() == "cuda:1"
|
|
86
|
-
|
|
87
|
-
with wp.ScopedDevice("cuda:0"):
|
|
88
|
-
assert wp.get_device() == "cuda:0"
|
|
89
|
-
assert wp.get_cuda_device() == "cuda:0"
|
|
90
|
-
|
|
91
|
-
with wp.ScopedDevice("cpu"):
|
|
92
|
-
assert wp.get_device() == "cpu"
|
|
93
|
-
assert wp.get_cuda_device() == "cuda:0"
|
|
94
|
-
|
|
95
|
-
wp.set_device("cuda:1")
|
|
96
|
-
|
|
97
|
-
assert wp.get_device() == "cuda:1"
|
|
98
|
-
assert wp.get_cuda_device() == "cuda:1"
|
|
99
|
-
|
|
100
|
-
assert wp.get_device() == "cuda:0"
|
|
101
|
-
assert wp.get_cuda_device() == "cuda:0"
|
|
102
|
-
|
|
103
|
-
assert wp.get_device() == "cuda:1"
|
|
104
|
-
assert wp.get_cuda_device() == "cuda:1"
|
|
105
|
-
|
|
106
|
-
assert wp.get_device() == initial_device
|
|
107
|
-
assert wp.get_cuda_device() == initial_cuda_device
|
|
108
|
-
|
|
109
|
-
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
110
|
-
@unittest.skipUnless(check_iommu(), "IOMMU seems enabled")
|
|
111
|
-
def test_multigpu_pingpong(self):
|
|
112
|
-
n = 1024 * 1024
|
|
113
|
-
|
|
114
|
-
a0 = wp.zeros(n, dtype=float, device="cuda:0")
|
|
115
|
-
a1 = wp.zeros(n, dtype=float, device="cuda:1")
|
|
116
|
-
|
|
117
|
-
iters = 10
|
|
118
|
-
|
|
119
|
-
for _ in range(iters):
|
|
120
|
-
wp.launch(inc, dim=a0.size, inputs=[a0], device=a0.device)
|
|
121
|
-
wp.synchronize_device(a0.device)
|
|
122
|
-
wp.copy(a1, a0)
|
|
123
|
-
|
|
124
|
-
wp.launch(inc, dim=a1.size, inputs=[a1], device=a1.device)
|
|
125
|
-
wp.synchronize_device(a1.device)
|
|
126
|
-
wp.copy(a0, a1)
|
|
127
|
-
|
|
128
|
-
expected = np.full(n, iters * 2, dtype=np.float32)
|
|
129
|
-
|
|
130
|
-
assert_np_equal(a0.numpy(), expected)
|
|
131
|
-
assert_np_equal(a1.numpy(), expected)
|
|
132
|
-
|
|
133
|
-
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
134
|
-
@unittest.skipUnless(check_iommu(), "IOMMU seems enabled")
|
|
135
|
-
def test_multigpu_pingpong_streams(self):
|
|
136
|
-
n = 1024 * 1024
|
|
137
|
-
|
|
138
|
-
a0 = wp.zeros(n, dtype=float, device="cuda:0")
|
|
139
|
-
a1 = wp.zeros(n, dtype=float, device="cuda:1")
|
|
140
|
-
|
|
141
|
-
stream0 = wp.get_stream("cuda:0")
|
|
142
|
-
stream1 = wp.get_stream("cuda:1")
|
|
143
|
-
|
|
144
|
-
iters = 10
|
|
145
|
-
|
|
146
|
-
for _ in range(iters):
|
|
147
|
-
wp.launch(inc, dim=a0.size, inputs=[a0], stream=stream0)
|
|
148
|
-
stream1.wait_stream(stream0)
|
|
149
|
-
wp.copy(a1, a0, stream=stream1)
|
|
150
|
-
|
|
151
|
-
wp.launch(inc, dim=a1.size, inputs=[a1], stream=stream1)
|
|
152
|
-
stream0.wait_stream(stream1)
|
|
153
|
-
wp.copy(a0, a1, stream=stream0)
|
|
154
|
-
|
|
155
|
-
expected = np.full(n, iters * 2, dtype=np.float32)
|
|
156
|
-
|
|
157
|
-
assert_np_equal(a0.numpy(), expected)
|
|
158
|
-
assert_np_equal(a1.numpy(), expected)
|
|
159
|
-
|
|
160
|
-
|
|
161
|
-
if __name__ == "__main__":
|
|
162
|
-
wp.build.clear_kernel_cache()
|
|
163
|
-
unittest.main(verbosity=2, failfast=False)
|
|
1
|
+
# Copyright (c) 2022 NVIDIA CORPORATION. All rights reserved.
|
|
2
|
+
# NVIDIA CORPORATION and its licensors retain all intellectual property
|
|
3
|
+
# and proprietary rights in and to this software, related documentation
|
|
4
|
+
# and any modifications thereto. Any use, reproduction, disclosure or
|
|
5
|
+
# distribution of this software and related documentation without an express
|
|
6
|
+
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
|
+
|
|
8
|
+
import unittest
|
|
9
|
+
|
|
10
|
+
import numpy as np
|
|
11
|
+
|
|
12
|
+
import warp as wp
|
|
13
|
+
from warp.tests.unittest_utils import *
|
|
14
|
+
from warp.utils import check_iommu
|
|
15
|
+
|
|
16
|
+
wp.init()
|
|
17
|
+
|
|
18
|
+
|
|
19
|
+
@wp.kernel
|
|
20
|
+
def inc(a: wp.array(dtype=float)):
|
|
21
|
+
tid = wp.tid()
|
|
22
|
+
a[tid] = a[tid] + 1.0
|
|
23
|
+
|
|
24
|
+
|
|
25
|
+
@wp.kernel
|
|
26
|
+
def arange(start: int, step: int, a: wp.array(dtype=int)):
|
|
27
|
+
tid = wp.tid()
|
|
28
|
+
a[tid] = start + step * tid
|
|
29
|
+
|
|
30
|
+
|
|
31
|
+
class TestMultiGPU(unittest.TestCase):
|
|
32
|
+
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
33
|
+
def test_multigpu_set_device(self):
|
|
34
|
+
# save default device
|
|
35
|
+
saved_device = wp.get_device()
|
|
36
|
+
|
|
37
|
+
n = 32
|
|
38
|
+
|
|
39
|
+
wp.set_device("cuda:0")
|
|
40
|
+
a0 = wp.empty(n, dtype=int)
|
|
41
|
+
wp.launch(arange, dim=a0.size, inputs=[0, 1, a0])
|
|
42
|
+
|
|
43
|
+
wp.set_device("cuda:1")
|
|
44
|
+
a1 = wp.empty(n, dtype=int)
|
|
45
|
+
wp.launch(arange, dim=a1.size, inputs=[0, 1, a1])
|
|
46
|
+
|
|
47
|
+
# restore default device
|
|
48
|
+
wp.set_device(saved_device)
|
|
49
|
+
|
|
50
|
+
assert a0.device == "cuda:0"
|
|
51
|
+
assert a1.device == "cuda:1"
|
|
52
|
+
|
|
53
|
+
expected = np.arange(n, dtype=int)
|
|
54
|
+
|
|
55
|
+
assert_np_equal(a0.numpy(), expected)
|
|
56
|
+
assert_np_equal(a1.numpy(), expected)
|
|
57
|
+
|
|
58
|
+
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
59
|
+
def test_multigpu_scoped_device(self):
|
|
60
|
+
n = 32
|
|
61
|
+
|
|
62
|
+
with wp.ScopedDevice("cuda:0"):
|
|
63
|
+
a0 = wp.empty(n, dtype=int)
|
|
64
|
+
wp.launch(arange, dim=a0.size, inputs=[0, 1, a0])
|
|
65
|
+
|
|
66
|
+
with wp.ScopedDevice("cuda:1"):
|
|
67
|
+
a1 = wp.empty(n, dtype=int)
|
|
68
|
+
wp.launch(arange, dim=a1.size, inputs=[0, 1, a1])
|
|
69
|
+
|
|
70
|
+
assert a0.device == "cuda:0"
|
|
71
|
+
assert a1.device == "cuda:1"
|
|
72
|
+
|
|
73
|
+
expected = np.arange(n, dtype=int)
|
|
74
|
+
|
|
75
|
+
assert_np_equal(a0.numpy(), expected)
|
|
76
|
+
assert_np_equal(a1.numpy(), expected)
|
|
77
|
+
|
|
78
|
+
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
79
|
+
def test_multigpu_nesting(self):
|
|
80
|
+
initial_device = wp.get_device()
|
|
81
|
+
initial_cuda_device = wp.get_cuda_device()
|
|
82
|
+
|
|
83
|
+
with wp.ScopedDevice("cuda:1"):
|
|
84
|
+
assert wp.get_device() == "cuda:1"
|
|
85
|
+
assert wp.get_cuda_device() == "cuda:1"
|
|
86
|
+
|
|
87
|
+
with wp.ScopedDevice("cuda:0"):
|
|
88
|
+
assert wp.get_device() == "cuda:0"
|
|
89
|
+
assert wp.get_cuda_device() == "cuda:0"
|
|
90
|
+
|
|
91
|
+
with wp.ScopedDevice("cpu"):
|
|
92
|
+
assert wp.get_device() == "cpu"
|
|
93
|
+
assert wp.get_cuda_device() == "cuda:0"
|
|
94
|
+
|
|
95
|
+
wp.set_device("cuda:1")
|
|
96
|
+
|
|
97
|
+
assert wp.get_device() == "cuda:1"
|
|
98
|
+
assert wp.get_cuda_device() == "cuda:1"
|
|
99
|
+
|
|
100
|
+
assert wp.get_device() == "cuda:0"
|
|
101
|
+
assert wp.get_cuda_device() == "cuda:0"
|
|
102
|
+
|
|
103
|
+
assert wp.get_device() == "cuda:1"
|
|
104
|
+
assert wp.get_cuda_device() == "cuda:1"
|
|
105
|
+
|
|
106
|
+
assert wp.get_device() == initial_device
|
|
107
|
+
assert wp.get_cuda_device() == initial_cuda_device
|
|
108
|
+
|
|
109
|
+
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
110
|
+
@unittest.skipUnless(check_iommu(), "IOMMU seems enabled")
|
|
111
|
+
def test_multigpu_pingpong(self):
|
|
112
|
+
n = 1024 * 1024
|
|
113
|
+
|
|
114
|
+
a0 = wp.zeros(n, dtype=float, device="cuda:0")
|
|
115
|
+
a1 = wp.zeros(n, dtype=float, device="cuda:1")
|
|
116
|
+
|
|
117
|
+
iters = 10
|
|
118
|
+
|
|
119
|
+
for _ in range(iters):
|
|
120
|
+
wp.launch(inc, dim=a0.size, inputs=[a0], device=a0.device)
|
|
121
|
+
wp.synchronize_device(a0.device)
|
|
122
|
+
wp.copy(a1, a0)
|
|
123
|
+
|
|
124
|
+
wp.launch(inc, dim=a1.size, inputs=[a1], device=a1.device)
|
|
125
|
+
wp.synchronize_device(a1.device)
|
|
126
|
+
wp.copy(a0, a1)
|
|
127
|
+
|
|
128
|
+
expected = np.full(n, iters * 2, dtype=np.float32)
|
|
129
|
+
|
|
130
|
+
assert_np_equal(a0.numpy(), expected)
|
|
131
|
+
assert_np_equal(a1.numpy(), expected)
|
|
132
|
+
|
|
133
|
+
@unittest.skipUnless(len(wp.get_cuda_devices()) > 1, "Requires at least two CUDA devices")
|
|
134
|
+
@unittest.skipUnless(check_iommu(), "IOMMU seems enabled")
|
|
135
|
+
def test_multigpu_pingpong_streams(self):
|
|
136
|
+
n = 1024 * 1024
|
|
137
|
+
|
|
138
|
+
a0 = wp.zeros(n, dtype=float, device="cuda:0")
|
|
139
|
+
a1 = wp.zeros(n, dtype=float, device="cuda:1")
|
|
140
|
+
|
|
141
|
+
stream0 = wp.get_stream("cuda:0")
|
|
142
|
+
stream1 = wp.get_stream("cuda:1")
|
|
143
|
+
|
|
144
|
+
iters = 10
|
|
145
|
+
|
|
146
|
+
for _ in range(iters):
|
|
147
|
+
wp.launch(inc, dim=a0.size, inputs=[a0], stream=stream0)
|
|
148
|
+
stream1.wait_stream(stream0)
|
|
149
|
+
wp.copy(a1, a0, stream=stream1)
|
|
150
|
+
|
|
151
|
+
wp.launch(inc, dim=a1.size, inputs=[a1], stream=stream1)
|
|
152
|
+
stream0.wait_stream(stream1)
|
|
153
|
+
wp.copy(a0, a1, stream=stream0)
|
|
154
|
+
|
|
155
|
+
expected = np.full(n, iters * 2, dtype=np.float32)
|
|
156
|
+
|
|
157
|
+
assert_np_equal(a0.numpy(), expected)
|
|
158
|
+
assert_np_equal(a1.numpy(), expected)
|
|
159
|
+
|
|
160
|
+
|
|
161
|
+
if __name__ == "__main__":
|
|
162
|
+
wp.build.clear_kernel_cache()
|
|
163
|
+
unittest.main(verbosity=2, failfast=False)
|