warp-lang 1.0.0b2__py3-none-manylinux2014_x86_64.whl → 1.0.0b6__py3-none-manylinux2014_x86_64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- docs/conf.py +17 -5
- examples/env/env_ant.py +1 -1
- examples/env/env_cartpole.py +1 -1
- examples/env/env_humanoid.py +1 -1
- examples/env/env_usd.py +4 -1
- examples/env/environment.py +8 -9
- examples/example_dem.py +34 -33
- examples/example_diffray.py +364 -337
- examples/example_fluid.py +32 -23
- examples/example_jacobian_ik.py +97 -93
- examples/example_marching_cubes.py +6 -16
- examples/example_mesh.py +6 -16
- examples/example_mesh_intersect.py +16 -14
- examples/example_nvdb.py +14 -16
- examples/example_raycast.py +14 -13
- examples/example_raymarch.py +16 -23
- examples/example_render_opengl.py +19 -10
- examples/example_sim_cartpole.py +82 -78
- examples/example_sim_cloth.py +45 -48
- examples/example_sim_fk_grad.py +51 -44
- examples/example_sim_fk_grad_torch.py +47 -40
- examples/example_sim_grad_bounce.py +108 -133
- examples/example_sim_grad_cloth.py +99 -113
- examples/example_sim_granular.py +5 -6
- examples/{example_sim_sdf_shape.py → example_sim_granular_collision_sdf.py} +37 -26
- examples/example_sim_neo_hookean.py +51 -55
- examples/example_sim_particle_chain.py +4 -4
- examples/example_sim_quadruped.py +126 -81
- examples/example_sim_rigid_chain.py +54 -61
- examples/example_sim_rigid_contact.py +66 -70
- examples/example_sim_rigid_fem.py +3 -3
- examples/example_sim_rigid_force.py +1 -1
- examples/example_sim_rigid_gyroscopic.py +3 -4
- examples/example_sim_rigid_kinematics.py +28 -39
- examples/example_sim_trajopt.py +112 -110
- examples/example_sph.py +9 -8
- examples/example_wave.py +7 -7
- examples/fem/bsr_utils.py +30 -17
- examples/fem/example_apic_fluid.py +85 -69
- examples/fem/example_convection_diffusion.py +97 -93
- examples/fem/example_convection_diffusion_dg.py +142 -149
- examples/fem/example_convection_diffusion_dg0.py +141 -136
- examples/fem/example_deformed_geometry.py +146 -0
- examples/fem/example_diffusion.py +115 -84
- examples/fem/example_diffusion_3d.py +116 -86
- examples/fem/example_diffusion_mgpu.py +102 -79
- examples/fem/example_mixed_elasticity.py +139 -100
- examples/fem/example_navier_stokes.py +175 -162
- examples/fem/example_stokes.py +143 -111
- examples/fem/example_stokes_transfer.py +186 -157
- examples/fem/mesh_utils.py +59 -97
- examples/fem/plot_utils.py +138 -17
- tools/ci/publishing/build_nodes_info.py +54 -0
- warp/__init__.py +4 -3
- warp/__init__.pyi +1 -0
- warp/bin/warp-clang.so +0 -0
- warp/bin/warp.so +0 -0
- warp/build.py +5 -3
- warp/build_dll.py +29 -9
- warp/builtins.py +836 -492
- warp/codegen.py +864 -553
- warp/config.py +3 -1
- warp/context.py +389 -172
- warp/fem/__init__.py +24 -6
- warp/fem/cache.py +318 -25
- warp/fem/dirichlet.py +7 -3
- warp/fem/domain.py +14 -0
- warp/fem/field/__init__.py +30 -38
- warp/fem/field/field.py +149 -0
- warp/fem/field/nodal_field.py +244 -138
- warp/fem/field/restriction.py +8 -6
- warp/fem/field/test.py +127 -59
- warp/fem/field/trial.py +117 -60
- warp/fem/geometry/__init__.py +5 -1
- warp/fem/geometry/deformed_geometry.py +271 -0
- warp/fem/geometry/element.py +24 -1
- warp/fem/geometry/geometry.py +86 -14
- warp/fem/geometry/grid_2d.py +112 -54
- warp/fem/geometry/grid_3d.py +134 -65
- warp/fem/geometry/hexmesh.py +953 -0
- warp/fem/geometry/partition.py +85 -33
- warp/fem/geometry/quadmesh_2d.py +532 -0
- warp/fem/geometry/tetmesh.py +451 -115
- warp/fem/geometry/trimesh_2d.py +197 -92
- warp/fem/integrate.py +534 -268
- warp/fem/operator.py +58 -31
- warp/fem/polynomial.py +11 -0
- warp/fem/quadrature/__init__.py +1 -1
- warp/fem/quadrature/pic_quadrature.py +150 -58
- warp/fem/quadrature/quadrature.py +209 -57
- warp/fem/space/__init__.py +230 -53
- warp/fem/space/basis_space.py +489 -0
- warp/fem/space/collocated_function_space.py +105 -0
- warp/fem/space/dof_mapper.py +49 -2
- warp/fem/space/function_space.py +90 -39
- warp/fem/space/grid_2d_function_space.py +149 -496
- warp/fem/space/grid_3d_function_space.py +173 -538
- warp/fem/space/hexmesh_function_space.py +352 -0
- warp/fem/space/partition.py +129 -76
- warp/fem/space/quadmesh_2d_function_space.py +369 -0
- warp/fem/space/restriction.py +46 -34
- warp/fem/space/shape/__init__.py +15 -0
- warp/fem/space/shape/cube_shape_function.py +738 -0
- warp/fem/space/shape/shape_function.py +103 -0
- warp/fem/space/shape/square_shape_function.py +611 -0
- warp/fem/space/shape/tet_shape_function.py +567 -0
- warp/fem/space/shape/triangle_shape_function.py +429 -0
- warp/fem/space/tetmesh_function_space.py +132 -1039
- warp/fem/space/topology.py +295 -0
- warp/fem/space/trimesh_2d_function_space.py +104 -742
- warp/fem/types.py +13 -11
- warp/fem/utils.py +335 -60
- warp/native/array.h +120 -34
- warp/native/builtin.h +101 -72
- warp/native/bvh.cpp +73 -325
- warp/native/bvh.cu +406 -23
- warp/native/bvh.h +22 -40
- warp/native/clang/clang.cpp +1 -0
- warp/native/crt.h +2 -0
- warp/native/cuda_util.cpp +8 -3
- warp/native/cuda_util.h +1 -0
- warp/native/exports.h +1522 -1243
- warp/native/intersect.h +19 -4
- warp/native/intersect_adj.h +8 -8
- warp/native/mat.h +76 -17
- warp/native/mesh.cpp +33 -108
- warp/native/mesh.cu +114 -18
- warp/native/mesh.h +395 -40
- warp/native/noise.h +272 -329
- warp/native/quat.h +51 -8
- warp/native/rand.h +44 -34
- warp/native/reduce.cpp +1 -1
- warp/native/sparse.cpp +4 -4
- warp/native/sparse.cu +163 -155
- warp/native/spatial.h +2 -2
- warp/native/temp_buffer.h +18 -14
- warp/native/vec.h +103 -21
- warp/native/warp.cpp +2 -1
- warp/native/warp.cu +28 -3
- warp/native/warp.h +4 -3
- warp/render/render_opengl.py +261 -109
- warp/sim/__init__.py +1 -2
- warp/sim/articulation.py +385 -185
- warp/sim/import_mjcf.py +59 -48
- warp/sim/import_urdf.py +15 -15
- warp/sim/import_usd.py +174 -102
- warp/sim/inertia.py +17 -18
- warp/sim/integrator_xpbd.py +4 -3
- warp/sim/model.py +330 -250
- warp/sim/render.py +1 -1
- warp/sparse.py +625 -152
- warp/stubs.py +341 -309
- warp/tape.py +9 -6
- warp/tests/__main__.py +3 -6
- warp/tests/assets/curlnoise_golden.npy +0 -0
- warp/tests/assets/pnoise_golden.npy +0 -0
- warp/tests/{test_class_kernel.py → aux_test_class_kernel.py} +9 -1
- warp/tests/aux_test_conditional_unequal_types_kernels.py +21 -0
- warp/tests/{test_dependent.py → aux_test_dependent.py} +2 -2
- warp/tests/{test_reference.py → aux_test_reference.py} +1 -1
- warp/tests/aux_test_unresolved_func.py +14 -0
- warp/tests/aux_test_unresolved_symbol.py +14 -0
- warp/tests/disabled_kinematics.py +239 -0
- warp/tests/run_coverage_serial.py +31 -0
- warp/tests/test_adam.py +103 -106
- warp/tests/test_arithmetic.py +94 -74
- warp/tests/test_array.py +82 -101
- warp/tests/test_array_reduce.py +57 -23
- warp/tests/test_atomic.py +64 -28
- warp/tests/test_bool.py +22 -12
- warp/tests/test_builtins_resolution.py +1292 -0
- warp/tests/test_bvh.py +18 -18
- warp/tests/test_closest_point_edge_edge.py +54 -57
- warp/tests/test_codegen.py +165 -134
- warp/tests/test_compile_consts.py +28 -20
- warp/tests/test_conditional.py +108 -24
- warp/tests/test_copy.py +10 -12
- warp/tests/test_ctypes.py +112 -88
- warp/tests/test_dense.py +21 -14
- warp/tests/test_devices.py +98 -0
- warp/tests/test_dlpack.py +75 -75
- warp/tests/test_examples.py +237 -0
- warp/tests/test_fabricarray.py +22 -24
- warp/tests/test_fast_math.py +15 -11
- warp/tests/test_fem.py +1034 -124
- warp/tests/test_fp16.py +23 -16
- warp/tests/test_func.py +187 -86
- warp/tests/test_generics.py +194 -49
- warp/tests/test_grad.py +123 -181
- warp/tests/test_grad_customs.py +176 -0
- warp/tests/test_hash_grid.py +35 -34
- warp/tests/test_import.py +10 -23
- warp/tests/test_indexedarray.py +24 -25
- warp/tests/test_intersect.py +18 -9
- warp/tests/test_large.py +141 -0
- warp/tests/test_launch.py +14 -41
- warp/tests/test_lerp.py +64 -65
- warp/tests/test_lvalue.py +493 -0
- warp/tests/test_marching_cubes.py +12 -13
- warp/tests/test_mat.py +517 -2898
- warp/tests/test_mat_lite.py +115 -0
- warp/tests/test_mat_scalar_ops.py +2889 -0
- warp/tests/test_math.py +103 -9
- warp/tests/test_matmul.py +304 -69
- warp/tests/test_matmul_lite.py +410 -0
- warp/tests/test_mesh.py +60 -22
- warp/tests/test_mesh_query_aabb.py +21 -25
- warp/tests/test_mesh_query_point.py +111 -22
- warp/tests/test_mesh_query_ray.py +12 -24
- warp/tests/test_mlp.py +30 -22
- warp/tests/test_model.py +92 -89
- warp/tests/test_modules_lite.py +39 -0
- warp/tests/test_multigpu.py +88 -114
- warp/tests/test_noise.py +12 -11
- warp/tests/test_operators.py +16 -20
- warp/tests/test_options.py +11 -11
- warp/tests/test_pinned.py +17 -18
- warp/tests/test_print.py +32 -11
- warp/tests/test_quat.py +275 -129
- warp/tests/test_rand.py +18 -16
- warp/tests/test_reload.py +38 -34
- warp/tests/test_rounding.py +50 -43
- warp/tests/test_runlength_encode.py +168 -20
- warp/tests/test_smoothstep.py +9 -11
- warp/tests/test_snippet.py +143 -0
- warp/tests/test_sparse.py +261 -63
- warp/tests/test_spatial.py +276 -243
- warp/tests/test_streams.py +110 -85
- warp/tests/test_struct.py +268 -63
- warp/tests/test_tape.py +39 -21
- warp/tests/test_torch.py +90 -86
- warp/tests/test_transient_module.py +10 -12
- warp/tests/test_types.py +363 -0
- warp/tests/test_utils.py +451 -0
- warp/tests/test_vec.py +354 -2050
- warp/tests/test_vec_lite.py +73 -0
- warp/tests/test_vec_scalar_ops.py +2099 -0
- warp/tests/test_volume.py +418 -376
- warp/tests/test_volume_write.py +124 -134
- warp/tests/unittest_serial.py +35 -0
- warp/tests/unittest_suites.py +291 -0
- warp/tests/unittest_utils.py +342 -0
- warp/tests/{test_misc.py → unused_test_misc.py} +13 -5
- warp/tests/{test_debug.py → walkthough_debug.py} +3 -17
- warp/thirdparty/appdirs.py +36 -45
- warp/thirdparty/unittest_parallel.py +589 -0
- warp/types.py +622 -211
- warp/utils.py +54 -393
- warp_lang-1.0.0b6.dist-info/METADATA +238 -0
- warp_lang-1.0.0b6.dist-info/RECORD +409 -0
- {warp_lang-1.0.0b2.dist-info → warp_lang-1.0.0b6.dist-info}/WHEEL +1 -1
- examples/example_cache_management.py +0 -40
- examples/example_multigpu.py +0 -54
- examples/example_struct.py +0 -65
- examples/fem/example_stokes_transfer_3d.py +0 -210
- warp/fem/field/discrete_field.py +0 -80
- warp/fem/space/nodal_function_space.py +0 -233
- warp/tests/test_all.py +0 -223
- warp/tests/test_array_scan.py +0 -60
- warp/tests/test_base.py +0 -208
- warp/tests/test_unresolved_func.py +0 -7
- warp/tests/test_unresolved_symbol.py +0 -7
- warp_lang-1.0.0b2.dist-info/METADATA +0 -26
- warp_lang-1.0.0b2.dist-info/RECORD +0 -378
- /warp/tests/{test_compile_consts_dummy.py → aux_test_compile_consts_dummy.py} +0 -0
- /warp/tests/{test_reference_reference.py → aux_test_reference_reference.py} +0 -0
- /warp/tests/{test_square.py → aux_test_square.py} +0 -0
- {warp_lang-1.0.0b2.dist-info → warp_lang-1.0.0b6.dist-info}/LICENSE.md +0 -0
- {warp_lang-1.0.0b2.dist-info → warp_lang-1.0.0b6.dist-info}/top_level.txt +0 -0
warp/tests/test_hash_grid.py
CHANGED
|
@@ -5,12 +5,12 @@
|
|
|
5
5
|
# distribution of this software and related documentation without an express
|
|
6
6
|
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
7
|
|
|
8
|
+
import unittest
|
|
9
|
+
|
|
8
10
|
import numpy as np
|
|
9
11
|
|
|
10
12
|
import warp as wp
|
|
11
|
-
from warp.tests.
|
|
12
|
-
|
|
13
|
-
np.random.seed(532)
|
|
13
|
+
from warp.tests.unittest_utils import *
|
|
14
14
|
|
|
15
15
|
wp.init()
|
|
16
16
|
|
|
@@ -72,6 +72,9 @@ def count_neighbors_reference(
|
|
|
72
72
|
|
|
73
73
|
|
|
74
74
|
def test_hashgrid_query(test, device):
|
|
75
|
+
wp.load_module(device=device)
|
|
76
|
+
rng = np.random.default_rng(123)
|
|
77
|
+
|
|
75
78
|
grid = wp.HashGrid(dim_x, dim_y, dim_z, device)
|
|
76
79
|
|
|
77
80
|
for i in range(num_runs):
|
|
@@ -79,15 +82,14 @@ def test_hashgrid_query(test, device):
|
|
|
79
82
|
print(f"Run: {i+1}")
|
|
80
83
|
print("---------")
|
|
81
84
|
|
|
82
|
-
|
|
83
|
-
points = np.random.rand(num_points, 3) * scale - np.array((scale, scale, scale)) * 0.5
|
|
85
|
+
points = rng.random(size=(num_points, 3)) * scale - np.array((scale, scale, scale)) * 0.5
|
|
84
86
|
|
|
85
87
|
def particle_grid(dim_x, dim_y, dim_z, lower, radius, jitter):
|
|
86
88
|
points = np.meshgrid(
|
|
87
89
|
np.linspace(0, dim_x, dim_x), np.linspace(0, dim_y, dim_y), np.linspace(0, dim_z, dim_z)
|
|
88
90
|
)
|
|
89
91
|
points_t = np.array((points[0], points[1], points[2])).T * radius * 2.0 + np.array(lower)
|
|
90
|
-
points_t = points_t +
|
|
92
|
+
points_t = points_t + rng.random(size=points_t.shape) * radius * jitter
|
|
91
93
|
|
|
92
94
|
return points_t.reshape((-1, 3))
|
|
93
95
|
|
|
@@ -97,27 +99,28 @@ def test_hashgrid_query(test, device):
|
|
|
97
99
|
counts_arr = wp.zeros(len(points), dtype=int, device=device)
|
|
98
100
|
counts_arr_ref = wp.zeros(len(points), dtype=int, device=device)
|
|
99
101
|
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
115
|
-
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
119
|
-
|
|
120
|
-
|
|
102
|
+
profiler = {}
|
|
103
|
+
|
|
104
|
+
with wp.ScopedTimer("grid operations", print=print_enabled, dict=profiler, synchronize=True):
|
|
105
|
+
with wp.ScopedTimer("brute", print=print_enabled, dict=profiler, synchronize=True):
|
|
106
|
+
wp.launch(
|
|
107
|
+
kernel=count_neighbors_reference,
|
|
108
|
+
dim=len(points) * len(points),
|
|
109
|
+
inputs=[query_radius, points_arr, counts_arr_ref, len(points)],
|
|
110
|
+
device=device,
|
|
111
|
+
)
|
|
112
|
+
wp.synchronize()
|
|
113
|
+
|
|
114
|
+
with wp.ScopedTimer("grid build", print=print_enabled, dict=profiler, synchronize=True):
|
|
115
|
+
grid.build(points_arr, cell_radius)
|
|
116
|
+
|
|
117
|
+
with wp.ScopedTimer("grid query", print=print_enabled, dict=profiler, synchronize=True):
|
|
118
|
+
wp.launch(
|
|
119
|
+
kernel=count_neighbors,
|
|
120
|
+
dim=len(points),
|
|
121
|
+
inputs=[grid.id, query_radius, points_arr, counts_arr],
|
|
122
|
+
device=device,
|
|
123
|
+
)
|
|
121
124
|
|
|
122
125
|
counts = counts_arr.numpy()
|
|
123
126
|
counts_ref = counts_arr_ref.numpy()
|
|
@@ -131,17 +134,15 @@ def test_hashgrid_query(test, device):
|
|
|
131
134
|
test.assertTrue(np.array_equal(counts, counts_ref))
|
|
132
135
|
|
|
133
136
|
|
|
134
|
-
|
|
135
|
-
devices = get_test_devices()
|
|
137
|
+
devices = get_test_devices()
|
|
136
138
|
|
|
137
|
-
class TestHashGrid(parent):
|
|
138
|
-
pass
|
|
139
139
|
|
|
140
|
-
|
|
140
|
+
class TestHashGrid(unittest.TestCase):
|
|
141
|
+
pass
|
|
141
142
|
|
|
142
|
-
return TestHashGrid
|
|
143
143
|
|
|
144
|
+
add_function_test(TestHashGrid, "test_hashgrid_query", test_hashgrid_query, devices=devices)
|
|
144
145
|
|
|
145
146
|
if __name__ == "__main__":
|
|
146
|
-
|
|
147
|
+
wp.build.clear_kernel_cache()
|
|
147
148
|
unittest.main(verbosity=2, failfast=False)
|
warp/tests/test_import.py
CHANGED
|
@@ -5,20 +5,14 @@
|
|
|
5
5
|
# distribution of this software and related documentation without an express
|
|
6
6
|
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
7
|
|
|
8
|
-
|
|
9
|
-
import numpy as np
|
|
10
|
-
import math
|
|
8
|
+
import unittest
|
|
11
9
|
|
|
12
10
|
import warp as wp
|
|
13
|
-
|
|
14
|
-
|
|
15
|
-
import unittest
|
|
11
|
+
import warp.tests.test_func as test_func
|
|
12
|
+
from warp.tests.unittest_utils import *
|
|
16
13
|
|
|
17
14
|
wp.init()
|
|
18
15
|
|
|
19
|
-
# from test_func import sqr
|
|
20
|
-
import warp.tests.test_func as test_func
|
|
21
|
-
|
|
22
16
|
|
|
23
17
|
@wp.kernel
|
|
24
18
|
def test_import_func():
|
|
@@ -30,23 +24,16 @@ def test_import_func():
|
|
|
30
24
|
wp.expect_eq(y, 8.0)
|
|
31
25
|
|
|
32
26
|
|
|
33
|
-
|
|
34
|
-
devices = get_test_devices()
|
|
35
|
-
|
|
36
|
-
class TestImport(parent):
|
|
37
|
-
pass
|
|
27
|
+
devices = get_test_devices()
|
|
38
28
|
|
|
39
|
-
add_kernel_test(TestImport, kernel=test_import_func, name="test_import_func", dim=1, devices=devices)
|
|
40
29
|
|
|
41
|
-
|
|
30
|
+
class TestImport(unittest.TestCase):
|
|
31
|
+
pass
|
|
42
32
|
|
|
43
33
|
|
|
44
|
-
|
|
45
|
-
c = register(unittest.TestCase)
|
|
46
|
-
# unittest.main(verbosity=2)
|
|
34
|
+
add_kernel_test(TestImport, kernel=test_import_func, name="test_import_func", dim=1, devices=devices)
|
|
47
35
|
|
|
48
|
-
wp.force_load()
|
|
49
36
|
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
37
|
+
if __name__ == "__main__":
|
|
38
|
+
wp.build.clear_kernel_cache()
|
|
39
|
+
unittest.main(verbosity=2)
|
warp/tests/test_indexedarray.py
CHANGED
|
@@ -12,7 +12,7 @@ import numpy as np
|
|
|
12
12
|
|
|
13
13
|
import warp as wp
|
|
14
14
|
from warp.tests.test_array import FillStruct
|
|
15
|
-
from warp.tests.
|
|
15
|
+
from warp.tests.unittest_utils import *
|
|
16
16
|
|
|
17
17
|
wp.init()
|
|
18
18
|
|
|
@@ -36,7 +36,7 @@ def test_indexedarray_1d(test, device):
|
|
|
36
36
|
|
|
37
37
|
indices = wp.array([1, 3, 5, 7, 9], dtype=int, device=device)
|
|
38
38
|
|
|
39
|
-
iarr = wp.
|
|
39
|
+
iarr = wp.indexedarray1d(arr, [indices])
|
|
40
40
|
|
|
41
41
|
test.assertEqual(iarr.dtype, arr.dtype)
|
|
42
42
|
test.assertEqual(iarr.ndim, 1)
|
|
@@ -72,7 +72,7 @@ def test_indexedarray_2d(test, device):
|
|
|
72
72
|
indices0 = wp.array([1, 3], dtype=int, device=device)
|
|
73
73
|
indices1 = wp.array([2, 4, 8], dtype=int, device=device)
|
|
74
74
|
|
|
75
|
-
iarr = wp.
|
|
75
|
+
iarr = wp.indexedarray2d(arr, [indices0, indices1])
|
|
76
76
|
|
|
77
77
|
test.assertEqual(iarr.dtype, arr.dtype)
|
|
78
78
|
test.assertEqual(iarr.ndim, 2)
|
|
@@ -112,7 +112,7 @@ def test_indexedarray_3d(test, device):
|
|
|
112
112
|
indices1 = wp.array([2, 4, 8], dtype=int, device=device)
|
|
113
113
|
indices2 = wp.array([0, 5], dtype=int, device=device)
|
|
114
114
|
|
|
115
|
-
iarr = wp.
|
|
115
|
+
iarr = wp.indexedarray3d(arr, [indices0, indices1, indices2])
|
|
116
116
|
|
|
117
117
|
test.assertEqual(iarr.dtype, arr.dtype)
|
|
118
118
|
test.assertEqual(iarr.ndim, 3)
|
|
@@ -157,7 +157,7 @@ def test_indexedarray_4d(test, device):
|
|
|
157
157
|
indices2 = wp.array([0, 5], dtype=int, device=device)
|
|
158
158
|
indices3 = wp.array([6, 7, 9], dtype=int, device=device)
|
|
159
159
|
|
|
160
|
-
iarr = wp.
|
|
160
|
+
iarr = wp.indexedarray4d(arr, [indices0, indices1, indices2, indices3])
|
|
161
161
|
|
|
162
162
|
test.assertEqual(iarr.dtype, arr.dtype)
|
|
163
163
|
test.assertEqual(iarr.ndim, 4)
|
|
@@ -1106,30 +1106,29 @@ def test_indexedarray_fill_struct(test, device):
|
|
|
1106
1106
|
assert_np_equal(a4.numpy(), np.zeros(a4.shape, dtype=nptype))
|
|
1107
1107
|
|
|
1108
1108
|
|
|
1109
|
-
|
|
1110
|
-
devices = get_test_devices()
|
|
1109
|
+
devices = get_test_devices()
|
|
1111
1110
|
|
|
1112
|
-
class TestIndexedArray(parent):
|
|
1113
|
-
pass
|
|
1114
1111
|
|
|
1115
|
-
|
|
1116
|
-
|
|
1117
|
-
add_function_test(TestIndexedArray, "test_indexedarray_3d", test_indexedarray_3d, devices=devices)
|
|
1118
|
-
add_function_test(TestIndexedArray, "test_indexedarray_4d", test_indexedarray_4d, devices=devices)
|
|
1119
|
-
add_function_test(TestIndexedArray, "test_indexedarray_mixed", test_indexedarray_mixed, devices=devices)
|
|
1120
|
-
add_function_test(TestIndexedArray, "test_indexedarray_shape", test_indexedarray_shape, devices=devices)
|
|
1121
|
-
add_function_test(TestIndexedArray, "test_indexedarray_getitem", test_indexedarray_getitem, devices=devices)
|
|
1122
|
-
add_function_test(TestIndexedArray, "test_indexedarray_slicing", test_indexedarray_slicing, devices=devices)
|
|
1123
|
-
add_function_test(TestIndexedArray, "test_indexedarray_generics", test_indexedarray_generics, devices=devices)
|
|
1124
|
-
add_function_test(TestIndexedArray, "test_indexedarray_empty", test_indexedarray_empty, devices=devices)
|
|
1125
|
-
add_function_test(TestIndexedArray, "test_indexedarray_fill_scalar", test_indexedarray_fill_scalar, devices=devices)
|
|
1126
|
-
add_function_test(TestIndexedArray, "test_indexedarray_fill_vector", test_indexedarray_fill_vector, devices=devices)
|
|
1127
|
-
add_function_test(TestIndexedArray, "test_indexedarray_fill_matrix", test_indexedarray_fill_matrix, devices=devices)
|
|
1128
|
-
add_function_test(TestIndexedArray, "test_indexedarray_fill_struct", test_indexedarray_fill_struct, devices=devices)
|
|
1112
|
+
class TestIndexedArray(unittest.TestCase):
|
|
1113
|
+
pass
|
|
1129
1114
|
|
|
1130
|
-
|
|
1115
|
+
|
|
1116
|
+
add_function_test(TestIndexedArray, "test_indexedarray_1d", test_indexedarray_1d, devices=devices)
|
|
1117
|
+
add_function_test(TestIndexedArray, "test_indexedarray_2d", test_indexedarray_2d, devices=devices)
|
|
1118
|
+
add_function_test(TestIndexedArray, "test_indexedarray_3d", test_indexedarray_3d, devices=devices)
|
|
1119
|
+
add_function_test(TestIndexedArray, "test_indexedarray_4d", test_indexedarray_4d, devices=devices)
|
|
1120
|
+
add_function_test(TestIndexedArray, "test_indexedarray_mixed", test_indexedarray_mixed, devices=devices)
|
|
1121
|
+
add_function_test(TestIndexedArray, "test_indexedarray_shape", test_indexedarray_shape, devices=devices)
|
|
1122
|
+
add_function_test(TestIndexedArray, "test_indexedarray_getitem", test_indexedarray_getitem, devices=devices)
|
|
1123
|
+
add_function_test(TestIndexedArray, "test_indexedarray_slicing", test_indexedarray_slicing, devices=devices)
|
|
1124
|
+
add_function_test(TestIndexedArray, "test_indexedarray_generics", test_indexedarray_generics, devices=devices)
|
|
1125
|
+
add_function_test(TestIndexedArray, "test_indexedarray_empty", test_indexedarray_empty, devices=devices)
|
|
1126
|
+
add_function_test(TestIndexedArray, "test_indexedarray_fill_scalar", test_indexedarray_fill_scalar, devices=devices)
|
|
1127
|
+
add_function_test(TestIndexedArray, "test_indexedarray_fill_vector", test_indexedarray_fill_vector, devices=devices)
|
|
1128
|
+
add_function_test(TestIndexedArray, "test_indexedarray_fill_matrix", test_indexedarray_fill_matrix, devices=devices)
|
|
1129
|
+
add_function_test(TestIndexedArray, "test_indexedarray_fill_struct", test_indexedarray_fill_struct, devices=devices)
|
|
1131
1130
|
|
|
1132
1131
|
|
|
1133
1132
|
if __name__ == "__main__":
|
|
1134
|
-
|
|
1133
|
+
wp.build.clear_kernel_cache()
|
|
1135
1134
|
unittest.main(verbosity=2)
|
warp/tests/test_intersect.py
CHANGED
|
@@ -1,6 +1,16 @@
|
|
|
1
|
-
|
|
1
|
+
# Copyright (c) 2022 NVIDIA CORPORATION. All rights reserved.
|
|
2
|
+
# NVIDIA CORPORATION and its licensors retain all intellectual property
|
|
3
|
+
# and proprietary rights in and to this software, related documentation
|
|
4
|
+
# and any modifications thereto. Any use, reproduction, disclosure or
|
|
5
|
+
# distribution of this software and related documentation without an express
|
|
6
|
+
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
|
+
|
|
8
|
+
import unittest
|
|
9
|
+
|
|
2
10
|
import numpy as np
|
|
3
|
-
|
|
11
|
+
|
|
12
|
+
import warp as wp
|
|
13
|
+
from warp.tests.unittest_utils import *
|
|
4
14
|
|
|
5
15
|
wp.init()
|
|
6
16
|
|
|
@@ -42,17 +52,16 @@ def test_intersect_tri(test, device):
|
|
|
42
52
|
assert_np_equal(result.numpy(), np.array([0]))
|
|
43
53
|
|
|
44
54
|
|
|
45
|
-
|
|
46
|
-
|
|
55
|
+
devices = get_test_devices()
|
|
56
|
+
|
|
47
57
|
|
|
48
|
-
|
|
49
|
-
|
|
58
|
+
class TestIntersect(unittest.TestCase):
|
|
59
|
+
pass
|
|
50
60
|
|
|
51
|
-
add_function_test(TestIntersect, "test_intersect_tri", test_intersect_tri, devices=devices)
|
|
52
61
|
|
|
53
|
-
|
|
62
|
+
add_function_test(TestIntersect, "test_intersect_tri", test_intersect_tri, devices=devices)
|
|
54
63
|
|
|
55
64
|
|
|
56
65
|
if __name__ == "__main__":
|
|
57
|
-
|
|
66
|
+
wp.build.clear_kernel_cache()
|
|
58
67
|
unittest.main(verbosity=2, failfast=False)
|
warp/tests/test_large.py
ADDED
|
@@ -0,0 +1,141 @@
|
|
|
1
|
+
# Copyright (c) 2023 NVIDIA CORPORATION. All rights reserved.
|
|
2
|
+
# NVIDIA CORPORATION and its licensors retain all intellectual property
|
|
3
|
+
# and proprietary rights in and to this software, related documentation
|
|
4
|
+
# and any modifications thereto. Any use, reproduction, disclosure or
|
|
5
|
+
# distribution of this software and related documentation without an express
|
|
6
|
+
# license agreement from NVIDIA CORPORATION is strictly prohibited.
|
|
7
|
+
|
|
8
|
+
import math
|
|
9
|
+
import unittest
|
|
10
|
+
|
|
11
|
+
import warp as wp
|
|
12
|
+
from warp.tests.unittest_utils import *
|
|
13
|
+
|
|
14
|
+
wp.init()
|
|
15
|
+
|
|
16
|
+
|
|
17
|
+
@wp.kernel
|
|
18
|
+
def conditional_sum(result: wp.array(dtype=wp.uint64)):
|
|
19
|
+
i, j, k = wp.tid()
|
|
20
|
+
|
|
21
|
+
if i == 0:
|
|
22
|
+
wp.atomic_add(result, 0, wp.uint64(1))
|
|
23
|
+
|
|
24
|
+
|
|
25
|
+
def test_large_launch_large_kernel(test, device):
|
|
26
|
+
"""Test tid() on kernel launch of 2**33 threads.
|
|
27
|
+
|
|
28
|
+
The function conditional sum will add 1 to result for every thread that has an i index of 0.
|
|
29
|
+
Due to the size of the grid, this test is not run on CPUs
|
|
30
|
+
"""
|
|
31
|
+
test_result = wp.zeros(shape=(1,), dtype=wp.uint64, device=device)
|
|
32
|
+
|
|
33
|
+
large_dim_length = 2**16
|
|
34
|
+
half_result = large_dim_length * large_dim_length
|
|
35
|
+
|
|
36
|
+
wp.launch(kernel=conditional_sum, dim=[2, large_dim_length, large_dim_length], inputs=[test_result], device=device)
|
|
37
|
+
test.assertEqual(test_result.numpy()[0], half_result)
|
|
38
|
+
|
|
39
|
+
|
|
40
|
+
@wp.kernel
|
|
41
|
+
def count_elements(result: wp.array(dtype=wp.uint64)):
|
|
42
|
+
wp.atomic_add(result, 0, wp.uint64(1))
|
|
43
|
+
|
|
44
|
+
|
|
45
|
+
def test_large_launch_max_blocks(test, device):
|
|
46
|
+
# Loop over 1000x1x1 elements using a grid of 256 threads
|
|
47
|
+
test_result = wp.zeros(shape=(1,), dtype=wp.uint64, device=device)
|
|
48
|
+
wp.launch(count_elements, (1000,), inputs=[test_result], max_blocks=1, device=device)
|
|
49
|
+
test.assertEqual(test_result.numpy()[0], 1000)
|
|
50
|
+
|
|
51
|
+
# Loop over 2x10x10 elements using a grid of 256 threads, using the tid() index to count half the elements
|
|
52
|
+
test_result.zero_()
|
|
53
|
+
wp.launch(
|
|
54
|
+
conditional_sum,
|
|
55
|
+
(
|
|
56
|
+
2,
|
|
57
|
+
50,
|
|
58
|
+
10,
|
|
59
|
+
),
|
|
60
|
+
inputs=[test_result],
|
|
61
|
+
max_blocks=1,
|
|
62
|
+
device=device,
|
|
63
|
+
)
|
|
64
|
+
test.assertEqual(test_result.numpy()[0], 500)
|
|
65
|
+
|
|
66
|
+
|
|
67
|
+
def test_large_launch_very_large_kernel(test, device):
|
|
68
|
+
"""Due to the size of the grid, this test is not run on CPUs"""
|
|
69
|
+
|
|
70
|
+
# Dim is chosen to be larger than the maximum CUDA one-dimensional grid size (total threads)
|
|
71
|
+
dim = (2**31 - 1) * 256 + 1
|
|
72
|
+
test_result = wp.zeros(shape=(1,), dtype=wp.uint64, device=device)
|
|
73
|
+
wp.launch(count_elements, (dim,), inputs=[test_result], device=device)
|
|
74
|
+
test.assertEqual(test_result.numpy()[0], dim)
|
|
75
|
+
|
|
76
|
+
|
|
77
|
+
def test_large_arrays_slow(test, device):
|
|
78
|
+
# The goal of this test is to use arrays just large enough to know
|
|
79
|
+
# if there's a flaw in handling arrays with more than 2**31-1 elements
|
|
80
|
+
# Unfortunately, it takes a long time to run so it won't be run automatically
|
|
81
|
+
# without changes to support how frequently a test may be run
|
|
82
|
+
total_elements = 2**31 + 8
|
|
83
|
+
|
|
84
|
+
# 1-D to 4-D arrays: test zero_, fill_, then zero_ for scalar data types:
|
|
85
|
+
for total_dims in range(1, 5):
|
|
86
|
+
dim_x = math.ceil(total_elements ** (1 / total_dims))
|
|
87
|
+
shape_tuple = tuple([dim_x] * total_dims)
|
|
88
|
+
|
|
89
|
+
for nptype, wptype in wp.types.np_dtype_to_warp_type.items():
|
|
90
|
+
a1 = wp.zeros(shape_tuple, dtype=wptype, device=device)
|
|
91
|
+
assert_np_equal(a1.numpy(), np.zeros_like(a1.numpy()))
|
|
92
|
+
|
|
93
|
+
a1.fill_(127)
|
|
94
|
+
assert_np_equal(a1.numpy(), 127 * np.ones_like(a1.numpy()))
|
|
95
|
+
|
|
96
|
+
a1.zero_()
|
|
97
|
+
assert_np_equal(a1.numpy(), np.zeros_like(a1.numpy()))
|
|
98
|
+
|
|
99
|
+
|
|
100
|
+
def test_large_arrays_fast(test, device):
|
|
101
|
+
# A truncated version of test_large_arrays_slow meant to catch basic errors
|
|
102
|
+
total_elements = 2**31 + 8
|
|
103
|
+
|
|
104
|
+
nptype = np.dtype(np.int8)
|
|
105
|
+
wptype = wp.types.np_dtype_to_warp_type[nptype]
|
|
106
|
+
|
|
107
|
+
a1 = wp.zeros((total_elements,), dtype=wptype, device=device)
|
|
108
|
+
assert_np_equal(a1.numpy(), np.zeros_like(a1.numpy()))
|
|
109
|
+
|
|
110
|
+
a1.fill_(127)
|
|
111
|
+
assert_np_equal(a1.numpy(), 127 * np.ones_like(a1.numpy()))
|
|
112
|
+
|
|
113
|
+
a1.zero_()
|
|
114
|
+
assert_np_equal(a1.numpy(), np.zeros_like(a1.numpy()))
|
|
115
|
+
|
|
116
|
+
|
|
117
|
+
devices = get_test_devices()
|
|
118
|
+
|
|
119
|
+
|
|
120
|
+
class TestLarge(unittest.TestCase):
|
|
121
|
+
pass
|
|
122
|
+
|
|
123
|
+
|
|
124
|
+
add_function_test(
|
|
125
|
+
TestLarge, "test_large_launch_large_kernel", test_large_launch_large_kernel, devices=get_unique_cuda_test_devices()
|
|
126
|
+
)
|
|
127
|
+
|
|
128
|
+
add_function_test(TestLarge, "test_large_launch_max_blocks", test_large_launch_max_blocks, devices=devices)
|
|
129
|
+
add_function_test(
|
|
130
|
+
TestLarge,
|
|
131
|
+
"test_large_launch_very_large_kernel",
|
|
132
|
+
test_large_launch_very_large_kernel,
|
|
133
|
+
devices=get_unique_cuda_test_devices(),
|
|
134
|
+
)
|
|
135
|
+
|
|
136
|
+
add_function_test(TestLarge, "test_large_arrays_fast", test_large_arrays_fast, devices=devices)
|
|
137
|
+
|
|
138
|
+
|
|
139
|
+
if __name__ == "__main__":
|
|
140
|
+
wp.build.clear_kernel_cache()
|
|
141
|
+
unittest.main(verbosity=2)
|
warp/tests/test_launch.py
CHANGED
|
@@ -7,11 +7,10 @@
|
|
|
7
7
|
|
|
8
8
|
import unittest
|
|
9
9
|
|
|
10
|
-
# include parent path
|
|
11
10
|
import numpy as np
|
|
12
11
|
|
|
13
12
|
import warp as wp
|
|
14
|
-
from warp.tests.
|
|
13
|
+
from warp.tests.unittest_utils import *
|
|
15
14
|
|
|
16
15
|
wp.init()
|
|
17
16
|
|
|
@@ -306,51 +305,25 @@ def test_launch_tuple_args(test, device):
|
|
|
306
305
|
assert_np_equal(out.numpy(), np.array((0, 3, 6, 9)))
|
|
307
306
|
|
|
308
307
|
|
|
309
|
-
|
|
310
|
-
def conditional_sum(result: wp.array(dtype=wp.uint64)):
|
|
311
|
-
i, j, k = wp.tid()
|
|
312
|
-
|
|
313
|
-
if i == 0:
|
|
314
|
-
wp.atomic_add(result, 0, wp.uint64(1))
|
|
315
|
-
|
|
316
|
-
|
|
317
|
-
def test_launch_large_kernel(test, device):
|
|
318
|
-
"""Test tid() on kernel launch of 2**33 threads.
|
|
319
|
-
|
|
320
|
-
The function conditional sum will add 1 to result for every thread that has an i index of 0.
|
|
321
|
-
Due to the size of the grid, this test is not run on CPUs
|
|
322
|
-
"""
|
|
323
|
-
test_result = wp.zeros(shape=(1,), dtype=wp.uint64, device=device)
|
|
324
|
-
|
|
325
|
-
large_dim_length = 2**16
|
|
326
|
-
half_result = large_dim_length * large_dim_length
|
|
327
|
-
|
|
328
|
-
wp.launch(kernel=conditional_sum, dim=[2, large_dim_length, large_dim_length], inputs=[test_result], device=device)
|
|
329
|
-
test.assertEqual(test_result.numpy()[0], half_result)
|
|
330
|
-
|
|
331
|
-
|
|
332
|
-
def register(parent):
|
|
333
|
-
devices = get_test_devices()
|
|
308
|
+
devices = get_test_devices()
|
|
334
309
|
|
|
335
|
-
class TestLaunch(parent):
|
|
336
|
-
pass
|
|
337
310
|
|
|
338
|
-
|
|
339
|
-
|
|
340
|
-
add_function_test(TestLaunch, "test_launch_3d", test3d, devices=devices)
|
|
341
|
-
add_function_test(TestLaunch, "test_launch_4d", test4d, devices=devices)
|
|
311
|
+
class TestLaunch(unittest.TestCase):
|
|
312
|
+
pass
|
|
342
313
|
|
|
343
|
-
add_function_test(TestLaunch, "test_launch_cmd", test_launch_cmd, devices=devices)
|
|
344
|
-
add_function_test(TestLaunch, "test_launch_cmd_set_param", test_launch_cmd_set_param, devices=devices)
|
|
345
|
-
add_function_test(TestLaunch, "test_launch_cmd_set_ctype", test_launch_cmd_set_ctype, devices=devices)
|
|
346
|
-
add_function_test(TestLaunch, "test_launch_cmd_set_dim", test_launch_cmd_set_dim, devices=devices)
|
|
347
|
-
add_function_test(TestLaunch, "test_launch_cmd_empty", test_launch_cmd_empty, devices=devices)
|
|
348
314
|
|
|
349
|
-
|
|
315
|
+
add_function_test(TestLaunch, "test_launch_1d", test1d, devices=devices)
|
|
316
|
+
add_function_test(TestLaunch, "test_launch_2d", test2d, devices=devices)
|
|
317
|
+
add_function_test(TestLaunch, "test_launch_3d", test3d, devices=devices)
|
|
318
|
+
add_function_test(TestLaunch, "test_launch_4d", test4d, devices=devices)
|
|
350
319
|
|
|
351
|
-
|
|
320
|
+
add_function_test(TestLaunch, "test_launch_cmd", test_launch_cmd, devices=devices)
|
|
321
|
+
add_function_test(TestLaunch, "test_launch_cmd_set_param", test_launch_cmd_set_param, devices=devices)
|
|
322
|
+
add_function_test(TestLaunch, "test_launch_cmd_set_ctype", test_launch_cmd_set_ctype, devices=devices)
|
|
323
|
+
add_function_test(TestLaunch, "test_launch_cmd_set_dim", test_launch_cmd_set_dim, devices=devices)
|
|
324
|
+
add_function_test(TestLaunch, "test_launch_cmd_empty", test_launch_cmd_empty, devices=devices)
|
|
352
325
|
|
|
353
326
|
|
|
354
327
|
if __name__ == "__main__":
|
|
355
|
-
|
|
328
|
+
wp.build.clear_kernel_cache()
|
|
356
329
|
unittest.main(verbosity=2)
|