warp-lang 1.0.0b2__py3-none-win_amd64.whl → 1.0.0b6__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of warp-lang might be problematic. Click here for more details.

Files changed (271) hide show
  1. docs/conf.py +17 -5
  2. examples/env/env_ant.py +1 -1
  3. examples/env/env_cartpole.py +1 -1
  4. examples/env/env_humanoid.py +1 -1
  5. examples/env/env_usd.py +4 -1
  6. examples/env/environment.py +8 -9
  7. examples/example_dem.py +34 -33
  8. examples/example_diffray.py +364 -337
  9. examples/example_fluid.py +32 -23
  10. examples/example_jacobian_ik.py +97 -93
  11. examples/example_marching_cubes.py +6 -16
  12. examples/example_mesh.py +6 -16
  13. examples/example_mesh_intersect.py +16 -14
  14. examples/example_nvdb.py +14 -16
  15. examples/example_raycast.py +14 -13
  16. examples/example_raymarch.py +16 -23
  17. examples/example_render_opengl.py +19 -10
  18. examples/example_sim_cartpole.py +82 -78
  19. examples/example_sim_cloth.py +45 -48
  20. examples/example_sim_fk_grad.py +51 -44
  21. examples/example_sim_fk_grad_torch.py +47 -40
  22. examples/example_sim_grad_bounce.py +108 -133
  23. examples/example_sim_grad_cloth.py +99 -113
  24. examples/example_sim_granular.py +5 -6
  25. examples/{example_sim_sdf_shape.py → example_sim_granular_collision_sdf.py} +37 -26
  26. examples/example_sim_neo_hookean.py +51 -55
  27. examples/example_sim_particle_chain.py +4 -4
  28. examples/example_sim_quadruped.py +126 -81
  29. examples/example_sim_rigid_chain.py +54 -61
  30. examples/example_sim_rigid_contact.py +66 -70
  31. examples/example_sim_rigid_fem.py +3 -3
  32. examples/example_sim_rigid_force.py +1 -1
  33. examples/example_sim_rigid_gyroscopic.py +3 -4
  34. examples/example_sim_rigid_kinematics.py +28 -39
  35. examples/example_sim_trajopt.py +112 -110
  36. examples/example_sph.py +9 -8
  37. examples/example_wave.py +7 -7
  38. examples/fem/bsr_utils.py +30 -17
  39. examples/fem/example_apic_fluid.py +85 -69
  40. examples/fem/example_convection_diffusion.py +97 -93
  41. examples/fem/example_convection_diffusion_dg.py +142 -149
  42. examples/fem/example_convection_diffusion_dg0.py +141 -136
  43. examples/fem/example_deformed_geometry.py +146 -0
  44. examples/fem/example_diffusion.py +115 -84
  45. examples/fem/example_diffusion_3d.py +116 -86
  46. examples/fem/example_diffusion_mgpu.py +102 -79
  47. examples/fem/example_mixed_elasticity.py +139 -100
  48. examples/fem/example_navier_stokes.py +175 -162
  49. examples/fem/example_stokes.py +143 -111
  50. examples/fem/example_stokes_transfer.py +186 -157
  51. examples/fem/mesh_utils.py +59 -97
  52. examples/fem/plot_utils.py +138 -17
  53. tools/ci/publishing/build_nodes_info.py +54 -0
  54. warp/__init__.py +4 -3
  55. warp/__init__.pyi +1 -0
  56. warp/bin/warp-clang.dll +0 -0
  57. warp/bin/warp.dll +0 -0
  58. warp/build.py +5 -3
  59. warp/build_dll.py +29 -9
  60. warp/builtins.py +836 -492
  61. warp/codegen.py +864 -553
  62. warp/config.py +3 -1
  63. warp/context.py +389 -172
  64. warp/fem/__init__.py +24 -6
  65. warp/fem/cache.py +318 -25
  66. warp/fem/dirichlet.py +7 -3
  67. warp/fem/domain.py +14 -0
  68. warp/fem/field/__init__.py +30 -38
  69. warp/fem/field/field.py +149 -0
  70. warp/fem/field/nodal_field.py +244 -138
  71. warp/fem/field/restriction.py +8 -6
  72. warp/fem/field/test.py +127 -59
  73. warp/fem/field/trial.py +117 -60
  74. warp/fem/geometry/__init__.py +5 -1
  75. warp/fem/geometry/deformed_geometry.py +271 -0
  76. warp/fem/geometry/element.py +24 -1
  77. warp/fem/geometry/geometry.py +86 -14
  78. warp/fem/geometry/grid_2d.py +112 -54
  79. warp/fem/geometry/grid_3d.py +134 -65
  80. warp/fem/geometry/hexmesh.py +953 -0
  81. warp/fem/geometry/partition.py +85 -33
  82. warp/fem/geometry/quadmesh_2d.py +532 -0
  83. warp/fem/geometry/tetmesh.py +451 -115
  84. warp/fem/geometry/trimesh_2d.py +197 -92
  85. warp/fem/integrate.py +534 -268
  86. warp/fem/operator.py +58 -31
  87. warp/fem/polynomial.py +11 -0
  88. warp/fem/quadrature/__init__.py +1 -1
  89. warp/fem/quadrature/pic_quadrature.py +150 -58
  90. warp/fem/quadrature/quadrature.py +209 -57
  91. warp/fem/space/__init__.py +230 -53
  92. warp/fem/space/basis_space.py +489 -0
  93. warp/fem/space/collocated_function_space.py +105 -0
  94. warp/fem/space/dof_mapper.py +49 -2
  95. warp/fem/space/function_space.py +90 -39
  96. warp/fem/space/grid_2d_function_space.py +149 -496
  97. warp/fem/space/grid_3d_function_space.py +173 -538
  98. warp/fem/space/hexmesh_function_space.py +352 -0
  99. warp/fem/space/partition.py +129 -76
  100. warp/fem/space/quadmesh_2d_function_space.py +369 -0
  101. warp/fem/space/restriction.py +46 -34
  102. warp/fem/space/shape/__init__.py +15 -0
  103. warp/fem/space/shape/cube_shape_function.py +738 -0
  104. warp/fem/space/shape/shape_function.py +103 -0
  105. warp/fem/space/shape/square_shape_function.py +611 -0
  106. warp/fem/space/shape/tet_shape_function.py +567 -0
  107. warp/fem/space/shape/triangle_shape_function.py +429 -0
  108. warp/fem/space/tetmesh_function_space.py +132 -1039
  109. warp/fem/space/topology.py +295 -0
  110. warp/fem/space/trimesh_2d_function_space.py +104 -742
  111. warp/fem/types.py +13 -11
  112. warp/fem/utils.py +335 -60
  113. warp/native/array.h +120 -34
  114. warp/native/builtin.h +101 -72
  115. warp/native/bvh.cpp +73 -325
  116. warp/native/bvh.cu +406 -23
  117. warp/native/bvh.h +22 -40
  118. warp/native/clang/clang.cpp +1 -0
  119. warp/native/crt.h +2 -0
  120. warp/native/cuda_util.cpp +8 -3
  121. warp/native/cuda_util.h +1 -0
  122. warp/native/exports.h +1522 -1243
  123. warp/native/intersect.h +19 -4
  124. warp/native/intersect_adj.h +8 -8
  125. warp/native/mat.h +76 -17
  126. warp/native/mesh.cpp +33 -108
  127. warp/native/mesh.cu +114 -18
  128. warp/native/mesh.h +395 -40
  129. warp/native/noise.h +272 -329
  130. warp/native/quat.h +51 -8
  131. warp/native/rand.h +44 -34
  132. warp/native/reduce.cpp +1 -1
  133. warp/native/sparse.cpp +4 -4
  134. warp/native/sparse.cu +163 -155
  135. warp/native/spatial.h +2 -2
  136. warp/native/temp_buffer.h +18 -14
  137. warp/native/vec.h +103 -21
  138. warp/native/warp.cpp +2 -1
  139. warp/native/warp.cu +28 -3
  140. warp/native/warp.h +4 -3
  141. warp/render/render_opengl.py +261 -109
  142. warp/sim/__init__.py +1 -2
  143. warp/sim/articulation.py +385 -185
  144. warp/sim/import_mjcf.py +59 -48
  145. warp/sim/import_urdf.py +15 -15
  146. warp/sim/import_usd.py +174 -102
  147. warp/sim/inertia.py +17 -18
  148. warp/sim/integrator_xpbd.py +4 -3
  149. warp/sim/model.py +330 -250
  150. warp/sim/render.py +1 -1
  151. warp/sparse.py +625 -152
  152. warp/stubs.py +341 -309
  153. warp/tape.py +9 -6
  154. warp/tests/__main__.py +3 -6
  155. warp/tests/assets/curlnoise_golden.npy +0 -0
  156. warp/tests/assets/pnoise_golden.npy +0 -0
  157. warp/tests/{test_class_kernel.py → aux_test_class_kernel.py} +9 -1
  158. warp/tests/aux_test_conditional_unequal_types_kernels.py +21 -0
  159. warp/tests/{test_dependent.py → aux_test_dependent.py} +2 -2
  160. warp/tests/{test_reference.py → aux_test_reference.py} +1 -1
  161. warp/tests/aux_test_unresolved_func.py +14 -0
  162. warp/tests/aux_test_unresolved_symbol.py +14 -0
  163. warp/tests/disabled_kinematics.py +239 -0
  164. warp/tests/run_coverage_serial.py +31 -0
  165. warp/tests/test_adam.py +103 -106
  166. warp/tests/test_arithmetic.py +94 -74
  167. warp/tests/test_array.py +82 -101
  168. warp/tests/test_array_reduce.py +57 -23
  169. warp/tests/test_atomic.py +64 -28
  170. warp/tests/test_bool.py +22 -12
  171. warp/tests/test_builtins_resolution.py +1292 -0
  172. warp/tests/test_bvh.py +18 -18
  173. warp/tests/test_closest_point_edge_edge.py +54 -57
  174. warp/tests/test_codegen.py +165 -134
  175. warp/tests/test_compile_consts.py +28 -20
  176. warp/tests/test_conditional.py +108 -24
  177. warp/tests/test_copy.py +10 -12
  178. warp/tests/test_ctypes.py +112 -88
  179. warp/tests/test_dense.py +21 -14
  180. warp/tests/test_devices.py +98 -0
  181. warp/tests/test_dlpack.py +75 -75
  182. warp/tests/test_examples.py +237 -0
  183. warp/tests/test_fabricarray.py +22 -24
  184. warp/tests/test_fast_math.py +15 -11
  185. warp/tests/test_fem.py +1034 -124
  186. warp/tests/test_fp16.py +23 -16
  187. warp/tests/test_func.py +187 -86
  188. warp/tests/test_generics.py +194 -49
  189. warp/tests/test_grad.py +123 -181
  190. warp/tests/test_grad_customs.py +176 -0
  191. warp/tests/test_hash_grid.py +35 -34
  192. warp/tests/test_import.py +10 -23
  193. warp/tests/test_indexedarray.py +24 -25
  194. warp/tests/test_intersect.py +18 -9
  195. warp/tests/test_large.py +141 -0
  196. warp/tests/test_launch.py +14 -41
  197. warp/tests/test_lerp.py +64 -65
  198. warp/tests/test_lvalue.py +493 -0
  199. warp/tests/test_marching_cubes.py +12 -13
  200. warp/tests/test_mat.py +517 -2898
  201. warp/tests/test_mat_lite.py +115 -0
  202. warp/tests/test_mat_scalar_ops.py +2889 -0
  203. warp/tests/test_math.py +103 -9
  204. warp/tests/test_matmul.py +304 -69
  205. warp/tests/test_matmul_lite.py +410 -0
  206. warp/tests/test_mesh.py +60 -22
  207. warp/tests/test_mesh_query_aabb.py +21 -25
  208. warp/tests/test_mesh_query_point.py +111 -22
  209. warp/tests/test_mesh_query_ray.py +12 -24
  210. warp/tests/test_mlp.py +30 -22
  211. warp/tests/test_model.py +92 -89
  212. warp/tests/test_modules_lite.py +39 -0
  213. warp/tests/test_multigpu.py +88 -114
  214. warp/tests/test_noise.py +12 -11
  215. warp/tests/test_operators.py +16 -20
  216. warp/tests/test_options.py +11 -11
  217. warp/tests/test_pinned.py +17 -18
  218. warp/tests/test_print.py +32 -11
  219. warp/tests/test_quat.py +275 -129
  220. warp/tests/test_rand.py +18 -16
  221. warp/tests/test_reload.py +38 -34
  222. warp/tests/test_rounding.py +50 -43
  223. warp/tests/test_runlength_encode.py +168 -20
  224. warp/tests/test_smoothstep.py +9 -11
  225. warp/tests/test_snippet.py +143 -0
  226. warp/tests/test_sparse.py +261 -63
  227. warp/tests/test_spatial.py +276 -243
  228. warp/tests/test_streams.py +110 -85
  229. warp/tests/test_struct.py +268 -63
  230. warp/tests/test_tape.py +39 -21
  231. warp/tests/test_torch.py +90 -86
  232. warp/tests/test_transient_module.py +10 -12
  233. warp/tests/test_types.py +363 -0
  234. warp/tests/test_utils.py +451 -0
  235. warp/tests/test_vec.py +354 -2050
  236. warp/tests/test_vec_lite.py +73 -0
  237. warp/tests/test_vec_scalar_ops.py +2099 -0
  238. warp/tests/test_volume.py +418 -376
  239. warp/tests/test_volume_write.py +124 -134
  240. warp/tests/unittest_serial.py +35 -0
  241. warp/tests/unittest_suites.py +291 -0
  242. warp/tests/unittest_utils.py +342 -0
  243. warp/tests/{test_misc.py → unused_test_misc.py} +13 -5
  244. warp/tests/{test_debug.py → walkthough_debug.py} +3 -17
  245. warp/thirdparty/appdirs.py +36 -45
  246. warp/thirdparty/unittest_parallel.py +589 -0
  247. warp/types.py +622 -211
  248. warp/utils.py +54 -393
  249. warp_lang-1.0.0b6.dist-info/METADATA +238 -0
  250. warp_lang-1.0.0b6.dist-info/RECORD +409 -0
  251. {warp_lang-1.0.0b2.dist-info → warp_lang-1.0.0b6.dist-info}/WHEEL +1 -1
  252. examples/example_cache_management.py +0 -40
  253. examples/example_multigpu.py +0 -54
  254. examples/example_struct.py +0 -65
  255. examples/fem/example_stokes_transfer_3d.py +0 -210
  256. warp/bin/warp-clang.so +0 -0
  257. warp/bin/warp.so +0 -0
  258. warp/fem/field/discrete_field.py +0 -80
  259. warp/fem/space/nodal_function_space.py +0 -233
  260. warp/tests/test_all.py +0 -223
  261. warp/tests/test_array_scan.py +0 -60
  262. warp/tests/test_base.py +0 -208
  263. warp/tests/test_unresolved_func.py +0 -7
  264. warp/tests/test_unresolved_symbol.py +0 -7
  265. warp_lang-1.0.0b2.dist-info/METADATA +0 -26
  266. warp_lang-1.0.0b2.dist-info/RECORD +0 -380
  267. /warp/tests/{test_compile_consts_dummy.py → aux_test_compile_consts_dummy.py} +0 -0
  268. /warp/tests/{test_reference_reference.py → aux_test_reference_reference.py} +0 -0
  269. /warp/tests/{test_square.py → aux_test_square.py} +0 -0
  270. {warp_lang-1.0.0b2.dist-info → warp_lang-1.0.0b6.dist-info}/LICENSE.md +0 -0
  271. {warp_lang-1.0.0b2.dist-info → warp_lang-1.0.0b6.dist-info}/top_level.txt +0 -0
@@ -5,12 +5,12 @@
5
5
  # distribution of this software and related documentation without an express
6
6
  # license agreement from NVIDIA CORPORATION is strictly prohibited.
7
7
 
8
+ import unittest
9
+
8
10
  import numpy as np
9
11
 
10
12
  import warp as wp
11
- from warp.tests.test_base import *
12
-
13
- np.random.seed(532)
13
+ from warp.tests.unittest_utils import *
14
14
 
15
15
  wp.init()
16
16
 
@@ -72,6 +72,9 @@ def count_neighbors_reference(
72
72
 
73
73
 
74
74
  def test_hashgrid_query(test, device):
75
+ wp.load_module(device=device)
76
+ rng = np.random.default_rng(123)
77
+
75
78
  grid = wp.HashGrid(dim_x, dim_y, dim_z, device)
76
79
 
77
80
  for i in range(num_runs):
@@ -79,15 +82,14 @@ def test_hashgrid_query(test, device):
79
82
  print(f"Run: {i+1}")
80
83
  print("---------")
81
84
 
82
- np.random.seed(532)
83
- points = np.random.rand(num_points, 3) * scale - np.array((scale, scale, scale)) * 0.5
85
+ points = rng.random(size=(num_points, 3)) * scale - np.array((scale, scale, scale)) * 0.5
84
86
 
85
87
  def particle_grid(dim_x, dim_y, dim_z, lower, radius, jitter):
86
88
  points = np.meshgrid(
87
89
  np.linspace(0, dim_x, dim_x), np.linspace(0, dim_y, dim_y), np.linspace(0, dim_z, dim_z)
88
90
  )
89
91
  points_t = np.array((points[0], points[1], points[2])).T * radius * 2.0 + np.array(lower)
90
- points_t = points_t + np.random.rand(*points_t.shape) * radius * jitter
92
+ points_t = points_t + rng.random(size=points_t.shape) * radius * jitter
91
93
 
92
94
  return points_t.reshape((-1, 3))
93
95
 
@@ -97,27 +99,28 @@ def test_hashgrid_query(test, device):
97
99
  counts_arr = wp.zeros(len(points), dtype=int, device=device)
98
100
  counts_arr_ref = wp.zeros(len(points), dtype=int, device=device)
99
101
 
100
- with wp.ScopedTimer("brute", active=print_enabled):
101
- wp.launch(
102
- kernel=count_neighbors_reference,
103
- dim=len(points) * len(points),
104
- inputs=[query_radius, points_arr, counts_arr_ref, len(points)],
105
- device=device,
106
- )
107
- wp.synchronize()
108
-
109
- with wp.ScopedTimer("grid build", active=print_enabled):
110
- grid.build(points_arr, cell_radius)
111
- wp.synchronize()
112
-
113
- with wp.ScopedTimer("grid query", active=print_enabled):
114
- wp.launch(
115
- kernel=count_neighbors,
116
- dim=len(points),
117
- inputs=[grid.id, query_radius, points_arr, counts_arr],
118
- device=device,
119
- )
120
- wp.synchronize()
102
+ profiler = {}
103
+
104
+ with wp.ScopedTimer("grid operations", print=print_enabled, dict=profiler, synchronize=True):
105
+ with wp.ScopedTimer("brute", print=print_enabled, dict=profiler, synchronize=True):
106
+ wp.launch(
107
+ kernel=count_neighbors_reference,
108
+ dim=len(points) * len(points),
109
+ inputs=[query_radius, points_arr, counts_arr_ref, len(points)],
110
+ device=device,
111
+ )
112
+ wp.synchronize()
113
+
114
+ with wp.ScopedTimer("grid build", print=print_enabled, dict=profiler, synchronize=True):
115
+ grid.build(points_arr, cell_radius)
116
+
117
+ with wp.ScopedTimer("grid query", print=print_enabled, dict=profiler, synchronize=True):
118
+ wp.launch(
119
+ kernel=count_neighbors,
120
+ dim=len(points),
121
+ inputs=[grid.id, query_radius, points_arr, counts_arr],
122
+ device=device,
123
+ )
121
124
 
122
125
  counts = counts_arr.numpy()
123
126
  counts_ref = counts_arr_ref.numpy()
@@ -131,17 +134,15 @@ def test_hashgrid_query(test, device):
131
134
  test.assertTrue(np.array_equal(counts, counts_ref))
132
135
 
133
136
 
134
- def register(parent):
135
- devices = get_test_devices()
137
+ devices = get_test_devices()
136
138
 
137
- class TestHashGrid(parent):
138
- pass
139
139
 
140
- add_function_test(TestHashGrid, "test_hashgrid_query", test_hashgrid_query, devices=devices)
140
+ class TestHashGrid(unittest.TestCase):
141
+ pass
141
142
 
142
- return TestHashGrid
143
143
 
144
+ add_function_test(TestHashGrid, "test_hashgrid_query", test_hashgrid_query, devices=devices)
144
145
 
145
146
  if __name__ == "__main__":
146
- c = register(unittest.TestCase)
147
+ wp.build.clear_kernel_cache()
147
148
  unittest.main(verbosity=2, failfast=False)
warp/tests/test_import.py CHANGED
@@ -5,20 +5,14 @@
5
5
  # distribution of this software and related documentation without an express
6
6
  # license agreement from NVIDIA CORPORATION is strictly prohibited.
7
7
 
8
- # include parent path
9
- import numpy as np
10
- import math
8
+ import unittest
11
9
 
12
10
  import warp as wp
13
- from warp.tests.test_base import *
14
-
15
- import unittest
11
+ import warp.tests.test_func as test_func
12
+ from warp.tests.unittest_utils import *
16
13
 
17
14
  wp.init()
18
15
 
19
- # from test_func import sqr
20
- import warp.tests.test_func as test_func
21
-
22
16
 
23
17
  @wp.kernel
24
18
  def test_import_func():
@@ -30,23 +24,16 @@ def test_import_func():
30
24
  wp.expect_eq(y, 8.0)
31
25
 
32
26
 
33
- def register(parent):
34
- devices = get_test_devices()
35
-
36
- class TestImport(parent):
37
- pass
27
+ devices = get_test_devices()
38
28
 
39
- add_kernel_test(TestImport, kernel=test_import_func, name="test_import_func", dim=1, devices=devices)
40
29
 
41
- return TestImport
30
+ class TestImport(unittest.TestCase):
31
+ pass
42
32
 
43
33
 
44
- if __name__ == "__main__":
45
- c = register(unittest.TestCase)
46
- # unittest.main(verbosity=2)
34
+ add_kernel_test(TestImport, kernel=test_import_func, name="test_import_func", dim=1, devices=devices)
47
35
 
48
- wp.force_load()
49
36
 
50
- loader = unittest.defaultTestLoader
51
- testSuite = loader.loadTestsFromTestCase(c)
52
- testSuite.debug()
37
+ if __name__ == "__main__":
38
+ wp.build.clear_kernel_cache()
39
+ unittest.main(verbosity=2)
@@ -12,7 +12,7 @@ import numpy as np
12
12
 
13
13
  import warp as wp
14
14
  from warp.tests.test_array import FillStruct
15
- from warp.tests.test_base import *
15
+ from warp.tests.unittest_utils import *
16
16
 
17
17
  wp.init()
18
18
 
@@ -36,7 +36,7 @@ def test_indexedarray_1d(test, device):
36
36
 
37
37
  indices = wp.array([1, 3, 5, 7, 9], dtype=int, device=device)
38
38
 
39
- iarr = wp.indexedarray(arr, [indices])
39
+ iarr = wp.indexedarray1d(arr, [indices])
40
40
 
41
41
  test.assertEqual(iarr.dtype, arr.dtype)
42
42
  test.assertEqual(iarr.ndim, 1)
@@ -72,7 +72,7 @@ def test_indexedarray_2d(test, device):
72
72
  indices0 = wp.array([1, 3], dtype=int, device=device)
73
73
  indices1 = wp.array([2, 4, 8], dtype=int, device=device)
74
74
 
75
- iarr = wp.indexedarray(arr, [indices0, indices1])
75
+ iarr = wp.indexedarray2d(arr, [indices0, indices1])
76
76
 
77
77
  test.assertEqual(iarr.dtype, arr.dtype)
78
78
  test.assertEqual(iarr.ndim, 2)
@@ -112,7 +112,7 @@ def test_indexedarray_3d(test, device):
112
112
  indices1 = wp.array([2, 4, 8], dtype=int, device=device)
113
113
  indices2 = wp.array([0, 5], dtype=int, device=device)
114
114
 
115
- iarr = wp.indexedarray(arr, [indices0, indices1, indices2])
115
+ iarr = wp.indexedarray3d(arr, [indices0, indices1, indices2])
116
116
 
117
117
  test.assertEqual(iarr.dtype, arr.dtype)
118
118
  test.assertEqual(iarr.ndim, 3)
@@ -157,7 +157,7 @@ def test_indexedarray_4d(test, device):
157
157
  indices2 = wp.array([0, 5], dtype=int, device=device)
158
158
  indices3 = wp.array([6, 7, 9], dtype=int, device=device)
159
159
 
160
- iarr = wp.indexedarray(arr, [indices0, indices1, indices2, indices3])
160
+ iarr = wp.indexedarray4d(arr, [indices0, indices1, indices2, indices3])
161
161
 
162
162
  test.assertEqual(iarr.dtype, arr.dtype)
163
163
  test.assertEqual(iarr.ndim, 4)
@@ -1106,30 +1106,29 @@ def test_indexedarray_fill_struct(test, device):
1106
1106
  assert_np_equal(a4.numpy(), np.zeros(a4.shape, dtype=nptype))
1107
1107
 
1108
1108
 
1109
- def register(parent):
1110
- devices = get_test_devices()
1109
+ devices = get_test_devices()
1111
1110
 
1112
- class TestIndexedArray(parent):
1113
- pass
1114
1111
 
1115
- add_function_test(TestIndexedArray, "test_indexedarray_1d", test_indexedarray_1d, devices=devices)
1116
- add_function_test(TestIndexedArray, "test_indexedarray_2d", test_indexedarray_2d, devices=devices)
1117
- add_function_test(TestIndexedArray, "test_indexedarray_3d", test_indexedarray_3d, devices=devices)
1118
- add_function_test(TestIndexedArray, "test_indexedarray_4d", test_indexedarray_4d, devices=devices)
1119
- add_function_test(TestIndexedArray, "test_indexedarray_mixed", test_indexedarray_mixed, devices=devices)
1120
- add_function_test(TestIndexedArray, "test_indexedarray_shape", test_indexedarray_shape, devices=devices)
1121
- add_function_test(TestIndexedArray, "test_indexedarray_getitem", test_indexedarray_getitem, devices=devices)
1122
- add_function_test(TestIndexedArray, "test_indexedarray_slicing", test_indexedarray_slicing, devices=devices)
1123
- add_function_test(TestIndexedArray, "test_indexedarray_generics", test_indexedarray_generics, devices=devices)
1124
- add_function_test(TestIndexedArray, "test_indexedarray_empty", test_indexedarray_empty, devices=devices)
1125
- add_function_test(TestIndexedArray, "test_indexedarray_fill_scalar", test_indexedarray_fill_scalar, devices=devices)
1126
- add_function_test(TestIndexedArray, "test_indexedarray_fill_vector", test_indexedarray_fill_vector, devices=devices)
1127
- add_function_test(TestIndexedArray, "test_indexedarray_fill_matrix", test_indexedarray_fill_matrix, devices=devices)
1128
- add_function_test(TestIndexedArray, "test_indexedarray_fill_struct", test_indexedarray_fill_struct, devices=devices)
1112
+ class TestIndexedArray(unittest.TestCase):
1113
+ pass
1129
1114
 
1130
- return TestIndexedArray
1115
+
1116
+ add_function_test(TestIndexedArray, "test_indexedarray_1d", test_indexedarray_1d, devices=devices)
1117
+ add_function_test(TestIndexedArray, "test_indexedarray_2d", test_indexedarray_2d, devices=devices)
1118
+ add_function_test(TestIndexedArray, "test_indexedarray_3d", test_indexedarray_3d, devices=devices)
1119
+ add_function_test(TestIndexedArray, "test_indexedarray_4d", test_indexedarray_4d, devices=devices)
1120
+ add_function_test(TestIndexedArray, "test_indexedarray_mixed", test_indexedarray_mixed, devices=devices)
1121
+ add_function_test(TestIndexedArray, "test_indexedarray_shape", test_indexedarray_shape, devices=devices)
1122
+ add_function_test(TestIndexedArray, "test_indexedarray_getitem", test_indexedarray_getitem, devices=devices)
1123
+ add_function_test(TestIndexedArray, "test_indexedarray_slicing", test_indexedarray_slicing, devices=devices)
1124
+ add_function_test(TestIndexedArray, "test_indexedarray_generics", test_indexedarray_generics, devices=devices)
1125
+ add_function_test(TestIndexedArray, "test_indexedarray_empty", test_indexedarray_empty, devices=devices)
1126
+ add_function_test(TestIndexedArray, "test_indexedarray_fill_scalar", test_indexedarray_fill_scalar, devices=devices)
1127
+ add_function_test(TestIndexedArray, "test_indexedarray_fill_vector", test_indexedarray_fill_vector, devices=devices)
1128
+ add_function_test(TestIndexedArray, "test_indexedarray_fill_matrix", test_indexedarray_fill_matrix, devices=devices)
1129
+ add_function_test(TestIndexedArray, "test_indexedarray_fill_struct", test_indexedarray_fill_struct, devices=devices)
1131
1130
 
1132
1131
 
1133
1132
  if __name__ == "__main__":
1134
- c = register(unittest.TestCase)
1133
+ wp.build.clear_kernel_cache()
1135
1134
  unittest.main(verbosity=2)
@@ -1,6 +1,16 @@
1
- import warp as wp
1
+ # Copyright (c) 2022 NVIDIA CORPORATION. All rights reserved.
2
+ # NVIDIA CORPORATION and its licensors retain all intellectual property
3
+ # and proprietary rights in and to this software, related documentation
4
+ # and any modifications thereto. Any use, reproduction, disclosure or
5
+ # distribution of this software and related documentation without an express
6
+ # license agreement from NVIDIA CORPORATION is strictly prohibited.
7
+
8
+ import unittest
9
+
2
10
  import numpy as np
3
- from warp.tests.test_base import *
11
+
12
+ import warp as wp
13
+ from warp.tests.unittest_utils import *
4
14
 
5
15
  wp.init()
6
16
 
@@ -42,17 +52,16 @@ def test_intersect_tri(test, device):
42
52
  assert_np_equal(result.numpy(), np.array([0]))
43
53
 
44
54
 
45
- def register(parent):
46
- devices = get_test_devices()
55
+ devices = get_test_devices()
56
+
47
57
 
48
- class TestIntersect(parent):
49
- pass
58
+ class TestIntersect(unittest.TestCase):
59
+ pass
50
60
 
51
- add_function_test(TestIntersect, "test_intersect_tri", test_intersect_tri, devices=devices)
52
61
 
53
- return TestIntersect
62
+ add_function_test(TestIntersect, "test_intersect_tri", test_intersect_tri, devices=devices)
54
63
 
55
64
 
56
65
  if __name__ == "__main__":
57
- c = register(unittest.TestCase)
66
+ wp.build.clear_kernel_cache()
58
67
  unittest.main(verbosity=2, failfast=False)
@@ -0,0 +1,141 @@
1
+ # Copyright (c) 2023 NVIDIA CORPORATION. All rights reserved.
2
+ # NVIDIA CORPORATION and its licensors retain all intellectual property
3
+ # and proprietary rights in and to this software, related documentation
4
+ # and any modifications thereto. Any use, reproduction, disclosure or
5
+ # distribution of this software and related documentation without an express
6
+ # license agreement from NVIDIA CORPORATION is strictly prohibited.
7
+
8
+ import math
9
+ import unittest
10
+
11
+ import warp as wp
12
+ from warp.tests.unittest_utils import *
13
+
14
+ wp.init()
15
+
16
+
17
+ @wp.kernel
18
+ def conditional_sum(result: wp.array(dtype=wp.uint64)):
19
+ i, j, k = wp.tid()
20
+
21
+ if i == 0:
22
+ wp.atomic_add(result, 0, wp.uint64(1))
23
+
24
+
25
+ def test_large_launch_large_kernel(test, device):
26
+ """Test tid() on kernel launch of 2**33 threads.
27
+
28
+ The function conditional sum will add 1 to result for every thread that has an i index of 0.
29
+ Due to the size of the grid, this test is not run on CPUs
30
+ """
31
+ test_result = wp.zeros(shape=(1,), dtype=wp.uint64, device=device)
32
+
33
+ large_dim_length = 2**16
34
+ half_result = large_dim_length * large_dim_length
35
+
36
+ wp.launch(kernel=conditional_sum, dim=[2, large_dim_length, large_dim_length], inputs=[test_result], device=device)
37
+ test.assertEqual(test_result.numpy()[0], half_result)
38
+
39
+
40
+ @wp.kernel
41
+ def count_elements(result: wp.array(dtype=wp.uint64)):
42
+ wp.atomic_add(result, 0, wp.uint64(1))
43
+
44
+
45
+ def test_large_launch_max_blocks(test, device):
46
+ # Loop over 1000x1x1 elements using a grid of 256 threads
47
+ test_result = wp.zeros(shape=(1,), dtype=wp.uint64, device=device)
48
+ wp.launch(count_elements, (1000,), inputs=[test_result], max_blocks=1, device=device)
49
+ test.assertEqual(test_result.numpy()[0], 1000)
50
+
51
+ # Loop over 2x10x10 elements using a grid of 256 threads, using the tid() index to count half the elements
52
+ test_result.zero_()
53
+ wp.launch(
54
+ conditional_sum,
55
+ (
56
+ 2,
57
+ 50,
58
+ 10,
59
+ ),
60
+ inputs=[test_result],
61
+ max_blocks=1,
62
+ device=device,
63
+ )
64
+ test.assertEqual(test_result.numpy()[0], 500)
65
+
66
+
67
+ def test_large_launch_very_large_kernel(test, device):
68
+ """Due to the size of the grid, this test is not run on CPUs"""
69
+
70
+ # Dim is chosen to be larger than the maximum CUDA one-dimensional grid size (total threads)
71
+ dim = (2**31 - 1) * 256 + 1
72
+ test_result = wp.zeros(shape=(1,), dtype=wp.uint64, device=device)
73
+ wp.launch(count_elements, (dim,), inputs=[test_result], device=device)
74
+ test.assertEqual(test_result.numpy()[0], dim)
75
+
76
+
77
+ def test_large_arrays_slow(test, device):
78
+ # The goal of this test is to use arrays just large enough to know
79
+ # if there's a flaw in handling arrays with more than 2**31-1 elements
80
+ # Unfortunately, it takes a long time to run so it won't be run automatically
81
+ # without changes to support how frequently a test may be run
82
+ total_elements = 2**31 + 8
83
+
84
+ # 1-D to 4-D arrays: test zero_, fill_, then zero_ for scalar data types:
85
+ for total_dims in range(1, 5):
86
+ dim_x = math.ceil(total_elements ** (1 / total_dims))
87
+ shape_tuple = tuple([dim_x] * total_dims)
88
+
89
+ for nptype, wptype in wp.types.np_dtype_to_warp_type.items():
90
+ a1 = wp.zeros(shape_tuple, dtype=wptype, device=device)
91
+ assert_np_equal(a1.numpy(), np.zeros_like(a1.numpy()))
92
+
93
+ a1.fill_(127)
94
+ assert_np_equal(a1.numpy(), 127 * np.ones_like(a1.numpy()))
95
+
96
+ a1.zero_()
97
+ assert_np_equal(a1.numpy(), np.zeros_like(a1.numpy()))
98
+
99
+
100
+ def test_large_arrays_fast(test, device):
101
+ # A truncated version of test_large_arrays_slow meant to catch basic errors
102
+ total_elements = 2**31 + 8
103
+
104
+ nptype = np.dtype(np.int8)
105
+ wptype = wp.types.np_dtype_to_warp_type[nptype]
106
+
107
+ a1 = wp.zeros((total_elements,), dtype=wptype, device=device)
108
+ assert_np_equal(a1.numpy(), np.zeros_like(a1.numpy()))
109
+
110
+ a1.fill_(127)
111
+ assert_np_equal(a1.numpy(), 127 * np.ones_like(a1.numpy()))
112
+
113
+ a1.zero_()
114
+ assert_np_equal(a1.numpy(), np.zeros_like(a1.numpy()))
115
+
116
+
117
+ devices = get_test_devices()
118
+
119
+
120
+ class TestLarge(unittest.TestCase):
121
+ pass
122
+
123
+
124
+ add_function_test(
125
+ TestLarge, "test_large_launch_large_kernel", test_large_launch_large_kernel, devices=get_unique_cuda_test_devices()
126
+ )
127
+
128
+ add_function_test(TestLarge, "test_large_launch_max_blocks", test_large_launch_max_blocks, devices=devices)
129
+ add_function_test(
130
+ TestLarge,
131
+ "test_large_launch_very_large_kernel",
132
+ test_large_launch_very_large_kernel,
133
+ devices=get_unique_cuda_test_devices(),
134
+ )
135
+
136
+ add_function_test(TestLarge, "test_large_arrays_fast", test_large_arrays_fast, devices=devices)
137
+
138
+
139
+ if __name__ == "__main__":
140
+ wp.build.clear_kernel_cache()
141
+ unittest.main(verbosity=2)
warp/tests/test_launch.py CHANGED
@@ -7,11 +7,10 @@
7
7
 
8
8
  import unittest
9
9
 
10
- # include parent path
11
10
  import numpy as np
12
11
 
13
12
  import warp as wp
14
- from warp.tests.test_base import *
13
+ from warp.tests.unittest_utils import *
15
14
 
16
15
  wp.init()
17
16
 
@@ -306,51 +305,25 @@ def test_launch_tuple_args(test, device):
306
305
  assert_np_equal(out.numpy(), np.array((0, 3, 6, 9)))
307
306
 
308
307
 
309
- @wp.kernel
310
- def conditional_sum(result: wp.array(dtype=wp.uint64)):
311
- i, j, k = wp.tid()
312
-
313
- if i == 0:
314
- wp.atomic_add(result, 0, wp.uint64(1))
315
-
316
-
317
- def test_launch_large_kernel(test, device):
318
- """Test tid() on kernel launch of 2**33 threads.
319
-
320
- The function conditional sum will add 1 to result for every thread that has an i index of 0.
321
- Due to the size of the grid, this test is not run on CPUs
322
- """
323
- test_result = wp.zeros(shape=(1,), dtype=wp.uint64, device=device)
324
-
325
- large_dim_length = 2**16
326
- half_result = large_dim_length * large_dim_length
327
-
328
- wp.launch(kernel=conditional_sum, dim=[2, large_dim_length, large_dim_length], inputs=[test_result], device=device)
329
- test.assertEqual(test_result.numpy()[0], half_result)
330
-
331
-
332
- def register(parent):
333
- devices = get_test_devices()
308
+ devices = get_test_devices()
334
309
 
335
- class TestLaunch(parent):
336
- pass
337
310
 
338
- add_function_test(TestLaunch, "test_launch_1d", test1d, devices=devices)
339
- add_function_test(TestLaunch, "test_launch_2d", test2d, devices=devices)
340
- add_function_test(TestLaunch, "test_launch_3d", test3d, devices=devices)
341
- add_function_test(TestLaunch, "test_launch_4d", test4d, devices=devices)
311
+ class TestLaunch(unittest.TestCase):
312
+ pass
342
313
 
343
- add_function_test(TestLaunch, "test_launch_cmd", test_launch_cmd, devices=devices)
344
- add_function_test(TestLaunch, "test_launch_cmd_set_param", test_launch_cmd_set_param, devices=devices)
345
- add_function_test(TestLaunch, "test_launch_cmd_set_ctype", test_launch_cmd_set_ctype, devices=devices)
346
- add_function_test(TestLaunch, "test_launch_cmd_set_dim", test_launch_cmd_set_dim, devices=devices)
347
- add_function_test(TestLaunch, "test_launch_cmd_empty", test_launch_cmd_empty, devices=devices)
348
314
 
349
- add_function_test(TestLaunch, "test_launch_large_kernel", test_launch_large_kernel, devices=wp.get_cuda_devices())
315
+ add_function_test(TestLaunch, "test_launch_1d", test1d, devices=devices)
316
+ add_function_test(TestLaunch, "test_launch_2d", test2d, devices=devices)
317
+ add_function_test(TestLaunch, "test_launch_3d", test3d, devices=devices)
318
+ add_function_test(TestLaunch, "test_launch_4d", test4d, devices=devices)
350
319
 
351
- return TestLaunch
320
+ add_function_test(TestLaunch, "test_launch_cmd", test_launch_cmd, devices=devices)
321
+ add_function_test(TestLaunch, "test_launch_cmd_set_param", test_launch_cmd_set_param, devices=devices)
322
+ add_function_test(TestLaunch, "test_launch_cmd_set_ctype", test_launch_cmd_set_ctype, devices=devices)
323
+ add_function_test(TestLaunch, "test_launch_cmd_set_dim", test_launch_cmd_set_dim, devices=devices)
324
+ add_function_test(TestLaunch, "test_launch_cmd_empty", test_launch_cmd_empty, devices=devices)
352
325
 
353
326
 
354
327
  if __name__ == "__main__":
355
- c = register(unittest.TestCase)
328
+ wp.build.clear_kernel_cache()
356
329
  unittest.main(verbosity=2)