warp-lang 1.10.0__py3-none-macosx_11_0_arm64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of warp-lang might be problematic. Click here for more details.

Files changed (468) hide show
  1. warp/__init__.py +334 -0
  2. warp/__init__.pyi +5856 -0
  3. warp/_src/__init__.py +14 -0
  4. warp/_src/autograd.py +1077 -0
  5. warp/_src/build.py +620 -0
  6. warp/_src/build_dll.py +642 -0
  7. warp/_src/builtins.py +10555 -0
  8. warp/_src/codegen.py +4361 -0
  9. warp/_src/config.py +178 -0
  10. warp/_src/constants.py +59 -0
  11. warp/_src/context.py +8352 -0
  12. warp/_src/dlpack.py +464 -0
  13. warp/_src/fabric.py +362 -0
  14. warp/_src/fem/__init__.py +14 -0
  15. warp/_src/fem/adaptivity.py +510 -0
  16. warp/_src/fem/cache.py +689 -0
  17. warp/_src/fem/dirichlet.py +190 -0
  18. warp/_src/fem/domain.py +553 -0
  19. warp/_src/fem/field/__init__.py +131 -0
  20. warp/_src/fem/field/field.py +703 -0
  21. warp/_src/fem/field/nodal_field.py +403 -0
  22. warp/_src/fem/field/restriction.py +39 -0
  23. warp/_src/fem/field/virtual.py +1021 -0
  24. warp/_src/fem/geometry/__init__.py +32 -0
  25. warp/_src/fem/geometry/adaptive_nanogrid.py +782 -0
  26. warp/_src/fem/geometry/closest_point.py +99 -0
  27. warp/_src/fem/geometry/deformed_geometry.py +277 -0
  28. warp/_src/fem/geometry/element.py +854 -0
  29. warp/_src/fem/geometry/geometry.py +693 -0
  30. warp/_src/fem/geometry/grid_2d.py +478 -0
  31. warp/_src/fem/geometry/grid_3d.py +539 -0
  32. warp/_src/fem/geometry/hexmesh.py +956 -0
  33. warp/_src/fem/geometry/nanogrid.py +660 -0
  34. warp/_src/fem/geometry/partition.py +483 -0
  35. warp/_src/fem/geometry/quadmesh.py +597 -0
  36. warp/_src/fem/geometry/tetmesh.py +762 -0
  37. warp/_src/fem/geometry/trimesh.py +588 -0
  38. warp/_src/fem/integrate.py +2507 -0
  39. warp/_src/fem/linalg.py +385 -0
  40. warp/_src/fem/operator.py +398 -0
  41. warp/_src/fem/polynomial.py +231 -0
  42. warp/_src/fem/quadrature/__init__.py +17 -0
  43. warp/_src/fem/quadrature/pic_quadrature.py +318 -0
  44. warp/_src/fem/quadrature/quadrature.py +665 -0
  45. warp/_src/fem/space/__init__.py +248 -0
  46. warp/_src/fem/space/basis_function_space.py +499 -0
  47. warp/_src/fem/space/basis_space.py +681 -0
  48. warp/_src/fem/space/dof_mapper.py +253 -0
  49. warp/_src/fem/space/function_space.py +312 -0
  50. warp/_src/fem/space/grid_2d_function_space.py +179 -0
  51. warp/_src/fem/space/grid_3d_function_space.py +229 -0
  52. warp/_src/fem/space/hexmesh_function_space.py +255 -0
  53. warp/_src/fem/space/nanogrid_function_space.py +199 -0
  54. warp/_src/fem/space/partition.py +435 -0
  55. warp/_src/fem/space/quadmesh_function_space.py +222 -0
  56. warp/_src/fem/space/restriction.py +221 -0
  57. warp/_src/fem/space/shape/__init__.py +152 -0
  58. warp/_src/fem/space/shape/cube_shape_function.py +1107 -0
  59. warp/_src/fem/space/shape/shape_function.py +134 -0
  60. warp/_src/fem/space/shape/square_shape_function.py +928 -0
  61. warp/_src/fem/space/shape/tet_shape_function.py +829 -0
  62. warp/_src/fem/space/shape/triangle_shape_function.py +674 -0
  63. warp/_src/fem/space/tetmesh_function_space.py +270 -0
  64. warp/_src/fem/space/topology.py +461 -0
  65. warp/_src/fem/space/trimesh_function_space.py +193 -0
  66. warp/_src/fem/types.py +114 -0
  67. warp/_src/fem/utils.py +488 -0
  68. warp/_src/jax.py +188 -0
  69. warp/_src/jax_experimental/__init__.py +14 -0
  70. warp/_src/jax_experimental/custom_call.py +389 -0
  71. warp/_src/jax_experimental/ffi.py +1286 -0
  72. warp/_src/jax_experimental/xla_ffi.py +658 -0
  73. warp/_src/marching_cubes.py +710 -0
  74. warp/_src/math.py +416 -0
  75. warp/_src/optim/__init__.py +14 -0
  76. warp/_src/optim/adam.py +165 -0
  77. warp/_src/optim/linear.py +1608 -0
  78. warp/_src/optim/sgd.py +114 -0
  79. warp/_src/paddle.py +408 -0
  80. warp/_src/render/__init__.py +14 -0
  81. warp/_src/render/imgui_manager.py +291 -0
  82. warp/_src/render/render_opengl.py +3638 -0
  83. warp/_src/render/render_usd.py +939 -0
  84. warp/_src/render/utils.py +162 -0
  85. warp/_src/sparse.py +2718 -0
  86. warp/_src/tape.py +1208 -0
  87. warp/_src/thirdparty/__init__.py +0 -0
  88. warp/_src/thirdparty/appdirs.py +598 -0
  89. warp/_src/thirdparty/dlpack.py +145 -0
  90. warp/_src/thirdparty/unittest_parallel.py +676 -0
  91. warp/_src/torch.py +393 -0
  92. warp/_src/types.py +5888 -0
  93. warp/_src/utils.py +1695 -0
  94. warp/autograd.py +33 -0
  95. warp/bin/libwarp-clang.dylib +0 -0
  96. warp/bin/libwarp.dylib +0 -0
  97. warp/build.py +29 -0
  98. warp/build_dll.py +24 -0
  99. warp/codegen.py +24 -0
  100. warp/constants.py +24 -0
  101. warp/context.py +33 -0
  102. warp/dlpack.py +24 -0
  103. warp/examples/__init__.py +24 -0
  104. warp/examples/assets/bear.usd +0 -0
  105. warp/examples/assets/bunny.usd +0 -0
  106. warp/examples/assets/cube.usd +0 -0
  107. warp/examples/assets/nonuniform.usd +0 -0
  108. warp/examples/assets/nvidia_logo.png +0 -0
  109. warp/examples/assets/pixel.jpg +0 -0
  110. warp/examples/assets/rocks.nvdb +0 -0
  111. warp/examples/assets/rocks.usd +0 -0
  112. warp/examples/assets/sphere.usd +0 -0
  113. warp/examples/assets/square_cloth.usd +0 -0
  114. warp/examples/benchmarks/benchmark_api.py +389 -0
  115. warp/examples/benchmarks/benchmark_cloth.py +296 -0
  116. warp/examples/benchmarks/benchmark_cloth_cupy.py +96 -0
  117. warp/examples/benchmarks/benchmark_cloth_jax.py +105 -0
  118. warp/examples/benchmarks/benchmark_cloth_numba.py +161 -0
  119. warp/examples/benchmarks/benchmark_cloth_numpy.py +85 -0
  120. warp/examples/benchmarks/benchmark_cloth_paddle.py +94 -0
  121. warp/examples/benchmarks/benchmark_cloth_pytorch.py +94 -0
  122. warp/examples/benchmarks/benchmark_cloth_taichi.py +120 -0
  123. warp/examples/benchmarks/benchmark_cloth_warp.py +153 -0
  124. warp/examples/benchmarks/benchmark_gemm.py +164 -0
  125. warp/examples/benchmarks/benchmark_interop_paddle.py +166 -0
  126. warp/examples/benchmarks/benchmark_interop_torch.py +166 -0
  127. warp/examples/benchmarks/benchmark_launches.py +301 -0
  128. warp/examples/benchmarks/benchmark_tile_load_store.py +103 -0
  129. warp/examples/benchmarks/benchmark_tile_sort.py +155 -0
  130. warp/examples/browse.py +37 -0
  131. warp/examples/core/example_cupy.py +86 -0
  132. warp/examples/core/example_dem.py +241 -0
  133. warp/examples/core/example_fluid.py +299 -0
  134. warp/examples/core/example_graph_capture.py +150 -0
  135. warp/examples/core/example_marching_cubes.py +195 -0
  136. warp/examples/core/example_mesh.py +180 -0
  137. warp/examples/core/example_mesh_intersect.py +211 -0
  138. warp/examples/core/example_nvdb.py +182 -0
  139. warp/examples/core/example_raycast.py +111 -0
  140. warp/examples/core/example_raymarch.py +205 -0
  141. warp/examples/core/example_render_opengl.py +290 -0
  142. warp/examples/core/example_sample_mesh.py +300 -0
  143. warp/examples/core/example_sph.py +411 -0
  144. warp/examples/core/example_spin_lock.py +93 -0
  145. warp/examples/core/example_torch.py +211 -0
  146. warp/examples/core/example_wave.py +269 -0
  147. warp/examples/core/example_work_queue.py +118 -0
  148. warp/examples/distributed/example_jacobi_mpi.py +506 -0
  149. warp/examples/fem/example_adaptive_grid.py +286 -0
  150. warp/examples/fem/example_apic_fluid.py +469 -0
  151. warp/examples/fem/example_burgers.py +261 -0
  152. warp/examples/fem/example_convection_diffusion.py +181 -0
  153. warp/examples/fem/example_convection_diffusion_dg.py +225 -0
  154. warp/examples/fem/example_darcy_ls_optimization.py +489 -0
  155. warp/examples/fem/example_deformed_geometry.py +172 -0
  156. warp/examples/fem/example_diffusion.py +196 -0
  157. warp/examples/fem/example_diffusion_3d.py +225 -0
  158. warp/examples/fem/example_diffusion_mgpu.py +225 -0
  159. warp/examples/fem/example_distortion_energy.py +228 -0
  160. warp/examples/fem/example_elastic_shape_optimization.py +387 -0
  161. warp/examples/fem/example_magnetostatics.py +242 -0
  162. warp/examples/fem/example_mixed_elasticity.py +293 -0
  163. warp/examples/fem/example_navier_stokes.py +263 -0
  164. warp/examples/fem/example_nonconforming_contact.py +300 -0
  165. warp/examples/fem/example_stokes.py +213 -0
  166. warp/examples/fem/example_stokes_transfer.py +262 -0
  167. warp/examples/fem/example_streamlines.py +357 -0
  168. warp/examples/fem/utils.py +1047 -0
  169. warp/examples/interop/example_jax_callable.py +146 -0
  170. warp/examples/interop/example_jax_ffi_callback.py +132 -0
  171. warp/examples/interop/example_jax_kernel.py +232 -0
  172. warp/examples/optim/example_diffray.py +561 -0
  173. warp/examples/optim/example_fluid_checkpoint.py +497 -0
  174. warp/examples/tile/example_tile_block_cholesky.py +502 -0
  175. warp/examples/tile/example_tile_cholesky.py +88 -0
  176. warp/examples/tile/example_tile_convolution.py +66 -0
  177. warp/examples/tile/example_tile_fft.py +55 -0
  178. warp/examples/tile/example_tile_filtering.py +113 -0
  179. warp/examples/tile/example_tile_matmul.py +85 -0
  180. warp/examples/tile/example_tile_mcgp.py +191 -0
  181. warp/examples/tile/example_tile_mlp.py +385 -0
  182. warp/examples/tile/example_tile_nbody.py +199 -0
  183. warp/fabric.py +24 -0
  184. warp/fem/__init__.py +173 -0
  185. warp/fem/adaptivity.py +26 -0
  186. warp/fem/cache.py +30 -0
  187. warp/fem/dirichlet.py +24 -0
  188. warp/fem/field/__init__.py +24 -0
  189. warp/fem/field/field.py +26 -0
  190. warp/fem/geometry/__init__.py +21 -0
  191. warp/fem/geometry/closest_point.py +31 -0
  192. warp/fem/linalg.py +38 -0
  193. warp/fem/operator.py +32 -0
  194. warp/fem/polynomial.py +29 -0
  195. warp/fem/space/__init__.py +22 -0
  196. warp/fem/space/basis_space.py +24 -0
  197. warp/fem/space/shape/__init__.py +68 -0
  198. warp/fem/space/topology.py +24 -0
  199. warp/fem/types.py +24 -0
  200. warp/fem/utils.py +32 -0
  201. warp/jax.py +29 -0
  202. warp/jax_experimental/__init__.py +29 -0
  203. warp/jax_experimental/custom_call.py +29 -0
  204. warp/jax_experimental/ffi.py +39 -0
  205. warp/jax_experimental/xla_ffi.py +24 -0
  206. warp/marching_cubes.py +24 -0
  207. warp/math.py +37 -0
  208. warp/native/array.h +1687 -0
  209. warp/native/builtin.h +2327 -0
  210. warp/native/bvh.cpp +562 -0
  211. warp/native/bvh.cu +826 -0
  212. warp/native/bvh.h +555 -0
  213. warp/native/clang/clang.cpp +541 -0
  214. warp/native/coloring.cpp +622 -0
  215. warp/native/crt.cpp +51 -0
  216. warp/native/crt.h +568 -0
  217. warp/native/cuda_crt.h +1058 -0
  218. warp/native/cuda_util.cpp +677 -0
  219. warp/native/cuda_util.h +313 -0
  220. warp/native/error.cpp +77 -0
  221. warp/native/error.h +36 -0
  222. warp/native/exports.h +2023 -0
  223. warp/native/fabric.h +246 -0
  224. warp/native/hashgrid.cpp +311 -0
  225. warp/native/hashgrid.cu +89 -0
  226. warp/native/hashgrid.h +240 -0
  227. warp/native/initializer_array.h +41 -0
  228. warp/native/intersect.h +1253 -0
  229. warp/native/intersect_adj.h +375 -0
  230. warp/native/intersect_tri.h +348 -0
  231. warp/native/mat.h +5189 -0
  232. warp/native/mathdx.cpp +93 -0
  233. warp/native/matnn.h +221 -0
  234. warp/native/mesh.cpp +266 -0
  235. warp/native/mesh.cu +406 -0
  236. warp/native/mesh.h +2097 -0
  237. warp/native/nanovdb/GridHandle.h +533 -0
  238. warp/native/nanovdb/HostBuffer.h +591 -0
  239. warp/native/nanovdb/NanoVDB.h +6246 -0
  240. warp/native/nanovdb/NodeManager.h +323 -0
  241. warp/native/nanovdb/PNanoVDB.h +3390 -0
  242. warp/native/noise.h +859 -0
  243. warp/native/quat.h +1664 -0
  244. warp/native/rand.h +342 -0
  245. warp/native/range.h +145 -0
  246. warp/native/reduce.cpp +174 -0
  247. warp/native/reduce.cu +363 -0
  248. warp/native/runlength_encode.cpp +79 -0
  249. warp/native/runlength_encode.cu +61 -0
  250. warp/native/scan.cpp +47 -0
  251. warp/native/scan.cu +55 -0
  252. warp/native/scan.h +23 -0
  253. warp/native/solid_angle.h +466 -0
  254. warp/native/sort.cpp +251 -0
  255. warp/native/sort.cu +286 -0
  256. warp/native/sort.h +35 -0
  257. warp/native/sparse.cpp +241 -0
  258. warp/native/sparse.cu +435 -0
  259. warp/native/spatial.h +1306 -0
  260. warp/native/svd.h +727 -0
  261. warp/native/temp_buffer.h +46 -0
  262. warp/native/tile.h +4124 -0
  263. warp/native/tile_radix_sort.h +1112 -0
  264. warp/native/tile_reduce.h +838 -0
  265. warp/native/tile_scan.h +240 -0
  266. warp/native/tuple.h +189 -0
  267. warp/native/vec.h +2199 -0
  268. warp/native/version.h +23 -0
  269. warp/native/volume.cpp +501 -0
  270. warp/native/volume.cu +68 -0
  271. warp/native/volume.h +970 -0
  272. warp/native/volume_builder.cu +483 -0
  273. warp/native/volume_builder.h +52 -0
  274. warp/native/volume_impl.h +70 -0
  275. warp/native/warp.cpp +1143 -0
  276. warp/native/warp.cu +4604 -0
  277. warp/native/warp.h +358 -0
  278. warp/optim/__init__.py +20 -0
  279. warp/optim/adam.py +24 -0
  280. warp/optim/linear.py +35 -0
  281. warp/optim/sgd.py +24 -0
  282. warp/paddle.py +24 -0
  283. warp/py.typed +0 -0
  284. warp/render/__init__.py +22 -0
  285. warp/render/imgui_manager.py +29 -0
  286. warp/render/render_opengl.py +24 -0
  287. warp/render/render_usd.py +24 -0
  288. warp/render/utils.py +24 -0
  289. warp/sparse.py +51 -0
  290. warp/tape.py +24 -0
  291. warp/tests/__init__.py +1 -0
  292. warp/tests/__main__.py +4 -0
  293. warp/tests/assets/curlnoise_golden.npy +0 -0
  294. warp/tests/assets/mlp_golden.npy +0 -0
  295. warp/tests/assets/pixel.npy +0 -0
  296. warp/tests/assets/pnoise_golden.npy +0 -0
  297. warp/tests/assets/spiky.usd +0 -0
  298. warp/tests/assets/test_grid.nvdb +0 -0
  299. warp/tests/assets/test_index_grid.nvdb +0 -0
  300. warp/tests/assets/test_int32_grid.nvdb +0 -0
  301. warp/tests/assets/test_vec_grid.nvdb +0 -0
  302. warp/tests/assets/torus.nvdb +0 -0
  303. warp/tests/assets/torus.usda +105 -0
  304. warp/tests/aux_test_class_kernel.py +34 -0
  305. warp/tests/aux_test_compile_consts_dummy.py +18 -0
  306. warp/tests/aux_test_conditional_unequal_types_kernels.py +29 -0
  307. warp/tests/aux_test_dependent.py +29 -0
  308. warp/tests/aux_test_grad_customs.py +29 -0
  309. warp/tests/aux_test_instancing_gc.py +26 -0
  310. warp/tests/aux_test_module_aot.py +7 -0
  311. warp/tests/aux_test_module_unload.py +23 -0
  312. warp/tests/aux_test_name_clash1.py +40 -0
  313. warp/tests/aux_test_name_clash2.py +40 -0
  314. warp/tests/aux_test_reference.py +9 -0
  315. warp/tests/aux_test_reference_reference.py +8 -0
  316. warp/tests/aux_test_square.py +16 -0
  317. warp/tests/aux_test_unresolved_func.py +22 -0
  318. warp/tests/aux_test_unresolved_symbol.py +22 -0
  319. warp/tests/cuda/__init__.py +0 -0
  320. warp/tests/cuda/test_async.py +676 -0
  321. warp/tests/cuda/test_conditional_captures.py +1147 -0
  322. warp/tests/cuda/test_ipc.py +124 -0
  323. warp/tests/cuda/test_mempool.py +233 -0
  324. warp/tests/cuda/test_multigpu.py +169 -0
  325. warp/tests/cuda/test_peer.py +139 -0
  326. warp/tests/cuda/test_pinned.py +84 -0
  327. warp/tests/cuda/test_streams.py +691 -0
  328. warp/tests/geometry/__init__.py +0 -0
  329. warp/tests/geometry/test_bvh.py +335 -0
  330. warp/tests/geometry/test_hash_grid.py +259 -0
  331. warp/tests/geometry/test_marching_cubes.py +294 -0
  332. warp/tests/geometry/test_mesh.py +318 -0
  333. warp/tests/geometry/test_mesh_query_aabb.py +392 -0
  334. warp/tests/geometry/test_mesh_query_point.py +935 -0
  335. warp/tests/geometry/test_mesh_query_ray.py +323 -0
  336. warp/tests/geometry/test_volume.py +1103 -0
  337. warp/tests/geometry/test_volume_write.py +346 -0
  338. warp/tests/interop/__init__.py +0 -0
  339. warp/tests/interop/test_dlpack.py +730 -0
  340. warp/tests/interop/test_jax.py +1673 -0
  341. warp/tests/interop/test_paddle.py +800 -0
  342. warp/tests/interop/test_torch.py +1001 -0
  343. warp/tests/run_coverage_serial.py +39 -0
  344. warp/tests/test_adam.py +162 -0
  345. warp/tests/test_arithmetic.py +1096 -0
  346. warp/tests/test_array.py +3756 -0
  347. warp/tests/test_array_reduce.py +156 -0
  348. warp/tests/test_assert.py +303 -0
  349. warp/tests/test_atomic.py +336 -0
  350. warp/tests/test_atomic_bitwise.py +209 -0
  351. warp/tests/test_atomic_cas.py +312 -0
  352. warp/tests/test_bool.py +220 -0
  353. warp/tests/test_builtins_resolution.py +732 -0
  354. warp/tests/test_closest_point_edge_edge.py +327 -0
  355. warp/tests/test_codegen.py +974 -0
  356. warp/tests/test_codegen_instancing.py +1495 -0
  357. warp/tests/test_compile_consts.py +215 -0
  358. warp/tests/test_conditional.py +298 -0
  359. warp/tests/test_context.py +35 -0
  360. warp/tests/test_copy.py +319 -0
  361. warp/tests/test_ctypes.py +618 -0
  362. warp/tests/test_dense.py +73 -0
  363. warp/tests/test_devices.py +127 -0
  364. warp/tests/test_enum.py +136 -0
  365. warp/tests/test_examples.py +424 -0
  366. warp/tests/test_fabricarray.py +998 -0
  367. warp/tests/test_fast_math.py +72 -0
  368. warp/tests/test_fem.py +2204 -0
  369. warp/tests/test_fixedarray.py +229 -0
  370. warp/tests/test_fp16.py +136 -0
  371. warp/tests/test_func.py +501 -0
  372. warp/tests/test_future_annotations.py +100 -0
  373. warp/tests/test_generics.py +656 -0
  374. warp/tests/test_grad.py +893 -0
  375. warp/tests/test_grad_customs.py +339 -0
  376. warp/tests/test_grad_debug.py +341 -0
  377. warp/tests/test_implicit_init.py +411 -0
  378. warp/tests/test_import.py +45 -0
  379. warp/tests/test_indexedarray.py +1140 -0
  380. warp/tests/test_intersect.py +103 -0
  381. warp/tests/test_iter.py +76 -0
  382. warp/tests/test_large.py +177 -0
  383. warp/tests/test_launch.py +411 -0
  384. warp/tests/test_lerp.py +151 -0
  385. warp/tests/test_linear_solvers.py +223 -0
  386. warp/tests/test_lvalue.py +427 -0
  387. warp/tests/test_map.py +526 -0
  388. warp/tests/test_mat.py +3515 -0
  389. warp/tests/test_mat_assign_copy.py +178 -0
  390. warp/tests/test_mat_constructors.py +573 -0
  391. warp/tests/test_mat_lite.py +122 -0
  392. warp/tests/test_mat_scalar_ops.py +2913 -0
  393. warp/tests/test_math.py +212 -0
  394. warp/tests/test_module_aot.py +287 -0
  395. warp/tests/test_module_hashing.py +258 -0
  396. warp/tests/test_modules_lite.py +70 -0
  397. warp/tests/test_noise.py +252 -0
  398. warp/tests/test_operators.py +299 -0
  399. warp/tests/test_options.py +129 -0
  400. warp/tests/test_overwrite.py +551 -0
  401. warp/tests/test_print.py +408 -0
  402. warp/tests/test_quat.py +2653 -0
  403. warp/tests/test_quat_assign_copy.py +145 -0
  404. warp/tests/test_rand.py +339 -0
  405. warp/tests/test_reload.py +303 -0
  406. warp/tests/test_rounding.py +157 -0
  407. warp/tests/test_runlength_encode.py +196 -0
  408. warp/tests/test_scalar_ops.py +133 -0
  409. warp/tests/test_smoothstep.py +108 -0
  410. warp/tests/test_snippet.py +318 -0
  411. warp/tests/test_sparse.py +845 -0
  412. warp/tests/test_spatial.py +2859 -0
  413. warp/tests/test_spatial_assign_copy.py +160 -0
  414. warp/tests/test_special_values.py +361 -0
  415. warp/tests/test_static.py +640 -0
  416. warp/tests/test_struct.py +901 -0
  417. warp/tests/test_tape.py +242 -0
  418. warp/tests/test_transient_module.py +93 -0
  419. warp/tests/test_triangle_closest_point.py +192 -0
  420. warp/tests/test_tuple.py +361 -0
  421. warp/tests/test_types.py +615 -0
  422. warp/tests/test_utils.py +594 -0
  423. warp/tests/test_vec.py +1408 -0
  424. warp/tests/test_vec_assign_copy.py +143 -0
  425. warp/tests/test_vec_constructors.py +325 -0
  426. warp/tests/test_vec_lite.py +80 -0
  427. warp/tests/test_vec_scalar_ops.py +2327 -0
  428. warp/tests/test_verify_fp.py +100 -0
  429. warp/tests/test_version.py +75 -0
  430. warp/tests/tile/__init__.py +0 -0
  431. warp/tests/tile/test_tile.py +1519 -0
  432. warp/tests/tile/test_tile_atomic_bitwise.py +403 -0
  433. warp/tests/tile/test_tile_cholesky.py +608 -0
  434. warp/tests/tile/test_tile_load.py +724 -0
  435. warp/tests/tile/test_tile_mathdx.py +156 -0
  436. warp/tests/tile/test_tile_matmul.py +179 -0
  437. warp/tests/tile/test_tile_mlp.py +400 -0
  438. warp/tests/tile/test_tile_reduce.py +950 -0
  439. warp/tests/tile/test_tile_shared_memory.py +376 -0
  440. warp/tests/tile/test_tile_sort.py +121 -0
  441. warp/tests/tile/test_tile_view.py +173 -0
  442. warp/tests/unittest_serial.py +47 -0
  443. warp/tests/unittest_suites.py +430 -0
  444. warp/tests/unittest_utils.py +469 -0
  445. warp/tests/walkthrough_debug.py +95 -0
  446. warp/torch.py +24 -0
  447. warp/types.py +51 -0
  448. warp/utils.py +31 -0
  449. warp_lang-1.10.0.dist-info/METADATA +459 -0
  450. warp_lang-1.10.0.dist-info/RECORD +468 -0
  451. warp_lang-1.10.0.dist-info/WHEEL +5 -0
  452. warp_lang-1.10.0.dist-info/licenses/LICENSE.md +176 -0
  453. warp_lang-1.10.0.dist-info/licenses/licenses/Gaia-LICENSE.txt +6 -0
  454. warp_lang-1.10.0.dist-info/licenses/licenses/appdirs-LICENSE.txt +22 -0
  455. warp_lang-1.10.0.dist-info/licenses/licenses/asset_pixel_jpg-LICENSE.txt +3 -0
  456. warp_lang-1.10.0.dist-info/licenses/licenses/cuda-LICENSE.txt +1582 -0
  457. warp_lang-1.10.0.dist-info/licenses/licenses/dlpack-LICENSE.txt +201 -0
  458. warp_lang-1.10.0.dist-info/licenses/licenses/fp16-LICENSE.txt +28 -0
  459. warp_lang-1.10.0.dist-info/licenses/licenses/libmathdx-LICENSE.txt +220 -0
  460. warp_lang-1.10.0.dist-info/licenses/licenses/llvm-LICENSE.txt +279 -0
  461. warp_lang-1.10.0.dist-info/licenses/licenses/moller-LICENSE.txt +16 -0
  462. warp_lang-1.10.0.dist-info/licenses/licenses/nanovdb-LICENSE.txt +2 -0
  463. warp_lang-1.10.0.dist-info/licenses/licenses/nvrtc-LICENSE.txt +1592 -0
  464. warp_lang-1.10.0.dist-info/licenses/licenses/svd-LICENSE.txt +23 -0
  465. warp_lang-1.10.0.dist-info/licenses/licenses/unittest_parallel-LICENSE.txt +21 -0
  466. warp_lang-1.10.0.dist-info/licenses/licenses/usd-LICENSE.txt +213 -0
  467. warp_lang-1.10.0.dist-info/licenses/licenses/windingnumber-LICENSE.txt +21 -0
  468. warp_lang-1.10.0.dist-info/top_level.txt +1 -0
@@ -0,0 +1,296 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ # include parent path
17
+ import csv
18
+ import os
19
+ import sys
20
+
21
+ import numpy as np
22
+
23
+ sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), ".")))
24
+
25
+ from pxr import Usd, UsdGeom
26
+
27
+ import warp as wp
28
+
29
+
30
+ class Cloth:
31
+ def __init__(
32
+ self, lower, dx, dy, radius, stretch_stiffness, bend_stiffness, shear_stiffness, mass, fix_corners=True
33
+ ):
34
+ self.triangles = []
35
+
36
+ self.positions = []
37
+ self.velocities = []
38
+ self.inv_masses = []
39
+
40
+ self.spring_indices = []
41
+ self.spring_lengths = []
42
+ self.spring_stiffness = []
43
+ self.spring_damping = []
44
+
45
+ def grid(x, y, stride):
46
+ return y * stride + x
47
+
48
+ def create_spring(i, j, stiffness, damp=10.0):
49
+ length = np.linalg.norm(np.array(self.positions[i]) - np.array(self.positions[j]))
50
+
51
+ self.spring_indices.append(i)
52
+ self.spring_indices.append(j)
53
+ self.spring_lengths.append(length)
54
+ self.spring_stiffness.append(stiffness)
55
+ self.spring_damping.append(damp)
56
+
57
+ for y in range(dy):
58
+ for x in range(dx):
59
+ p = np.array(lower) + radius * np.array((float(x), float(0.0), float(y)))
60
+
61
+ self.positions.append(p)
62
+ self.velocities.append(np.zeros(3))
63
+
64
+ if x > 0 and y > 0:
65
+ self.triangles.append(grid(x - 1, y - 1, dx))
66
+ self.triangles.append(grid(x, y - 1, dx))
67
+ self.triangles.append(grid(x, y, dx))
68
+
69
+ self.triangles.append(grid(x - 1, y - 1, dx))
70
+ self.triangles.append(grid(x, y, dx))
71
+ self.triangles.append(grid(x - 1, y, dx))
72
+
73
+ if fix_corners and y == 0 and (x == 0 or x == dx - 1):
74
+ w = 0.0
75
+ else:
76
+ w = 1.0 / mass
77
+
78
+ self.inv_masses.append(w)
79
+
80
+ # horizontal springs
81
+ for y in range(dy):
82
+ for x in range(dx):
83
+ index0 = y * dx + x
84
+
85
+ if x > 0:
86
+ index1 = y * dx + x - 1
87
+ create_spring(index0, index1, stretch_stiffness)
88
+
89
+ if x > 1 and bend_stiffness > 0.0:
90
+ index2 = y * dx + x - 2
91
+ create_spring(index0, index2, bend_stiffness)
92
+
93
+ if y > 0 and x < dx - 1 and shear_stiffness > 0.0:
94
+ indexDiag = (y - 1) * dx + x + 1
95
+ create_spring(index0, indexDiag, shear_stiffness)
96
+
97
+ if y > 0 and x > 0 and shear_stiffness > 0.0:
98
+ indexDiag = (y - 1) * dx + x - 1
99
+ create_spring(index0, indexDiag, shear_stiffness)
100
+
101
+ # vertical
102
+ for x in range(dx):
103
+ for y in range(dy):
104
+ index0 = y * dx + x
105
+
106
+ if y > 0:
107
+ index1 = (y - 1) * dx + x
108
+ create_spring(index0, index1, stretch_stiffness)
109
+
110
+ if y > 1 and bend_stiffness > 0.0:
111
+ index2 = (y - 2) * dx + x
112
+ create_spring(index0, index2, bend_stiffness)
113
+
114
+ # harden to np arrays
115
+ self.positions = np.array(self.positions, dtype=np.float32)
116
+ self.velocities = np.array(self.velocities, dtype=np.float32)
117
+ self.inv_masses = np.array(self.inv_masses, dtype=np.float32)
118
+ self.spring_lengths = np.array(self.spring_lengths, dtype=np.float32)
119
+ self.spring_indices = np.array(self.spring_indices, dtype=np.int32)
120
+ self.spring_stiffness = np.array(self.spring_stiffness, dtype=np.float32)
121
+ self.spring_damping = np.array(self.spring_damping, dtype=np.float32)
122
+
123
+ self.num_particles = len(self.positions)
124
+ self.num_springs = len(self.spring_lengths)
125
+ self.num_tris = int(len(self.triangles) / 3)
126
+
127
+
128
+ def run_benchmark(mode, dim, timers, render=False):
129
+ # params
130
+ sim_width = dim
131
+ sim_height = dim
132
+
133
+ sim_fps = 60.0
134
+ sim_substeps = 16
135
+ sim_duration = 1.0
136
+ sim_frames = int(sim_duration * sim_fps)
137
+ sim_dt = 1.0 / sim_fps
138
+ sim_time = 0.0
139
+
140
+ # wave constants
141
+ k_stretch = 1000.0
142
+ k_shear = 1000.0
143
+ k_bend = 1000.0
144
+ # k_damp = 0.0
145
+
146
+ cloth = Cloth(
147
+ lower=(0.0, 0.0, 0.0),
148
+ dx=sim_width,
149
+ dy=sim_height,
150
+ radius=0.1,
151
+ stretch_stiffness=k_stretch,
152
+ bend_stiffness=k_bend,
153
+ shear_stiffness=k_shear,
154
+ mass=0.1,
155
+ fix_corners=True,
156
+ )
157
+
158
+ if render:
159
+ # set up grid for visualization
160
+ stage = Usd.Stage.CreateNew("benchmark.usd")
161
+ stage.SetStartTimeCode(0.0)
162
+ stage.SetEndTimeCode(sim_duration * sim_fps)
163
+ stage.SetFramesPerSecond(sim_fps)
164
+
165
+ grid = UsdGeom.Mesh.Define(stage, "/root")
166
+ grid.GetPointsAttr().Set(cloth.positions, 0.0)
167
+ grid.GetFaceVertexIndicesAttr().Set(cloth.triangles, 0.0)
168
+ grid.GetFaceVertexCountsAttr().Set([3] * cloth.num_tris, 0.0)
169
+
170
+ with wp.ScopedTimer("Initialization", dict=timers):
171
+ if mode == "warp_cpu":
172
+ import benchmark_cloth_warp
173
+
174
+ integrator = benchmark_cloth_warp.WpIntegrator(cloth, "cpu")
175
+
176
+ elif mode == "warp_gpu":
177
+ import benchmark_cloth_warp
178
+
179
+ integrator = benchmark_cloth_warp.WpIntegrator(cloth, "cuda")
180
+
181
+ elif mode == "taichi_cpu":
182
+ import benchmark_cloth_taichi
183
+
184
+ integrator = benchmark_cloth_taichi.TiIntegrator(cloth, "cpu")
185
+
186
+ elif mode == "taichi_gpu":
187
+ import benchmark_cloth_taichi
188
+
189
+ integrator = benchmark_cloth_taichi.TiIntegrator(cloth, "cuda")
190
+
191
+ elif mode == "numpy":
192
+ import benchmark_cloth_numpy
193
+
194
+ integrator = benchmark_cloth_numpy.NpIntegrator(cloth)
195
+
196
+ elif mode == "cupy":
197
+ import benchmark_cloth_cupy
198
+
199
+ integrator = benchmark_cloth_cupy.CpIntegrator(cloth)
200
+
201
+ elif mode == "numba":
202
+ import benchmark_cloth_numba
203
+
204
+ integrator = benchmark_cloth_numba.NbIntegrator(cloth)
205
+
206
+ elif mode == "torch_cpu":
207
+ import benchmark_cloth_pytorch
208
+
209
+ integrator = benchmark_cloth_pytorch.TrIntegrator(cloth, "cpu")
210
+
211
+ elif mode == "torch_gpu":
212
+ import benchmark_cloth_pytorch
213
+
214
+ integrator = benchmark_cloth_pytorch.TrIntegrator(cloth, "cuda")
215
+
216
+ elif mode == "jax_cpu":
217
+ os.environ["JAX_PLATFORM_NAME"] = "cpu"
218
+
219
+ import benchmark_cloth_jax
220
+
221
+ integrator = benchmark_cloth_jax.JxIntegrator(cloth)
222
+
223
+ elif mode == "jax_gpu":
224
+ os.environ["JAX_PLATFORM_NAME"] = "gpu"
225
+
226
+ import benchmark_cloth_jax
227
+
228
+ integrator = benchmark_cloth_jax.JxIntegrator(cloth)
229
+
230
+ elif mode == "paddle_cpu":
231
+ import benchmark_cloth_paddle
232
+
233
+ integrator = benchmark_cloth_paddle.TrIntegrator(cloth, "cpu")
234
+
235
+ elif mode == "paddle_gpu":
236
+ import benchmark_cloth_paddle
237
+
238
+ integrator = benchmark_cloth_paddle.TrIntegrator(cloth, "gpu")
239
+
240
+ else:
241
+ raise RuntimeError("Unknown simulation backend")
242
+
243
+ # run one warm-up iteration to accurately measure initialization time (some engines do lazy init)
244
+ positions = integrator.simulate(sim_dt, sim_substeps)
245
+
246
+ label = f"Dim ({dim}^2)"
247
+
248
+ # run simulation
249
+ for _i in range(sim_frames):
250
+ # simulate
251
+ with wp.ScopedTimer(label, dict=timers):
252
+ positions = integrator.simulate(sim_dt, sim_substeps)
253
+
254
+ if render:
255
+ grid.GetPointsAttr().Set(positions, sim_time * sim_fps)
256
+
257
+ sim_time += sim_dt
258
+
259
+ if render:
260
+ stage.Save()
261
+
262
+
263
+ # record profiling information
264
+ timers = {}
265
+
266
+ if len(sys.argv) > 1:
267
+ mode = sys.argv[1]
268
+ else:
269
+ mode = "warp_gpu"
270
+
271
+ run_benchmark(mode, 32, timers, render=False)
272
+ run_benchmark(mode, 64, timers, render=False)
273
+ run_benchmark(mode, 128, timers, render=False)
274
+
275
+ # write results
276
+
277
+ for k, v in timers.items():
278
+ print(f"{k:16} min: {np.min(v):8.2f} max: {np.max(v):8.2f} avg: {np.mean(v):8.2f}")
279
+
280
+ report = open(os.path.join("benchmark.csv"), "a")
281
+ writer = csv.writer(report, delimiter=",")
282
+
283
+ if report.tell() == 0:
284
+ writer.writerow(["Name", "Init", "Dim (32^2)", "Dim (64^2)", "Dim (128^2)"])
285
+
286
+ writer.writerow(
287
+ [
288
+ mode,
289
+ np.max(timers["Initialization"]),
290
+ np.mean(timers["Dim (32^2)"]),
291
+ np.mean(timers["Dim (64^2)"]),
292
+ np.mean(timers["Dim (128^2)"]),
293
+ ]
294
+ )
295
+
296
+ report.close()
@@ -0,0 +1,96 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import cupy as cp
17
+ import cupyx as cpx
18
+
19
+
20
+ def eval_springs(x, v, indices, rest, ke, kd, f):
21
+ i = indices[:, 0]
22
+ j = indices[:, 1]
23
+
24
+ xi = x[i]
25
+ xj = x[j]
26
+
27
+ vi = v[i]
28
+ vj = v[j]
29
+
30
+ xij = xi - xj
31
+ vij = vi - vj
32
+
33
+ l = cp.linalg.norm(xij, axis=1)
34
+ l_inv = 1.0 / l
35
+
36
+ # normalized spring direction
37
+ dir = (xij.T * l_inv).T
38
+
39
+ c = l - rest
40
+ dcdt = cp.sum(dir * vij, axis=1)
41
+
42
+ # damping based on relative velocity.
43
+ fs = dir.T * (ke * c + kd * dcdt)
44
+
45
+ cpx.scatter_add(f, i, -fs.T)
46
+ cpx.scatter_add(f, j, fs.T)
47
+
48
+
49
+ def integrate_particles(x, v, f, w, dt):
50
+ g = cp.array((0.0, 0.0 - 9.8, 0.0))
51
+ s = w > 0.0
52
+
53
+ a_ext = g * s[:, None]
54
+
55
+ # simple semi-implicit Euler. v1 = v0 + a dt, x1 = x0 + v1 dt
56
+ v += ((f.T * w).T + a_ext) * dt
57
+ x += v * dt
58
+
59
+ # clear forces
60
+ f *= 0.0
61
+
62
+
63
+ class CpIntegrator:
64
+ def __init__(self, cloth):
65
+ self.cloth = cloth
66
+
67
+ self.positions = cp.array(self.cloth.positions)
68
+ self.velocities = cp.array(self.cloth.velocities)
69
+ self.inv_mass = cp.array(self.cloth.inv_masses)
70
+
71
+ self.spring_indices = cp.array(self.cloth.spring_indices)
72
+ self.spring_lengths = cp.array(self.cloth.spring_lengths)
73
+ self.spring_stiffness = cp.array(self.cloth.spring_stiffness)
74
+ self.spring_damping = cp.array(self.cloth.spring_damping)
75
+
76
+ self.forces = cp.zeros((self.cloth.num_particles, 3), dtype=cp.float32)
77
+
78
+ def simulate(self, dt, substeps):
79
+ sim_dt = dt / substeps
80
+
81
+ for _s in range(substeps):
82
+ eval_springs(
83
+ self.positions,
84
+ self.velocities,
85
+ self.spring_indices.reshape((self.cloth.num_springs, 2)),
86
+ self.spring_lengths,
87
+ self.spring_stiffness,
88
+ self.spring_damping,
89
+ self.forces,
90
+ )
91
+
92
+ # integrate
93
+ integrate_particles(self.positions, self.velocities, self.forces, self.inv_mass, sim_dt)
94
+
95
+ # return np.array(self.positions)
96
+ return self.positions.get()
@@ -0,0 +1,105 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import jax.lax
17
+ import jax.numpy as jnp
18
+ import numpy as np
19
+
20
+
21
+ @jax.jit
22
+ def eval_springs(x, v, indices, rest, ke, kd):
23
+ i = indices[:, 0]
24
+ j = indices[:, 1]
25
+
26
+ xi = x[i]
27
+ xj = x[j]
28
+
29
+ vi = v[i]
30
+ vj = v[j]
31
+
32
+ xij = xi - xj
33
+ vij = vi - vj
34
+
35
+ l = jnp.linalg.norm(xij, axis=1)
36
+ l_inv = 1.0 / l
37
+
38
+ # normalized spring direction
39
+ dir = (xij.T * l_inv).T
40
+
41
+ c = l - rest
42
+ dcdt = jnp.sum(dir * vij, axis=1)
43
+
44
+ # damping based on relative velocity.
45
+ fs = dir.T * (ke * c + kd * dcdt)
46
+
47
+ f = jnp.zeros_like(v)
48
+
49
+ # f = jax.ops.index_add(f, i, -fs.T, indices_are_sorted=False, unique_indices=False)
50
+ # f = jax.ops.index_add(f, j, fs.T, indices_are_sorted=False, unique_indices=False)
51
+
52
+ f.at[i].add(-fs.T)
53
+ f.at[j].add(fs.T)
54
+
55
+ return f
56
+
57
+
58
+ @jax.jit
59
+ def integrate_particles(x, v, f, w, dt):
60
+ g = jnp.array((0.0, 0.0 - 9.8, 0.0))
61
+ s = w > 0.0
62
+
63
+ a_ext = g * s[:, None]
64
+
65
+ # simple semi-implicit Euler. v1 = v0 + a dt, x1 = x0 + v1 dt
66
+ v += ((f.T * w).T + a_ext) * dt
67
+ x += v * dt
68
+
69
+ return (x, v)
70
+
71
+
72
+ class JxIntegrator:
73
+ def __init__(self, cloth):
74
+ self.cloth = cloth
75
+
76
+ self.positions = jnp.array(self.cloth.positions)
77
+ self.velocities = jnp.array(self.cloth.velocities)
78
+ self.inv_mass = jnp.array(self.cloth.inv_masses)
79
+
80
+ print(self.positions.device_buffer.device())
81
+
82
+ self.spring_indices = jnp.array(self.cloth.spring_indices)
83
+ self.spring_lengths = jnp.array(self.cloth.spring_lengths)
84
+ self.spring_stiffness = jnp.array(self.cloth.spring_stiffness)
85
+ self.spring_damping = jnp.array(self.cloth.spring_damping)
86
+
87
+ def simulate(self, dt, substeps):
88
+ sim_dt = dt / substeps
89
+
90
+ for _s in range(substeps):
91
+ f = eval_springs(
92
+ self.positions,
93
+ self.velocities,
94
+ self.spring_indices.reshape((self.cloth.num_springs, 2)),
95
+ self.spring_lengths,
96
+ self.spring_stiffness,
97
+ self.spring_damping,
98
+ )
99
+
100
+ # integrate
101
+ (self.positions, self.velocities) = integrate_particles(
102
+ self.positions, self.velocities, f, self.inv_mass, sim_dt
103
+ )
104
+
105
+ return np.array(self.positions)
@@ -0,0 +1,161 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import math
17
+
18
+ import cupy as cp
19
+ import numpy as np
20
+ from numba import cuda, float32
21
+
22
+ # Notes:
23
+ #
24
+ # Current implementation requires some familarity of writing custom cuda kernels
25
+ # May be improved with cuda ufuncs and/or writing custom numba type extensions.
26
+
27
+
28
+ @cuda.jit(device=True)
29
+ def norm(x):
30
+ s = float32(0.0)
31
+ for i in range(3):
32
+ s += x[i] * x[i]
33
+ return math.sqrt(s)
34
+
35
+
36
+ @cuda.jit(device=True)
37
+ def dot(x, y):
38
+ s = float32(0.0)
39
+ for i in range(3):
40
+ s += x[i] * y[i]
41
+ return s
42
+
43
+
44
+ @cuda.jit
45
+ def eval_springs_cuda(
46
+ num_springs, # (1,)
47
+ xs, # position (N, 3)
48
+ vs, # velocities (N, 3)
49
+ indices, # spring indices (S, 2)
50
+ rests, # spring rest length (S,)
51
+ kes, # stiffness (S,)
52
+ kds, # damping (S,)
53
+ fs,
54
+ ): # forces (N, 3)
55
+ tidx = cuda.grid(1)
56
+
57
+ if tidx < num_springs:
58
+ i, j = indices[tidx][0], indices[tidx][1]
59
+ xi, xj = xs[i], xs[j]
60
+ vi, vj = vs[i], vs[j]
61
+ rest, ke, kd = rests[tidx], kes[tidx], kds[tidx]
62
+
63
+ xij = cuda.local.array(3, dtype=cp.float32)
64
+ vij = cuda.local.array(3, dtype=cp.float32)
65
+ for k in range(3):
66
+ xij[k] = xi[k] - xj[k]
67
+ for k in range(3):
68
+ vij[k] = vi[k] - vj[k]
69
+
70
+ l = norm(xij)
71
+
72
+ l_inv = float32(1.0) / l
73
+
74
+ # normalized spring direction
75
+ xij_unit = cuda.local.array(3, dtype=cp.float32)
76
+ for k in range(3):
77
+ xij_unit[k] = xij[k] * l_inv
78
+ c = l - rest
79
+ dcdt = dot(xij_unit, vij)
80
+
81
+ # mass-spring-damper model
82
+ fac = ke * c + kd * dcdt
83
+ df = cuda.local.array(3, dtype=cp.float32)
84
+ for k in range(3):
85
+ df[k] = xij_unit[k] * fac
86
+
87
+ for k in range(3):
88
+ cuda.atomic.add(fs[i], k, -df[k])
89
+ cuda.atomic.add(fs[j], k, df[k])
90
+
91
+
92
+ # Support const array with cp array?
93
+ g = np.array([0.0, 0.0 - 9.8, 0.0], dtype=np.float32)
94
+ z = np.array([0.0, 0.0, 0.0], dtype=np.float32)
95
+
96
+
97
+ @cuda.jit
98
+ def integrate_particles_cuda(
99
+ xs, # position (N, 3)
100
+ vs, # velocity (N, 3)
101
+ fs, # force (N, 3)
102
+ ws, # inverse of mass (N,)
103
+ dt,
104
+ ): # dt (1,)
105
+ i = cuda.grid(1)
106
+
107
+ if i < xs.shape[0]:
108
+ w = ws[i]
109
+ a = cuda.const.array_like(g) if w > 0.0 else cuda.const.array_like(z)
110
+
111
+ for j in range(3):
112
+ # vs[i] += ((f * w) + a) * dt (ideally)
113
+ vs[i][j] = vs[i][j] + ((fs[i][j] * w) + a[j]) * dt
114
+ xs[i][j] = xs[i][j] + vs[i][j] * dt
115
+
116
+ fs[i] = 0.0
117
+
118
+
119
+ class NbIntegrator:
120
+ def __init__(self, cloth):
121
+ self.cloth = cloth
122
+
123
+ self.positions = cp.array(self.cloth.positions)
124
+ self.velocities = cp.array(self.cloth.velocities)
125
+ self.inv_mass = cp.array(self.cloth.inv_masses)
126
+
127
+ self.spring_indices = cp.array(self.cloth.spring_indices)
128
+ self.spring_lengths = cp.array(self.cloth.spring_lengths)
129
+ self.spring_stiffness = cp.array(self.cloth.spring_stiffness)
130
+ self.spring_damping = cp.array(self.cloth.spring_damping)
131
+
132
+ self.forces = cp.zeros((self.cloth.num_particles, 3), dtype=cp.float32)
133
+
134
+ self.num_particles = self.positions.shape[0]
135
+ self.integrate_tpb = 4
136
+ self.integrate_nb = self.num_particles // self.integrate_tpb + 1
137
+
138
+ self.spring_tpb = 4
139
+ self.spring_nb = self.cloth.num_springs // self.spring_tpb + 1
140
+
141
+ def simulate(self, dt, substeps):
142
+ sim_dt = dt / substeps
143
+
144
+ for _s in range(substeps):
145
+ eval_springs_cuda[self.spring_nb, self.spring_tpb](
146
+ self.cloth.num_springs,
147
+ self.positions,
148
+ self.velocities,
149
+ self.spring_indices.reshape((self.cloth.num_springs, 2)),
150
+ self.spring_lengths,
151
+ self.spring_stiffness,
152
+ self.spring_damping,
153
+ self.forces,
154
+ )
155
+
156
+ # integrate
157
+ integrate_particles_cuda[self.integrate_nb, self.integrate_tpb](
158
+ self.positions, self.velocities, self.forces, self.inv_mass, sim_dt
159
+ )
160
+
161
+ return self.positions.get()