warp-lang 1.10.0__py3-none-macosx_11_0_arm64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of warp-lang might be problematic. Click here for more details.

Files changed (468) hide show
  1. warp/__init__.py +334 -0
  2. warp/__init__.pyi +5856 -0
  3. warp/_src/__init__.py +14 -0
  4. warp/_src/autograd.py +1077 -0
  5. warp/_src/build.py +620 -0
  6. warp/_src/build_dll.py +642 -0
  7. warp/_src/builtins.py +10555 -0
  8. warp/_src/codegen.py +4361 -0
  9. warp/_src/config.py +178 -0
  10. warp/_src/constants.py +59 -0
  11. warp/_src/context.py +8352 -0
  12. warp/_src/dlpack.py +464 -0
  13. warp/_src/fabric.py +362 -0
  14. warp/_src/fem/__init__.py +14 -0
  15. warp/_src/fem/adaptivity.py +510 -0
  16. warp/_src/fem/cache.py +689 -0
  17. warp/_src/fem/dirichlet.py +190 -0
  18. warp/_src/fem/domain.py +553 -0
  19. warp/_src/fem/field/__init__.py +131 -0
  20. warp/_src/fem/field/field.py +703 -0
  21. warp/_src/fem/field/nodal_field.py +403 -0
  22. warp/_src/fem/field/restriction.py +39 -0
  23. warp/_src/fem/field/virtual.py +1021 -0
  24. warp/_src/fem/geometry/__init__.py +32 -0
  25. warp/_src/fem/geometry/adaptive_nanogrid.py +782 -0
  26. warp/_src/fem/geometry/closest_point.py +99 -0
  27. warp/_src/fem/geometry/deformed_geometry.py +277 -0
  28. warp/_src/fem/geometry/element.py +854 -0
  29. warp/_src/fem/geometry/geometry.py +693 -0
  30. warp/_src/fem/geometry/grid_2d.py +478 -0
  31. warp/_src/fem/geometry/grid_3d.py +539 -0
  32. warp/_src/fem/geometry/hexmesh.py +956 -0
  33. warp/_src/fem/geometry/nanogrid.py +660 -0
  34. warp/_src/fem/geometry/partition.py +483 -0
  35. warp/_src/fem/geometry/quadmesh.py +597 -0
  36. warp/_src/fem/geometry/tetmesh.py +762 -0
  37. warp/_src/fem/geometry/trimesh.py +588 -0
  38. warp/_src/fem/integrate.py +2507 -0
  39. warp/_src/fem/linalg.py +385 -0
  40. warp/_src/fem/operator.py +398 -0
  41. warp/_src/fem/polynomial.py +231 -0
  42. warp/_src/fem/quadrature/__init__.py +17 -0
  43. warp/_src/fem/quadrature/pic_quadrature.py +318 -0
  44. warp/_src/fem/quadrature/quadrature.py +665 -0
  45. warp/_src/fem/space/__init__.py +248 -0
  46. warp/_src/fem/space/basis_function_space.py +499 -0
  47. warp/_src/fem/space/basis_space.py +681 -0
  48. warp/_src/fem/space/dof_mapper.py +253 -0
  49. warp/_src/fem/space/function_space.py +312 -0
  50. warp/_src/fem/space/grid_2d_function_space.py +179 -0
  51. warp/_src/fem/space/grid_3d_function_space.py +229 -0
  52. warp/_src/fem/space/hexmesh_function_space.py +255 -0
  53. warp/_src/fem/space/nanogrid_function_space.py +199 -0
  54. warp/_src/fem/space/partition.py +435 -0
  55. warp/_src/fem/space/quadmesh_function_space.py +222 -0
  56. warp/_src/fem/space/restriction.py +221 -0
  57. warp/_src/fem/space/shape/__init__.py +152 -0
  58. warp/_src/fem/space/shape/cube_shape_function.py +1107 -0
  59. warp/_src/fem/space/shape/shape_function.py +134 -0
  60. warp/_src/fem/space/shape/square_shape_function.py +928 -0
  61. warp/_src/fem/space/shape/tet_shape_function.py +829 -0
  62. warp/_src/fem/space/shape/triangle_shape_function.py +674 -0
  63. warp/_src/fem/space/tetmesh_function_space.py +270 -0
  64. warp/_src/fem/space/topology.py +461 -0
  65. warp/_src/fem/space/trimesh_function_space.py +193 -0
  66. warp/_src/fem/types.py +114 -0
  67. warp/_src/fem/utils.py +488 -0
  68. warp/_src/jax.py +188 -0
  69. warp/_src/jax_experimental/__init__.py +14 -0
  70. warp/_src/jax_experimental/custom_call.py +389 -0
  71. warp/_src/jax_experimental/ffi.py +1286 -0
  72. warp/_src/jax_experimental/xla_ffi.py +658 -0
  73. warp/_src/marching_cubes.py +710 -0
  74. warp/_src/math.py +416 -0
  75. warp/_src/optim/__init__.py +14 -0
  76. warp/_src/optim/adam.py +165 -0
  77. warp/_src/optim/linear.py +1608 -0
  78. warp/_src/optim/sgd.py +114 -0
  79. warp/_src/paddle.py +408 -0
  80. warp/_src/render/__init__.py +14 -0
  81. warp/_src/render/imgui_manager.py +291 -0
  82. warp/_src/render/render_opengl.py +3638 -0
  83. warp/_src/render/render_usd.py +939 -0
  84. warp/_src/render/utils.py +162 -0
  85. warp/_src/sparse.py +2718 -0
  86. warp/_src/tape.py +1208 -0
  87. warp/_src/thirdparty/__init__.py +0 -0
  88. warp/_src/thirdparty/appdirs.py +598 -0
  89. warp/_src/thirdparty/dlpack.py +145 -0
  90. warp/_src/thirdparty/unittest_parallel.py +676 -0
  91. warp/_src/torch.py +393 -0
  92. warp/_src/types.py +5888 -0
  93. warp/_src/utils.py +1695 -0
  94. warp/autograd.py +33 -0
  95. warp/bin/libwarp-clang.dylib +0 -0
  96. warp/bin/libwarp.dylib +0 -0
  97. warp/build.py +29 -0
  98. warp/build_dll.py +24 -0
  99. warp/codegen.py +24 -0
  100. warp/constants.py +24 -0
  101. warp/context.py +33 -0
  102. warp/dlpack.py +24 -0
  103. warp/examples/__init__.py +24 -0
  104. warp/examples/assets/bear.usd +0 -0
  105. warp/examples/assets/bunny.usd +0 -0
  106. warp/examples/assets/cube.usd +0 -0
  107. warp/examples/assets/nonuniform.usd +0 -0
  108. warp/examples/assets/nvidia_logo.png +0 -0
  109. warp/examples/assets/pixel.jpg +0 -0
  110. warp/examples/assets/rocks.nvdb +0 -0
  111. warp/examples/assets/rocks.usd +0 -0
  112. warp/examples/assets/sphere.usd +0 -0
  113. warp/examples/assets/square_cloth.usd +0 -0
  114. warp/examples/benchmarks/benchmark_api.py +389 -0
  115. warp/examples/benchmarks/benchmark_cloth.py +296 -0
  116. warp/examples/benchmarks/benchmark_cloth_cupy.py +96 -0
  117. warp/examples/benchmarks/benchmark_cloth_jax.py +105 -0
  118. warp/examples/benchmarks/benchmark_cloth_numba.py +161 -0
  119. warp/examples/benchmarks/benchmark_cloth_numpy.py +85 -0
  120. warp/examples/benchmarks/benchmark_cloth_paddle.py +94 -0
  121. warp/examples/benchmarks/benchmark_cloth_pytorch.py +94 -0
  122. warp/examples/benchmarks/benchmark_cloth_taichi.py +120 -0
  123. warp/examples/benchmarks/benchmark_cloth_warp.py +153 -0
  124. warp/examples/benchmarks/benchmark_gemm.py +164 -0
  125. warp/examples/benchmarks/benchmark_interop_paddle.py +166 -0
  126. warp/examples/benchmarks/benchmark_interop_torch.py +166 -0
  127. warp/examples/benchmarks/benchmark_launches.py +301 -0
  128. warp/examples/benchmarks/benchmark_tile_load_store.py +103 -0
  129. warp/examples/benchmarks/benchmark_tile_sort.py +155 -0
  130. warp/examples/browse.py +37 -0
  131. warp/examples/core/example_cupy.py +86 -0
  132. warp/examples/core/example_dem.py +241 -0
  133. warp/examples/core/example_fluid.py +299 -0
  134. warp/examples/core/example_graph_capture.py +150 -0
  135. warp/examples/core/example_marching_cubes.py +195 -0
  136. warp/examples/core/example_mesh.py +180 -0
  137. warp/examples/core/example_mesh_intersect.py +211 -0
  138. warp/examples/core/example_nvdb.py +182 -0
  139. warp/examples/core/example_raycast.py +111 -0
  140. warp/examples/core/example_raymarch.py +205 -0
  141. warp/examples/core/example_render_opengl.py +290 -0
  142. warp/examples/core/example_sample_mesh.py +300 -0
  143. warp/examples/core/example_sph.py +411 -0
  144. warp/examples/core/example_spin_lock.py +93 -0
  145. warp/examples/core/example_torch.py +211 -0
  146. warp/examples/core/example_wave.py +269 -0
  147. warp/examples/core/example_work_queue.py +118 -0
  148. warp/examples/distributed/example_jacobi_mpi.py +506 -0
  149. warp/examples/fem/example_adaptive_grid.py +286 -0
  150. warp/examples/fem/example_apic_fluid.py +469 -0
  151. warp/examples/fem/example_burgers.py +261 -0
  152. warp/examples/fem/example_convection_diffusion.py +181 -0
  153. warp/examples/fem/example_convection_diffusion_dg.py +225 -0
  154. warp/examples/fem/example_darcy_ls_optimization.py +489 -0
  155. warp/examples/fem/example_deformed_geometry.py +172 -0
  156. warp/examples/fem/example_diffusion.py +196 -0
  157. warp/examples/fem/example_diffusion_3d.py +225 -0
  158. warp/examples/fem/example_diffusion_mgpu.py +225 -0
  159. warp/examples/fem/example_distortion_energy.py +228 -0
  160. warp/examples/fem/example_elastic_shape_optimization.py +387 -0
  161. warp/examples/fem/example_magnetostatics.py +242 -0
  162. warp/examples/fem/example_mixed_elasticity.py +293 -0
  163. warp/examples/fem/example_navier_stokes.py +263 -0
  164. warp/examples/fem/example_nonconforming_contact.py +300 -0
  165. warp/examples/fem/example_stokes.py +213 -0
  166. warp/examples/fem/example_stokes_transfer.py +262 -0
  167. warp/examples/fem/example_streamlines.py +357 -0
  168. warp/examples/fem/utils.py +1047 -0
  169. warp/examples/interop/example_jax_callable.py +146 -0
  170. warp/examples/interop/example_jax_ffi_callback.py +132 -0
  171. warp/examples/interop/example_jax_kernel.py +232 -0
  172. warp/examples/optim/example_diffray.py +561 -0
  173. warp/examples/optim/example_fluid_checkpoint.py +497 -0
  174. warp/examples/tile/example_tile_block_cholesky.py +502 -0
  175. warp/examples/tile/example_tile_cholesky.py +88 -0
  176. warp/examples/tile/example_tile_convolution.py +66 -0
  177. warp/examples/tile/example_tile_fft.py +55 -0
  178. warp/examples/tile/example_tile_filtering.py +113 -0
  179. warp/examples/tile/example_tile_matmul.py +85 -0
  180. warp/examples/tile/example_tile_mcgp.py +191 -0
  181. warp/examples/tile/example_tile_mlp.py +385 -0
  182. warp/examples/tile/example_tile_nbody.py +199 -0
  183. warp/fabric.py +24 -0
  184. warp/fem/__init__.py +173 -0
  185. warp/fem/adaptivity.py +26 -0
  186. warp/fem/cache.py +30 -0
  187. warp/fem/dirichlet.py +24 -0
  188. warp/fem/field/__init__.py +24 -0
  189. warp/fem/field/field.py +26 -0
  190. warp/fem/geometry/__init__.py +21 -0
  191. warp/fem/geometry/closest_point.py +31 -0
  192. warp/fem/linalg.py +38 -0
  193. warp/fem/operator.py +32 -0
  194. warp/fem/polynomial.py +29 -0
  195. warp/fem/space/__init__.py +22 -0
  196. warp/fem/space/basis_space.py +24 -0
  197. warp/fem/space/shape/__init__.py +68 -0
  198. warp/fem/space/topology.py +24 -0
  199. warp/fem/types.py +24 -0
  200. warp/fem/utils.py +32 -0
  201. warp/jax.py +29 -0
  202. warp/jax_experimental/__init__.py +29 -0
  203. warp/jax_experimental/custom_call.py +29 -0
  204. warp/jax_experimental/ffi.py +39 -0
  205. warp/jax_experimental/xla_ffi.py +24 -0
  206. warp/marching_cubes.py +24 -0
  207. warp/math.py +37 -0
  208. warp/native/array.h +1687 -0
  209. warp/native/builtin.h +2327 -0
  210. warp/native/bvh.cpp +562 -0
  211. warp/native/bvh.cu +826 -0
  212. warp/native/bvh.h +555 -0
  213. warp/native/clang/clang.cpp +541 -0
  214. warp/native/coloring.cpp +622 -0
  215. warp/native/crt.cpp +51 -0
  216. warp/native/crt.h +568 -0
  217. warp/native/cuda_crt.h +1058 -0
  218. warp/native/cuda_util.cpp +677 -0
  219. warp/native/cuda_util.h +313 -0
  220. warp/native/error.cpp +77 -0
  221. warp/native/error.h +36 -0
  222. warp/native/exports.h +2023 -0
  223. warp/native/fabric.h +246 -0
  224. warp/native/hashgrid.cpp +311 -0
  225. warp/native/hashgrid.cu +89 -0
  226. warp/native/hashgrid.h +240 -0
  227. warp/native/initializer_array.h +41 -0
  228. warp/native/intersect.h +1253 -0
  229. warp/native/intersect_adj.h +375 -0
  230. warp/native/intersect_tri.h +348 -0
  231. warp/native/mat.h +5189 -0
  232. warp/native/mathdx.cpp +93 -0
  233. warp/native/matnn.h +221 -0
  234. warp/native/mesh.cpp +266 -0
  235. warp/native/mesh.cu +406 -0
  236. warp/native/mesh.h +2097 -0
  237. warp/native/nanovdb/GridHandle.h +533 -0
  238. warp/native/nanovdb/HostBuffer.h +591 -0
  239. warp/native/nanovdb/NanoVDB.h +6246 -0
  240. warp/native/nanovdb/NodeManager.h +323 -0
  241. warp/native/nanovdb/PNanoVDB.h +3390 -0
  242. warp/native/noise.h +859 -0
  243. warp/native/quat.h +1664 -0
  244. warp/native/rand.h +342 -0
  245. warp/native/range.h +145 -0
  246. warp/native/reduce.cpp +174 -0
  247. warp/native/reduce.cu +363 -0
  248. warp/native/runlength_encode.cpp +79 -0
  249. warp/native/runlength_encode.cu +61 -0
  250. warp/native/scan.cpp +47 -0
  251. warp/native/scan.cu +55 -0
  252. warp/native/scan.h +23 -0
  253. warp/native/solid_angle.h +466 -0
  254. warp/native/sort.cpp +251 -0
  255. warp/native/sort.cu +286 -0
  256. warp/native/sort.h +35 -0
  257. warp/native/sparse.cpp +241 -0
  258. warp/native/sparse.cu +435 -0
  259. warp/native/spatial.h +1306 -0
  260. warp/native/svd.h +727 -0
  261. warp/native/temp_buffer.h +46 -0
  262. warp/native/tile.h +4124 -0
  263. warp/native/tile_radix_sort.h +1112 -0
  264. warp/native/tile_reduce.h +838 -0
  265. warp/native/tile_scan.h +240 -0
  266. warp/native/tuple.h +189 -0
  267. warp/native/vec.h +2199 -0
  268. warp/native/version.h +23 -0
  269. warp/native/volume.cpp +501 -0
  270. warp/native/volume.cu +68 -0
  271. warp/native/volume.h +970 -0
  272. warp/native/volume_builder.cu +483 -0
  273. warp/native/volume_builder.h +52 -0
  274. warp/native/volume_impl.h +70 -0
  275. warp/native/warp.cpp +1143 -0
  276. warp/native/warp.cu +4604 -0
  277. warp/native/warp.h +358 -0
  278. warp/optim/__init__.py +20 -0
  279. warp/optim/adam.py +24 -0
  280. warp/optim/linear.py +35 -0
  281. warp/optim/sgd.py +24 -0
  282. warp/paddle.py +24 -0
  283. warp/py.typed +0 -0
  284. warp/render/__init__.py +22 -0
  285. warp/render/imgui_manager.py +29 -0
  286. warp/render/render_opengl.py +24 -0
  287. warp/render/render_usd.py +24 -0
  288. warp/render/utils.py +24 -0
  289. warp/sparse.py +51 -0
  290. warp/tape.py +24 -0
  291. warp/tests/__init__.py +1 -0
  292. warp/tests/__main__.py +4 -0
  293. warp/tests/assets/curlnoise_golden.npy +0 -0
  294. warp/tests/assets/mlp_golden.npy +0 -0
  295. warp/tests/assets/pixel.npy +0 -0
  296. warp/tests/assets/pnoise_golden.npy +0 -0
  297. warp/tests/assets/spiky.usd +0 -0
  298. warp/tests/assets/test_grid.nvdb +0 -0
  299. warp/tests/assets/test_index_grid.nvdb +0 -0
  300. warp/tests/assets/test_int32_grid.nvdb +0 -0
  301. warp/tests/assets/test_vec_grid.nvdb +0 -0
  302. warp/tests/assets/torus.nvdb +0 -0
  303. warp/tests/assets/torus.usda +105 -0
  304. warp/tests/aux_test_class_kernel.py +34 -0
  305. warp/tests/aux_test_compile_consts_dummy.py +18 -0
  306. warp/tests/aux_test_conditional_unequal_types_kernels.py +29 -0
  307. warp/tests/aux_test_dependent.py +29 -0
  308. warp/tests/aux_test_grad_customs.py +29 -0
  309. warp/tests/aux_test_instancing_gc.py +26 -0
  310. warp/tests/aux_test_module_aot.py +7 -0
  311. warp/tests/aux_test_module_unload.py +23 -0
  312. warp/tests/aux_test_name_clash1.py +40 -0
  313. warp/tests/aux_test_name_clash2.py +40 -0
  314. warp/tests/aux_test_reference.py +9 -0
  315. warp/tests/aux_test_reference_reference.py +8 -0
  316. warp/tests/aux_test_square.py +16 -0
  317. warp/tests/aux_test_unresolved_func.py +22 -0
  318. warp/tests/aux_test_unresolved_symbol.py +22 -0
  319. warp/tests/cuda/__init__.py +0 -0
  320. warp/tests/cuda/test_async.py +676 -0
  321. warp/tests/cuda/test_conditional_captures.py +1147 -0
  322. warp/tests/cuda/test_ipc.py +124 -0
  323. warp/tests/cuda/test_mempool.py +233 -0
  324. warp/tests/cuda/test_multigpu.py +169 -0
  325. warp/tests/cuda/test_peer.py +139 -0
  326. warp/tests/cuda/test_pinned.py +84 -0
  327. warp/tests/cuda/test_streams.py +691 -0
  328. warp/tests/geometry/__init__.py +0 -0
  329. warp/tests/geometry/test_bvh.py +335 -0
  330. warp/tests/geometry/test_hash_grid.py +259 -0
  331. warp/tests/geometry/test_marching_cubes.py +294 -0
  332. warp/tests/geometry/test_mesh.py +318 -0
  333. warp/tests/geometry/test_mesh_query_aabb.py +392 -0
  334. warp/tests/geometry/test_mesh_query_point.py +935 -0
  335. warp/tests/geometry/test_mesh_query_ray.py +323 -0
  336. warp/tests/geometry/test_volume.py +1103 -0
  337. warp/tests/geometry/test_volume_write.py +346 -0
  338. warp/tests/interop/__init__.py +0 -0
  339. warp/tests/interop/test_dlpack.py +730 -0
  340. warp/tests/interop/test_jax.py +1673 -0
  341. warp/tests/interop/test_paddle.py +800 -0
  342. warp/tests/interop/test_torch.py +1001 -0
  343. warp/tests/run_coverage_serial.py +39 -0
  344. warp/tests/test_adam.py +162 -0
  345. warp/tests/test_arithmetic.py +1096 -0
  346. warp/tests/test_array.py +3756 -0
  347. warp/tests/test_array_reduce.py +156 -0
  348. warp/tests/test_assert.py +303 -0
  349. warp/tests/test_atomic.py +336 -0
  350. warp/tests/test_atomic_bitwise.py +209 -0
  351. warp/tests/test_atomic_cas.py +312 -0
  352. warp/tests/test_bool.py +220 -0
  353. warp/tests/test_builtins_resolution.py +732 -0
  354. warp/tests/test_closest_point_edge_edge.py +327 -0
  355. warp/tests/test_codegen.py +974 -0
  356. warp/tests/test_codegen_instancing.py +1495 -0
  357. warp/tests/test_compile_consts.py +215 -0
  358. warp/tests/test_conditional.py +298 -0
  359. warp/tests/test_context.py +35 -0
  360. warp/tests/test_copy.py +319 -0
  361. warp/tests/test_ctypes.py +618 -0
  362. warp/tests/test_dense.py +73 -0
  363. warp/tests/test_devices.py +127 -0
  364. warp/tests/test_enum.py +136 -0
  365. warp/tests/test_examples.py +424 -0
  366. warp/tests/test_fabricarray.py +998 -0
  367. warp/tests/test_fast_math.py +72 -0
  368. warp/tests/test_fem.py +2204 -0
  369. warp/tests/test_fixedarray.py +229 -0
  370. warp/tests/test_fp16.py +136 -0
  371. warp/tests/test_func.py +501 -0
  372. warp/tests/test_future_annotations.py +100 -0
  373. warp/tests/test_generics.py +656 -0
  374. warp/tests/test_grad.py +893 -0
  375. warp/tests/test_grad_customs.py +339 -0
  376. warp/tests/test_grad_debug.py +341 -0
  377. warp/tests/test_implicit_init.py +411 -0
  378. warp/tests/test_import.py +45 -0
  379. warp/tests/test_indexedarray.py +1140 -0
  380. warp/tests/test_intersect.py +103 -0
  381. warp/tests/test_iter.py +76 -0
  382. warp/tests/test_large.py +177 -0
  383. warp/tests/test_launch.py +411 -0
  384. warp/tests/test_lerp.py +151 -0
  385. warp/tests/test_linear_solvers.py +223 -0
  386. warp/tests/test_lvalue.py +427 -0
  387. warp/tests/test_map.py +526 -0
  388. warp/tests/test_mat.py +3515 -0
  389. warp/tests/test_mat_assign_copy.py +178 -0
  390. warp/tests/test_mat_constructors.py +573 -0
  391. warp/tests/test_mat_lite.py +122 -0
  392. warp/tests/test_mat_scalar_ops.py +2913 -0
  393. warp/tests/test_math.py +212 -0
  394. warp/tests/test_module_aot.py +287 -0
  395. warp/tests/test_module_hashing.py +258 -0
  396. warp/tests/test_modules_lite.py +70 -0
  397. warp/tests/test_noise.py +252 -0
  398. warp/tests/test_operators.py +299 -0
  399. warp/tests/test_options.py +129 -0
  400. warp/tests/test_overwrite.py +551 -0
  401. warp/tests/test_print.py +408 -0
  402. warp/tests/test_quat.py +2653 -0
  403. warp/tests/test_quat_assign_copy.py +145 -0
  404. warp/tests/test_rand.py +339 -0
  405. warp/tests/test_reload.py +303 -0
  406. warp/tests/test_rounding.py +157 -0
  407. warp/tests/test_runlength_encode.py +196 -0
  408. warp/tests/test_scalar_ops.py +133 -0
  409. warp/tests/test_smoothstep.py +108 -0
  410. warp/tests/test_snippet.py +318 -0
  411. warp/tests/test_sparse.py +845 -0
  412. warp/tests/test_spatial.py +2859 -0
  413. warp/tests/test_spatial_assign_copy.py +160 -0
  414. warp/tests/test_special_values.py +361 -0
  415. warp/tests/test_static.py +640 -0
  416. warp/tests/test_struct.py +901 -0
  417. warp/tests/test_tape.py +242 -0
  418. warp/tests/test_transient_module.py +93 -0
  419. warp/tests/test_triangle_closest_point.py +192 -0
  420. warp/tests/test_tuple.py +361 -0
  421. warp/tests/test_types.py +615 -0
  422. warp/tests/test_utils.py +594 -0
  423. warp/tests/test_vec.py +1408 -0
  424. warp/tests/test_vec_assign_copy.py +143 -0
  425. warp/tests/test_vec_constructors.py +325 -0
  426. warp/tests/test_vec_lite.py +80 -0
  427. warp/tests/test_vec_scalar_ops.py +2327 -0
  428. warp/tests/test_verify_fp.py +100 -0
  429. warp/tests/test_version.py +75 -0
  430. warp/tests/tile/__init__.py +0 -0
  431. warp/tests/tile/test_tile.py +1519 -0
  432. warp/tests/tile/test_tile_atomic_bitwise.py +403 -0
  433. warp/tests/tile/test_tile_cholesky.py +608 -0
  434. warp/tests/tile/test_tile_load.py +724 -0
  435. warp/tests/tile/test_tile_mathdx.py +156 -0
  436. warp/tests/tile/test_tile_matmul.py +179 -0
  437. warp/tests/tile/test_tile_mlp.py +400 -0
  438. warp/tests/tile/test_tile_reduce.py +950 -0
  439. warp/tests/tile/test_tile_shared_memory.py +376 -0
  440. warp/tests/tile/test_tile_sort.py +121 -0
  441. warp/tests/tile/test_tile_view.py +173 -0
  442. warp/tests/unittest_serial.py +47 -0
  443. warp/tests/unittest_suites.py +430 -0
  444. warp/tests/unittest_utils.py +469 -0
  445. warp/tests/walkthrough_debug.py +95 -0
  446. warp/torch.py +24 -0
  447. warp/types.py +51 -0
  448. warp/utils.py +31 -0
  449. warp_lang-1.10.0.dist-info/METADATA +459 -0
  450. warp_lang-1.10.0.dist-info/RECORD +468 -0
  451. warp_lang-1.10.0.dist-info/WHEEL +5 -0
  452. warp_lang-1.10.0.dist-info/licenses/LICENSE.md +176 -0
  453. warp_lang-1.10.0.dist-info/licenses/licenses/Gaia-LICENSE.txt +6 -0
  454. warp_lang-1.10.0.dist-info/licenses/licenses/appdirs-LICENSE.txt +22 -0
  455. warp_lang-1.10.0.dist-info/licenses/licenses/asset_pixel_jpg-LICENSE.txt +3 -0
  456. warp_lang-1.10.0.dist-info/licenses/licenses/cuda-LICENSE.txt +1582 -0
  457. warp_lang-1.10.0.dist-info/licenses/licenses/dlpack-LICENSE.txt +201 -0
  458. warp_lang-1.10.0.dist-info/licenses/licenses/fp16-LICENSE.txt +28 -0
  459. warp_lang-1.10.0.dist-info/licenses/licenses/libmathdx-LICENSE.txt +220 -0
  460. warp_lang-1.10.0.dist-info/licenses/licenses/llvm-LICENSE.txt +279 -0
  461. warp_lang-1.10.0.dist-info/licenses/licenses/moller-LICENSE.txt +16 -0
  462. warp_lang-1.10.0.dist-info/licenses/licenses/nanovdb-LICENSE.txt +2 -0
  463. warp_lang-1.10.0.dist-info/licenses/licenses/nvrtc-LICENSE.txt +1592 -0
  464. warp_lang-1.10.0.dist-info/licenses/licenses/svd-LICENSE.txt +23 -0
  465. warp_lang-1.10.0.dist-info/licenses/licenses/unittest_parallel-LICENSE.txt +21 -0
  466. warp_lang-1.10.0.dist-info/licenses/licenses/usd-LICENSE.txt +213 -0
  467. warp_lang-1.10.0.dist-info/licenses/licenses/windingnumber-LICENSE.txt +21 -0
  468. warp_lang-1.10.0.dist-info/top_level.txt +1 -0
warp/_src/math.py ADDED
@@ -0,0 +1,416 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ from typing import Any
17
+
18
+ import warp as wp
19
+
20
+ """
21
+ Vector norm functions
22
+ """
23
+
24
+ _wp_module_name_ = "warp.math"
25
+
26
+ __all__ = [
27
+ "norm_huber",
28
+ "norm_l1",
29
+ "norm_l2",
30
+ "norm_pseudo_huber",
31
+ "smooth_normalize",
32
+ "transform_compose",
33
+ "transform_decompose",
34
+ "transform_from_matrix",
35
+ "transform_to_matrix",
36
+ ]
37
+
38
+
39
+ @wp.func
40
+ def norm_l1(v: Any):
41
+ """
42
+ Computes the L1 norm of a vector v.
43
+
44
+ .. math:: \\|v\\|_1 = \\sum_i |v_i|
45
+
46
+ Args:
47
+ v (Vector[Any,Float]): The vector to compute the L1 norm of.
48
+
49
+ Returns:
50
+ float: The L1 norm of the vector.
51
+ """
52
+ n = float(0.0)
53
+ for i in range(len(v)):
54
+ n += wp.abs(v[i])
55
+ return n
56
+
57
+
58
+ @wp.func
59
+ def norm_l2(v: Any):
60
+ """
61
+ Computes the L2 norm of a vector v.
62
+
63
+ .. math:: \\|v\\|_2 = \\sqrt{\\sum_i v_i^2}
64
+
65
+ Args:
66
+ v (Vector[Any,Float]): The vector to compute the L2 norm of.
67
+
68
+ Returns:
69
+ float: The L2 norm of the vector.
70
+ """
71
+ return wp.length(v)
72
+
73
+
74
+ @wp.func
75
+ def norm_huber(v: Any, delta: float = 1.0):
76
+ """
77
+ Computes the Huber norm of a vector v with a given delta.
78
+
79
+ .. math::
80
+ H(v) = \\begin{cases} \\frac{1}{2} \\|v\\|^2 & \\text{if } \\|v\\| \\leq \\delta \\\\ \\delta(\\|v\\| - \\frac{1}{2}\\delta) & \\text{otherwise} \\end{cases}
81
+
82
+ .. image:: /img/norm_huber.svg
83
+ :align: center
84
+
85
+ Args:
86
+ v (Vector[Any,Float]): The vector to compute the Huber norm of.
87
+ delta (float): The threshold value, defaults to 1.0.
88
+
89
+ Returns:
90
+ float: The Huber norm of the vector.
91
+ """
92
+ a = wp.dot(v, v)
93
+ if a <= delta * delta:
94
+ return 0.5 * a
95
+ return delta * (wp.sqrt(a) - 0.5 * delta)
96
+
97
+
98
+ @wp.func
99
+ def norm_pseudo_huber(v: Any, delta: float = 1.0):
100
+ """
101
+ Computes the "pseudo" Huber norm of a vector v with a given delta.
102
+
103
+ .. math::
104
+ H^\\prime(v) = \\delta \\sqrt{1 + \\frac{\\|v\\|^2}{\\delta^2}}
105
+
106
+ .. image:: /img/norm_pseudo_huber.svg
107
+ :align: center
108
+
109
+ Args:
110
+ v (Vector[Any,Float]): The vector to compute the Huber norm of.
111
+ delta (float): The threshold value, defaults to 1.0.
112
+
113
+ Returns:
114
+ float: The Huber norm of the vector.
115
+ """
116
+ a = wp.dot(v, v)
117
+ return delta * wp.sqrt(1.0 + a / (delta * delta))
118
+
119
+
120
+ @wp.func
121
+ def smooth_normalize(v: Any, delta: float = 1.0):
122
+ """
123
+ Normalizes a vector using the pseudo-Huber norm.
124
+
125
+ See :func:`norm_pseudo_huber`.
126
+
127
+ .. math::
128
+ \\frac{v}{H^\\prime(v)}
129
+
130
+ Args:
131
+ v (Vector[Any,Float]): The vector to normalize.
132
+ delta (float): The threshold value, defaults to 1.0.
133
+
134
+ Returns:
135
+ Vector[Any,Float]: The normalized vector.
136
+ """
137
+ return v / norm_pseudo_huber(v, delta)
138
+
139
+
140
+ def create_transform_from_matrix_func(dtype):
141
+ mat44 = wp._src.types.matrix((4, 4), dtype)
142
+ vec3 = wp._src.types.vector(3, dtype)
143
+ transform = wp._src.types.transformation(dtype)
144
+
145
+ def transform_from_matrix(mat: mat44) -> transform:
146
+ """
147
+ Construct a transformation from a 4x4 matrix.
148
+
149
+ .. math::
150
+ M = \\begin{bmatrix}
151
+ R_{00} & R_{01} & R_{02} & p_x \\\\
152
+ R_{10} & R_{11} & R_{12} & p_y \\\\
153
+ R_{20} & R_{21} & R_{22} & p_z \\\\
154
+ 0 & 0 & 0 & 1
155
+ \\end{bmatrix}
156
+
157
+ Where:
158
+
159
+ * :math:`R` is the 3x3 rotation matrix created from the orientation quaternion of the input transform.
160
+ * :math:`p` is the 3D position vector :math:`[p_x, p_y, p_z]` of the input transform.
161
+
162
+ Args:
163
+ mat (Matrix[4, 4, Float]): Matrix to convert.
164
+
165
+ Returns:
166
+ Transformation[Float]: The transformation.
167
+ """
168
+ p = vec3(mat[0][3], mat[1][3], mat[2][3])
169
+ q = wp.quat_from_matrix(mat)
170
+ return transform(p, q)
171
+
172
+ return transform_from_matrix
173
+
174
+
175
+ transform_from_matrix = wp.func(
176
+ create_transform_from_matrix_func(wp.float32),
177
+ name="transform_from_matrix",
178
+ )
179
+ wp.func(
180
+ create_transform_from_matrix_func(wp.float16),
181
+ name="transform_from_matrix",
182
+ )
183
+ wp.func(
184
+ create_transform_from_matrix_func(wp.float64),
185
+ name="transform_from_matrix",
186
+ )
187
+
188
+
189
+ def create_transform_to_matrix_func(dtype):
190
+ mat44 = wp._src.types.matrix((4, 4), dtype)
191
+ transform = wp._src.types.transformation(dtype)
192
+
193
+ def transform_to_matrix(xform: transform) -> mat44:
194
+ """
195
+ Convert a transformation to a 4x4 matrix.
196
+
197
+ .. math::
198
+ M = \\begin{bmatrix}
199
+ R_{00} & R_{01} & R_{02} & p_x \\\\
200
+ R_{10} & R_{11} & R_{12} & p_y \\\\
201
+ R_{20} & R_{21} & R_{22} & p_z \\\\
202
+ 0 & 0 & 0 & 1
203
+ \\end{bmatrix}
204
+
205
+ Where:
206
+
207
+ * :math:`R` is the 3x3 rotation matrix created from the orientation quaternion of the input transform.
208
+ * :math:`p` is the 3D position vector :math:`[p_x, p_y, p_z]` of the input transform.
209
+
210
+ Args:
211
+ xform (Transformation[Float]): Transformation to convert.
212
+
213
+ Returns:
214
+ Matrix[4, 4, Float]: The matrix.
215
+ """
216
+ p = wp.transform_get_translation(xform)
217
+ q = wp.transform_get_rotation(xform)
218
+ rot = wp.quat_to_matrix(q)
219
+ # fmt: off
220
+ return mat44(
221
+ rot[0][0], rot[0][1], rot[0][2], p[0],
222
+ rot[1][0], rot[1][1], rot[1][2], p[1],
223
+ rot[2][0], rot[2][1], rot[2][2], p[2],
224
+ dtype(0.0), dtype(0.0), dtype(0.0), dtype(1.0),
225
+ )
226
+ # fmt: on
227
+
228
+ return transform_to_matrix
229
+
230
+
231
+ transform_to_matrix = wp.func(
232
+ create_transform_to_matrix_func(wp.float32),
233
+ name="transform_to_matrix",
234
+ )
235
+ wp.func(
236
+ create_transform_to_matrix_func(wp.float16),
237
+ name="transform_to_matrix",
238
+ )
239
+ wp.func(
240
+ create_transform_to_matrix_func(wp.float64),
241
+ name="transform_to_matrix",
242
+ )
243
+
244
+
245
+ def create_transform_compose_func(dtype):
246
+ mat44 = wp._src.types.matrix((4, 4), dtype)
247
+ quat = wp._src.types.quaternion(dtype)
248
+ vec3 = wp._src.types.vector(3, dtype)
249
+
250
+ def transform_compose(position: vec3, rotation: quat, scale: vec3):
251
+ """
252
+ Compose a 4x4 transformation matrix from a 3D position, quaternion orientation, and 3D scale.
253
+
254
+ .. math::
255
+ M = \\begin{bmatrix}
256
+ s_x R_{00} & s_y R_{01} & s_z R_{02} & p_x \\\\
257
+ s_x R_{10} & s_y R_{11} & s_z R_{12} & p_y \\\\
258
+ s_x R_{20} & s_y R_{21} & s_z R_{22} & p_z \\\\
259
+ 0 & 0 & 0 & 1
260
+ \\end{bmatrix}
261
+
262
+ Where:
263
+
264
+ * :math:`R` is the 3x3 rotation matrix created from the orientation quaternion of the input transform.
265
+ * :math:`p` is the 3D position vector :math:`[p_x, p_y, p_z]` of the input transform.
266
+ * :math:`s` is the 3D scale vector :math:`[s_x, s_y, s_z]` of the input transform.
267
+
268
+ Args:
269
+ position (Vector[3, Float]): The 3D position vector.
270
+ rotation (Quaternion[Float]): The quaternion orientation.
271
+ scale (Vector[3, Float]): The 3D scale vector.
272
+
273
+ Returns:
274
+ Matrix[4, 4, Float]: The transformation matrix.
275
+ """
276
+ R = wp.quat_to_matrix(rotation)
277
+ # fmt: off
278
+ return mat44(
279
+ scale[0] * R[0,0], scale[1] * R[0,1], scale[2] * R[0,2], position[0],
280
+ scale[0] * R[1,0], scale[1] * R[1,1], scale[2] * R[1,2], position[1],
281
+ scale[0] * R[2,0], scale[1] * R[2,1], scale[2] * R[2,2], position[2],
282
+ dtype(0.0), dtype(0.0), dtype(0.0), dtype(1.0),
283
+ )
284
+ # fmt: on
285
+
286
+ return transform_compose
287
+
288
+
289
+ transform_compose = wp.func(
290
+ create_transform_compose_func(wp.float32),
291
+ name="transform_compose",
292
+ )
293
+ wp.func(
294
+ create_transform_compose_func(wp.float16),
295
+ name="transform_compose",
296
+ )
297
+ wp.func(
298
+ create_transform_compose_func(wp.float64),
299
+ name="transform_compose",
300
+ )
301
+
302
+
303
+ def create_transform_decompose_func(dtype):
304
+ mat44 = wp._src.types.matrix((4, 4), dtype)
305
+ vec3 = wp._src.types.vector(3, dtype)
306
+ mat33 = wp._src.types.matrix((3, 3), dtype)
307
+ zero = dtype(0.0)
308
+
309
+ def transform_decompose(m: mat44):
310
+ """
311
+ Decompose a 4x4 transformation matrix into 3D position, quaternion orientation, and 3D scale.
312
+
313
+ .. math::
314
+ M = \\begin{bmatrix}
315
+ s_x R_{00} & s_y R_{01} & s_z R_{02} & p_x \\\\
316
+ s_x R_{10} & s_y R_{11} & s_z R_{12} & p_y \\\\
317
+ s_x R_{20} & s_y R_{21} & s_z R_{22} & p_z \\\\
318
+ 0 & 0 & 0 & 1
319
+ \\end{bmatrix}
320
+
321
+ Where:
322
+
323
+ * :math:`R` is the 3x3 rotation matrix created from the orientation quaternion of the input transform.
324
+ * :math:`p` is the 3D position vector :math:`[p_x, p_y, p_z]` of the input transform.
325
+ * :math:`s` is the 3D scale vector :math:`[s_x, s_y, s_z]` of the input transform.
326
+
327
+ Args:
328
+ m (Matrix[4, 4, Float]): The matrix to decompose.
329
+
330
+ Returns:
331
+ Tuple[Vector[3, Float], Quaternion[Float], Vector[3, Float]]: A tuple containing the position vector, quaternion orientation, and scale vector.
332
+ """
333
+ # extract position
334
+ position = vec3(m[0, 3], m[1, 3], m[2, 3])
335
+ # extract rotation matrix components
336
+ r00, r01, r02 = m[0, 0], m[0, 1], m[0, 2]
337
+ r10, r11, r12 = m[1, 0], m[1, 1], m[1, 2]
338
+ r20, r21, r22 = m[2, 0], m[2, 1], m[2, 2]
339
+ # get scale magnitudes
340
+ sx = wp.sqrt(r00 * r00 + r10 * r10 + r20 * r20)
341
+ sy = wp.sqrt(r01 * r01 + r11 * r11 + r21 * r21)
342
+ sz = wp.sqrt(r02 * r02 + r12 * r12 + r22 * r22)
343
+ # normalize rotation matrix components
344
+ if sx != zero:
345
+ r00 /= sx
346
+ r10 /= sx
347
+ r20 /= sx
348
+ if sy != zero:
349
+ r01 /= sy
350
+ r11 /= sy
351
+ r21 /= sy
352
+ if sz != zero:
353
+ r02 /= sz
354
+ r12 /= sz
355
+ r22 /= sz
356
+ # extract rotation (quaternion)
357
+ rotation = wp.quat_from_matrix(mat33(r00, r01, r02, r10, r11, r12, r20, r21, r22))
358
+ # extract scale
359
+ scale = vec3(sx, sy, sz)
360
+ return position, rotation, scale
361
+
362
+ return transform_decompose
363
+
364
+
365
+ transform_decompose = wp.func(
366
+ create_transform_decompose_func(wp.float32),
367
+ name="transform_decompose",
368
+ )
369
+ wp.func(
370
+ create_transform_decompose_func(wp.float16),
371
+ name="transform_decompose",
372
+ )
373
+ wp.func(
374
+ create_transform_decompose_func(wp.float64),
375
+ name="transform_decompose",
376
+ )
377
+
378
+
379
+ # register API functions so they appear in the documentation
380
+
381
+ wp._src.context.register_api_function(
382
+ norm_l1,
383
+ group="Vector Math",
384
+ )
385
+ wp._src.context.register_api_function(
386
+ norm_l2,
387
+ group="Vector Math",
388
+ )
389
+ wp._src.context.register_api_function(
390
+ norm_huber,
391
+ group="Vector Math",
392
+ )
393
+ wp._src.context.register_api_function(
394
+ norm_pseudo_huber,
395
+ group="Vector Math",
396
+ )
397
+ wp._src.context.register_api_function(
398
+ smooth_normalize,
399
+ group="Vector Math",
400
+ )
401
+ wp._src.context.register_api_function(
402
+ transform_from_matrix,
403
+ group="Transformations",
404
+ )
405
+ wp._src.context.register_api_function(
406
+ transform_to_matrix,
407
+ group="Transformations",
408
+ )
409
+ wp._src.context.register_api_function(
410
+ transform_compose,
411
+ group="Transformations",
412
+ )
413
+ wp._src.context.register_api_function(
414
+ transform_decompose,
415
+ group="Transformations",
416
+ )
@@ -0,0 +1,14 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
@@ -0,0 +1,165 @@
1
+ # SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
+ # SPDX-License-Identifier: Apache-2.0
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ import warp as wp
17
+
18
+ _wp_module_name_ = "warp.optim.adam"
19
+
20
+
21
+ @wp.kernel
22
+ def adam_step_kernel_vec3(
23
+ g: wp.array(dtype=wp.vec3),
24
+ m: wp.array(dtype=wp.vec3),
25
+ v: wp.array(dtype=wp.vec3),
26
+ lr: float,
27
+ beta1: float,
28
+ beta2: float,
29
+ t: float,
30
+ eps: float,
31
+ params: wp.array(dtype=wp.vec3),
32
+ ):
33
+ i = wp.tid()
34
+ m[i] = beta1 * m[i] + (1.0 - beta1) * g[i]
35
+ v[i] = beta2 * v[i] + (1.0 - beta2) * wp.cw_mul(g[i], g[i])
36
+ mhat = m[i] / (1.0 - wp.pow(beta1, (t + 1.0)))
37
+ vhat = v[i] / (1.0 - wp.pow(beta2, (t + 1.0)))
38
+ sqrt_vhat = wp.vec3(wp.sqrt(vhat[0]), wp.sqrt(vhat[1]), wp.sqrt(vhat[2]))
39
+ eps_vec3 = wp.vec3(eps, eps, eps)
40
+ params[i] = params[i] - lr * wp.cw_div(mhat, (sqrt_vhat + eps_vec3))
41
+
42
+
43
+ @wp.kernel
44
+ def adam_step_kernel_float(
45
+ g: wp.array(dtype=float),
46
+ m: wp.array(dtype=float),
47
+ v: wp.array(dtype=float),
48
+ lr: float,
49
+ beta1: float,
50
+ beta2: float,
51
+ t: float,
52
+ eps: float,
53
+ params: wp.array(dtype=float),
54
+ ):
55
+ i = wp.tid()
56
+ m[i] = beta1 * m[i] + (1.0 - beta1) * g[i]
57
+ v[i] = beta2 * v[i] + (1.0 - beta2) * g[i] * g[i]
58
+ mhat = m[i] / (1.0 - wp.pow(beta1, (t + 1.0)))
59
+ vhat = v[i] / (1.0 - wp.pow(beta2, (t + 1.0)))
60
+ params[i] = params[i] - lr * mhat / (wp.sqrt(vhat) + eps)
61
+
62
+
63
+ @wp.kernel
64
+ def adam_step_kernel_half(
65
+ g: wp.array(dtype=wp.float16),
66
+ m: wp.array(dtype=float),
67
+ v: wp.array(dtype=float),
68
+ lr: float,
69
+ beta1: float,
70
+ beta2: float,
71
+ t: float,
72
+ eps: float,
73
+ params: wp.array(dtype=wp.float16),
74
+ ):
75
+ i = wp.tid()
76
+ m[i] = beta1 * m[i] + (1.0 - beta1) * float(g[i])
77
+ v[i] = beta2 * v[i] + (1.0 - beta2) * float(g[i]) * float(g[i])
78
+ mhat = m[i] / (1.0 - wp.pow(beta1, (t + 1.0)))
79
+ vhat = v[i] / (1.0 - wp.pow(beta2, (t + 1.0)))
80
+ params[i] = params[i] - wp.float16(lr * mhat / (wp.sqrt(vhat) + eps))
81
+
82
+
83
+ class Adam:
84
+ """An implementation of the Adam Optimizer
85
+ It is designed to mimic Pytorch's version.
86
+ https://pytorch.org/docs/stable/generated/torch.optim.Adam.html#torch.optim.Adam
87
+ """
88
+
89
+ def __init__(self, params=None, lr=0.001, betas=(0.9, 0.999), eps=1e-08):
90
+ self.m = [] # first moment
91
+ self.v = [] # second moment
92
+ self.set_params(params)
93
+ self.lr = lr
94
+ self.beta1 = betas[0]
95
+ self.beta2 = betas[1]
96
+ self.eps = eps
97
+ self.t = 0
98
+
99
+ def set_params(self, params):
100
+ self.params = params
101
+ if params is not None and isinstance(params, list) and len(params) > 0:
102
+ if len(self.m) != len(params):
103
+ self.m = [None] * len(params) # reset first moment
104
+ if len(self.v) != len(params):
105
+ self.v = [None] * len(params) # reset second moment
106
+ for i in range(len(params)):
107
+ param = params[i]
108
+
109
+ if param.dtype == wp.vec3:
110
+ dtype = wp.vec3
111
+ elif param.dtype == wp.float32:
112
+ dtype = wp.float32
113
+ elif param.dtype == wp.float16:
114
+ dtype = wp.float32 # we always use fp32 for moments, even if params are fp16
115
+ else:
116
+ raise RuntimeError(f"Unsupported dtype for Warp Adam optimizer: {param.dtype}")
117
+
118
+ if self.m[i] is None or self.m[i].shape != param.shape or self.m[i].dtype != param.dtype:
119
+ self.m[i] = wp.zeros(shape=param.shape, dtype=dtype, device=param.device)
120
+ if self.v[i] is None or self.v[i].shape != param.shape or self.v[i].dtype != param.dtype:
121
+ self.v[i] = wp.zeros(shape=param.shape, dtype=dtype, device=param.device)
122
+
123
+ def reset_internal_state(self):
124
+ for m_i in self.m:
125
+ m_i.zero_()
126
+ for v_i in self.v:
127
+ v_i.zero_()
128
+ self.t = 0
129
+
130
+ def step(self, grad):
131
+ assert self.params is not None
132
+ for i in range(len(self.params)):
133
+ Adam.step_detail(
134
+ grad[i], self.m[i], self.v[i], self.lr, self.beta1, self.beta2, self.t, self.eps, self.params[i]
135
+ )
136
+ self.t = self.t + 1
137
+
138
+ @staticmethod
139
+ def step_detail(g, m, v, lr, beta1, beta2, t, eps, params):
140
+ assert params.dtype == g.dtype
141
+ assert params.shape == g.shape
142
+ kernel_inputs = [g, m, v, lr, beta1, beta2, t, eps, params]
143
+ if params.dtype == wp._src.types.float32:
144
+ wp.launch(
145
+ kernel=adam_step_kernel_float,
146
+ dim=len(params),
147
+ inputs=kernel_inputs,
148
+ device=params.device,
149
+ )
150
+ elif params.dtype == wp._src.types.float16:
151
+ wp.launch(
152
+ kernel=adam_step_kernel_half,
153
+ dim=len(params),
154
+ inputs=kernel_inputs,
155
+ device=params.device,
156
+ )
157
+ elif params.dtype == wp._src.types.vec3:
158
+ wp.launch(
159
+ kernel=adam_step_kernel_vec3,
160
+ dim=len(params),
161
+ inputs=kernel_inputs,
162
+ device=params.device,
163
+ )
164
+ else:
165
+ raise RuntimeError("Params data type not supported in Adam step kernels.")