warp-lang 0.10.1__py3-none-win_amd64.whl → 0.11.0__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of warp-lang might be problematic. Click here for more details.

Files changed (300) hide show
  1. warp/__init__.py +10 -4
  2. warp/__init__.pyi +1 -0
  3. warp/bin/warp-clang.dll +0 -0
  4. warp/bin/warp.dll +0 -0
  5. warp/build.py +5 -3
  6. warp/build_dll.py +29 -9
  7. warp/builtins.py +868 -507
  8. warp/codegen.py +1074 -638
  9. warp/config.py +3 -3
  10. warp/constants.py +6 -0
  11. warp/context.py +715 -222
  12. warp/fabric.py +326 -0
  13. warp/fem/__init__.py +27 -0
  14. warp/fem/cache.py +389 -0
  15. warp/fem/dirichlet.py +181 -0
  16. warp/fem/domain.py +263 -0
  17. warp/fem/field/__init__.py +101 -0
  18. warp/fem/field/field.py +149 -0
  19. warp/fem/field/nodal_field.py +299 -0
  20. warp/fem/field/restriction.py +21 -0
  21. warp/fem/field/test.py +181 -0
  22. warp/fem/field/trial.py +183 -0
  23. warp/fem/geometry/__init__.py +19 -0
  24. warp/fem/geometry/closest_point.py +70 -0
  25. warp/fem/geometry/deformed_geometry.py +271 -0
  26. warp/fem/geometry/element.py +744 -0
  27. warp/fem/geometry/geometry.py +186 -0
  28. warp/fem/geometry/grid_2d.py +373 -0
  29. warp/fem/geometry/grid_3d.py +435 -0
  30. warp/fem/geometry/hexmesh.py +953 -0
  31. warp/fem/geometry/partition.py +376 -0
  32. warp/fem/geometry/quadmesh_2d.py +532 -0
  33. warp/fem/geometry/tetmesh.py +840 -0
  34. warp/fem/geometry/trimesh_2d.py +577 -0
  35. warp/fem/integrate.py +1616 -0
  36. warp/fem/operator.py +191 -0
  37. warp/fem/polynomial.py +213 -0
  38. warp/fem/quadrature/__init__.py +2 -0
  39. warp/fem/quadrature/pic_quadrature.py +245 -0
  40. warp/fem/quadrature/quadrature.py +294 -0
  41. warp/fem/space/__init__.py +292 -0
  42. warp/fem/space/basis_space.py +489 -0
  43. warp/fem/space/collocated_function_space.py +105 -0
  44. warp/fem/space/dof_mapper.py +236 -0
  45. warp/fem/space/function_space.py +145 -0
  46. warp/fem/space/grid_2d_function_space.py +267 -0
  47. warp/fem/space/grid_3d_function_space.py +306 -0
  48. warp/fem/space/hexmesh_function_space.py +352 -0
  49. warp/fem/space/partition.py +350 -0
  50. warp/fem/space/quadmesh_2d_function_space.py +369 -0
  51. warp/fem/space/restriction.py +160 -0
  52. warp/fem/space/shape/__init__.py +15 -0
  53. warp/fem/space/shape/cube_shape_function.py +738 -0
  54. warp/fem/space/shape/shape_function.py +103 -0
  55. warp/fem/space/shape/square_shape_function.py +611 -0
  56. warp/fem/space/shape/tet_shape_function.py +567 -0
  57. warp/fem/space/shape/triangle_shape_function.py +429 -0
  58. warp/fem/space/tetmesh_function_space.py +292 -0
  59. warp/fem/space/topology.py +295 -0
  60. warp/fem/space/trimesh_2d_function_space.py +221 -0
  61. warp/fem/types.py +77 -0
  62. warp/fem/utils.py +495 -0
  63. warp/native/array.h +147 -44
  64. warp/native/builtin.h +122 -149
  65. warp/native/bvh.cpp +73 -325
  66. warp/native/bvh.cu +406 -23
  67. warp/native/bvh.h +34 -43
  68. warp/native/clang/clang.cpp +13 -8
  69. warp/native/crt.h +2 -0
  70. warp/native/cuda_crt.h +5 -0
  71. warp/native/cuda_util.cpp +15 -3
  72. warp/native/cuda_util.h +3 -1
  73. warp/native/cutlass/tools/library/scripts/conv2d_operation.py +463 -0
  74. warp/native/cutlass/tools/library/scripts/conv3d_operation.py +321 -0
  75. warp/native/cutlass/tools/library/scripts/gemm_operation.py +988 -0
  76. warp/native/cutlass/tools/library/scripts/generator.py +4625 -0
  77. warp/native/cutlass/tools/library/scripts/library.py +799 -0
  78. warp/native/cutlass/tools/library/scripts/manifest.py +402 -0
  79. warp/native/cutlass/tools/library/scripts/pycutlass/docs/source/conf.py +96 -0
  80. warp/native/cutlass/tools/library/scripts/pycutlass/profile/conv/conv2d_f16_sm80.py +106 -0
  81. warp/native/cutlass/tools/library/scripts/pycutlass/profile/gemm/gemm_f32_sm80.py +91 -0
  82. warp/native/cutlass/tools/library/scripts/pycutlass/setup.py +80 -0
  83. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/__init__.py +48 -0
  84. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/arguments.py +118 -0
  85. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/c_types.py +241 -0
  86. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/compiler.py +432 -0
  87. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/conv2d_operation.py +631 -0
  88. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/epilogue.py +1026 -0
  89. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/frontend.py +104 -0
  90. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/gemm_operation.py +1276 -0
  91. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/library.py +744 -0
  92. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/memory_manager.py +74 -0
  93. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/operation.py +110 -0
  94. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/parser.py +619 -0
  95. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/reduction_operation.py +398 -0
  96. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/tensor_ref.py +70 -0
  97. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/__init__.py +4 -0
  98. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/conv2d_testbed.py +646 -0
  99. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_grouped_testbed.py +235 -0
  100. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_testbed.py +557 -0
  101. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/profiler.py +70 -0
  102. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/type_hint.py +39 -0
  103. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/__init__.py +1 -0
  104. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/device.py +76 -0
  105. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/reference_model.py +255 -0
  106. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/__init__.py +0 -0
  107. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +201 -0
  108. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +177 -0
  109. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +98 -0
  110. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +95 -0
  111. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_few_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +163 -0
  112. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_fixed_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +187 -0
  113. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +309 -0
  114. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +54 -0
  115. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
  116. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
  117. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_strided_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +253 -0
  118. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +97 -0
  119. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +242 -0
  120. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
  121. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
  122. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/run_all_tests.py +10 -0
  123. warp/native/cutlass/tools/library/scripts/pycutlass/test/frontend/test_frontend.py +146 -0
  124. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/__init__.py +0 -0
  125. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_bf16_sm80.py +96 -0
  126. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f16_sm80.py +447 -0
  127. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f32_sm80.py +146 -0
  128. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f64_sm80.py +102 -0
  129. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_grouped_sm80.py +203 -0
  130. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_s8_sm80.py +229 -0
  131. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/run_all_tests.py +9 -0
  132. warp/native/cutlass/tools/library/scripts/pycutlass/test/unit/test_sm80.py +453 -0
  133. warp/native/cutlass/tools/library/scripts/rank_2k_operation.py +398 -0
  134. warp/native/cutlass/tools/library/scripts/rank_k_operation.py +387 -0
  135. warp/native/cutlass/tools/library/scripts/rt.py +796 -0
  136. warp/native/cutlass/tools/library/scripts/symm_operation.py +400 -0
  137. warp/native/cutlass/tools/library/scripts/trmm_operation.py +407 -0
  138. warp/native/cutlass_gemm.cu +5 -3
  139. warp/native/exports.h +1240 -952
  140. warp/native/fabric.h +228 -0
  141. warp/native/hashgrid.cpp +4 -4
  142. warp/native/hashgrid.h +22 -2
  143. warp/native/intersect.h +22 -7
  144. warp/native/intersect_adj.h +8 -8
  145. warp/native/intersect_tri.h +1 -1
  146. warp/native/marching.cu +157 -161
  147. warp/native/mat.h +80 -19
  148. warp/native/matnn.h +2 -2
  149. warp/native/mesh.cpp +33 -108
  150. warp/native/mesh.cu +114 -23
  151. warp/native/mesh.h +446 -46
  152. warp/native/noise.h +272 -329
  153. warp/native/quat.h +51 -8
  154. warp/native/rand.h +45 -35
  155. warp/native/range.h +6 -2
  156. warp/native/reduce.cpp +1 -1
  157. warp/native/reduce.cu +10 -12
  158. warp/native/runlength_encode.cu +6 -10
  159. warp/native/scan.cu +8 -11
  160. warp/native/sparse.cpp +4 -4
  161. warp/native/sparse.cu +164 -154
  162. warp/native/spatial.h +2 -2
  163. warp/native/temp_buffer.h +14 -30
  164. warp/native/vec.h +107 -23
  165. warp/native/volume.h +120 -0
  166. warp/native/warp.cpp +560 -30
  167. warp/native/warp.cu +431 -44
  168. warp/native/warp.h +13 -4
  169. warp/optim/__init__.py +1 -0
  170. warp/optim/linear.py +922 -0
  171. warp/optim/sgd.py +92 -0
  172. warp/render/render_opengl.py +335 -119
  173. warp/render/render_usd.py +11 -11
  174. warp/sim/__init__.py +2 -2
  175. warp/sim/articulation.py +385 -185
  176. warp/sim/collide.py +8 -0
  177. warp/sim/import_mjcf.py +297 -106
  178. warp/sim/import_urdf.py +389 -210
  179. warp/sim/import_usd.py +198 -97
  180. warp/sim/inertia.py +17 -18
  181. warp/sim/integrator_euler.py +14 -8
  182. warp/sim/integrator_xpbd.py +158 -16
  183. warp/sim/model.py +795 -291
  184. warp/sim/render.py +3 -3
  185. warp/sim/utils.py +3 -0
  186. warp/sparse.py +640 -150
  187. warp/stubs.py +606 -267
  188. warp/tape.py +61 -10
  189. warp/tests/__main__.py +3 -6
  190. warp/tests/assets/curlnoise_golden.npy +0 -0
  191. warp/tests/assets/pnoise_golden.npy +0 -0
  192. warp/tests/{test_class_kernel.py → aux_test_class_kernel.py} +9 -1
  193. warp/tests/aux_test_conditional_unequal_types_kernels.py +21 -0
  194. warp/tests/{test_dependent.py → aux_test_dependent.py} +2 -2
  195. warp/tests/{test_reference.py → aux_test_reference.py} +1 -1
  196. warp/tests/aux_test_unresolved_func.py +14 -0
  197. warp/tests/aux_test_unresolved_symbol.py +14 -0
  198. warp/tests/disabled_kinematics.py +239 -0
  199. warp/tests/run_coverage_serial.py +31 -0
  200. warp/tests/test_adam.py +103 -106
  201. warp/tests/test_arithmetic.py +128 -74
  202. warp/tests/test_array.py +212 -97
  203. warp/tests/test_array_reduce.py +57 -23
  204. warp/tests/test_atomic.py +64 -28
  205. warp/tests/test_bool.py +99 -0
  206. warp/tests/test_builtins_resolution.py +1292 -0
  207. warp/tests/test_bvh.py +42 -18
  208. warp/tests/test_closest_point_edge_edge.py +54 -57
  209. warp/tests/test_codegen.py +208 -130
  210. warp/tests/test_compile_consts.py +28 -20
  211. warp/tests/test_conditional.py +108 -24
  212. warp/tests/test_copy.py +10 -12
  213. warp/tests/test_ctypes.py +112 -88
  214. warp/tests/test_dense.py +21 -14
  215. warp/tests/test_devices.py +98 -0
  216. warp/tests/test_dlpack.py +75 -75
  217. warp/tests/test_examples.py +277 -0
  218. warp/tests/test_fabricarray.py +955 -0
  219. warp/tests/test_fast_math.py +15 -11
  220. warp/tests/test_fem.py +1271 -0
  221. warp/tests/test_fp16.py +53 -19
  222. warp/tests/test_func.py +187 -86
  223. warp/tests/test_generics.py +194 -49
  224. warp/tests/test_grad.py +178 -109
  225. warp/tests/test_grad_customs.py +176 -0
  226. warp/tests/test_hash_grid.py +52 -37
  227. warp/tests/test_import.py +10 -23
  228. warp/tests/test_indexedarray.py +32 -31
  229. warp/tests/test_intersect.py +18 -9
  230. warp/tests/test_large.py +141 -0
  231. warp/tests/test_launch.py +14 -41
  232. warp/tests/test_lerp.py +64 -65
  233. warp/tests/test_linear_solvers.py +154 -0
  234. warp/tests/test_lvalue.py +493 -0
  235. warp/tests/test_marching_cubes.py +12 -13
  236. warp/tests/test_mat.py +517 -2898
  237. warp/tests/test_mat_lite.py +115 -0
  238. warp/tests/test_mat_scalar_ops.py +2889 -0
  239. warp/tests/test_math.py +103 -9
  240. warp/tests/test_matmul.py +305 -69
  241. warp/tests/test_matmul_lite.py +410 -0
  242. warp/tests/test_mesh.py +71 -14
  243. warp/tests/test_mesh_query_aabb.py +41 -25
  244. warp/tests/test_mesh_query_point.py +140 -22
  245. warp/tests/test_mesh_query_ray.py +39 -22
  246. warp/tests/test_mlp.py +30 -22
  247. warp/tests/test_model.py +92 -89
  248. warp/tests/test_modules_lite.py +39 -0
  249. warp/tests/test_multigpu.py +88 -114
  250. warp/tests/test_noise.py +12 -11
  251. warp/tests/test_operators.py +16 -20
  252. warp/tests/test_options.py +11 -11
  253. warp/tests/test_pinned.py +17 -18
  254. warp/tests/test_print.py +32 -11
  255. warp/tests/test_quat.py +275 -129
  256. warp/tests/test_rand.py +18 -16
  257. warp/tests/test_reload.py +38 -34
  258. warp/tests/test_rounding.py +50 -43
  259. warp/tests/test_runlength_encode.py +168 -20
  260. warp/tests/test_smoothstep.py +9 -11
  261. warp/tests/test_snippet.py +143 -0
  262. warp/tests/test_sparse.py +261 -63
  263. warp/tests/test_spatial.py +276 -243
  264. warp/tests/test_streams.py +110 -85
  265. warp/tests/test_struct.py +268 -63
  266. warp/tests/test_tape.py +39 -21
  267. warp/tests/test_torch.py +118 -89
  268. warp/tests/test_transient_module.py +12 -13
  269. warp/tests/test_types.py +614 -0
  270. warp/tests/test_utils.py +494 -0
  271. warp/tests/test_vec.py +354 -2050
  272. warp/tests/test_vec_lite.py +73 -0
  273. warp/tests/test_vec_scalar_ops.py +2099 -0
  274. warp/tests/test_volume.py +457 -293
  275. warp/tests/test_volume_write.py +124 -134
  276. warp/tests/unittest_serial.py +35 -0
  277. warp/tests/unittest_suites.py +341 -0
  278. warp/tests/unittest_utils.py +568 -0
  279. warp/tests/unused_test_misc.py +71 -0
  280. warp/tests/{test_debug.py → walkthough_debug.py} +3 -17
  281. warp/thirdparty/appdirs.py +36 -45
  282. warp/thirdparty/unittest_parallel.py +549 -0
  283. warp/torch.py +9 -6
  284. warp/types.py +1089 -366
  285. warp/utils.py +93 -387
  286. warp_lang-0.11.0.dist-info/METADATA +238 -0
  287. warp_lang-0.11.0.dist-info/RECORD +332 -0
  288. {warp_lang-0.10.1.dist-info → warp_lang-0.11.0.dist-info}/WHEEL +1 -1
  289. warp/tests/test_all.py +0 -219
  290. warp/tests/test_array_scan.py +0 -60
  291. warp/tests/test_base.py +0 -208
  292. warp/tests/test_unresolved_func.py +0 -7
  293. warp/tests/test_unresolved_symbol.py +0 -7
  294. warp_lang-0.10.1.dist-info/METADATA +0 -21
  295. warp_lang-0.10.1.dist-info/RECORD +0 -188
  296. /warp/tests/{test_compile_consts_dummy.py → aux_test_compile_consts_dummy.py} +0 -0
  297. /warp/tests/{test_reference_reference.py → aux_test_reference_reference.py} +0 -0
  298. /warp/tests/{test_square.py → aux_test_square.py} +0 -0
  299. {warp_lang-0.10.1.dist-info → warp_lang-0.11.0.dist-info}/LICENSE.md +0 -0
  300. {warp_lang-0.10.1.dist-info → warp_lang-0.11.0.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,840 @@
1
+ from typing import Optional
2
+
3
+ import warp as wp
4
+ from warp.fem.cache import (
5
+ TemporaryStore,
6
+ borrow_temporary,
7
+ borrow_temporary_like,
8
+ cached_arg_value,
9
+ )
10
+ from warp.fem.types import (
11
+ NULL_ELEMENT_INDEX,
12
+ OUTSIDE,
13
+ Coords,
14
+ ElementIndex,
15
+ Sample,
16
+ make_free_sample,
17
+ )
18
+
19
+ from .closest_point import project_on_tet_at_origin
20
+ from .element import Tetrahedron, Triangle
21
+ from .geometry import Geometry
22
+
23
+
24
+ @wp.struct
25
+ class TetmeshCellArg:
26
+ tet_vertex_indices: wp.array2d(dtype=int)
27
+ positions: wp.array(dtype=wp.vec3)
28
+
29
+ # for neighbor cell lookup
30
+ vertex_tet_offsets: wp.array(dtype=int)
31
+ vertex_tet_indices: wp.array(dtype=int)
32
+
33
+ # for transforming reference gradient
34
+ deformation_gradients: wp.array(dtype=wp.mat33f)
35
+
36
+
37
+ @wp.struct
38
+ class TetmeshSideArg:
39
+ cell_arg: TetmeshCellArg
40
+ face_vertex_indices: wp.array(dtype=wp.vec3i)
41
+ face_tet_indices: wp.array(dtype=wp.vec2i)
42
+
43
+
44
+ _mat32 = wp.mat(shape=(3, 2), dtype=float)
45
+
46
+
47
+ class Tetmesh(Geometry):
48
+ """Tetrahedral mesh geometry"""
49
+
50
+ dimension = 3
51
+
52
+ def __init__(
53
+ self, tet_vertex_indices: wp.array, positions: wp.array, temporary_store: Optional[TemporaryStore] = None
54
+ ):
55
+ """
56
+ Constructs a tetrahedral mesh.
57
+
58
+ Args:
59
+ tet_vertex_indices: warp array of shape (num_tets, 4) containing vertex indices for each tet
60
+ positions: warp array of shape (num_vertices, 3) containing 3d position for each vertex
61
+ temporary_store: shared pool from which to allocate temporary arrays
62
+ """
63
+
64
+ self.tet_vertex_indices = tet_vertex_indices
65
+ self.positions = positions
66
+
67
+ self._face_vertex_indices: wp.array = None
68
+ self._face_tet_indices: wp.array = None
69
+ self._vertex_tet_offsets: wp.array = None
70
+ self._vertex_tet_indices: wp.array = None
71
+ self._tet_edge_indices: wp.array = None
72
+ self._edge_count = 0
73
+ self._build_topology(temporary_store)
74
+
75
+ self._deformation_gradients: wp.array = None
76
+ self._compute_deformation_gradients()
77
+
78
+ def cell_count(self):
79
+ return self.tet_vertex_indices.shape[0]
80
+
81
+ def vertex_count(self):
82
+ return self.positions.shape[0]
83
+
84
+ def side_count(self):
85
+ return self._face_vertex_indices.shape[0]
86
+
87
+ def edge_count(self):
88
+ if self._tet_edge_indices is None:
89
+ self._compute_tet_edges()
90
+ return self._edge_count
91
+
92
+ def boundary_side_count(self):
93
+ return self._boundary_face_indices.shape[0]
94
+
95
+ def reference_cell(self) -> Tetrahedron:
96
+ return Tetrahedron()
97
+
98
+ def reference_side(self) -> Triangle:
99
+ return Triangle()
100
+
101
+ @property
102
+ def tet_edge_indices(self) -> wp.array:
103
+ if self._tet_edge_indices is None:
104
+ self._compute_tet_edges()
105
+ return self._tet_edge_indices
106
+
107
+ @property
108
+ def face_tet_indices(self) -> wp.array:
109
+ return self._face_tet_indices
110
+
111
+ @property
112
+ def face_vertex_indices(self) -> wp.array:
113
+ return self._face_vertex_indices
114
+
115
+ CellArg = TetmeshCellArg
116
+ SideArg = TetmeshSideArg
117
+
118
+ @wp.struct
119
+ class SideIndexArg:
120
+ boundary_face_indices: wp.array(dtype=int)
121
+
122
+ # Geometry device interface
123
+
124
+ @cached_arg_value
125
+ def cell_arg_value(self, device) -> CellArg:
126
+ args = self.CellArg()
127
+
128
+ args.tet_vertex_indices = self.tet_vertex_indices.to(device)
129
+ args.positions = self.positions.to(device)
130
+ args.vertex_tet_offsets = self._vertex_tet_offsets.to(device)
131
+ args.vertex_tet_indices = self._vertex_tet_indices.to(device)
132
+ args.deformation_gradients = self._deformation_gradients.to(device)
133
+
134
+ return args
135
+
136
+ @wp.func
137
+ def cell_position(args: CellArg, s: Sample):
138
+ tet_idx = args.tet_vertex_indices[s.element_index]
139
+ w0 = 1.0 - s.element_coords[0] - s.element_coords[1] - s.element_coords[2]
140
+ return (
141
+ w0 * args.positions[tet_idx[0]]
142
+ + s.element_coords[0] * args.positions[tet_idx[1]]
143
+ + s.element_coords[1] * args.positions[tet_idx[2]]
144
+ + s.element_coords[2] * args.positions[tet_idx[3]]
145
+ )
146
+
147
+ @wp.func
148
+ def cell_deformation_gradient(args: CellArg, s: Sample):
149
+ return args.deformation_gradients[s.element_index]
150
+
151
+ @wp.func
152
+ def cell_inverse_deformation_gradient(args: CellArg, s: Sample):
153
+ return wp.inverse(args.deformation_gradients[s.element_index])
154
+
155
+ @wp.func
156
+ def _project_on_tet(args: CellArg, pos: wp.vec3, tet_index: int):
157
+ p0 = args.positions[args.tet_vertex_indices[tet_index, 0]]
158
+
159
+ q = pos - p0
160
+ e1 = args.positions[args.tet_vertex_indices[tet_index, 1]] - p0
161
+ e2 = args.positions[args.tet_vertex_indices[tet_index, 2]] - p0
162
+ e3 = args.positions[args.tet_vertex_indices[tet_index, 3]] - p0
163
+
164
+ dist, coords = project_on_tet_at_origin(q, e1, e2, e3)
165
+ return dist, coords
166
+
167
+ @wp.func
168
+ def cell_lookup(args: CellArg, pos: wp.vec3, guess: Sample):
169
+ closest_tet = int(NULL_ELEMENT_INDEX)
170
+ closest_coords = Coords(OUTSIDE)
171
+ closest_dist = float(1.0e8)
172
+
173
+ for v in range(4):
174
+ vtx = args.tet_vertex_indices[guess.element_index, v]
175
+ tet_beg = args.vertex_tet_offsets[vtx]
176
+ tet_end = args.vertex_tet_offsets[vtx + 1]
177
+
178
+ for t in range(tet_beg, tet_end):
179
+ tet = args.vertex_tet_indices[t]
180
+ dist, coords = Tetmesh._project_on_tet(args, pos, tet)
181
+ if dist <= closest_dist:
182
+ closest_dist = dist
183
+ closest_tet = tet
184
+ closest_coords = coords
185
+
186
+ return make_free_sample(closest_tet, closest_coords)
187
+
188
+ @wp.func
189
+ def cell_measure(args: CellArg, s: Sample):
190
+ return wp.abs(wp.determinant(args.deformation_gradients[s.element_index])) / 6.0
191
+
192
+ @wp.func
193
+ def cell_measure_ratio(args: CellArg, s: Sample):
194
+ return 1.0
195
+
196
+ @wp.func
197
+ def cell_normal(args: CellArg, s: Sample):
198
+ return wp.vec3(0.0)
199
+
200
+ @cached_arg_value
201
+ def side_index_arg_value(self, device) -> SideIndexArg:
202
+ args = self.SideIndexArg()
203
+
204
+ args.boundary_face_indices = self._boundary_face_indices.to(device)
205
+
206
+ return args
207
+
208
+ @wp.func
209
+ def boundary_side_index(args: SideIndexArg, boundary_side_index: int):
210
+ """Boundary side to side index"""
211
+
212
+ return args.boundary_face_indices[boundary_side_index]
213
+
214
+ @cached_arg_value
215
+ def side_arg_value(self, device) -> CellArg:
216
+ args = self.SideArg()
217
+
218
+ args.cell_arg = self.cell_arg_value(device)
219
+ args.face_vertex_indices = self._face_vertex_indices.to(device)
220
+ args.face_tet_indices = self._face_tet_indices.to(device)
221
+
222
+ return args
223
+
224
+ @wp.func
225
+ def side_position(args: SideArg, s: Sample):
226
+ face_idx = args.face_vertex_indices[s.element_index]
227
+ return (
228
+ s.element_coords[0] * args.cell_arg.positions[face_idx[0]]
229
+ + s.element_coords[1] * args.cell_arg.positions[face_idx[1]]
230
+ + s.element_coords[2] * args.cell_arg.positions[face_idx[2]]
231
+ )
232
+
233
+ @wp.func
234
+ def _side_vecs(args: SideArg, side_index: ElementIndex):
235
+ face_idx = args.face_vertex_indices[side_index]
236
+ v0 = args.cell_arg.positions[face_idx[0]]
237
+ v1 = args.cell_arg.positions[face_idx[1]]
238
+ v2 = args.cell_arg.positions[face_idx[2]]
239
+
240
+ return v1 - v0, v2 - v0
241
+
242
+ @wp.func
243
+ def side_deformation_gradient(args: SideArg, s: Sample):
244
+ e1, e2 = Tetmesh._side_vecs(args, s.element_index)
245
+ return _mat32(e1, e2)
246
+
247
+ @wp.func
248
+ def side_inner_inverse_deformation_gradient(args: SideArg, s: Sample):
249
+ cell_index = Tetmesh.side_inner_cell_index(args, s.element_index)
250
+ return wp.inverse(args.cell_arg.deformation_gradients[cell_index])
251
+
252
+ @wp.func
253
+ def side_outer_inverse_deformation_gradient(args: SideArg, s: Sample):
254
+ cell_index = Tetmesh.side_outer_cell_index(args, s.element_index)
255
+ return wp.inverse(args.cell_arg.deformation_gradients[cell_index])
256
+
257
+ @wp.func
258
+ def side_measure(args: SideArg, s: Sample):
259
+ e1, e2 = Tetmesh._side_vecs(args, s.element_index)
260
+ return 0.5 * wp.length(wp.cross(e1, e2))
261
+
262
+ @wp.func
263
+ def side_measure_ratio(args: SideArg, s: Sample):
264
+ inner = Tetmesh.side_inner_cell_index(args, s.element_index)
265
+ outer = Tetmesh.side_outer_cell_index(args, s.element_index)
266
+ return Tetmesh.side_measure(args, s) / wp.min(
267
+ Tetmesh.cell_measure(args.cell_arg, make_free_sample(inner, Coords())),
268
+ Tetmesh.cell_measure(args.cell_arg, make_free_sample(outer, Coords())),
269
+ )
270
+
271
+ @wp.func
272
+ def side_normal(args: SideArg, s: Sample):
273
+ e1, e2 = Tetmesh._side_vecs(args, s.element_index)
274
+ return wp.normalize(wp.cross(e1, e2))
275
+
276
+ @wp.func
277
+ def side_inner_cell_index(arg: SideArg, side_index: ElementIndex):
278
+ return arg.face_tet_indices[side_index][0]
279
+
280
+ @wp.func
281
+ def side_outer_cell_index(arg: SideArg, side_index: ElementIndex):
282
+ return arg.face_tet_indices[side_index][1]
283
+
284
+ @wp.func
285
+ def face_to_tet_coords(args: SideArg, side_index: ElementIndex, tet_index: ElementIndex, side_coords: Coords):
286
+ fvi = args.face_vertex_indices[side_index]
287
+
288
+ tv1 = args.cell_arg.tet_vertex_indices[tet_index, 1]
289
+ tv2 = args.cell_arg.tet_vertex_indices[tet_index, 2]
290
+ tv3 = args.cell_arg.tet_vertex_indices[tet_index, 3]
291
+
292
+ c1 = float(0.0)
293
+ c2 = float(0.0)
294
+ c3 = float(0.0)
295
+
296
+ for k in range(3):
297
+ if tv1 == fvi[k]:
298
+ c1 = side_coords[k]
299
+ elif tv2 == fvi[k]:
300
+ c2 = side_coords[k]
301
+ elif tv3 == fvi[k]:
302
+ c3 = side_coords[k]
303
+
304
+ return Coords(c1, c2, c3)
305
+
306
+ @wp.func
307
+ def side_inner_cell_coords(args: SideArg, side_index: ElementIndex, side_coords: Coords):
308
+ inner_cell_index = Tetmesh.side_inner_cell_index(args, side_index)
309
+ return Tetmesh.face_to_tet_coords(args, side_index, inner_cell_index, side_coords)
310
+
311
+ @wp.func
312
+ def side_outer_cell_coords(args: SideArg, side_index: ElementIndex, side_coords: Coords):
313
+ outer_cell_index = Tetmesh.side_outer_cell_index(args, side_index)
314
+ return Tetmesh.face_to_tet_coords(args, side_index, outer_cell_index, side_coords)
315
+
316
+ @wp.func
317
+ def side_from_cell_coords(args: SideArg, side_index: ElementIndex, tet_index: ElementIndex, tet_coords: Coords):
318
+ fvi = args.face_vertex_indices[side_index]
319
+
320
+ tv1 = args.cell_arg.tet_vertex_indices[tet_index, 1]
321
+ tv2 = args.cell_arg.tet_vertex_indices[tet_index, 2]
322
+ tv3 = args.cell_arg.tet_vertex_indices[tet_index, 3]
323
+
324
+ if tv1 == fvi[0]:
325
+ c0 = tet_coords[0]
326
+ elif tv2 == fvi[0]:
327
+ c0 = tet_coords[1]
328
+ elif tv3 == fvi[0]:
329
+ c0 = tet_coords[2]
330
+ else:
331
+ c0 = 1.0 - tet_coords[0] - tet_coords[1] - tet_coords[2]
332
+
333
+ if tv1 == fvi[1]:
334
+ c1 = tet_coords[0]
335
+ elif tv2 == fvi[1]:
336
+ c1 = tet_coords[1]
337
+ elif tv3 == fvi[1]:
338
+ c1 = tet_coords[2]
339
+ else:
340
+ c1 = 1.0 - tet_coords[0] - tet_coords[1] - tet_coords[2]
341
+
342
+ if tv1 == fvi[2]:
343
+ c2 = tet_coords[0]
344
+ elif tv2 == fvi[2]:
345
+ c2 = tet_coords[1]
346
+ elif tv3 == fvi[2]:
347
+ c2 = tet_coords[2]
348
+ else:
349
+ c2 = 1.0 - tet_coords[0] - tet_coords[1] - tet_coords[2]
350
+
351
+ return wp.select(c0 + c1 + c2 > 0.999, Coords(OUTSIDE), Coords(c0, c1, c2))
352
+
353
+ @wp.func
354
+ def side_to_cell_arg(side_arg: SideArg):
355
+ return side_arg.cell_arg
356
+
357
+ def _build_topology(self, temporary_store: TemporaryStore):
358
+ from warp.fem.utils import compress_node_indices, masked_indices
359
+ from warp.utils import array_scan
360
+
361
+ device = self.tet_vertex_indices.device
362
+
363
+ vertex_tet_offsets, vertex_tet_indices, _, __ = compress_node_indices(
364
+ self.vertex_count(), self.tet_vertex_indices, temporary_store=temporary_store
365
+ )
366
+ self._vertex_tet_offsets = vertex_tet_offsets.detach()
367
+ self._vertex_tet_indices = vertex_tet_indices.detach()
368
+
369
+ vertex_start_face_count = borrow_temporary(temporary_store, dtype=int, device=device, shape=self.vertex_count())
370
+ vertex_start_face_count.array.zero_()
371
+ vertex_start_face_offsets = borrow_temporary_like(vertex_start_face_count, temporary_store=temporary_store)
372
+
373
+ vertex_face_other_vs = borrow_temporary(
374
+ temporary_store, dtype=wp.vec2i, device=device, shape=(4 * self.cell_count())
375
+ )
376
+ vertex_face_tets = borrow_temporary(temporary_store, dtype=int, device=device, shape=(4 * self.cell_count(), 2))
377
+
378
+ # Count face edges starting at each vertex
379
+ wp.launch(
380
+ kernel=Tetmesh._count_starting_faces_kernel,
381
+ device=device,
382
+ dim=self.cell_count(),
383
+ inputs=[self.tet_vertex_indices, vertex_start_face_count.array],
384
+ )
385
+
386
+ array_scan(in_array=vertex_start_face_count.array, out_array=vertex_start_face_offsets.array, inclusive=False)
387
+
388
+ # Count number of unique edges (deduplicate across faces)
389
+ vertex_unique_face_count = vertex_start_face_count
390
+ wp.launch(
391
+ kernel=Tetmesh._count_unique_starting_faces_kernel,
392
+ device=device,
393
+ dim=self.vertex_count(),
394
+ inputs=[
395
+ self._vertex_tet_offsets,
396
+ self._vertex_tet_indices,
397
+ self.tet_vertex_indices,
398
+ vertex_start_face_offsets.array,
399
+ vertex_unique_face_count.array,
400
+ vertex_face_other_vs.array,
401
+ vertex_face_tets.array,
402
+ ],
403
+ )
404
+
405
+ vertex_unique_face_offsets = borrow_temporary_like(vertex_start_face_offsets, temporary_store=temporary_store)
406
+ array_scan(in_array=vertex_start_face_count.array, out_array=vertex_unique_face_offsets.array, inclusive=False)
407
+
408
+ # Get back edge count to host
409
+ if device.is_cuda:
410
+ face_count = borrow_temporary(temporary_store, shape=(1,), dtype=int, device="cpu", pinned=True)
411
+ # Last vertex will not own any edge, so its count will be zero; just fetching last prefix count is ok
412
+ wp.copy(
413
+ dest=face_count.array, src=vertex_unique_face_offsets.array, src_offset=self.vertex_count() - 1, count=1
414
+ )
415
+ wp.synchronize_stream(wp.get_stream(device))
416
+ face_count = int(face_count.array.numpy()[0])
417
+ else:
418
+ face_count = int(vertex_unique_face_offsets.array.numpy()[self.vertex_count() - 1])
419
+
420
+ self._face_vertex_indices = wp.empty(shape=(face_count,), dtype=wp.vec3i, device=device)
421
+ self._face_tet_indices = wp.empty(shape=(face_count,), dtype=wp.vec2i, device=device)
422
+
423
+ boundary_mask = borrow_temporary(temporary_store, shape=(face_count,), dtype=int, device=device)
424
+
425
+ # Compress edge data
426
+ wp.launch(
427
+ kernel=Tetmesh._compress_faces_kernel,
428
+ device=device,
429
+ dim=self.vertex_count(),
430
+ inputs=[
431
+ vertex_start_face_offsets.array,
432
+ vertex_unique_face_offsets.array,
433
+ vertex_unique_face_count.array,
434
+ vertex_face_other_vs.array,
435
+ vertex_face_tets.array,
436
+ self._face_vertex_indices,
437
+ self._face_tet_indices,
438
+ boundary_mask.array,
439
+ ],
440
+ )
441
+
442
+ vertex_start_face_offsets.release()
443
+ vertex_unique_face_offsets.release()
444
+ vertex_unique_face_count.release()
445
+ vertex_face_other_vs.release()
446
+ vertex_face_tets.release()
447
+
448
+ # Flip normals if necessary
449
+ wp.launch(
450
+ kernel=Tetmesh._flip_face_normals,
451
+ device=device,
452
+ dim=self.side_count(),
453
+ inputs=[self._face_vertex_indices, self._face_tet_indices, self.tet_vertex_indices, self.positions],
454
+ )
455
+
456
+ boundary_face_indices, _ = masked_indices(boundary_mask.array)
457
+ self._boundary_face_indices = boundary_face_indices.detach()
458
+
459
+ def _compute_tet_edges(self, temporary_store: Optional[TemporaryStore] = None):
460
+ from warp.utils import array_scan
461
+
462
+ device = self.tet_vertex_indices.device
463
+
464
+ vertex_start_edge_count = borrow_temporary(temporary_store, dtype=int, device=device, shape=self.vertex_count())
465
+ vertex_start_edge_count.array.zero_()
466
+ vertex_start_edge_offsets = borrow_temporary_like(vertex_start_edge_count, temporary_store=temporary_store)
467
+
468
+ vertex_edge_ends = borrow_temporary(temporary_store, dtype=int, device=device, shape=(6 * self.cell_count()))
469
+
470
+ # Count face edges starting at each vertex
471
+ wp.launch(
472
+ kernel=Tetmesh._count_starting_edges_kernel,
473
+ device=device,
474
+ dim=self.cell_count(),
475
+ inputs=[self.tet_vertex_indices, vertex_start_edge_count.array],
476
+ )
477
+
478
+ array_scan(in_array=vertex_start_edge_count.array, out_array=vertex_start_edge_offsets.array, inclusive=False)
479
+
480
+ # Count number of unique edges (deduplicate across faces)
481
+ vertex_unique_edge_count = vertex_start_edge_count
482
+ wp.launch(
483
+ kernel=Tetmesh._count_unique_starting_edges_kernel,
484
+ device=device,
485
+ dim=self.vertex_count(),
486
+ inputs=[
487
+ self._vertex_tet_offsets,
488
+ self._vertex_tet_indices,
489
+ self.tet_vertex_indices,
490
+ vertex_start_edge_offsets.array,
491
+ vertex_unique_edge_count.array,
492
+ vertex_edge_ends.array,
493
+ ],
494
+ )
495
+
496
+ vertex_unique_edge_offsets = borrow_temporary_like(
497
+ vertex_start_edge_offsets.array, temporary_store=temporary_store
498
+ )
499
+ array_scan(in_array=vertex_start_edge_count.array, out_array=vertex_unique_edge_offsets.array, inclusive=False)
500
+
501
+ # Get back edge count to host
502
+ if device.is_cuda:
503
+ edge_count = borrow_temporary(temporary_store, shape=(1,), dtype=int, device="cpu", pinned=True)
504
+ # Last vertex will not own any edge, so its count will be zero; just fetching last prefix count is ok
505
+ wp.copy(
506
+ dest=edge_count.array,
507
+ src=vertex_unique_edge_offsets.array,
508
+ src_offset=self.vertex_count() - 1,
509
+ count=1,
510
+ )
511
+ wp.synchronize_stream(wp.get_stream(device))
512
+ self._edge_count = int(edge_count.array.numpy()[0])
513
+ else:
514
+ self._edge_count = int(vertex_unique_edge_offsets.array.numpy()[self.vertex_count() - 1])
515
+
516
+ self._tet_edge_indices = wp.empty(
517
+ dtype=int, device=self.tet_vertex_indices.device, shape=(self.cell_count(), 6)
518
+ )
519
+
520
+ # Compress edge data
521
+ wp.launch(
522
+ kernel=Tetmesh._compress_edges_kernel,
523
+ device=device,
524
+ dim=self.vertex_count(),
525
+ inputs=[
526
+ self._vertex_tet_offsets,
527
+ self._vertex_tet_indices,
528
+ self.tet_vertex_indices,
529
+ vertex_start_edge_offsets.array,
530
+ vertex_unique_edge_offsets.array,
531
+ vertex_unique_edge_count.array,
532
+ vertex_edge_ends.array,
533
+ self._tet_edge_indices,
534
+ ],
535
+ )
536
+
537
+ vertex_start_edge_offsets.release()
538
+ vertex_unique_edge_offsets.release()
539
+ vertex_unique_edge_count.release()
540
+ vertex_edge_ends.release()
541
+
542
+ def _compute_deformation_gradients(self):
543
+ self._deformation_gradients = wp.empty(dtype=wp.mat33f, device=self.positions.device, shape=(self.cell_count()))
544
+
545
+ wp.launch(
546
+ kernel=Tetmesh._compute_deformation_gradients_kernel,
547
+ dim=self._deformation_gradients.shape,
548
+ device=self._deformation_gradients.device,
549
+ inputs=[self.tet_vertex_indices, self.positions, self._deformation_gradients],
550
+ )
551
+
552
+ @wp.kernel
553
+ def _count_starting_faces_kernel(
554
+ tet_vertex_indices: wp.array2d(dtype=int), vertex_start_face_count: wp.array(dtype=int)
555
+ ):
556
+ t = wp.tid()
557
+ for k in range(4):
558
+ vi = wp.vec3i(
559
+ tet_vertex_indices[t, k], tet_vertex_indices[t, (k + 1) % 4], tet_vertex_indices[t, (k + 2) % 4]
560
+ )
561
+ vm = wp.min(vi)
562
+
563
+ for i in range(3):
564
+ if vm == vi[i]:
565
+ wp.atomic_add(vertex_start_face_count, vm, 1)
566
+
567
+ @wp.func
568
+ def _find_face(
569
+ needle: wp.vec2i,
570
+ values: wp.array(dtype=wp.vec2i),
571
+ beg: int,
572
+ end: int,
573
+ ):
574
+ for i in range(beg, end):
575
+ if values[i] == needle:
576
+ return i
577
+
578
+ return -1
579
+
580
+ @wp.kernel
581
+ def _count_unique_starting_faces_kernel(
582
+ vertex_tet_offsets: wp.array(dtype=int),
583
+ vertex_tet_indices: wp.array(dtype=int),
584
+ tet_vertex_indices: wp.array2d(dtype=int),
585
+ vertex_start_face_offsets: wp.array(dtype=int),
586
+ vertex_start_face_count: wp.array(dtype=int),
587
+ face_other_vs: wp.array(dtype=wp.vec2i),
588
+ face_tets: wp.array2d(dtype=int),
589
+ ):
590
+ v = wp.tid()
591
+
592
+ face_beg = vertex_start_face_offsets[v]
593
+
594
+ tet_beg = vertex_tet_offsets[v]
595
+ tet_end = vertex_tet_offsets[v + 1]
596
+
597
+ face_cur = face_beg
598
+
599
+ for tet in range(tet_beg, tet_end):
600
+ t = vertex_tet_indices[tet]
601
+
602
+ for k in range(4):
603
+ vi = wp.vec3i(
604
+ tet_vertex_indices[t, k], tet_vertex_indices[t, (k + 1) % 4], tet_vertex_indices[t, (k + 2) % 4]
605
+ )
606
+ min_v = wp.min(vi)
607
+
608
+ if v == min_v:
609
+ max_v = wp.max(vi)
610
+ mid_v = vi[0] + vi[1] + vi[2] - min_v - max_v
611
+ other_v = wp.vec2i(mid_v, max_v)
612
+
613
+ # Check if other_v has been seen
614
+ seen_idx = Tetmesh._find_face(other_v, face_other_vs, face_beg, face_cur)
615
+
616
+ if seen_idx == -1:
617
+ face_other_vs[face_cur] = other_v
618
+ face_tets[face_cur, 0] = t
619
+ face_tets[face_cur, 1] = t
620
+ face_cur += 1
621
+ else:
622
+ face_tets[seen_idx, 1] = t
623
+
624
+ vertex_start_face_count[v] = face_cur - face_beg
625
+
626
+ @wp.kernel
627
+ def _compress_faces_kernel(
628
+ vertex_start_face_offsets: wp.array(dtype=int),
629
+ vertex_unique_face_offsets: wp.array(dtype=int),
630
+ vertex_unique_face_count: wp.array(dtype=int),
631
+ uncompressed_face_other_vs: wp.array(dtype=wp.vec2i),
632
+ uncompressed_face_tets: wp.array2d(dtype=int),
633
+ face_vertex_indices: wp.array(dtype=wp.vec3i),
634
+ face_tet_indices: wp.array(dtype=wp.vec2i),
635
+ boundary_mask: wp.array(dtype=int),
636
+ ):
637
+ v = wp.tid()
638
+
639
+ start_beg = vertex_start_face_offsets[v]
640
+ unique_beg = vertex_unique_face_offsets[v]
641
+ unique_count = vertex_unique_face_count[v]
642
+
643
+ for f in range(unique_count):
644
+ src_index = start_beg + f
645
+ face_index = unique_beg + f
646
+
647
+ face_vertex_indices[face_index] = wp.vec3i(
648
+ v,
649
+ uncompressed_face_other_vs[src_index][0],
650
+ uncompressed_face_other_vs[src_index][1],
651
+ )
652
+
653
+ t0 = uncompressed_face_tets[src_index, 0]
654
+ t1 = uncompressed_face_tets[src_index, 1]
655
+ face_tet_indices[face_index] = wp.vec2i(t0, t1)
656
+ if t0 == t1:
657
+ boundary_mask[face_index] = 1
658
+ else:
659
+ boundary_mask[face_index] = 0
660
+
661
+ @wp.kernel
662
+ def _flip_face_normals(
663
+ face_vertex_indices: wp.array(dtype=wp.vec3i),
664
+ face_tet_indices: wp.array(dtype=wp.vec2i),
665
+ tet_vertex_indices: wp.array2d(dtype=int),
666
+ positions: wp.array(dtype=wp.vec3),
667
+ ):
668
+ e = wp.tid()
669
+
670
+ tet = face_tet_indices[e][0]
671
+
672
+ tet_vidx = tet_vertex_indices[tet]
673
+ face_vidx = face_vertex_indices[e]
674
+
675
+ tet_centroid = (
676
+ positions[tet_vidx[0]] + positions[tet_vidx[1]] + positions[tet_vidx[2]] + positions[tet_vidx[3]]
677
+ ) / 4.0
678
+
679
+ v0 = positions[face_vidx[0]]
680
+ v1 = positions[face_vidx[1]]
681
+ v2 = positions[face_vidx[2]]
682
+
683
+ face_center = (v1 + v0 + v2) / 3.0
684
+ face_normal = wp.cross(v1 - v0, v2 - v0)
685
+
686
+ # if face normal points toward first tet centroid, flip indices
687
+ if wp.dot(tet_centroid - face_center, face_normal) > 0.0:
688
+ face_vertex_indices[e] = wp.vec3i(face_vidx[0], face_vidx[2], face_vidx[1])
689
+
690
+ @wp.kernel
691
+ def _count_starting_edges_kernel(
692
+ tri_vertex_indices: wp.array2d(dtype=int), vertex_start_edge_count: wp.array(dtype=int)
693
+ ):
694
+ t = wp.tid()
695
+ for k in range(3):
696
+ v0 = tri_vertex_indices[t, k]
697
+ v1 = tri_vertex_indices[t, (k + 1) % 3]
698
+
699
+ if v0 < v1:
700
+ wp.atomic_add(vertex_start_edge_count, v0, 1)
701
+ else:
702
+ wp.atomic_add(vertex_start_edge_count, v1, 1)
703
+
704
+ for k in range(3):
705
+ v0 = tri_vertex_indices[t, k]
706
+ v1 = tri_vertex_indices[t, 3]
707
+
708
+ if v0 < v1:
709
+ wp.atomic_add(vertex_start_edge_count, v0, 1)
710
+ else:
711
+ wp.atomic_add(vertex_start_edge_count, v1, 1)
712
+
713
+ @wp.func
714
+ def _find_edge(
715
+ needle: int,
716
+ values: wp.array(dtype=int),
717
+ beg: int,
718
+ end: int,
719
+ ):
720
+ for i in range(beg, end):
721
+ if values[i] == needle:
722
+ return i
723
+
724
+ return -1
725
+
726
+ @wp.kernel
727
+ def _count_unique_starting_edges_kernel(
728
+ vertex_tet_offsets: wp.array(dtype=int),
729
+ vertex_tet_indices: wp.array(dtype=int),
730
+ tet_vertex_indices: wp.array2d(dtype=int),
731
+ vertex_start_edge_offsets: wp.array(dtype=int),
732
+ vertex_start_edge_count: wp.array(dtype=int),
733
+ edge_ends: wp.array(dtype=int),
734
+ ):
735
+ v = wp.tid()
736
+
737
+ edge_beg = vertex_start_edge_offsets[v]
738
+
739
+ tet_beg = vertex_tet_offsets[v]
740
+ tet_end = vertex_tet_offsets[v + 1]
741
+
742
+ edge_cur = edge_beg
743
+
744
+ for tet in range(tet_beg, tet_end):
745
+ t = vertex_tet_indices[tet]
746
+
747
+ for k in range(3):
748
+ v0 = tet_vertex_indices[t, k]
749
+ v1 = tet_vertex_indices[t, (k + 1) % 3]
750
+
751
+ if v == wp.min(v0, v1):
752
+ other_v = wp.max(v0, v1)
753
+ if Tetmesh._find_edge(other_v, edge_ends, edge_beg, edge_cur) == -1:
754
+ edge_ends[edge_cur] = other_v
755
+ edge_cur += 1
756
+
757
+ for k in range(3):
758
+ v0 = tet_vertex_indices[t, k]
759
+ v1 = tet_vertex_indices[t, 3]
760
+
761
+ if v == wp.min(v0, v1):
762
+ other_v = wp.max(v0, v1)
763
+ if Tetmesh._find_edge(other_v, edge_ends, edge_beg, edge_cur) == -1:
764
+ edge_ends[edge_cur] = other_v
765
+ edge_cur += 1
766
+
767
+ vertex_start_edge_count[v] = edge_cur - edge_beg
768
+
769
+ @wp.kernel
770
+ def _compress_edges_kernel(
771
+ vertex_tet_offsets: wp.array(dtype=int),
772
+ vertex_tet_indices: wp.array(dtype=int),
773
+ tet_vertex_indices: wp.array2d(dtype=int),
774
+ vertex_start_edge_offsets: wp.array(dtype=int),
775
+ vertex_unique_edge_offsets: wp.array(dtype=int),
776
+ vertex_unique_edge_count: wp.array(dtype=int),
777
+ uncompressed_edge_ends: wp.array(dtype=int),
778
+ tet_edge_indices: wp.array2d(dtype=int),
779
+ ):
780
+ v = wp.tid()
781
+
782
+ uncompressed_beg = vertex_start_edge_offsets[v]
783
+
784
+ unique_beg = vertex_unique_edge_offsets[v]
785
+ unique_count = vertex_unique_edge_count[v]
786
+
787
+ tet_beg = vertex_tet_offsets[v]
788
+ tet_end = vertex_tet_offsets[v + 1]
789
+
790
+ for tet in range(tet_beg, tet_end):
791
+ t = vertex_tet_indices[tet]
792
+
793
+ for k in range(3):
794
+ v0 = tet_vertex_indices[t, k]
795
+ v1 = tet_vertex_indices[t, (k + 1) % 3]
796
+
797
+ if v == wp.min(v0, v1):
798
+ other_v = wp.max(v0, v1)
799
+ edge_id = (
800
+ Tetmesh._find_edge(
801
+ other_v, uncompressed_edge_ends, uncompressed_beg, uncompressed_beg + unique_count
802
+ )
803
+ - uncompressed_beg
804
+ + unique_beg
805
+ )
806
+ tet_edge_indices[t][k] = edge_id
807
+
808
+ for k in range(3):
809
+ v0 = tet_vertex_indices[t, k]
810
+ v1 = tet_vertex_indices[t, 3]
811
+
812
+ if v == wp.min(v0, v1):
813
+ other_v = wp.max(v0, v1)
814
+ edge_id = (
815
+ Tetmesh._find_edge(
816
+ other_v, uncompressed_edge_ends, uncompressed_beg, uncompressed_beg + unique_count
817
+ )
818
+ - uncompressed_beg
819
+ + unique_beg
820
+ )
821
+ tet_edge_indices[t][k + 3] = edge_id
822
+
823
+ @wp.kernel
824
+ def _compute_deformation_gradients_kernel(
825
+ tet_vertex_indices: wp.array2d(dtype=int),
826
+ positions: wp.array(dtype=wp.vec3f),
827
+ transforms: wp.array(dtype=wp.mat33f),
828
+ ):
829
+ t = wp.tid()
830
+
831
+ p0 = positions[tet_vertex_indices[t, 0]]
832
+ p1 = positions[tet_vertex_indices[t, 1]]
833
+ p2 = positions[tet_vertex_indices[t, 2]]
834
+ p3 = positions[tet_vertex_indices[t, 3]]
835
+
836
+ e1 = p1 - p0
837
+ e2 = p2 - p0
838
+ e3 = p3 - p0
839
+
840
+ transforms[t] = wp.mat33(e1, e2, e3)