warp-lang 0.10.1__py3-none-win_amd64.whl → 0.11.0__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of warp-lang might be problematic. Click here for more details.

Files changed (300) hide show
  1. warp/__init__.py +10 -4
  2. warp/__init__.pyi +1 -0
  3. warp/bin/warp-clang.dll +0 -0
  4. warp/bin/warp.dll +0 -0
  5. warp/build.py +5 -3
  6. warp/build_dll.py +29 -9
  7. warp/builtins.py +868 -507
  8. warp/codegen.py +1074 -638
  9. warp/config.py +3 -3
  10. warp/constants.py +6 -0
  11. warp/context.py +715 -222
  12. warp/fabric.py +326 -0
  13. warp/fem/__init__.py +27 -0
  14. warp/fem/cache.py +389 -0
  15. warp/fem/dirichlet.py +181 -0
  16. warp/fem/domain.py +263 -0
  17. warp/fem/field/__init__.py +101 -0
  18. warp/fem/field/field.py +149 -0
  19. warp/fem/field/nodal_field.py +299 -0
  20. warp/fem/field/restriction.py +21 -0
  21. warp/fem/field/test.py +181 -0
  22. warp/fem/field/trial.py +183 -0
  23. warp/fem/geometry/__init__.py +19 -0
  24. warp/fem/geometry/closest_point.py +70 -0
  25. warp/fem/geometry/deformed_geometry.py +271 -0
  26. warp/fem/geometry/element.py +744 -0
  27. warp/fem/geometry/geometry.py +186 -0
  28. warp/fem/geometry/grid_2d.py +373 -0
  29. warp/fem/geometry/grid_3d.py +435 -0
  30. warp/fem/geometry/hexmesh.py +953 -0
  31. warp/fem/geometry/partition.py +376 -0
  32. warp/fem/geometry/quadmesh_2d.py +532 -0
  33. warp/fem/geometry/tetmesh.py +840 -0
  34. warp/fem/geometry/trimesh_2d.py +577 -0
  35. warp/fem/integrate.py +1616 -0
  36. warp/fem/operator.py +191 -0
  37. warp/fem/polynomial.py +213 -0
  38. warp/fem/quadrature/__init__.py +2 -0
  39. warp/fem/quadrature/pic_quadrature.py +245 -0
  40. warp/fem/quadrature/quadrature.py +294 -0
  41. warp/fem/space/__init__.py +292 -0
  42. warp/fem/space/basis_space.py +489 -0
  43. warp/fem/space/collocated_function_space.py +105 -0
  44. warp/fem/space/dof_mapper.py +236 -0
  45. warp/fem/space/function_space.py +145 -0
  46. warp/fem/space/grid_2d_function_space.py +267 -0
  47. warp/fem/space/grid_3d_function_space.py +306 -0
  48. warp/fem/space/hexmesh_function_space.py +352 -0
  49. warp/fem/space/partition.py +350 -0
  50. warp/fem/space/quadmesh_2d_function_space.py +369 -0
  51. warp/fem/space/restriction.py +160 -0
  52. warp/fem/space/shape/__init__.py +15 -0
  53. warp/fem/space/shape/cube_shape_function.py +738 -0
  54. warp/fem/space/shape/shape_function.py +103 -0
  55. warp/fem/space/shape/square_shape_function.py +611 -0
  56. warp/fem/space/shape/tet_shape_function.py +567 -0
  57. warp/fem/space/shape/triangle_shape_function.py +429 -0
  58. warp/fem/space/tetmesh_function_space.py +292 -0
  59. warp/fem/space/topology.py +295 -0
  60. warp/fem/space/trimesh_2d_function_space.py +221 -0
  61. warp/fem/types.py +77 -0
  62. warp/fem/utils.py +495 -0
  63. warp/native/array.h +147 -44
  64. warp/native/builtin.h +122 -149
  65. warp/native/bvh.cpp +73 -325
  66. warp/native/bvh.cu +406 -23
  67. warp/native/bvh.h +34 -43
  68. warp/native/clang/clang.cpp +13 -8
  69. warp/native/crt.h +2 -0
  70. warp/native/cuda_crt.h +5 -0
  71. warp/native/cuda_util.cpp +15 -3
  72. warp/native/cuda_util.h +3 -1
  73. warp/native/cutlass/tools/library/scripts/conv2d_operation.py +463 -0
  74. warp/native/cutlass/tools/library/scripts/conv3d_operation.py +321 -0
  75. warp/native/cutlass/tools/library/scripts/gemm_operation.py +988 -0
  76. warp/native/cutlass/tools/library/scripts/generator.py +4625 -0
  77. warp/native/cutlass/tools/library/scripts/library.py +799 -0
  78. warp/native/cutlass/tools/library/scripts/manifest.py +402 -0
  79. warp/native/cutlass/tools/library/scripts/pycutlass/docs/source/conf.py +96 -0
  80. warp/native/cutlass/tools/library/scripts/pycutlass/profile/conv/conv2d_f16_sm80.py +106 -0
  81. warp/native/cutlass/tools/library/scripts/pycutlass/profile/gemm/gemm_f32_sm80.py +91 -0
  82. warp/native/cutlass/tools/library/scripts/pycutlass/setup.py +80 -0
  83. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/__init__.py +48 -0
  84. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/arguments.py +118 -0
  85. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/c_types.py +241 -0
  86. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/compiler.py +432 -0
  87. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/conv2d_operation.py +631 -0
  88. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/epilogue.py +1026 -0
  89. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/frontend.py +104 -0
  90. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/gemm_operation.py +1276 -0
  91. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/library.py +744 -0
  92. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/memory_manager.py +74 -0
  93. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/operation.py +110 -0
  94. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/parser.py +619 -0
  95. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/reduction_operation.py +398 -0
  96. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/tensor_ref.py +70 -0
  97. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/__init__.py +4 -0
  98. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/conv2d_testbed.py +646 -0
  99. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_grouped_testbed.py +235 -0
  100. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_testbed.py +557 -0
  101. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/profiler.py +70 -0
  102. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/type_hint.py +39 -0
  103. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/__init__.py +1 -0
  104. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/device.py +76 -0
  105. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/reference_model.py +255 -0
  106. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/__init__.py +0 -0
  107. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +201 -0
  108. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +177 -0
  109. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +98 -0
  110. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +95 -0
  111. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_few_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +163 -0
  112. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_fixed_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +187 -0
  113. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +309 -0
  114. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +54 -0
  115. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
  116. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
  117. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_strided_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +253 -0
  118. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +97 -0
  119. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +242 -0
  120. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
  121. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
  122. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/run_all_tests.py +10 -0
  123. warp/native/cutlass/tools/library/scripts/pycutlass/test/frontend/test_frontend.py +146 -0
  124. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/__init__.py +0 -0
  125. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_bf16_sm80.py +96 -0
  126. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f16_sm80.py +447 -0
  127. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f32_sm80.py +146 -0
  128. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f64_sm80.py +102 -0
  129. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_grouped_sm80.py +203 -0
  130. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_s8_sm80.py +229 -0
  131. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/run_all_tests.py +9 -0
  132. warp/native/cutlass/tools/library/scripts/pycutlass/test/unit/test_sm80.py +453 -0
  133. warp/native/cutlass/tools/library/scripts/rank_2k_operation.py +398 -0
  134. warp/native/cutlass/tools/library/scripts/rank_k_operation.py +387 -0
  135. warp/native/cutlass/tools/library/scripts/rt.py +796 -0
  136. warp/native/cutlass/tools/library/scripts/symm_operation.py +400 -0
  137. warp/native/cutlass/tools/library/scripts/trmm_operation.py +407 -0
  138. warp/native/cutlass_gemm.cu +5 -3
  139. warp/native/exports.h +1240 -952
  140. warp/native/fabric.h +228 -0
  141. warp/native/hashgrid.cpp +4 -4
  142. warp/native/hashgrid.h +22 -2
  143. warp/native/intersect.h +22 -7
  144. warp/native/intersect_adj.h +8 -8
  145. warp/native/intersect_tri.h +1 -1
  146. warp/native/marching.cu +157 -161
  147. warp/native/mat.h +80 -19
  148. warp/native/matnn.h +2 -2
  149. warp/native/mesh.cpp +33 -108
  150. warp/native/mesh.cu +114 -23
  151. warp/native/mesh.h +446 -46
  152. warp/native/noise.h +272 -329
  153. warp/native/quat.h +51 -8
  154. warp/native/rand.h +45 -35
  155. warp/native/range.h +6 -2
  156. warp/native/reduce.cpp +1 -1
  157. warp/native/reduce.cu +10 -12
  158. warp/native/runlength_encode.cu +6 -10
  159. warp/native/scan.cu +8 -11
  160. warp/native/sparse.cpp +4 -4
  161. warp/native/sparse.cu +164 -154
  162. warp/native/spatial.h +2 -2
  163. warp/native/temp_buffer.h +14 -30
  164. warp/native/vec.h +107 -23
  165. warp/native/volume.h +120 -0
  166. warp/native/warp.cpp +560 -30
  167. warp/native/warp.cu +431 -44
  168. warp/native/warp.h +13 -4
  169. warp/optim/__init__.py +1 -0
  170. warp/optim/linear.py +922 -0
  171. warp/optim/sgd.py +92 -0
  172. warp/render/render_opengl.py +335 -119
  173. warp/render/render_usd.py +11 -11
  174. warp/sim/__init__.py +2 -2
  175. warp/sim/articulation.py +385 -185
  176. warp/sim/collide.py +8 -0
  177. warp/sim/import_mjcf.py +297 -106
  178. warp/sim/import_urdf.py +389 -210
  179. warp/sim/import_usd.py +198 -97
  180. warp/sim/inertia.py +17 -18
  181. warp/sim/integrator_euler.py +14 -8
  182. warp/sim/integrator_xpbd.py +158 -16
  183. warp/sim/model.py +795 -291
  184. warp/sim/render.py +3 -3
  185. warp/sim/utils.py +3 -0
  186. warp/sparse.py +640 -150
  187. warp/stubs.py +606 -267
  188. warp/tape.py +61 -10
  189. warp/tests/__main__.py +3 -6
  190. warp/tests/assets/curlnoise_golden.npy +0 -0
  191. warp/tests/assets/pnoise_golden.npy +0 -0
  192. warp/tests/{test_class_kernel.py → aux_test_class_kernel.py} +9 -1
  193. warp/tests/aux_test_conditional_unequal_types_kernels.py +21 -0
  194. warp/tests/{test_dependent.py → aux_test_dependent.py} +2 -2
  195. warp/tests/{test_reference.py → aux_test_reference.py} +1 -1
  196. warp/tests/aux_test_unresolved_func.py +14 -0
  197. warp/tests/aux_test_unresolved_symbol.py +14 -0
  198. warp/tests/disabled_kinematics.py +239 -0
  199. warp/tests/run_coverage_serial.py +31 -0
  200. warp/tests/test_adam.py +103 -106
  201. warp/tests/test_arithmetic.py +128 -74
  202. warp/tests/test_array.py +212 -97
  203. warp/tests/test_array_reduce.py +57 -23
  204. warp/tests/test_atomic.py +64 -28
  205. warp/tests/test_bool.py +99 -0
  206. warp/tests/test_builtins_resolution.py +1292 -0
  207. warp/tests/test_bvh.py +42 -18
  208. warp/tests/test_closest_point_edge_edge.py +54 -57
  209. warp/tests/test_codegen.py +208 -130
  210. warp/tests/test_compile_consts.py +28 -20
  211. warp/tests/test_conditional.py +108 -24
  212. warp/tests/test_copy.py +10 -12
  213. warp/tests/test_ctypes.py +112 -88
  214. warp/tests/test_dense.py +21 -14
  215. warp/tests/test_devices.py +98 -0
  216. warp/tests/test_dlpack.py +75 -75
  217. warp/tests/test_examples.py +277 -0
  218. warp/tests/test_fabricarray.py +955 -0
  219. warp/tests/test_fast_math.py +15 -11
  220. warp/tests/test_fem.py +1271 -0
  221. warp/tests/test_fp16.py +53 -19
  222. warp/tests/test_func.py +187 -86
  223. warp/tests/test_generics.py +194 -49
  224. warp/tests/test_grad.py +178 -109
  225. warp/tests/test_grad_customs.py +176 -0
  226. warp/tests/test_hash_grid.py +52 -37
  227. warp/tests/test_import.py +10 -23
  228. warp/tests/test_indexedarray.py +32 -31
  229. warp/tests/test_intersect.py +18 -9
  230. warp/tests/test_large.py +141 -0
  231. warp/tests/test_launch.py +14 -41
  232. warp/tests/test_lerp.py +64 -65
  233. warp/tests/test_linear_solvers.py +154 -0
  234. warp/tests/test_lvalue.py +493 -0
  235. warp/tests/test_marching_cubes.py +12 -13
  236. warp/tests/test_mat.py +517 -2898
  237. warp/tests/test_mat_lite.py +115 -0
  238. warp/tests/test_mat_scalar_ops.py +2889 -0
  239. warp/tests/test_math.py +103 -9
  240. warp/tests/test_matmul.py +305 -69
  241. warp/tests/test_matmul_lite.py +410 -0
  242. warp/tests/test_mesh.py +71 -14
  243. warp/tests/test_mesh_query_aabb.py +41 -25
  244. warp/tests/test_mesh_query_point.py +140 -22
  245. warp/tests/test_mesh_query_ray.py +39 -22
  246. warp/tests/test_mlp.py +30 -22
  247. warp/tests/test_model.py +92 -89
  248. warp/tests/test_modules_lite.py +39 -0
  249. warp/tests/test_multigpu.py +88 -114
  250. warp/tests/test_noise.py +12 -11
  251. warp/tests/test_operators.py +16 -20
  252. warp/tests/test_options.py +11 -11
  253. warp/tests/test_pinned.py +17 -18
  254. warp/tests/test_print.py +32 -11
  255. warp/tests/test_quat.py +275 -129
  256. warp/tests/test_rand.py +18 -16
  257. warp/tests/test_reload.py +38 -34
  258. warp/tests/test_rounding.py +50 -43
  259. warp/tests/test_runlength_encode.py +168 -20
  260. warp/tests/test_smoothstep.py +9 -11
  261. warp/tests/test_snippet.py +143 -0
  262. warp/tests/test_sparse.py +261 -63
  263. warp/tests/test_spatial.py +276 -243
  264. warp/tests/test_streams.py +110 -85
  265. warp/tests/test_struct.py +268 -63
  266. warp/tests/test_tape.py +39 -21
  267. warp/tests/test_torch.py +118 -89
  268. warp/tests/test_transient_module.py +12 -13
  269. warp/tests/test_types.py +614 -0
  270. warp/tests/test_utils.py +494 -0
  271. warp/tests/test_vec.py +354 -2050
  272. warp/tests/test_vec_lite.py +73 -0
  273. warp/tests/test_vec_scalar_ops.py +2099 -0
  274. warp/tests/test_volume.py +457 -293
  275. warp/tests/test_volume_write.py +124 -134
  276. warp/tests/unittest_serial.py +35 -0
  277. warp/tests/unittest_suites.py +341 -0
  278. warp/tests/unittest_utils.py +568 -0
  279. warp/tests/unused_test_misc.py +71 -0
  280. warp/tests/{test_debug.py → walkthough_debug.py} +3 -17
  281. warp/thirdparty/appdirs.py +36 -45
  282. warp/thirdparty/unittest_parallel.py +549 -0
  283. warp/torch.py +9 -6
  284. warp/types.py +1089 -366
  285. warp/utils.py +93 -387
  286. warp_lang-0.11.0.dist-info/METADATA +238 -0
  287. warp_lang-0.11.0.dist-info/RECORD +332 -0
  288. {warp_lang-0.10.1.dist-info → warp_lang-0.11.0.dist-info}/WHEEL +1 -1
  289. warp/tests/test_all.py +0 -219
  290. warp/tests/test_array_scan.py +0 -60
  291. warp/tests/test_base.py +0 -208
  292. warp/tests/test_unresolved_func.py +0 -7
  293. warp/tests/test_unresolved_symbol.py +0 -7
  294. warp_lang-0.10.1.dist-info/METADATA +0 -21
  295. warp_lang-0.10.1.dist-info/RECORD +0 -188
  296. /warp/tests/{test_compile_consts_dummy.py → aux_test_compile_consts_dummy.py} +0 -0
  297. /warp/tests/{test_reference_reference.py → aux_test_reference_reference.py} +0 -0
  298. /warp/tests/{test_square.py → aux_test_square.py} +0 -0
  299. {warp_lang-0.10.1.dist-info → warp_lang-0.11.0.dist-info}/LICENSE.md +0 -0
  300. {warp_lang-0.10.1.dist-info → warp_lang-0.11.0.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,567 @@
1
+ import math
2
+
3
+ import warp as wp
4
+ import numpy as np
5
+
6
+ from warp.fem.types import Coords
7
+ from warp.fem import cache
8
+
9
+
10
+ def _tet_node_index(tx: int, ty: int, tz: int, degree: int):
11
+ from .triangle_shape_function import _triangle_node_index
12
+
13
+ VERTEX_NODE_COUNT = 4
14
+ EDGE_INTERIOR_NODE_COUNT = degree - 1
15
+ VERTEX_EDGE_NODE_COUNT = VERTEX_NODE_COUNT + 6 * EDGE_INTERIOR_NODE_COUNT
16
+ FACE_INTERIOR_NODE_COUNT = (degree - 1) * (degree - 2) // 2
17
+ VERTEX_EDGE_FACE_NODE_COUNT = VERTEX_EDGE_NODE_COUNT + 4 * FACE_INTERIOR_NODE_COUNT
18
+
19
+ # Index in similar order to e.g. VTK
20
+ # First vertices, then edges (counterclokwise), then faces, then interior points (recursively)
21
+
22
+ if tx == 0:
23
+ if ty == 0:
24
+ if tz == 0:
25
+ return 0
26
+ elif tz == degree:
27
+ return 3
28
+ else:
29
+ # 0-3 edge
30
+ edge_index = 3
31
+ return VERTEX_NODE_COUNT + EDGE_INTERIOR_NODE_COUNT * edge_index + (tz - 1)
32
+ elif tz == 0:
33
+ if ty == degree:
34
+ return 2
35
+ else:
36
+ # 2-0 edge
37
+ edge_index = 2
38
+ return VERTEX_NODE_COUNT + EDGE_INTERIOR_NODE_COUNT * edge_index + (EDGE_INTERIOR_NODE_COUNT - ty)
39
+ elif tz + ty == degree:
40
+ # 2-3 edge
41
+ edge_index = 5
42
+ return VERTEX_NODE_COUNT + EDGE_INTERIOR_NODE_COUNT * edge_index + (tz - 1)
43
+ else:
44
+ # 2-3-0 face
45
+ face_index = 2
46
+ return (
47
+ VERTEX_EDGE_NODE_COUNT
48
+ + FACE_INTERIOR_NODE_COUNT * face_index
49
+ + _triangle_node_index(degree - 1 - ty - tz, tz - 1, degree - 3)
50
+ )
51
+ elif ty == 0:
52
+ if tz == 0:
53
+ if tx == degree:
54
+ return 1
55
+ else:
56
+ # 0-1 edge
57
+ edge_index = 0
58
+ return VERTEX_NODE_COUNT + EDGE_INTERIOR_NODE_COUNT * edge_index + (tx - 1)
59
+ elif tz + tx == degree:
60
+ # 1-3 edge
61
+ edge_index = 4
62
+ return VERTEX_NODE_COUNT + EDGE_INTERIOR_NODE_COUNT * edge_index + (tz - 1)
63
+ else:
64
+ # 3-0-1 face
65
+ face_index = 3
66
+ return (
67
+ VERTEX_EDGE_NODE_COUNT
68
+ + FACE_INTERIOR_NODE_COUNT * face_index
69
+ + _triangle_node_index(tx - 1, tz - 1, degree - 3)
70
+ )
71
+ elif tz == 0:
72
+ if tx + ty == degree:
73
+ # 1-2 edge
74
+ edge_index = 1
75
+ return VERTEX_NODE_COUNT + EDGE_INTERIOR_NODE_COUNT * edge_index + (ty - 1)
76
+ else:
77
+ # 0-1-2 face
78
+ face_index = 0
79
+ return (
80
+ VERTEX_EDGE_NODE_COUNT
81
+ + FACE_INTERIOR_NODE_COUNT * face_index
82
+ + _triangle_node_index(tx - 1, ty - 1, degree - 3)
83
+ )
84
+ elif tx + ty + tz == degree:
85
+ # 1-2-3 face
86
+ face_index = 1
87
+ return (
88
+ VERTEX_EDGE_NODE_COUNT
89
+ + FACE_INTERIOR_NODE_COUNT * face_index
90
+ + _triangle_node_index(tx - 1, tz - 1, degree - 3)
91
+ )
92
+
93
+ return VERTEX_EDGE_FACE_NODE_COUNT + _tet_node_index(tx - 1, ty - 1, tz - 1, degree - 4)
94
+
95
+
96
+ class TetrahedronPolynomialShapeFunctions:
97
+ INVALID = wp.constant(-1)
98
+ VERTEX = wp.constant(0)
99
+ EDGE = wp.constant(1)
100
+ FACE = wp.constant(2)
101
+ INTERIOR = wp.constant(3)
102
+
103
+ def __init__(self, degree: int):
104
+ self.ORDER = wp.constant(degree)
105
+
106
+ self.NODES_PER_ELEMENT = wp.constant((degree + 1) * (degree + 2) * (degree + 3) // 6)
107
+ self.NODES_PER_SIDE = wp.constant((degree + 1) * (degree + 2) // 2)
108
+
109
+ tet_coords = np.empty((self.NODES_PER_ELEMENT, 3), dtype=int)
110
+
111
+ for tx in range(degree + 1):
112
+ for ty in range(degree + 1 - tx):
113
+ for tz in range(degree + 1 - tx - ty):
114
+ index = _tet_node_index(tx, ty, tz, degree)
115
+ tet_coords[index] = [tx, ty, tz]
116
+
117
+ CoordTypeVec = wp.mat(dtype=int, shape=(self.NODES_PER_ELEMENT, 3))
118
+ self.NODE_TET_COORDS = wp.constant(CoordTypeVec(tet_coords))
119
+
120
+ self.node_type_and_type_index = self._get_node_type_and_type_index()
121
+ self._node_tet_coordinates = self._get_node_tet_coordinates()
122
+
123
+ @property
124
+ def name(self) -> str:
125
+ return f"Tet_P{self.ORDER}"
126
+
127
+ def _get_node_tet_coordinates(self):
128
+ NODE_TET_COORDS = self.NODE_TET_COORDS
129
+
130
+ def node_tet_coordinates(
131
+ node_index_in_elt: int,
132
+ ):
133
+ return wp.vec3i(
134
+ NODE_TET_COORDS[node_index_in_elt, 0],
135
+ NODE_TET_COORDS[node_index_in_elt, 1],
136
+ NODE_TET_COORDS[node_index_in_elt, 2],
137
+ )
138
+
139
+ return cache.get_func(node_tet_coordinates, self.name)
140
+
141
+ def _get_node_type_and_type_index(self):
142
+ ORDER = self.ORDER
143
+ NODES_PER_ELEMENT = self.NODES_PER_ELEMENT
144
+
145
+ def node_type_and_index(
146
+ node_index_in_elt: int,
147
+ ):
148
+ if node_index_in_elt < 0 or node_index_in_elt >= NODES_PER_ELEMENT:
149
+ return TetrahedronPolynomialShapeFunctions.INVALID, TetrahedronPolynomialShapeFunctions.INVALID
150
+
151
+ if node_index_in_elt < 4:
152
+ return TetrahedronPolynomialShapeFunctions.VERTEX, node_index_in_elt
153
+
154
+ if node_index_in_elt < (6 * ORDER - 2):
155
+ return TetrahedronPolynomialShapeFunctions.EDGE, (node_index_in_elt - 4)
156
+
157
+ if node_index_in_elt < (2 * ORDER * ORDER + 2):
158
+ return TetrahedronPolynomialShapeFunctions.FACE, (node_index_in_elt - (6 * ORDER - 2))
159
+
160
+ return TetrahedronPolynomialShapeFunctions.INTERIOR, (node_index_in_elt - (2 * ORDER * ORDER + 2))
161
+
162
+ return cache.get_func(node_type_and_index, self.name)
163
+
164
+ def make_node_coords_in_element(self):
165
+ ORDER = self.ORDER
166
+
167
+ def node_coords_in_element(
168
+ node_index_in_elt: int,
169
+ ):
170
+ tet_coords = self._node_tet_coordinates(node_index_in_elt)
171
+ cx = float(tet_coords[0]) / float(ORDER)
172
+ cy = float(tet_coords[1]) / float(ORDER)
173
+ cz = float(tet_coords[2]) / float(ORDER)
174
+ return Coords(cx, cy, cz)
175
+
176
+ return cache.get_func(node_coords_in_element, self.name)
177
+
178
+ def make_node_quadrature_weight(self):
179
+ if self.ORDER == 3:
180
+ # Order 1, but optimized quadrature weights for monomials of order <= 6
181
+ vertex_weight = 0.007348845656
182
+ edge_weight = 0.020688129855
183
+ face_weight = 0.180586764778
184
+ interior_weight = 0.0
185
+ else:
186
+ vertex_weight = 1.0 / self.NODES_PER_ELEMENT
187
+ edge_weight = 1.0 / self.NODES_PER_ELEMENT
188
+ face_weight = 1.0 / self.NODES_PER_ELEMENT
189
+ interior_weight = 1.0 / self.NODES_PER_ELEMENT
190
+
191
+ VERTEX_WEIGHT = wp.constant(vertex_weight)
192
+ EDGE_WEIGHT = wp.constant(edge_weight)
193
+ FACE_WEIGHT = wp.constant(face_weight)
194
+ INTERIOR_WEIGHT = wp.constant(interior_weight)
195
+
196
+ @cache.dynamic_func(suffix=self.name)
197
+ def node_quadrature_weight(node_index_in_element: int):
198
+ node_type, type_index = self.node_type_and_type_index(node_index_in_element)
199
+
200
+ if node_type == TetrahedronPolynomialShapeFunctions.VERTEX:
201
+ return VERTEX_WEIGHT
202
+ elif node_type == TetrahedronPolynomialShapeFunctions.EDGE:
203
+ return EDGE_WEIGHT
204
+ elif node_type == TetrahedronPolynomialShapeFunctions.FACE:
205
+ return FACE_WEIGHT
206
+
207
+ return INTERIOR_WEIGHT
208
+
209
+ return node_quadrature_weight
210
+
211
+ def make_trace_node_quadrature_weight(self):
212
+ if self.ORDER == 3:
213
+ # P3 intrisic quadrature
214
+ vertex_weight = 1.0 / 30
215
+ edge_weight = 0.075
216
+ interior_weight = 0.45
217
+ elif self.ORDER == 2:
218
+ # Order 1, but optimized quadrature weights for monomials of order <= 4
219
+ vertex_weight = 0.022335964126
220
+ edge_weight = 0.310997369207
221
+ interior_weight = 0.0
222
+ else:
223
+ vertex_weight = 1.0 / self.NODES_PER_SIDE
224
+ edge_weight = 1.0 / self.NODES_PER_SIDE
225
+ interior_weight = 1.0 / self.NODES_PER_SIDE
226
+
227
+ VERTEX_WEIGHT = wp.constant(vertex_weight)
228
+ EDGE_WEIGHT = wp.constant(edge_weight)
229
+ FACE_INTERIOR_WEIGHT = wp.constant(interior_weight)
230
+
231
+ @cache.dynamic_func(suffix=self.name)
232
+ def trace_node_quadrature_weight(node_index_in_element: int):
233
+ node_type, type_index = self.node_type_and_type_index(node_index_in_element)
234
+
235
+ if node_type == TetrahedronPolynomialShapeFunctions.VERTEX:
236
+ return VERTEX_WEIGHT
237
+ elif node_type == TetrahedronPolynomialShapeFunctions.EDGE:
238
+ return EDGE_WEIGHT
239
+
240
+ return FACE_INTERIOR_WEIGHT
241
+
242
+ return trace_node_quadrature_weight
243
+
244
+ def make_element_inner_weight(self):
245
+ ORDER = self.ORDER
246
+
247
+ def element_inner_weight_linear(
248
+ coords: Coords,
249
+ node_index_in_elt: int,
250
+ ):
251
+ if node_index_in_elt < 0 or node_index_in_elt >= 4:
252
+ return 0.0
253
+
254
+ tet_coords = wp.vec4(1.0 - coords[0] - coords[1] - coords[2], coords[0], coords[1], coords[2])
255
+ return tet_coords[node_index_in_elt]
256
+
257
+ def element_inner_weight_quadratic(
258
+ coords: Coords,
259
+ node_index_in_elt: int,
260
+ ):
261
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
262
+
263
+ tet_coords = wp.vec4(1.0 - coords[0] - coords[1] - coords[2], coords[0], coords[1], coords[2])
264
+
265
+ if node_type == TetrahedronPolynomialShapeFunctions.VERTEX:
266
+ # Vertex
267
+ return tet_coords[type_index] * (2.0 * tet_coords[type_index] - 1.0)
268
+
269
+ elif node_type == TetrahedronPolynomialShapeFunctions.EDGE:
270
+ # Edge
271
+ if type_index < 3:
272
+ c1 = type_index
273
+ c2 = (type_index + 1) % 3
274
+ else:
275
+ c1 = type_index - 3
276
+ c2 = 3
277
+ return 4.0 * tet_coords[c1] * tet_coords[c2]
278
+
279
+ return 0.0
280
+
281
+ def element_inner_weight_cubic(
282
+ coords: Coords,
283
+ node_index_in_elt: int,
284
+ ):
285
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
286
+
287
+ tet_coords = wp.vec4(1.0 - coords[0] - coords[1] - coords[2], coords[0], coords[1], coords[2])
288
+
289
+ if node_type == TetrahedronPolynomialShapeFunctions.VERTEX:
290
+ # Vertex
291
+ return (
292
+ 0.5
293
+ * tet_coords[type_index]
294
+ * (3.0 * tet_coords[type_index] - 1.0)
295
+ * (3.0 * tet_coords[type_index] - 2.0)
296
+ )
297
+
298
+ elif node_type == TetrahedronPolynomialShapeFunctions.EDGE:
299
+ # Edge
300
+ edge = type_index // 2
301
+ edge_node = type_index - 2 * edge
302
+
303
+ if edge < 3:
304
+ c1 = (edge + edge_node) % 3
305
+ c2 = (edge + 1 - edge_node) % 3
306
+ elif edge_node == 0:
307
+ c1 = edge - 3
308
+ c2 = 3
309
+ else:
310
+ c1 = 3
311
+ c2 = edge - 3
312
+
313
+ return 4.5 * tet_coords[c1] * tet_coords[c2] * (3.0 * tet_coords[c1] - 1.0)
314
+
315
+ elif node_type == TetrahedronPolynomialShapeFunctions.FACE:
316
+ # Interior
317
+ c1 = type_index
318
+ c2 = (c1 + 1) % 4
319
+ c3 = (c1 + 2) % 4
320
+ return 27.0 * tet_coords[c1] * tet_coords[c2] * tet_coords[c3]
321
+
322
+ return 0.0
323
+
324
+ if ORDER == 1:
325
+ return cache.get_func(element_inner_weight_linear, self.name)
326
+ elif ORDER == 2:
327
+ return cache.get_func(element_inner_weight_quadratic, self.name)
328
+ elif ORDER == 3:
329
+ return cache.get_func(element_inner_weight_cubic, self.name)
330
+
331
+ return None
332
+
333
+ def make_element_inner_weight_gradient(self):
334
+ ORDER = self.ORDER
335
+
336
+ def element_inner_weight_gradient_linear(
337
+ coords: Coords,
338
+ node_index_in_elt: int,
339
+ ):
340
+ if node_index_in_elt < 0 or node_index_in_elt >= 4:
341
+ return wp.vec3(0.0)
342
+
343
+ dw_dc = wp.vec4(0.0)
344
+ dw_dc[node_index_in_elt] = 1.0
345
+
346
+ dw_du = wp.vec3(dw_dc[1] - dw_dc[0], dw_dc[2] - dw_dc[0], dw_dc[3] - dw_dc[0])
347
+
348
+ return dw_du
349
+
350
+ def element_inner_weight_gradient_quadratic(
351
+ coords: Coords,
352
+ node_index_in_elt: int,
353
+ ):
354
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
355
+
356
+ tet_coords = wp.vec4(1.0 - coords[0] - coords[1] - coords[2], coords[0], coords[1], coords[2])
357
+ dw_dc = wp.vec4(0.0)
358
+
359
+ if node_type == TetrahedronPolynomialShapeFunctions.VERTEX:
360
+ # Vertex
361
+ dw_dc[type_index] = 4.0 * tet_coords[type_index] - 1.0
362
+
363
+ elif node_type == TetrahedronPolynomialShapeFunctions.EDGE:
364
+ # Edge
365
+ if type_index < 3:
366
+ c1 = type_index
367
+ c2 = (type_index + 1) % 3
368
+ else:
369
+ c1 = type_index - 3
370
+ c2 = 3
371
+ dw_dc[c1] = 4.0 * tet_coords[c2]
372
+ dw_dc[c2] = 4.0 * tet_coords[c1]
373
+
374
+ dw_du = wp.vec3(dw_dc[1] - dw_dc[0], dw_dc[2] - dw_dc[0], dw_dc[3] - dw_dc[0])
375
+ return dw_du
376
+
377
+ def element_inner_weight_gradient_cubic(
378
+ coords: Coords,
379
+ node_index_in_elt: int,
380
+ ):
381
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
382
+
383
+ tet_coords = wp.vec4(1.0 - coords[0] - coords[1] - coords[2], coords[0], coords[1], coords[2])
384
+
385
+ dw_dc = wp.vec4(0.0)
386
+
387
+ if node_type == TetrahedronPolynomialShapeFunctions.VERTEX:
388
+ # Vertex
389
+ dw_dc[type_index] = (
390
+ 0.5 * 27.0 * tet_coords[type_index] * tet_coords[type_index] - 9.0 * tet_coords[type_index] + 1.0
391
+ )
392
+
393
+ elif node_type == TetrahedronPolynomialShapeFunctions.EDGE:
394
+ # Edge
395
+ edge = type_index // 2
396
+ edge_node = type_index - 2 * edge
397
+
398
+ if edge < 3:
399
+ c1 = (edge + edge_node) % 3
400
+ c2 = (edge + 1 - edge_node) % 3
401
+ elif edge_node == 0:
402
+ c1 = edge - 3
403
+ c2 = 3
404
+ else:
405
+ c1 = 3
406
+ c2 = edge - 3
407
+
408
+ dw_dc[c1] = 4.5 * tet_coords[c2] * (6.0 * tet_coords[c1] - 1.0)
409
+ dw_dc[c2] = 4.5 * tet_coords[c1] * (3.0 * tet_coords[c1] - 1.0)
410
+
411
+ elif node_type == TetrahedronPolynomialShapeFunctions.FACE:
412
+ # Interior
413
+ c1 = type_index
414
+ c2 = (c1 + 1) % 4
415
+ c3 = (c1 + 2) % 4
416
+
417
+ dw_dc[c1] = 27.0 * tet_coords[c2] * tet_coords[c3]
418
+ dw_dc[c2] = 27.0 * tet_coords[c3] * tet_coords[c1]
419
+ dw_dc[c3] = 27.0 * tet_coords[c1] * tet_coords[c2]
420
+
421
+ dw_du = wp.vec3(dw_dc[1] - dw_dc[0], dw_dc[2] - dw_dc[0], dw_dc[3] - dw_dc[0])
422
+ return dw_du
423
+
424
+ if ORDER == 1:
425
+ return cache.get_func(element_inner_weight_gradient_linear, self.name)
426
+ elif ORDER == 2:
427
+ return cache.get_func(element_inner_weight_gradient_quadratic, self.name)
428
+ elif ORDER == 3:
429
+ return cache.get_func(element_inner_weight_gradient_cubic, self.name)
430
+
431
+ return None
432
+
433
+ def element_node_tets(self):
434
+ if self.ORDER == 1:
435
+ element_tets = [[0, 1, 2, 3]]
436
+ if self.ORDER == 2:
437
+ element_tets = [
438
+ [0, 4, 6, 7],
439
+ [1, 5, 4, 8],
440
+ [2, 6, 5, 9],
441
+ [3, 7, 8, 9],
442
+ [4, 5, 6, 8],
443
+ [8, 7, 9, 6],
444
+ [6, 5, 9, 8],
445
+ [6, 8, 7, 4],
446
+ ]
447
+ elif self.ORDER == 3:
448
+ raise NotImplementedError()
449
+
450
+ return np.array(element_tets)
451
+
452
+
453
+ class TetrahedronNonConformingPolynomialShapeFunctions:
454
+ def __init__(self, degree: int):
455
+ self._tet_shape = TetrahedronPolynomialShapeFunctions(degree=degree)
456
+ self.ORDER = self._tet_shape.ORDER
457
+ self.NODES_PER_ELEMENT = self._tet_shape.NODES_PER_ELEMENT
458
+
459
+ self.element_node_tets = self._tet_shape.element_node_tets
460
+
461
+ if self.ORDER == 1:
462
+ self._TET_SCALE = 0.4472135955 # so v at 0.5854101966249680 (order 2)
463
+ elif self.ORDER == 2:
464
+ self._TET_SCALE = 0.6123779296874996 # optimized for low intrinsic quadrature error of deg 4
465
+ elif self.ORDER == 3:
466
+ self._TET_SCALE = 0.7153564453124999 # optimized for low intrinsic quadrature error of deg 6
467
+ else:
468
+ self._TET_SCALE = 1.0
469
+
470
+ self._TET_SCALE = wp.constant(self._TET_SCALE)
471
+ self._TET_OFFSET = wp.constant((1.0 - self._TET_SCALE) * wp.vec3(0.25, 0.25, 0.25))
472
+
473
+ @property
474
+ def name(self) -> str:
475
+ return f"Tet_P{self.ORDER}d"
476
+
477
+ def make_node_coords_in_element(self):
478
+ node_coords_in_tet = self._tet_shape.make_node_coords_in_element()
479
+
480
+ TET_SCALE = self._TET_SCALE
481
+ TET_OFFSET = self._TET_OFFSET
482
+
483
+ @cache.dynamic_func(suffix=self.name)
484
+ def node_coords_in_element(
485
+ node_index_in_elt: int,
486
+ ):
487
+ tet_coords = node_coords_in_tet(node_index_in_elt)
488
+ return TET_SCALE * tet_coords + TET_OFFSET
489
+
490
+ return node_coords_in_element
491
+
492
+ def make_node_quadrature_weight(self):
493
+ # Intrinsic quadrature -- precomputed integral of node shape functions
494
+ # over element. Order euqla to self.ORDER
495
+
496
+ if self.ORDER == 2:
497
+ vertex_weight = 0.07499641
498
+ edge_weight = 0.11666908
499
+ face_interior_weight = 0.0
500
+ elif self.ORDER == 3:
501
+ vertex_weight = 0.03345134
502
+ edge_weight = 0.04521887
503
+ face_interior_weight = 0.08089206
504
+ else:
505
+ vertex_weight = 1.0 / self.NODES_PER_ELEMENT
506
+ edge_weight = 1.0 / self.NODES_PER_ELEMENT
507
+ face_interior_weight = 1.0 / self.NODES_PER_ELEMENT
508
+
509
+ VERTEX_WEIGHT = wp.constant(vertex_weight)
510
+ EDGE_WEIGHT = wp.constant(edge_weight)
511
+ FACE_INTERIOR_WEIGHT = wp.constant(face_interior_weight)
512
+
513
+ @cache.dynamic_func(suffix=self.name)
514
+ def node_quadrature_weight(node_index_in_element: int):
515
+ node_type, type_index = self._tet_shape.node_type_and_type_index(node_index_in_element)
516
+
517
+ if node_type == TetrahedronPolynomialShapeFunctions.VERTEX:
518
+ return VERTEX_WEIGHT
519
+ elif node_type == TetrahedronPolynomialShapeFunctions.EDGE:
520
+ return EDGE_WEIGHT
521
+
522
+ return FACE_INTERIOR_WEIGHT
523
+
524
+ return node_quadrature_weight
525
+
526
+ def make_trace_node_quadrature_weight(self):
527
+ # Non-conforming, zero measure on sides
528
+
529
+ @wp.func
530
+ def zero(node_index_in_elt: int):
531
+ return 0.0
532
+
533
+ return zero
534
+
535
+ def make_element_inner_weight(self):
536
+ tet_inner_weight = self._tet_shape.make_element_inner_weight()
537
+
538
+ TET_SCALE = self._TET_SCALE
539
+ TET_OFFSET = self._TET_OFFSET
540
+
541
+ @cache.dynamic_func(suffix=self.name)
542
+ def element_inner_weight(
543
+ coords: Coords,
544
+ node_index_in_elt: int,
545
+ ):
546
+ tet_coords = (coords - TET_OFFSET) / TET_SCALE
547
+
548
+ return tet_inner_weight(tet_coords, node_index_in_elt)
549
+
550
+ return element_inner_weight
551
+
552
+ def make_element_inner_weight_gradient(self):
553
+ tet_inner_weight_gradient = self._tet_shape.make_element_inner_weight_gradient()
554
+
555
+ TET_SCALE = self._TET_SCALE
556
+ TET_OFFSET = self._TET_OFFSET
557
+
558
+ @cache.dynamic_func(suffix=self.name)
559
+ def element_inner_weight_gradient(
560
+ coords: Coords,
561
+ node_index_in_elt: int,
562
+ ):
563
+ tet_coords = (coords - TET_OFFSET) / TET_SCALE
564
+ grad = tet_inner_weight_gradient(tet_coords, node_index_in_elt)
565
+ return grad / TET_SCALE
566
+
567
+ return element_inner_weight_gradient