warp-lang 0.10.1__py3-none-win_amd64.whl → 0.11.0__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of warp-lang might be problematic. Click here for more details.

Files changed (300) hide show
  1. warp/__init__.py +10 -4
  2. warp/__init__.pyi +1 -0
  3. warp/bin/warp-clang.dll +0 -0
  4. warp/bin/warp.dll +0 -0
  5. warp/build.py +5 -3
  6. warp/build_dll.py +29 -9
  7. warp/builtins.py +868 -507
  8. warp/codegen.py +1074 -638
  9. warp/config.py +3 -3
  10. warp/constants.py +6 -0
  11. warp/context.py +715 -222
  12. warp/fabric.py +326 -0
  13. warp/fem/__init__.py +27 -0
  14. warp/fem/cache.py +389 -0
  15. warp/fem/dirichlet.py +181 -0
  16. warp/fem/domain.py +263 -0
  17. warp/fem/field/__init__.py +101 -0
  18. warp/fem/field/field.py +149 -0
  19. warp/fem/field/nodal_field.py +299 -0
  20. warp/fem/field/restriction.py +21 -0
  21. warp/fem/field/test.py +181 -0
  22. warp/fem/field/trial.py +183 -0
  23. warp/fem/geometry/__init__.py +19 -0
  24. warp/fem/geometry/closest_point.py +70 -0
  25. warp/fem/geometry/deformed_geometry.py +271 -0
  26. warp/fem/geometry/element.py +744 -0
  27. warp/fem/geometry/geometry.py +186 -0
  28. warp/fem/geometry/grid_2d.py +373 -0
  29. warp/fem/geometry/grid_3d.py +435 -0
  30. warp/fem/geometry/hexmesh.py +953 -0
  31. warp/fem/geometry/partition.py +376 -0
  32. warp/fem/geometry/quadmesh_2d.py +532 -0
  33. warp/fem/geometry/tetmesh.py +840 -0
  34. warp/fem/geometry/trimesh_2d.py +577 -0
  35. warp/fem/integrate.py +1616 -0
  36. warp/fem/operator.py +191 -0
  37. warp/fem/polynomial.py +213 -0
  38. warp/fem/quadrature/__init__.py +2 -0
  39. warp/fem/quadrature/pic_quadrature.py +245 -0
  40. warp/fem/quadrature/quadrature.py +294 -0
  41. warp/fem/space/__init__.py +292 -0
  42. warp/fem/space/basis_space.py +489 -0
  43. warp/fem/space/collocated_function_space.py +105 -0
  44. warp/fem/space/dof_mapper.py +236 -0
  45. warp/fem/space/function_space.py +145 -0
  46. warp/fem/space/grid_2d_function_space.py +267 -0
  47. warp/fem/space/grid_3d_function_space.py +306 -0
  48. warp/fem/space/hexmesh_function_space.py +352 -0
  49. warp/fem/space/partition.py +350 -0
  50. warp/fem/space/quadmesh_2d_function_space.py +369 -0
  51. warp/fem/space/restriction.py +160 -0
  52. warp/fem/space/shape/__init__.py +15 -0
  53. warp/fem/space/shape/cube_shape_function.py +738 -0
  54. warp/fem/space/shape/shape_function.py +103 -0
  55. warp/fem/space/shape/square_shape_function.py +611 -0
  56. warp/fem/space/shape/tet_shape_function.py +567 -0
  57. warp/fem/space/shape/triangle_shape_function.py +429 -0
  58. warp/fem/space/tetmesh_function_space.py +292 -0
  59. warp/fem/space/topology.py +295 -0
  60. warp/fem/space/trimesh_2d_function_space.py +221 -0
  61. warp/fem/types.py +77 -0
  62. warp/fem/utils.py +495 -0
  63. warp/native/array.h +147 -44
  64. warp/native/builtin.h +122 -149
  65. warp/native/bvh.cpp +73 -325
  66. warp/native/bvh.cu +406 -23
  67. warp/native/bvh.h +34 -43
  68. warp/native/clang/clang.cpp +13 -8
  69. warp/native/crt.h +2 -0
  70. warp/native/cuda_crt.h +5 -0
  71. warp/native/cuda_util.cpp +15 -3
  72. warp/native/cuda_util.h +3 -1
  73. warp/native/cutlass/tools/library/scripts/conv2d_operation.py +463 -0
  74. warp/native/cutlass/tools/library/scripts/conv3d_operation.py +321 -0
  75. warp/native/cutlass/tools/library/scripts/gemm_operation.py +988 -0
  76. warp/native/cutlass/tools/library/scripts/generator.py +4625 -0
  77. warp/native/cutlass/tools/library/scripts/library.py +799 -0
  78. warp/native/cutlass/tools/library/scripts/manifest.py +402 -0
  79. warp/native/cutlass/tools/library/scripts/pycutlass/docs/source/conf.py +96 -0
  80. warp/native/cutlass/tools/library/scripts/pycutlass/profile/conv/conv2d_f16_sm80.py +106 -0
  81. warp/native/cutlass/tools/library/scripts/pycutlass/profile/gemm/gemm_f32_sm80.py +91 -0
  82. warp/native/cutlass/tools/library/scripts/pycutlass/setup.py +80 -0
  83. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/__init__.py +48 -0
  84. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/arguments.py +118 -0
  85. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/c_types.py +241 -0
  86. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/compiler.py +432 -0
  87. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/conv2d_operation.py +631 -0
  88. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/epilogue.py +1026 -0
  89. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/frontend.py +104 -0
  90. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/gemm_operation.py +1276 -0
  91. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/library.py +744 -0
  92. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/memory_manager.py +74 -0
  93. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/operation.py +110 -0
  94. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/parser.py +619 -0
  95. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/reduction_operation.py +398 -0
  96. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/tensor_ref.py +70 -0
  97. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/__init__.py +4 -0
  98. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/conv2d_testbed.py +646 -0
  99. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_grouped_testbed.py +235 -0
  100. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_testbed.py +557 -0
  101. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/profiler.py +70 -0
  102. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/type_hint.py +39 -0
  103. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/__init__.py +1 -0
  104. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/device.py +76 -0
  105. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/reference_model.py +255 -0
  106. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/__init__.py +0 -0
  107. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +201 -0
  108. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +177 -0
  109. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +98 -0
  110. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +95 -0
  111. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_few_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +163 -0
  112. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_fixed_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +187 -0
  113. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +309 -0
  114. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +54 -0
  115. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
  116. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
  117. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_strided_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +253 -0
  118. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +97 -0
  119. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +242 -0
  120. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
  121. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
  122. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/run_all_tests.py +10 -0
  123. warp/native/cutlass/tools/library/scripts/pycutlass/test/frontend/test_frontend.py +146 -0
  124. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/__init__.py +0 -0
  125. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_bf16_sm80.py +96 -0
  126. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f16_sm80.py +447 -0
  127. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f32_sm80.py +146 -0
  128. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f64_sm80.py +102 -0
  129. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_grouped_sm80.py +203 -0
  130. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_s8_sm80.py +229 -0
  131. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/run_all_tests.py +9 -0
  132. warp/native/cutlass/tools/library/scripts/pycutlass/test/unit/test_sm80.py +453 -0
  133. warp/native/cutlass/tools/library/scripts/rank_2k_operation.py +398 -0
  134. warp/native/cutlass/tools/library/scripts/rank_k_operation.py +387 -0
  135. warp/native/cutlass/tools/library/scripts/rt.py +796 -0
  136. warp/native/cutlass/tools/library/scripts/symm_operation.py +400 -0
  137. warp/native/cutlass/tools/library/scripts/trmm_operation.py +407 -0
  138. warp/native/cutlass_gemm.cu +5 -3
  139. warp/native/exports.h +1240 -952
  140. warp/native/fabric.h +228 -0
  141. warp/native/hashgrid.cpp +4 -4
  142. warp/native/hashgrid.h +22 -2
  143. warp/native/intersect.h +22 -7
  144. warp/native/intersect_adj.h +8 -8
  145. warp/native/intersect_tri.h +1 -1
  146. warp/native/marching.cu +157 -161
  147. warp/native/mat.h +80 -19
  148. warp/native/matnn.h +2 -2
  149. warp/native/mesh.cpp +33 -108
  150. warp/native/mesh.cu +114 -23
  151. warp/native/mesh.h +446 -46
  152. warp/native/noise.h +272 -329
  153. warp/native/quat.h +51 -8
  154. warp/native/rand.h +45 -35
  155. warp/native/range.h +6 -2
  156. warp/native/reduce.cpp +1 -1
  157. warp/native/reduce.cu +10 -12
  158. warp/native/runlength_encode.cu +6 -10
  159. warp/native/scan.cu +8 -11
  160. warp/native/sparse.cpp +4 -4
  161. warp/native/sparse.cu +164 -154
  162. warp/native/spatial.h +2 -2
  163. warp/native/temp_buffer.h +14 -30
  164. warp/native/vec.h +107 -23
  165. warp/native/volume.h +120 -0
  166. warp/native/warp.cpp +560 -30
  167. warp/native/warp.cu +431 -44
  168. warp/native/warp.h +13 -4
  169. warp/optim/__init__.py +1 -0
  170. warp/optim/linear.py +922 -0
  171. warp/optim/sgd.py +92 -0
  172. warp/render/render_opengl.py +335 -119
  173. warp/render/render_usd.py +11 -11
  174. warp/sim/__init__.py +2 -2
  175. warp/sim/articulation.py +385 -185
  176. warp/sim/collide.py +8 -0
  177. warp/sim/import_mjcf.py +297 -106
  178. warp/sim/import_urdf.py +389 -210
  179. warp/sim/import_usd.py +198 -97
  180. warp/sim/inertia.py +17 -18
  181. warp/sim/integrator_euler.py +14 -8
  182. warp/sim/integrator_xpbd.py +158 -16
  183. warp/sim/model.py +795 -291
  184. warp/sim/render.py +3 -3
  185. warp/sim/utils.py +3 -0
  186. warp/sparse.py +640 -150
  187. warp/stubs.py +606 -267
  188. warp/tape.py +61 -10
  189. warp/tests/__main__.py +3 -6
  190. warp/tests/assets/curlnoise_golden.npy +0 -0
  191. warp/tests/assets/pnoise_golden.npy +0 -0
  192. warp/tests/{test_class_kernel.py → aux_test_class_kernel.py} +9 -1
  193. warp/tests/aux_test_conditional_unequal_types_kernels.py +21 -0
  194. warp/tests/{test_dependent.py → aux_test_dependent.py} +2 -2
  195. warp/tests/{test_reference.py → aux_test_reference.py} +1 -1
  196. warp/tests/aux_test_unresolved_func.py +14 -0
  197. warp/tests/aux_test_unresolved_symbol.py +14 -0
  198. warp/tests/disabled_kinematics.py +239 -0
  199. warp/tests/run_coverage_serial.py +31 -0
  200. warp/tests/test_adam.py +103 -106
  201. warp/tests/test_arithmetic.py +128 -74
  202. warp/tests/test_array.py +212 -97
  203. warp/tests/test_array_reduce.py +57 -23
  204. warp/tests/test_atomic.py +64 -28
  205. warp/tests/test_bool.py +99 -0
  206. warp/tests/test_builtins_resolution.py +1292 -0
  207. warp/tests/test_bvh.py +42 -18
  208. warp/tests/test_closest_point_edge_edge.py +54 -57
  209. warp/tests/test_codegen.py +208 -130
  210. warp/tests/test_compile_consts.py +28 -20
  211. warp/tests/test_conditional.py +108 -24
  212. warp/tests/test_copy.py +10 -12
  213. warp/tests/test_ctypes.py +112 -88
  214. warp/tests/test_dense.py +21 -14
  215. warp/tests/test_devices.py +98 -0
  216. warp/tests/test_dlpack.py +75 -75
  217. warp/tests/test_examples.py +277 -0
  218. warp/tests/test_fabricarray.py +955 -0
  219. warp/tests/test_fast_math.py +15 -11
  220. warp/tests/test_fem.py +1271 -0
  221. warp/tests/test_fp16.py +53 -19
  222. warp/tests/test_func.py +187 -86
  223. warp/tests/test_generics.py +194 -49
  224. warp/tests/test_grad.py +178 -109
  225. warp/tests/test_grad_customs.py +176 -0
  226. warp/tests/test_hash_grid.py +52 -37
  227. warp/tests/test_import.py +10 -23
  228. warp/tests/test_indexedarray.py +32 -31
  229. warp/tests/test_intersect.py +18 -9
  230. warp/tests/test_large.py +141 -0
  231. warp/tests/test_launch.py +14 -41
  232. warp/tests/test_lerp.py +64 -65
  233. warp/tests/test_linear_solvers.py +154 -0
  234. warp/tests/test_lvalue.py +493 -0
  235. warp/tests/test_marching_cubes.py +12 -13
  236. warp/tests/test_mat.py +517 -2898
  237. warp/tests/test_mat_lite.py +115 -0
  238. warp/tests/test_mat_scalar_ops.py +2889 -0
  239. warp/tests/test_math.py +103 -9
  240. warp/tests/test_matmul.py +305 -69
  241. warp/tests/test_matmul_lite.py +410 -0
  242. warp/tests/test_mesh.py +71 -14
  243. warp/tests/test_mesh_query_aabb.py +41 -25
  244. warp/tests/test_mesh_query_point.py +140 -22
  245. warp/tests/test_mesh_query_ray.py +39 -22
  246. warp/tests/test_mlp.py +30 -22
  247. warp/tests/test_model.py +92 -89
  248. warp/tests/test_modules_lite.py +39 -0
  249. warp/tests/test_multigpu.py +88 -114
  250. warp/tests/test_noise.py +12 -11
  251. warp/tests/test_operators.py +16 -20
  252. warp/tests/test_options.py +11 -11
  253. warp/tests/test_pinned.py +17 -18
  254. warp/tests/test_print.py +32 -11
  255. warp/tests/test_quat.py +275 -129
  256. warp/tests/test_rand.py +18 -16
  257. warp/tests/test_reload.py +38 -34
  258. warp/tests/test_rounding.py +50 -43
  259. warp/tests/test_runlength_encode.py +168 -20
  260. warp/tests/test_smoothstep.py +9 -11
  261. warp/tests/test_snippet.py +143 -0
  262. warp/tests/test_sparse.py +261 -63
  263. warp/tests/test_spatial.py +276 -243
  264. warp/tests/test_streams.py +110 -85
  265. warp/tests/test_struct.py +268 -63
  266. warp/tests/test_tape.py +39 -21
  267. warp/tests/test_torch.py +118 -89
  268. warp/tests/test_transient_module.py +12 -13
  269. warp/tests/test_types.py +614 -0
  270. warp/tests/test_utils.py +494 -0
  271. warp/tests/test_vec.py +354 -2050
  272. warp/tests/test_vec_lite.py +73 -0
  273. warp/tests/test_vec_scalar_ops.py +2099 -0
  274. warp/tests/test_volume.py +457 -293
  275. warp/tests/test_volume_write.py +124 -134
  276. warp/tests/unittest_serial.py +35 -0
  277. warp/tests/unittest_suites.py +341 -0
  278. warp/tests/unittest_utils.py +568 -0
  279. warp/tests/unused_test_misc.py +71 -0
  280. warp/tests/{test_debug.py → walkthough_debug.py} +3 -17
  281. warp/thirdparty/appdirs.py +36 -45
  282. warp/thirdparty/unittest_parallel.py +549 -0
  283. warp/torch.py +9 -6
  284. warp/types.py +1089 -366
  285. warp/utils.py +93 -387
  286. warp_lang-0.11.0.dist-info/METADATA +238 -0
  287. warp_lang-0.11.0.dist-info/RECORD +332 -0
  288. {warp_lang-0.10.1.dist-info → warp_lang-0.11.0.dist-info}/WHEEL +1 -1
  289. warp/tests/test_all.py +0 -219
  290. warp/tests/test_array_scan.py +0 -60
  291. warp/tests/test_base.py +0 -208
  292. warp/tests/test_unresolved_func.py +0 -7
  293. warp/tests/test_unresolved_symbol.py +0 -7
  294. warp_lang-0.10.1.dist-info/METADATA +0 -21
  295. warp_lang-0.10.1.dist-info/RECORD +0 -188
  296. /warp/tests/{test_compile_consts_dummy.py → aux_test_compile_consts_dummy.py} +0 -0
  297. /warp/tests/{test_reference_reference.py → aux_test_reference_reference.py} +0 -0
  298. /warp/tests/{test_square.py → aux_test_square.py} +0 -0
  299. {warp_lang-0.10.1.dist-info → warp_lang-0.11.0.dist-info}/LICENSE.md +0 -0
  300. {warp_lang-0.10.1.dist-info → warp_lang-0.11.0.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,611 @@
1
+ import math
2
+
3
+ import warp as wp
4
+ import numpy as np
5
+
6
+ from warp.fem.polynomial import Polynomial, quadrature_1d, lagrange_scales, is_closed
7
+ from warp.fem.types import Coords
8
+ from warp.fem import cache
9
+
10
+ from .triangle_shape_function import Triangle2DPolynomialShapeFunctions
11
+
12
+
13
+ class SquareBipolynomialShapeFunctions:
14
+ def __init__(self, degree: int, family: Polynomial):
15
+ self.family = family
16
+
17
+ self.ORDER = wp.constant(degree)
18
+ self.NODES_PER_ELEMENT = wp.constant((degree + 1) * (degree + 1))
19
+ self.NODES_PER_SIDE = wp.constant(degree + 1)
20
+
21
+ lobatto_coords, lobatto_weight = quadrature_1d(point_count=degree + 1, family=family)
22
+ lagrange_scale = lagrange_scales(lobatto_coords)
23
+
24
+ NodeVec = wp.types.vector(length=degree + 1, dtype=wp.float32)
25
+ self.LOBATTO_COORDS = wp.constant(NodeVec(lobatto_coords))
26
+ self.LOBATTO_WEIGHT = wp.constant(NodeVec(lobatto_weight))
27
+ self.LAGRANGE_SCALE = wp.constant(NodeVec(lagrange_scale))
28
+ self.ORDER_PLUS_ONE = wp.constant(self.ORDER + 1)
29
+
30
+ @property
31
+ def name(self) -> str:
32
+ return f"Square_Q{self.ORDER}_{self.family}"
33
+
34
+ def make_node_coords_in_element(self):
35
+ ORDER = self.ORDER
36
+ LOBATTO_COORDS = self.LOBATTO_COORDS
37
+
38
+ @cache.dynamic_func(suffix=self.name)
39
+ def node_coords_in_element(
40
+ node_index_in_elt: int,
41
+ ):
42
+ node_i = node_index_in_elt // (ORDER + 1)
43
+ node_j = node_index_in_elt - (ORDER + 1) * node_i
44
+ return Coords(LOBATTO_COORDS[node_i], LOBATTO_COORDS[node_j], 0.0)
45
+
46
+ return node_coords_in_element
47
+
48
+ def make_node_quadrature_weight(self):
49
+ ORDER = self.ORDER
50
+ LOBATTO_WEIGHT = self.LOBATTO_WEIGHT
51
+
52
+ def node_quadrature_weight(
53
+ node_index_in_elt: int,
54
+ ):
55
+ node_i = node_index_in_elt // (ORDER + 1)
56
+ node_j = node_index_in_elt - (ORDER + 1) * node_i
57
+ return LOBATTO_WEIGHT[node_i] * LOBATTO_WEIGHT[node_j]
58
+
59
+ def node_quadrature_weight_linear(
60
+ node_index_in_elt: int,
61
+ ):
62
+ return 0.25
63
+
64
+ if ORDER == 1:
65
+ return cache.get_func(node_quadrature_weight_linear, self.name)
66
+
67
+ return cache.get_func(node_quadrature_weight, self.name)
68
+
69
+ @wp.func
70
+ def _vertex_coords_f(vidx_in_cell: int):
71
+ x = vidx_in_cell // 2
72
+ y = vidx_in_cell - 2 * x
73
+ return wp.vec2(float(x), float(y))
74
+
75
+ def make_trace_node_quadrature_weight(self):
76
+ ORDER = self.ORDER
77
+ LOBATTO_WEIGHT = self.LOBATTO_WEIGHT
78
+
79
+ def trace_node_quadrature_weight(
80
+ node_index_in_elt: int,
81
+ ):
82
+ # We're either on a side interior or at a vertex
83
+ # I.e., either both indices are at extrema, or only one is
84
+ # Pick the interior one if possible, if both are at extrema pick any one
85
+ node_i = node_index_in_elt // (ORDER + 1)
86
+ if node_i > 0 and node_i < ORDER:
87
+ return LOBATTO_WEIGHT[node_i]
88
+
89
+ node_j = node_index_in_elt - (ORDER + 1) * node_i
90
+ return LOBATTO_WEIGHT[node_j]
91
+
92
+ def trace_node_quadrature_weight_linear(
93
+ node_index_in_elt: int,
94
+ ):
95
+ return 0.5
96
+
97
+ def trace_node_quadrature_weight_open(
98
+ node_index_in_elt: int,
99
+ ):
100
+ return 0.0
101
+
102
+ if not is_closed(self.family):
103
+ return cache.get_func(trace_node_quadrature_weight_open, self.name)
104
+
105
+ if ORDER == 1:
106
+ return cache.get_func(trace_node_quadrature_weight_linear, self.name)
107
+
108
+ return cache.get_func(trace_node_quadrature_weight, self.name)
109
+
110
+ def make_element_inner_weight(self):
111
+ ORDER_PLUS_ONE = self.ORDER_PLUS_ONE
112
+ LOBATTO_COORDS = self.LOBATTO_COORDS
113
+ LAGRANGE_SCALE = self.LAGRANGE_SCALE
114
+
115
+ def element_inner_weight(
116
+ coords: Coords,
117
+ node_index_in_elt: int,
118
+ ):
119
+ node_i = node_index_in_elt // ORDER_PLUS_ONE
120
+ node_j = node_index_in_elt - ORDER_PLUS_ONE * node_i
121
+
122
+ w = float(1.0)
123
+ for k in range(ORDER_PLUS_ONE):
124
+ if k != node_i:
125
+ w *= coords[0] - LOBATTO_COORDS[k]
126
+ if k != node_j:
127
+ w *= coords[1] - LOBATTO_COORDS[k]
128
+
129
+ w *= LAGRANGE_SCALE[node_i] * LAGRANGE_SCALE[node_j]
130
+
131
+ return w
132
+
133
+ def element_inner_weight_linear(
134
+ coords: Coords,
135
+ node_index_in_elt: int,
136
+ ):
137
+ v = SquareBipolynomialShapeFunctions._vertex_coords_f(node_index_in_elt)
138
+
139
+ wx = (1.0 - coords[0]) * (1.0 - v[0]) + v[0] * coords[0]
140
+ wy = (1.0 - coords[1]) * (1.0 - v[1]) + v[1] * coords[1]
141
+ return wx * wy
142
+
143
+ if self.ORDER == 1 and is_closed(self.family):
144
+ return cache.get_func(element_inner_weight_linear, self.name)
145
+
146
+ return cache.get_func(element_inner_weight, self.name)
147
+
148
+ def make_element_inner_weight_gradient(self):
149
+ ORDER_PLUS_ONE = self.ORDER_PLUS_ONE
150
+ LOBATTO_COORDS = self.LOBATTO_COORDS
151
+ LAGRANGE_SCALE = self.LAGRANGE_SCALE
152
+
153
+ def element_inner_weight_gradient(
154
+ coords: Coords,
155
+ node_index_in_elt: int,
156
+ ):
157
+ node_i = node_index_in_elt // ORDER_PLUS_ONE
158
+ node_j = node_index_in_elt - ORDER_PLUS_ONE * node_i
159
+
160
+ prefix_x = float(1.0)
161
+ prefix_y = float(1.0)
162
+ for k in range(ORDER_PLUS_ONE):
163
+ if k != node_i:
164
+ prefix_y *= coords[0] - LOBATTO_COORDS[k]
165
+ if k != node_j:
166
+ prefix_x *= coords[1] - LOBATTO_COORDS[k]
167
+
168
+ grad_x = float(0.0)
169
+ grad_y = float(0.0)
170
+
171
+ for k in range(ORDER_PLUS_ONE):
172
+ if k != node_i:
173
+ delta_x = coords[0] - LOBATTO_COORDS[k]
174
+ grad_x = grad_x * delta_x + prefix_x
175
+ prefix_x *= delta_x
176
+ if k != node_j:
177
+ delta_y = coords[1] - LOBATTO_COORDS[k]
178
+ grad_y = grad_y * delta_y + prefix_y
179
+ prefix_y *= delta_y
180
+
181
+ grad = LAGRANGE_SCALE[node_i] * LAGRANGE_SCALE[node_j] * wp.vec2(grad_x, grad_y)
182
+
183
+ return grad
184
+
185
+ def element_inner_weight_gradient_linear(
186
+ coords: Coords,
187
+ node_index_in_elt: int,
188
+ ):
189
+ v = SquareBipolynomialShapeFunctions._vertex_coords_f(node_index_in_elt)
190
+
191
+ wx = (1.0 - coords[0]) * (1.0 - v[0]) + v[0] * coords[0]
192
+ wy = (1.0 - coords[1]) * (1.0 - v[1]) + v[1] * coords[1]
193
+
194
+ dx = 2.0 * v[0] - 1.0
195
+ dy = 2.0 * v[1] - 1.0
196
+
197
+ return wp.vec2(dx * wy, dy * wx)
198
+
199
+ if self.ORDER == 1 and is_closed(self.family):
200
+ return cache.get_func(element_inner_weight_gradient_linear, self.name)
201
+
202
+ return cache.get_func(element_inner_weight_gradient, self.name)
203
+
204
+ def element_node_triangulation(self):
205
+ from warp.fem.utils import grid_to_tris
206
+
207
+ return grid_to_tris(self.ORDER, self.ORDER)
208
+
209
+
210
+ class SquareSerendipityShapeFunctions:
211
+ """
212
+ Serendipity element ~ tensor product space without interior nodes
213
+ Side shape functions are usual Lagrange shape functions times a linear function in the normal direction
214
+ Corner shape functions are bilinear shape functions times a function of (x^{d-1} + y^{d-1})
215
+ """
216
+
217
+ # Node categories
218
+ VERTEX = wp.constant(0)
219
+ EDGE_X = wp.constant(1)
220
+ EDGE_Y = wp.constant(2)
221
+
222
+ def __init__(self, degree: int, family: Polynomial):
223
+ if not is_closed(family):
224
+ raise ValueError("A closed polynomial family is required to define serendipity elements")
225
+
226
+ if degree not in [2, 3]:
227
+ raise NotImplementedError("Serendipity element only implemented for order 2 or 3")
228
+
229
+ self.family = family
230
+
231
+ self.ORDER = wp.constant(degree)
232
+ self.NODES_PER_ELEMENT = wp.constant(4 * degree)
233
+ self.NODES_PER_SIDE = wp.constant(degree + 1)
234
+
235
+ lobatto_coords, lobatto_weight = quadrature_1d(point_count=degree + 1, family=family)
236
+ lagrange_scale = lagrange_scales(lobatto_coords)
237
+
238
+ NodeVec = wp.types.vector(length=degree + 1, dtype=wp.float32)
239
+ self.LOBATTO_COORDS = wp.constant(NodeVec(lobatto_coords))
240
+ self.LOBATTO_WEIGHT = wp.constant(NodeVec(lobatto_weight))
241
+ self.LAGRANGE_SCALE = wp.constant(NodeVec(lagrange_scale))
242
+ self.ORDER_PLUS_ONE = wp.constant(self.ORDER + 1)
243
+
244
+ self.node_type_and_type_index = self._get_node_type_and_type_index()
245
+ self._node_lobatto_indices = self._get_node_lobatto_indices()
246
+
247
+ @property
248
+ def name(self) -> str:
249
+ return f"Square_S{self.ORDER}_{self.family}"
250
+
251
+ def _get_node_type_and_type_index(self):
252
+ @cache.dynamic_func(suffix=self.name)
253
+ def node_type_and_index(
254
+ node_index_in_elt: int,
255
+ ):
256
+ if node_index_in_elt < 4:
257
+ return SquareSerendipityShapeFunctions.VERTEX, node_index_in_elt
258
+
259
+ type_index = (node_index_in_elt - 4) // 2
260
+ side = node_index_in_elt - 4 - 2 * type_index
261
+ return SquareSerendipityShapeFunctions.EDGE_X + side, type_index
262
+
263
+ return node_type_and_index
264
+
265
+ @wp.func
266
+ def side_offset_and_index(type_index: int):
267
+ index_in_side = type_index // 2
268
+ side_offset = type_index - 2 * index_in_side
269
+
270
+ return side_offset, index_in_side
271
+
272
+ def _get_node_lobatto_indices(self):
273
+ ORDER = self.ORDER
274
+
275
+ @cache.dynamic_func(suffix=self.name)
276
+ def node_lobatto_indices(node_type: int, type_index: int):
277
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
278
+ node_i = type_index // 2
279
+ node_j = type_index - 2 * node_i
280
+ return node_i * ORDER, node_j * ORDER
281
+
282
+ side_offset, index_in_side = SquareSerendipityShapeFunctions.side_offset_and_index(type_index)
283
+
284
+ if node_type == SquareSerendipityShapeFunctions.EDGE_X:
285
+ node_i = 1 + index_in_side
286
+ node_j = side_offset * ORDER
287
+ else:
288
+ node_j = 1 + index_in_side
289
+ node_i = side_offset * ORDER
290
+
291
+ return node_i, node_j
292
+
293
+ return node_lobatto_indices
294
+
295
+ def make_node_coords_in_element(self):
296
+ LOBATTO_COORDS = self.LOBATTO_COORDS
297
+
298
+ @cache.dynamic_func(suffix=self.name)
299
+ def node_coords_in_element(
300
+ node_index_in_elt: int,
301
+ ):
302
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
303
+ node_i, node_j = self._node_lobatto_indices(node_type, type_index)
304
+ return Coords(LOBATTO_COORDS[node_i], LOBATTO_COORDS[node_j], 0.0)
305
+
306
+ return node_coords_in_element
307
+
308
+ def make_node_quadrature_weight(self):
309
+ ORDER = self.ORDER
310
+
311
+ @cache.dynamic_func(suffix=self.name)
312
+ def node_quadrature_weight(
313
+ node_index_in_elt: int,
314
+ ):
315
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
316
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
317
+ return 0.25 / float(ORDER * ORDER)
318
+
319
+ return (0.25 - 0.25 / float(ORDER * ORDER)) / float(ORDER - 1)
320
+
321
+ return node_quadrature_weight
322
+
323
+ def make_trace_node_quadrature_weight(self):
324
+ LOBATTO_WEIGHT = self.LOBATTO_WEIGHT
325
+
326
+ @cache.dynamic_func(suffix=self.name)
327
+ def trace_node_quadrature_weight(
328
+ node_index_in_elt: int,
329
+ ):
330
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
331
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
332
+ return LOBATTO_WEIGHT[0]
333
+
334
+ side_offset, index_in_side = SquareSerendipityShapeFunctions.side_offset_and_index(type_index)
335
+ return LOBATTO_WEIGHT[1 + index_in_side]
336
+
337
+ return trace_node_quadrature_weight
338
+
339
+ def make_element_inner_weight(self):
340
+ ORDER = self.ORDER
341
+ ORDER_PLUS_ONE = self.ORDER_PLUS_ONE
342
+
343
+ LOBATTO_COORDS = self.LOBATTO_COORDS
344
+ LAGRANGE_SCALE = self.LAGRANGE_SCALE
345
+
346
+ DEGREE_3_CIRCLE_RAD = wp.constant(0.5**2 + (0.5 - LOBATTO_COORDS[1]) ** 2)
347
+ DEGREE_3_CIRCLE_SCALE = 1.0 / (0.5 - DEGREE_3_CIRCLE_RAD)
348
+
349
+ @cache.dynamic_func(suffix=self.name)
350
+ def element_inner_weight(
351
+ coords: Coords,
352
+ node_index_in_elt: int,
353
+ ):
354
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
355
+
356
+ node_i, node_j = self._node_lobatto_indices(node_type, type_index)
357
+
358
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
359
+ cx = wp.select(node_i == 0, coords[0], 1.0 - coords[0])
360
+ cy = wp.select(node_j == 0, coords[1], 1.0 - coords[1])
361
+
362
+ w = cx * cy
363
+
364
+ if ORDER == 2:
365
+ w *= cx + cy - 2.0 + LOBATTO_COORDS[1]
366
+ return w * LAGRANGE_SCALE[0]
367
+ if ORDER == 3:
368
+ w *= (cx - 0.5) * (cx - 0.5) + (cy - 0.5) * (cy - 0.5) - DEGREE_3_CIRCLE_RAD
369
+ return w * DEGREE_3_CIRCLE_SCALE
370
+
371
+ w = float(1.0)
372
+ if node_type == SquareSerendipityShapeFunctions.EDGE_Y:
373
+ w *= wp.select(node_i == 0, coords[0], 1.0 - coords[0])
374
+ else:
375
+ for k in range(ORDER_PLUS_ONE):
376
+ if k != node_i:
377
+ w *= coords[0] - LOBATTO_COORDS[k]
378
+
379
+ w *= LAGRANGE_SCALE[node_i]
380
+
381
+ if node_type == SquareSerendipityShapeFunctions.EDGE_X:
382
+ w *= wp.select(node_j == 0, coords[1], 1.0 - coords[1])
383
+ else:
384
+ for k in range(ORDER_PLUS_ONE):
385
+ if k != node_j:
386
+ w *= coords[1] - LOBATTO_COORDS[k]
387
+ w *= LAGRANGE_SCALE[node_j]
388
+
389
+ return w
390
+
391
+ return element_inner_weight
392
+
393
+ def make_element_inner_weight_gradient(self):
394
+ ORDER = self.ORDER
395
+ ORDER_PLUS_ONE = self.ORDER_PLUS_ONE
396
+ LOBATTO_COORDS = self.LOBATTO_COORDS
397
+ LAGRANGE_SCALE = self.LAGRANGE_SCALE
398
+
399
+ DEGREE_3_CIRCLE_RAD = wp.constant(0.5**2 + (0.5 - LOBATTO_COORDS[1]) ** 2)
400
+ DEGREE_3_CIRCLE_SCALE = 1.0 / (0.5 - DEGREE_3_CIRCLE_RAD)
401
+
402
+ @cache.dynamic_func(suffix=self.name)
403
+ def element_inner_weight_gradient(
404
+ coords: Coords,
405
+ node_index_in_elt: int,
406
+ ):
407
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
408
+
409
+ node_i, node_j = self._node_lobatto_indices(node_type, type_index)
410
+
411
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
412
+ cx = wp.select(node_i == 0, coords[0], 1.0 - coords[0])
413
+ cy = wp.select(node_j == 0, coords[1], 1.0 - coords[1])
414
+
415
+ gx = wp.select(node_i == 0, 1.0, -1.0)
416
+ gy = wp.select(node_j == 0, 1.0, -1.0)
417
+
418
+ if ORDER == 2:
419
+ w = cx + cy - 2.0 + LOBATTO_COORDS[1]
420
+ grad_x = cy * gx * (w + cx)
421
+ grad_y = cx * gy * (w + cy)
422
+
423
+ return wp.vec2(grad_x, grad_y) * LAGRANGE_SCALE[0]
424
+
425
+ if ORDER == 3:
426
+ w = (cx - 0.5) * (cx - 0.5) + (cy - 0.5) * (cy - 0.5) - DEGREE_3_CIRCLE_RAD
427
+
428
+ dw_dcx = 2.0 * cx - 1.0
429
+ dw_dcy = 2.0 * cy - 1.0
430
+ grad_x = cy * gx * (w + cx * dw_dcx)
431
+ grad_y = cx * gy * (w + cy * dw_dcy)
432
+
433
+ return wp.vec2(grad_x, grad_y) * DEGREE_3_CIRCLE_SCALE
434
+
435
+ if node_type == SquareSerendipityShapeFunctions.EDGE_X:
436
+ prefix_x = wp.select(node_j == 0, coords[1], 1.0 - coords[1])
437
+ else:
438
+ prefix_x = LAGRANGE_SCALE[node_j]
439
+ for k in range(ORDER_PLUS_ONE):
440
+ if k != node_j:
441
+ prefix_x *= coords[1] - LOBATTO_COORDS[k]
442
+
443
+ if node_type == SquareSerendipityShapeFunctions.EDGE_Y:
444
+ prefix_y = wp.select(node_i == 0, coords[0], 1.0 - coords[0])
445
+ else:
446
+ prefix_y = LAGRANGE_SCALE[node_i]
447
+ for k in range(ORDER_PLUS_ONE):
448
+ if k != node_i:
449
+ prefix_y *= coords[0] - LOBATTO_COORDS[k]
450
+
451
+ if node_type == SquareSerendipityShapeFunctions.EDGE_X:
452
+ grad_y = wp.select(node_j == 0, 1.0, -1.0) * prefix_y
453
+ else:
454
+ prefix_y *= LAGRANGE_SCALE[node_j]
455
+ grad_y = float(0.0)
456
+ for k in range(ORDER_PLUS_ONE):
457
+ if k != node_j:
458
+ delta_y = coords[1] - LOBATTO_COORDS[k]
459
+ grad_y = grad_y * delta_y + prefix_y
460
+ prefix_y *= delta_y
461
+
462
+ if node_type == SquareSerendipityShapeFunctions.EDGE_Y:
463
+ grad_x = wp.select(node_i == 0, 1.0, -1.0) * prefix_x
464
+ else:
465
+ prefix_x *= LAGRANGE_SCALE[node_i]
466
+ grad_x = float(0.0)
467
+ for k in range(ORDER_PLUS_ONE):
468
+ if k != node_i:
469
+ delta_x = coords[0] - LOBATTO_COORDS[k]
470
+ grad_x = grad_x * delta_x + prefix_x
471
+ prefix_x *= delta_x
472
+
473
+ grad = wp.vec2(grad_x, grad_y)
474
+ return grad
475
+
476
+ return element_inner_weight_gradient
477
+
478
+ def element_node_triangulation(self):
479
+ if self.ORDER == 2:
480
+ element_triangles = [
481
+ [0, 4, 5],
482
+ [5, 4, 6],
483
+ [5, 6, 1],
484
+ [4, 2, 7],
485
+ [4, 7, 6],
486
+ [6, 7, 3],
487
+ ]
488
+ else:
489
+ element_triangles = [
490
+ [0, 4, 5],
491
+ [2, 7, 8],
492
+ [3, 10, 11],
493
+ [1, 9, 6],
494
+ [5, 6, 9],
495
+ [5, 4, 6],
496
+ [8, 11, 10],
497
+ [8, 7, 11],
498
+ [4, 8, 10],
499
+ [4, 10, 6],
500
+ ]
501
+
502
+ return element_triangles
503
+
504
+
505
+ class SquareNonConformingPolynomialShapeFunctions:
506
+ # embeds the largest equilateral triangle centered at (0.5, 0.5) into the reference square
507
+ _tri_height = 0.75
508
+ _tri_side = 2.0 / math.sqrt(3.0) * _tri_height
509
+ _tri_to_square = np.array([[_tri_side, _tri_side / 2.0], [0.0, _tri_height]])
510
+
511
+ _TRI_OFFSET = wp.constant(wp.vec2(0.5 - 0.5 * _tri_side, 0.5 - _tri_height / 3.0))
512
+
513
+ def __init__(self, degree: int):
514
+ self._tri_shape = Triangle2DPolynomialShapeFunctions(degree=degree)
515
+ self.ORDER = self._tri_shape.ORDER
516
+ self.NODES_PER_ELEMENT = self._tri_shape.NODES_PER_ELEMENT
517
+
518
+ self.element_node_triangulation = self._tri_shape.element_node_triangulation
519
+
520
+ @property
521
+ def name(self) -> str:
522
+ return f"Square_P{self.ORDER}d"
523
+
524
+ def make_node_coords_in_element(self):
525
+ node_coords_in_tet = self._tri_shape.make_node_coords_in_element()
526
+
527
+ TRI_TO_SQUARE = wp.constant(wp.mat22(self._tri_to_square))
528
+
529
+ @cache.dynamic_func(suffix=self.name)
530
+ def node_coords_in_element(
531
+ node_index_in_elt: int,
532
+ ):
533
+ tri_coords = node_coords_in_tet(node_index_in_elt)
534
+ coords = (
535
+ TRI_TO_SQUARE * wp.vec2(tri_coords[1], tri_coords[2])
536
+ ) + SquareNonConformingPolynomialShapeFunctions._TRI_OFFSET
537
+ return Coords(coords[0], coords[1], 0.0)
538
+
539
+ return node_coords_in_element
540
+
541
+ def make_node_quadrature_weight(self):
542
+ NODES_PER_ELEMENT = self.NODES_PER_ELEMENT
543
+
544
+ if self.ORDER == 2:
545
+ # Intrinsic quadrature (order 2)
546
+ @cache.dynamic_func(suffix=self.name)
547
+ def node_quadrature_weight_quadratic(
548
+ node_index_in_elt: int,
549
+ ):
550
+ node_type, type_index = self._tri_shape.node_type_and_type_index(node_index_in_elt)
551
+ if node_type == Triangle2DPolynomialShapeFunctions.VERTEX:
552
+ return 0.18518521
553
+ return 0.14814811
554
+
555
+ return node_quadrature_weight_quadratic
556
+
557
+ @cache.dynamic_func(suffix=self.name)
558
+ def node_uniform_quadrature_weight(
559
+ node_index_in_elt: int,
560
+ ):
561
+ return 1.0 / float(NODES_PER_ELEMENT)
562
+
563
+ return node_uniform_quadrature_weight
564
+
565
+ def make_trace_node_quadrature_weight(self):
566
+ # Non-conforming, zero measure on sides
567
+
568
+ @wp.func
569
+ def zero(node_index_in_elt: int):
570
+ return 0.0
571
+
572
+ return zero
573
+
574
+ def make_element_inner_weight(self):
575
+ tri_inner_weight = self._tri_shape.make_element_inner_weight()
576
+
577
+ SQUARE_TO_TRI = wp.constant(wp.mat22(np.linalg.inv(self._tri_to_square)))
578
+
579
+ @cache.dynamic_func(suffix=self.name)
580
+ def element_inner_weight(
581
+ coords: Coords,
582
+ node_index_in_elt: int,
583
+ ):
584
+ tri_param = SQUARE_TO_TRI * (
585
+ wp.vec2(coords[0], coords[1]) - SquareNonConformingPolynomialShapeFunctions._TRI_OFFSET
586
+ )
587
+ tri_coords = Coords(1.0 - tri_param[0] - tri_param[1], tri_param[0], tri_param[1])
588
+
589
+ return tri_inner_weight(tri_coords, node_index_in_elt)
590
+
591
+ return element_inner_weight
592
+
593
+ def make_element_inner_weight_gradient(self):
594
+ tri_inner_weight_gradient = self._tri_shape.make_element_inner_weight_gradient()
595
+
596
+ SQUARE_TO_TRI = wp.constant(wp.mat22(np.linalg.inv(self._tri_to_square)))
597
+
598
+ @cache.dynamic_func(suffix=self.name)
599
+ def element_inner_weight_gradient(
600
+ coords: Coords,
601
+ node_index_in_elt: int,
602
+ ):
603
+ tri_param = SQUARE_TO_TRI * (
604
+ wp.vec2(coords[0], coords[1]) - SquareNonConformingPolynomialShapeFunctions._TRI_OFFSET
605
+ )
606
+ tri_coords = Coords(1.0 - tri_param[0] - tri_param[1], tri_param[0], tri_param[1])
607
+
608
+ grad = tri_inner_weight_gradient(tri_coords, node_index_in_elt)
609
+ return wp.transpose(SQUARE_TO_TRI) * grad
610
+
611
+ return element_inner_weight_gradient