warp-lang 0.9.0__py3-none-win_amd64.whl → 0.11.0__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of warp-lang might be problematic. Click here for more details.

Files changed (315) hide show
  1. warp/__init__.py +15 -7
  2. warp/__init__.pyi +1 -0
  3. warp/bin/warp-clang.dll +0 -0
  4. warp/bin/warp.dll +0 -0
  5. warp/build.py +22 -443
  6. warp/build_dll.py +384 -0
  7. warp/builtins.py +998 -488
  8. warp/codegen.py +1307 -739
  9. warp/config.py +5 -3
  10. warp/constants.py +6 -0
  11. warp/context.py +1291 -548
  12. warp/dlpack.py +31 -31
  13. warp/fabric.py +326 -0
  14. warp/fem/__init__.py +27 -0
  15. warp/fem/cache.py +389 -0
  16. warp/fem/dirichlet.py +181 -0
  17. warp/fem/domain.py +263 -0
  18. warp/fem/field/__init__.py +101 -0
  19. warp/fem/field/field.py +149 -0
  20. warp/fem/field/nodal_field.py +299 -0
  21. warp/fem/field/restriction.py +21 -0
  22. warp/fem/field/test.py +181 -0
  23. warp/fem/field/trial.py +183 -0
  24. warp/fem/geometry/__init__.py +19 -0
  25. warp/fem/geometry/closest_point.py +70 -0
  26. warp/fem/geometry/deformed_geometry.py +271 -0
  27. warp/fem/geometry/element.py +744 -0
  28. warp/fem/geometry/geometry.py +186 -0
  29. warp/fem/geometry/grid_2d.py +373 -0
  30. warp/fem/geometry/grid_3d.py +435 -0
  31. warp/fem/geometry/hexmesh.py +953 -0
  32. warp/fem/geometry/partition.py +376 -0
  33. warp/fem/geometry/quadmesh_2d.py +532 -0
  34. warp/fem/geometry/tetmesh.py +840 -0
  35. warp/fem/geometry/trimesh_2d.py +577 -0
  36. warp/fem/integrate.py +1616 -0
  37. warp/fem/operator.py +191 -0
  38. warp/fem/polynomial.py +213 -0
  39. warp/fem/quadrature/__init__.py +2 -0
  40. warp/fem/quadrature/pic_quadrature.py +245 -0
  41. warp/fem/quadrature/quadrature.py +294 -0
  42. warp/fem/space/__init__.py +292 -0
  43. warp/fem/space/basis_space.py +489 -0
  44. warp/fem/space/collocated_function_space.py +105 -0
  45. warp/fem/space/dof_mapper.py +236 -0
  46. warp/fem/space/function_space.py +145 -0
  47. warp/fem/space/grid_2d_function_space.py +267 -0
  48. warp/fem/space/grid_3d_function_space.py +306 -0
  49. warp/fem/space/hexmesh_function_space.py +352 -0
  50. warp/fem/space/partition.py +350 -0
  51. warp/fem/space/quadmesh_2d_function_space.py +369 -0
  52. warp/fem/space/restriction.py +160 -0
  53. warp/fem/space/shape/__init__.py +15 -0
  54. warp/fem/space/shape/cube_shape_function.py +738 -0
  55. warp/fem/space/shape/shape_function.py +103 -0
  56. warp/fem/space/shape/square_shape_function.py +611 -0
  57. warp/fem/space/shape/tet_shape_function.py +567 -0
  58. warp/fem/space/shape/triangle_shape_function.py +429 -0
  59. warp/fem/space/tetmesh_function_space.py +292 -0
  60. warp/fem/space/topology.py +295 -0
  61. warp/fem/space/trimesh_2d_function_space.py +221 -0
  62. warp/fem/types.py +77 -0
  63. warp/fem/utils.py +495 -0
  64. warp/native/array.h +164 -55
  65. warp/native/builtin.h +150 -174
  66. warp/native/bvh.cpp +75 -328
  67. warp/native/bvh.cu +406 -23
  68. warp/native/bvh.h +37 -45
  69. warp/native/clang/clang.cpp +136 -24
  70. warp/native/crt.cpp +1 -76
  71. warp/native/crt.h +111 -104
  72. warp/native/cuda_crt.h +1049 -0
  73. warp/native/cuda_util.cpp +15 -3
  74. warp/native/cuda_util.h +3 -1
  75. warp/native/cutlass/tools/library/scripts/conv2d_operation.py +463 -0
  76. warp/native/cutlass/tools/library/scripts/conv3d_operation.py +321 -0
  77. warp/native/cutlass/tools/library/scripts/gemm_operation.py +988 -0
  78. warp/native/cutlass/tools/library/scripts/generator.py +4625 -0
  79. warp/native/cutlass/tools/library/scripts/library.py +799 -0
  80. warp/native/cutlass/tools/library/scripts/manifest.py +402 -0
  81. warp/native/cutlass/tools/library/scripts/pycutlass/docs/source/conf.py +96 -0
  82. warp/native/cutlass/tools/library/scripts/pycutlass/profile/conv/conv2d_f16_sm80.py +106 -0
  83. warp/native/cutlass/tools/library/scripts/pycutlass/profile/gemm/gemm_f32_sm80.py +91 -0
  84. warp/native/cutlass/tools/library/scripts/pycutlass/setup.py +80 -0
  85. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/__init__.py +48 -0
  86. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/arguments.py +118 -0
  87. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/c_types.py +241 -0
  88. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/compiler.py +432 -0
  89. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/conv2d_operation.py +631 -0
  90. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/epilogue.py +1026 -0
  91. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/frontend.py +104 -0
  92. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/gemm_operation.py +1276 -0
  93. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/library.py +744 -0
  94. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/memory_manager.py +74 -0
  95. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/operation.py +110 -0
  96. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/parser.py +619 -0
  97. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/reduction_operation.py +398 -0
  98. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/tensor_ref.py +70 -0
  99. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/__init__.py +4 -0
  100. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/conv2d_testbed.py +646 -0
  101. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_grouped_testbed.py +235 -0
  102. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_testbed.py +557 -0
  103. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/profiler.py +70 -0
  104. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/type_hint.py +39 -0
  105. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/__init__.py +1 -0
  106. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/device.py +76 -0
  107. warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/reference_model.py +255 -0
  108. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/__init__.py +0 -0
  109. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +201 -0
  110. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +177 -0
  111. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +98 -0
  112. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +95 -0
  113. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_few_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +163 -0
  114. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_fixed_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +187 -0
  115. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +309 -0
  116. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +54 -0
  117. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
  118. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
  119. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_strided_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +253 -0
  120. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +97 -0
  121. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +242 -0
  122. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
  123. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
  124. warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/run_all_tests.py +10 -0
  125. warp/native/cutlass/tools/library/scripts/pycutlass/test/frontend/test_frontend.py +146 -0
  126. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/__init__.py +0 -0
  127. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_bf16_sm80.py +96 -0
  128. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f16_sm80.py +447 -0
  129. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f32_sm80.py +146 -0
  130. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f64_sm80.py +102 -0
  131. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_grouped_sm80.py +203 -0
  132. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_s8_sm80.py +229 -0
  133. warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/run_all_tests.py +9 -0
  134. warp/native/cutlass/tools/library/scripts/pycutlass/test/unit/test_sm80.py +453 -0
  135. warp/native/cutlass/tools/library/scripts/rank_2k_operation.py +398 -0
  136. warp/native/cutlass/tools/library/scripts/rank_k_operation.py +387 -0
  137. warp/native/cutlass/tools/library/scripts/rt.py +796 -0
  138. warp/native/cutlass/tools/library/scripts/symm_operation.py +400 -0
  139. warp/native/cutlass/tools/library/scripts/trmm_operation.py +407 -0
  140. warp/native/cutlass_gemm.cu +5 -3
  141. warp/native/exports.h +1240 -949
  142. warp/native/fabric.h +228 -0
  143. warp/native/hashgrid.cpp +4 -4
  144. warp/native/hashgrid.h +22 -2
  145. warp/native/initializer_array.h +2 -2
  146. warp/native/intersect.h +22 -7
  147. warp/native/intersect_adj.h +8 -8
  148. warp/native/intersect_tri.h +13 -16
  149. warp/native/marching.cu +157 -161
  150. warp/native/mat.h +119 -19
  151. warp/native/matnn.h +2 -2
  152. warp/native/mesh.cpp +108 -83
  153. warp/native/mesh.cu +243 -6
  154. warp/native/mesh.h +1547 -458
  155. warp/native/nanovdb/NanoVDB.h +1 -1
  156. warp/native/noise.h +272 -329
  157. warp/native/quat.h +51 -8
  158. warp/native/rand.h +45 -35
  159. warp/native/range.h +6 -2
  160. warp/native/reduce.cpp +157 -0
  161. warp/native/reduce.cu +348 -0
  162. warp/native/runlength_encode.cpp +62 -0
  163. warp/native/runlength_encode.cu +46 -0
  164. warp/native/scan.cu +11 -13
  165. warp/native/scan.h +1 -0
  166. warp/native/solid_angle.h +442 -0
  167. warp/native/sort.cpp +13 -0
  168. warp/native/sort.cu +9 -1
  169. warp/native/sparse.cpp +338 -0
  170. warp/native/sparse.cu +545 -0
  171. warp/native/spatial.h +2 -2
  172. warp/native/temp_buffer.h +30 -0
  173. warp/native/vec.h +126 -24
  174. warp/native/volume.h +120 -0
  175. warp/native/warp.cpp +658 -53
  176. warp/native/warp.cu +660 -68
  177. warp/native/warp.h +112 -12
  178. warp/optim/__init__.py +1 -0
  179. warp/optim/linear.py +922 -0
  180. warp/optim/sgd.py +92 -0
  181. warp/render/render_opengl.py +392 -152
  182. warp/render/render_usd.py +11 -11
  183. warp/sim/__init__.py +2 -2
  184. warp/sim/articulation.py +385 -185
  185. warp/sim/collide.py +21 -8
  186. warp/sim/import_mjcf.py +297 -106
  187. warp/sim/import_urdf.py +389 -210
  188. warp/sim/import_usd.py +198 -97
  189. warp/sim/inertia.py +17 -18
  190. warp/sim/integrator_euler.py +14 -8
  191. warp/sim/integrator_xpbd.py +161 -19
  192. warp/sim/model.py +795 -291
  193. warp/sim/optimizer.py +2 -6
  194. warp/sim/render.py +65 -3
  195. warp/sim/utils.py +3 -0
  196. warp/sparse.py +1227 -0
  197. warp/stubs.py +665 -223
  198. warp/tape.py +66 -15
  199. warp/tests/__main__.py +3 -6
  200. warp/tests/assets/curlnoise_golden.npy +0 -0
  201. warp/tests/assets/pnoise_golden.npy +0 -0
  202. warp/tests/assets/torus.usda +105 -105
  203. warp/tests/{test_class_kernel.py → aux_test_class_kernel.py} +9 -1
  204. warp/tests/aux_test_conditional_unequal_types_kernels.py +21 -0
  205. warp/tests/{test_dependent.py → aux_test_dependent.py} +2 -2
  206. warp/tests/{test_reference.py → aux_test_reference.py} +1 -1
  207. warp/tests/aux_test_unresolved_func.py +14 -0
  208. warp/tests/aux_test_unresolved_symbol.py +14 -0
  209. warp/tests/disabled_kinematics.py +239 -0
  210. warp/tests/run_coverage_serial.py +31 -0
  211. warp/tests/test_adam.py +103 -106
  212. warp/tests/test_arithmetic.py +128 -74
  213. warp/tests/test_array.py +1497 -211
  214. warp/tests/test_array_reduce.py +150 -0
  215. warp/tests/test_atomic.py +64 -28
  216. warp/tests/test_bool.py +99 -0
  217. warp/tests/test_builtins_resolution.py +1292 -0
  218. warp/tests/test_bvh.py +75 -43
  219. warp/tests/test_closest_point_edge_edge.py +54 -57
  220. warp/tests/test_codegen.py +233 -128
  221. warp/tests/test_compile_consts.py +28 -20
  222. warp/tests/test_conditional.py +108 -24
  223. warp/tests/test_copy.py +10 -12
  224. warp/tests/test_ctypes.py +112 -88
  225. warp/tests/test_dense.py +21 -14
  226. warp/tests/test_devices.py +98 -0
  227. warp/tests/test_dlpack.py +136 -108
  228. warp/tests/test_examples.py +277 -0
  229. warp/tests/test_fabricarray.py +955 -0
  230. warp/tests/test_fast_math.py +15 -11
  231. warp/tests/test_fem.py +1271 -0
  232. warp/tests/test_fp16.py +53 -19
  233. warp/tests/test_func.py +187 -74
  234. warp/tests/test_generics.py +194 -49
  235. warp/tests/test_grad.py +180 -116
  236. warp/tests/test_grad_customs.py +176 -0
  237. warp/tests/test_hash_grid.py +52 -37
  238. warp/tests/test_import.py +10 -23
  239. warp/tests/test_indexedarray.py +577 -24
  240. warp/tests/test_intersect.py +18 -9
  241. warp/tests/test_large.py +141 -0
  242. warp/tests/test_launch.py +251 -15
  243. warp/tests/test_lerp.py +64 -65
  244. warp/tests/test_linear_solvers.py +154 -0
  245. warp/tests/test_lvalue.py +493 -0
  246. warp/tests/test_marching_cubes.py +12 -13
  247. warp/tests/test_mat.py +508 -2778
  248. warp/tests/test_mat_lite.py +115 -0
  249. warp/tests/test_mat_scalar_ops.py +2889 -0
  250. warp/tests/test_math.py +103 -9
  251. warp/tests/test_matmul.py +305 -69
  252. warp/tests/test_matmul_lite.py +410 -0
  253. warp/tests/test_mesh.py +71 -14
  254. warp/tests/test_mesh_query_aabb.py +41 -25
  255. warp/tests/test_mesh_query_point.py +325 -34
  256. warp/tests/test_mesh_query_ray.py +39 -22
  257. warp/tests/test_mlp.py +30 -22
  258. warp/tests/test_model.py +92 -89
  259. warp/tests/test_modules_lite.py +39 -0
  260. warp/tests/test_multigpu.py +88 -114
  261. warp/tests/test_noise.py +12 -11
  262. warp/tests/test_operators.py +16 -20
  263. warp/tests/test_options.py +11 -11
  264. warp/tests/test_pinned.py +17 -18
  265. warp/tests/test_print.py +32 -11
  266. warp/tests/test_quat.py +275 -129
  267. warp/tests/test_rand.py +18 -16
  268. warp/tests/test_reload.py +38 -34
  269. warp/tests/test_rounding.py +50 -43
  270. warp/tests/test_runlength_encode.py +190 -0
  271. warp/tests/test_smoothstep.py +9 -11
  272. warp/tests/test_snippet.py +143 -0
  273. warp/tests/test_sparse.py +460 -0
  274. warp/tests/test_spatial.py +276 -243
  275. warp/tests/test_streams.py +110 -85
  276. warp/tests/test_struct.py +331 -85
  277. warp/tests/test_tape.py +39 -21
  278. warp/tests/test_torch.py +118 -89
  279. warp/tests/test_transient_module.py +12 -13
  280. warp/tests/test_types.py +614 -0
  281. warp/tests/test_utils.py +494 -0
  282. warp/tests/test_vec.py +354 -1987
  283. warp/tests/test_vec_lite.py +73 -0
  284. warp/tests/test_vec_scalar_ops.py +2099 -0
  285. warp/tests/test_volume.py +457 -293
  286. warp/tests/test_volume_write.py +124 -134
  287. warp/tests/unittest_serial.py +35 -0
  288. warp/tests/unittest_suites.py +341 -0
  289. warp/tests/unittest_utils.py +568 -0
  290. warp/tests/unused_test_misc.py +71 -0
  291. warp/tests/{test_debug.py → walkthough_debug.py} +3 -17
  292. warp/thirdparty/appdirs.py +36 -45
  293. warp/thirdparty/unittest_parallel.py +549 -0
  294. warp/torch.py +72 -30
  295. warp/types.py +1744 -713
  296. warp/utils.py +360 -350
  297. warp_lang-0.11.0.dist-info/LICENSE.md +36 -0
  298. warp_lang-0.11.0.dist-info/METADATA +238 -0
  299. warp_lang-0.11.0.dist-info/RECORD +332 -0
  300. {warp_lang-0.9.0.dist-info → warp_lang-0.11.0.dist-info}/WHEEL +1 -1
  301. warp/bin/warp-clang.exp +0 -0
  302. warp/bin/warp-clang.lib +0 -0
  303. warp/bin/warp.exp +0 -0
  304. warp/bin/warp.lib +0 -0
  305. warp/tests/test_all.py +0 -215
  306. warp/tests/test_array_scan.py +0 -60
  307. warp/tests/test_base.py +0 -208
  308. warp/tests/test_unresolved_func.py +0 -7
  309. warp/tests/test_unresolved_symbol.py +0 -7
  310. warp_lang-0.9.0.dist-info/METADATA +0 -20
  311. warp_lang-0.9.0.dist-info/RECORD +0 -177
  312. /warp/tests/{test_compile_consts_dummy.py → aux_test_compile_consts_dummy.py} +0 -0
  313. /warp/tests/{test_reference_reference.py → aux_test_reference_reference.py} +0 -0
  314. /warp/tests/{test_square.py → aux_test_square.py} +0 -0
  315. {warp_lang-0.9.0.dist-info → warp_lang-0.11.0.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,611 @@
1
+ import math
2
+
3
+ import warp as wp
4
+ import numpy as np
5
+
6
+ from warp.fem.polynomial import Polynomial, quadrature_1d, lagrange_scales, is_closed
7
+ from warp.fem.types import Coords
8
+ from warp.fem import cache
9
+
10
+ from .triangle_shape_function import Triangle2DPolynomialShapeFunctions
11
+
12
+
13
+ class SquareBipolynomialShapeFunctions:
14
+ def __init__(self, degree: int, family: Polynomial):
15
+ self.family = family
16
+
17
+ self.ORDER = wp.constant(degree)
18
+ self.NODES_PER_ELEMENT = wp.constant((degree + 1) * (degree + 1))
19
+ self.NODES_PER_SIDE = wp.constant(degree + 1)
20
+
21
+ lobatto_coords, lobatto_weight = quadrature_1d(point_count=degree + 1, family=family)
22
+ lagrange_scale = lagrange_scales(lobatto_coords)
23
+
24
+ NodeVec = wp.types.vector(length=degree + 1, dtype=wp.float32)
25
+ self.LOBATTO_COORDS = wp.constant(NodeVec(lobatto_coords))
26
+ self.LOBATTO_WEIGHT = wp.constant(NodeVec(lobatto_weight))
27
+ self.LAGRANGE_SCALE = wp.constant(NodeVec(lagrange_scale))
28
+ self.ORDER_PLUS_ONE = wp.constant(self.ORDER + 1)
29
+
30
+ @property
31
+ def name(self) -> str:
32
+ return f"Square_Q{self.ORDER}_{self.family}"
33
+
34
+ def make_node_coords_in_element(self):
35
+ ORDER = self.ORDER
36
+ LOBATTO_COORDS = self.LOBATTO_COORDS
37
+
38
+ @cache.dynamic_func(suffix=self.name)
39
+ def node_coords_in_element(
40
+ node_index_in_elt: int,
41
+ ):
42
+ node_i = node_index_in_elt // (ORDER + 1)
43
+ node_j = node_index_in_elt - (ORDER + 1) * node_i
44
+ return Coords(LOBATTO_COORDS[node_i], LOBATTO_COORDS[node_j], 0.0)
45
+
46
+ return node_coords_in_element
47
+
48
+ def make_node_quadrature_weight(self):
49
+ ORDER = self.ORDER
50
+ LOBATTO_WEIGHT = self.LOBATTO_WEIGHT
51
+
52
+ def node_quadrature_weight(
53
+ node_index_in_elt: int,
54
+ ):
55
+ node_i = node_index_in_elt // (ORDER + 1)
56
+ node_j = node_index_in_elt - (ORDER + 1) * node_i
57
+ return LOBATTO_WEIGHT[node_i] * LOBATTO_WEIGHT[node_j]
58
+
59
+ def node_quadrature_weight_linear(
60
+ node_index_in_elt: int,
61
+ ):
62
+ return 0.25
63
+
64
+ if ORDER == 1:
65
+ return cache.get_func(node_quadrature_weight_linear, self.name)
66
+
67
+ return cache.get_func(node_quadrature_weight, self.name)
68
+
69
+ @wp.func
70
+ def _vertex_coords_f(vidx_in_cell: int):
71
+ x = vidx_in_cell // 2
72
+ y = vidx_in_cell - 2 * x
73
+ return wp.vec2(float(x), float(y))
74
+
75
+ def make_trace_node_quadrature_weight(self):
76
+ ORDER = self.ORDER
77
+ LOBATTO_WEIGHT = self.LOBATTO_WEIGHT
78
+
79
+ def trace_node_quadrature_weight(
80
+ node_index_in_elt: int,
81
+ ):
82
+ # We're either on a side interior or at a vertex
83
+ # I.e., either both indices are at extrema, or only one is
84
+ # Pick the interior one if possible, if both are at extrema pick any one
85
+ node_i = node_index_in_elt // (ORDER + 1)
86
+ if node_i > 0 and node_i < ORDER:
87
+ return LOBATTO_WEIGHT[node_i]
88
+
89
+ node_j = node_index_in_elt - (ORDER + 1) * node_i
90
+ return LOBATTO_WEIGHT[node_j]
91
+
92
+ def trace_node_quadrature_weight_linear(
93
+ node_index_in_elt: int,
94
+ ):
95
+ return 0.5
96
+
97
+ def trace_node_quadrature_weight_open(
98
+ node_index_in_elt: int,
99
+ ):
100
+ return 0.0
101
+
102
+ if not is_closed(self.family):
103
+ return cache.get_func(trace_node_quadrature_weight_open, self.name)
104
+
105
+ if ORDER == 1:
106
+ return cache.get_func(trace_node_quadrature_weight_linear, self.name)
107
+
108
+ return cache.get_func(trace_node_quadrature_weight, self.name)
109
+
110
+ def make_element_inner_weight(self):
111
+ ORDER_PLUS_ONE = self.ORDER_PLUS_ONE
112
+ LOBATTO_COORDS = self.LOBATTO_COORDS
113
+ LAGRANGE_SCALE = self.LAGRANGE_SCALE
114
+
115
+ def element_inner_weight(
116
+ coords: Coords,
117
+ node_index_in_elt: int,
118
+ ):
119
+ node_i = node_index_in_elt // ORDER_PLUS_ONE
120
+ node_j = node_index_in_elt - ORDER_PLUS_ONE * node_i
121
+
122
+ w = float(1.0)
123
+ for k in range(ORDER_PLUS_ONE):
124
+ if k != node_i:
125
+ w *= coords[0] - LOBATTO_COORDS[k]
126
+ if k != node_j:
127
+ w *= coords[1] - LOBATTO_COORDS[k]
128
+
129
+ w *= LAGRANGE_SCALE[node_i] * LAGRANGE_SCALE[node_j]
130
+
131
+ return w
132
+
133
+ def element_inner_weight_linear(
134
+ coords: Coords,
135
+ node_index_in_elt: int,
136
+ ):
137
+ v = SquareBipolynomialShapeFunctions._vertex_coords_f(node_index_in_elt)
138
+
139
+ wx = (1.0 - coords[0]) * (1.0 - v[0]) + v[0] * coords[0]
140
+ wy = (1.0 - coords[1]) * (1.0 - v[1]) + v[1] * coords[1]
141
+ return wx * wy
142
+
143
+ if self.ORDER == 1 and is_closed(self.family):
144
+ return cache.get_func(element_inner_weight_linear, self.name)
145
+
146
+ return cache.get_func(element_inner_weight, self.name)
147
+
148
+ def make_element_inner_weight_gradient(self):
149
+ ORDER_PLUS_ONE = self.ORDER_PLUS_ONE
150
+ LOBATTO_COORDS = self.LOBATTO_COORDS
151
+ LAGRANGE_SCALE = self.LAGRANGE_SCALE
152
+
153
+ def element_inner_weight_gradient(
154
+ coords: Coords,
155
+ node_index_in_elt: int,
156
+ ):
157
+ node_i = node_index_in_elt // ORDER_PLUS_ONE
158
+ node_j = node_index_in_elt - ORDER_PLUS_ONE * node_i
159
+
160
+ prefix_x = float(1.0)
161
+ prefix_y = float(1.0)
162
+ for k in range(ORDER_PLUS_ONE):
163
+ if k != node_i:
164
+ prefix_y *= coords[0] - LOBATTO_COORDS[k]
165
+ if k != node_j:
166
+ prefix_x *= coords[1] - LOBATTO_COORDS[k]
167
+
168
+ grad_x = float(0.0)
169
+ grad_y = float(0.0)
170
+
171
+ for k in range(ORDER_PLUS_ONE):
172
+ if k != node_i:
173
+ delta_x = coords[0] - LOBATTO_COORDS[k]
174
+ grad_x = grad_x * delta_x + prefix_x
175
+ prefix_x *= delta_x
176
+ if k != node_j:
177
+ delta_y = coords[1] - LOBATTO_COORDS[k]
178
+ grad_y = grad_y * delta_y + prefix_y
179
+ prefix_y *= delta_y
180
+
181
+ grad = LAGRANGE_SCALE[node_i] * LAGRANGE_SCALE[node_j] * wp.vec2(grad_x, grad_y)
182
+
183
+ return grad
184
+
185
+ def element_inner_weight_gradient_linear(
186
+ coords: Coords,
187
+ node_index_in_elt: int,
188
+ ):
189
+ v = SquareBipolynomialShapeFunctions._vertex_coords_f(node_index_in_elt)
190
+
191
+ wx = (1.0 - coords[0]) * (1.0 - v[0]) + v[0] * coords[0]
192
+ wy = (1.0 - coords[1]) * (1.0 - v[1]) + v[1] * coords[1]
193
+
194
+ dx = 2.0 * v[0] - 1.0
195
+ dy = 2.0 * v[1] - 1.0
196
+
197
+ return wp.vec2(dx * wy, dy * wx)
198
+
199
+ if self.ORDER == 1 and is_closed(self.family):
200
+ return cache.get_func(element_inner_weight_gradient_linear, self.name)
201
+
202
+ return cache.get_func(element_inner_weight_gradient, self.name)
203
+
204
+ def element_node_triangulation(self):
205
+ from warp.fem.utils import grid_to_tris
206
+
207
+ return grid_to_tris(self.ORDER, self.ORDER)
208
+
209
+
210
+ class SquareSerendipityShapeFunctions:
211
+ """
212
+ Serendipity element ~ tensor product space without interior nodes
213
+ Side shape functions are usual Lagrange shape functions times a linear function in the normal direction
214
+ Corner shape functions are bilinear shape functions times a function of (x^{d-1} + y^{d-1})
215
+ """
216
+
217
+ # Node categories
218
+ VERTEX = wp.constant(0)
219
+ EDGE_X = wp.constant(1)
220
+ EDGE_Y = wp.constant(2)
221
+
222
+ def __init__(self, degree: int, family: Polynomial):
223
+ if not is_closed(family):
224
+ raise ValueError("A closed polynomial family is required to define serendipity elements")
225
+
226
+ if degree not in [2, 3]:
227
+ raise NotImplementedError("Serendipity element only implemented for order 2 or 3")
228
+
229
+ self.family = family
230
+
231
+ self.ORDER = wp.constant(degree)
232
+ self.NODES_PER_ELEMENT = wp.constant(4 * degree)
233
+ self.NODES_PER_SIDE = wp.constant(degree + 1)
234
+
235
+ lobatto_coords, lobatto_weight = quadrature_1d(point_count=degree + 1, family=family)
236
+ lagrange_scale = lagrange_scales(lobatto_coords)
237
+
238
+ NodeVec = wp.types.vector(length=degree + 1, dtype=wp.float32)
239
+ self.LOBATTO_COORDS = wp.constant(NodeVec(lobatto_coords))
240
+ self.LOBATTO_WEIGHT = wp.constant(NodeVec(lobatto_weight))
241
+ self.LAGRANGE_SCALE = wp.constant(NodeVec(lagrange_scale))
242
+ self.ORDER_PLUS_ONE = wp.constant(self.ORDER + 1)
243
+
244
+ self.node_type_and_type_index = self._get_node_type_and_type_index()
245
+ self._node_lobatto_indices = self._get_node_lobatto_indices()
246
+
247
+ @property
248
+ def name(self) -> str:
249
+ return f"Square_S{self.ORDER}_{self.family}"
250
+
251
+ def _get_node_type_and_type_index(self):
252
+ @cache.dynamic_func(suffix=self.name)
253
+ def node_type_and_index(
254
+ node_index_in_elt: int,
255
+ ):
256
+ if node_index_in_elt < 4:
257
+ return SquareSerendipityShapeFunctions.VERTEX, node_index_in_elt
258
+
259
+ type_index = (node_index_in_elt - 4) // 2
260
+ side = node_index_in_elt - 4 - 2 * type_index
261
+ return SquareSerendipityShapeFunctions.EDGE_X + side, type_index
262
+
263
+ return node_type_and_index
264
+
265
+ @wp.func
266
+ def side_offset_and_index(type_index: int):
267
+ index_in_side = type_index // 2
268
+ side_offset = type_index - 2 * index_in_side
269
+
270
+ return side_offset, index_in_side
271
+
272
+ def _get_node_lobatto_indices(self):
273
+ ORDER = self.ORDER
274
+
275
+ @cache.dynamic_func(suffix=self.name)
276
+ def node_lobatto_indices(node_type: int, type_index: int):
277
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
278
+ node_i = type_index // 2
279
+ node_j = type_index - 2 * node_i
280
+ return node_i * ORDER, node_j * ORDER
281
+
282
+ side_offset, index_in_side = SquareSerendipityShapeFunctions.side_offset_and_index(type_index)
283
+
284
+ if node_type == SquareSerendipityShapeFunctions.EDGE_X:
285
+ node_i = 1 + index_in_side
286
+ node_j = side_offset * ORDER
287
+ else:
288
+ node_j = 1 + index_in_side
289
+ node_i = side_offset * ORDER
290
+
291
+ return node_i, node_j
292
+
293
+ return node_lobatto_indices
294
+
295
+ def make_node_coords_in_element(self):
296
+ LOBATTO_COORDS = self.LOBATTO_COORDS
297
+
298
+ @cache.dynamic_func(suffix=self.name)
299
+ def node_coords_in_element(
300
+ node_index_in_elt: int,
301
+ ):
302
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
303
+ node_i, node_j = self._node_lobatto_indices(node_type, type_index)
304
+ return Coords(LOBATTO_COORDS[node_i], LOBATTO_COORDS[node_j], 0.0)
305
+
306
+ return node_coords_in_element
307
+
308
+ def make_node_quadrature_weight(self):
309
+ ORDER = self.ORDER
310
+
311
+ @cache.dynamic_func(suffix=self.name)
312
+ def node_quadrature_weight(
313
+ node_index_in_elt: int,
314
+ ):
315
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
316
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
317
+ return 0.25 / float(ORDER * ORDER)
318
+
319
+ return (0.25 - 0.25 / float(ORDER * ORDER)) / float(ORDER - 1)
320
+
321
+ return node_quadrature_weight
322
+
323
+ def make_trace_node_quadrature_weight(self):
324
+ LOBATTO_WEIGHT = self.LOBATTO_WEIGHT
325
+
326
+ @cache.dynamic_func(suffix=self.name)
327
+ def trace_node_quadrature_weight(
328
+ node_index_in_elt: int,
329
+ ):
330
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
331
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
332
+ return LOBATTO_WEIGHT[0]
333
+
334
+ side_offset, index_in_side = SquareSerendipityShapeFunctions.side_offset_and_index(type_index)
335
+ return LOBATTO_WEIGHT[1 + index_in_side]
336
+
337
+ return trace_node_quadrature_weight
338
+
339
+ def make_element_inner_weight(self):
340
+ ORDER = self.ORDER
341
+ ORDER_PLUS_ONE = self.ORDER_PLUS_ONE
342
+
343
+ LOBATTO_COORDS = self.LOBATTO_COORDS
344
+ LAGRANGE_SCALE = self.LAGRANGE_SCALE
345
+
346
+ DEGREE_3_CIRCLE_RAD = wp.constant(0.5**2 + (0.5 - LOBATTO_COORDS[1]) ** 2)
347
+ DEGREE_3_CIRCLE_SCALE = 1.0 / (0.5 - DEGREE_3_CIRCLE_RAD)
348
+
349
+ @cache.dynamic_func(suffix=self.name)
350
+ def element_inner_weight(
351
+ coords: Coords,
352
+ node_index_in_elt: int,
353
+ ):
354
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
355
+
356
+ node_i, node_j = self._node_lobatto_indices(node_type, type_index)
357
+
358
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
359
+ cx = wp.select(node_i == 0, coords[0], 1.0 - coords[0])
360
+ cy = wp.select(node_j == 0, coords[1], 1.0 - coords[1])
361
+
362
+ w = cx * cy
363
+
364
+ if ORDER == 2:
365
+ w *= cx + cy - 2.0 + LOBATTO_COORDS[1]
366
+ return w * LAGRANGE_SCALE[0]
367
+ if ORDER == 3:
368
+ w *= (cx - 0.5) * (cx - 0.5) + (cy - 0.5) * (cy - 0.5) - DEGREE_3_CIRCLE_RAD
369
+ return w * DEGREE_3_CIRCLE_SCALE
370
+
371
+ w = float(1.0)
372
+ if node_type == SquareSerendipityShapeFunctions.EDGE_Y:
373
+ w *= wp.select(node_i == 0, coords[0], 1.0 - coords[0])
374
+ else:
375
+ for k in range(ORDER_PLUS_ONE):
376
+ if k != node_i:
377
+ w *= coords[0] - LOBATTO_COORDS[k]
378
+
379
+ w *= LAGRANGE_SCALE[node_i]
380
+
381
+ if node_type == SquareSerendipityShapeFunctions.EDGE_X:
382
+ w *= wp.select(node_j == 0, coords[1], 1.0 - coords[1])
383
+ else:
384
+ for k in range(ORDER_PLUS_ONE):
385
+ if k != node_j:
386
+ w *= coords[1] - LOBATTO_COORDS[k]
387
+ w *= LAGRANGE_SCALE[node_j]
388
+
389
+ return w
390
+
391
+ return element_inner_weight
392
+
393
+ def make_element_inner_weight_gradient(self):
394
+ ORDER = self.ORDER
395
+ ORDER_PLUS_ONE = self.ORDER_PLUS_ONE
396
+ LOBATTO_COORDS = self.LOBATTO_COORDS
397
+ LAGRANGE_SCALE = self.LAGRANGE_SCALE
398
+
399
+ DEGREE_3_CIRCLE_RAD = wp.constant(0.5**2 + (0.5 - LOBATTO_COORDS[1]) ** 2)
400
+ DEGREE_3_CIRCLE_SCALE = 1.0 / (0.5 - DEGREE_3_CIRCLE_RAD)
401
+
402
+ @cache.dynamic_func(suffix=self.name)
403
+ def element_inner_weight_gradient(
404
+ coords: Coords,
405
+ node_index_in_elt: int,
406
+ ):
407
+ node_type, type_index = self.node_type_and_type_index(node_index_in_elt)
408
+
409
+ node_i, node_j = self._node_lobatto_indices(node_type, type_index)
410
+
411
+ if node_type == SquareSerendipityShapeFunctions.VERTEX:
412
+ cx = wp.select(node_i == 0, coords[0], 1.0 - coords[0])
413
+ cy = wp.select(node_j == 0, coords[1], 1.0 - coords[1])
414
+
415
+ gx = wp.select(node_i == 0, 1.0, -1.0)
416
+ gy = wp.select(node_j == 0, 1.0, -1.0)
417
+
418
+ if ORDER == 2:
419
+ w = cx + cy - 2.0 + LOBATTO_COORDS[1]
420
+ grad_x = cy * gx * (w + cx)
421
+ grad_y = cx * gy * (w + cy)
422
+
423
+ return wp.vec2(grad_x, grad_y) * LAGRANGE_SCALE[0]
424
+
425
+ if ORDER == 3:
426
+ w = (cx - 0.5) * (cx - 0.5) + (cy - 0.5) * (cy - 0.5) - DEGREE_3_CIRCLE_RAD
427
+
428
+ dw_dcx = 2.0 * cx - 1.0
429
+ dw_dcy = 2.0 * cy - 1.0
430
+ grad_x = cy * gx * (w + cx * dw_dcx)
431
+ grad_y = cx * gy * (w + cy * dw_dcy)
432
+
433
+ return wp.vec2(grad_x, grad_y) * DEGREE_3_CIRCLE_SCALE
434
+
435
+ if node_type == SquareSerendipityShapeFunctions.EDGE_X:
436
+ prefix_x = wp.select(node_j == 0, coords[1], 1.0 - coords[1])
437
+ else:
438
+ prefix_x = LAGRANGE_SCALE[node_j]
439
+ for k in range(ORDER_PLUS_ONE):
440
+ if k != node_j:
441
+ prefix_x *= coords[1] - LOBATTO_COORDS[k]
442
+
443
+ if node_type == SquareSerendipityShapeFunctions.EDGE_Y:
444
+ prefix_y = wp.select(node_i == 0, coords[0], 1.0 - coords[0])
445
+ else:
446
+ prefix_y = LAGRANGE_SCALE[node_i]
447
+ for k in range(ORDER_PLUS_ONE):
448
+ if k != node_i:
449
+ prefix_y *= coords[0] - LOBATTO_COORDS[k]
450
+
451
+ if node_type == SquareSerendipityShapeFunctions.EDGE_X:
452
+ grad_y = wp.select(node_j == 0, 1.0, -1.0) * prefix_y
453
+ else:
454
+ prefix_y *= LAGRANGE_SCALE[node_j]
455
+ grad_y = float(0.0)
456
+ for k in range(ORDER_PLUS_ONE):
457
+ if k != node_j:
458
+ delta_y = coords[1] - LOBATTO_COORDS[k]
459
+ grad_y = grad_y * delta_y + prefix_y
460
+ prefix_y *= delta_y
461
+
462
+ if node_type == SquareSerendipityShapeFunctions.EDGE_Y:
463
+ grad_x = wp.select(node_i == 0, 1.0, -1.0) * prefix_x
464
+ else:
465
+ prefix_x *= LAGRANGE_SCALE[node_i]
466
+ grad_x = float(0.0)
467
+ for k in range(ORDER_PLUS_ONE):
468
+ if k != node_i:
469
+ delta_x = coords[0] - LOBATTO_COORDS[k]
470
+ grad_x = grad_x * delta_x + prefix_x
471
+ prefix_x *= delta_x
472
+
473
+ grad = wp.vec2(grad_x, grad_y)
474
+ return grad
475
+
476
+ return element_inner_weight_gradient
477
+
478
+ def element_node_triangulation(self):
479
+ if self.ORDER == 2:
480
+ element_triangles = [
481
+ [0, 4, 5],
482
+ [5, 4, 6],
483
+ [5, 6, 1],
484
+ [4, 2, 7],
485
+ [4, 7, 6],
486
+ [6, 7, 3],
487
+ ]
488
+ else:
489
+ element_triangles = [
490
+ [0, 4, 5],
491
+ [2, 7, 8],
492
+ [3, 10, 11],
493
+ [1, 9, 6],
494
+ [5, 6, 9],
495
+ [5, 4, 6],
496
+ [8, 11, 10],
497
+ [8, 7, 11],
498
+ [4, 8, 10],
499
+ [4, 10, 6],
500
+ ]
501
+
502
+ return element_triangles
503
+
504
+
505
+ class SquareNonConformingPolynomialShapeFunctions:
506
+ # embeds the largest equilateral triangle centered at (0.5, 0.5) into the reference square
507
+ _tri_height = 0.75
508
+ _tri_side = 2.0 / math.sqrt(3.0) * _tri_height
509
+ _tri_to_square = np.array([[_tri_side, _tri_side / 2.0], [0.0, _tri_height]])
510
+
511
+ _TRI_OFFSET = wp.constant(wp.vec2(0.5 - 0.5 * _tri_side, 0.5 - _tri_height / 3.0))
512
+
513
+ def __init__(self, degree: int):
514
+ self._tri_shape = Triangle2DPolynomialShapeFunctions(degree=degree)
515
+ self.ORDER = self._tri_shape.ORDER
516
+ self.NODES_PER_ELEMENT = self._tri_shape.NODES_PER_ELEMENT
517
+
518
+ self.element_node_triangulation = self._tri_shape.element_node_triangulation
519
+
520
+ @property
521
+ def name(self) -> str:
522
+ return f"Square_P{self.ORDER}d"
523
+
524
+ def make_node_coords_in_element(self):
525
+ node_coords_in_tet = self._tri_shape.make_node_coords_in_element()
526
+
527
+ TRI_TO_SQUARE = wp.constant(wp.mat22(self._tri_to_square))
528
+
529
+ @cache.dynamic_func(suffix=self.name)
530
+ def node_coords_in_element(
531
+ node_index_in_elt: int,
532
+ ):
533
+ tri_coords = node_coords_in_tet(node_index_in_elt)
534
+ coords = (
535
+ TRI_TO_SQUARE * wp.vec2(tri_coords[1], tri_coords[2])
536
+ ) + SquareNonConformingPolynomialShapeFunctions._TRI_OFFSET
537
+ return Coords(coords[0], coords[1], 0.0)
538
+
539
+ return node_coords_in_element
540
+
541
+ def make_node_quadrature_weight(self):
542
+ NODES_PER_ELEMENT = self.NODES_PER_ELEMENT
543
+
544
+ if self.ORDER == 2:
545
+ # Intrinsic quadrature (order 2)
546
+ @cache.dynamic_func(suffix=self.name)
547
+ def node_quadrature_weight_quadratic(
548
+ node_index_in_elt: int,
549
+ ):
550
+ node_type, type_index = self._tri_shape.node_type_and_type_index(node_index_in_elt)
551
+ if node_type == Triangle2DPolynomialShapeFunctions.VERTEX:
552
+ return 0.18518521
553
+ return 0.14814811
554
+
555
+ return node_quadrature_weight_quadratic
556
+
557
+ @cache.dynamic_func(suffix=self.name)
558
+ def node_uniform_quadrature_weight(
559
+ node_index_in_elt: int,
560
+ ):
561
+ return 1.0 / float(NODES_PER_ELEMENT)
562
+
563
+ return node_uniform_quadrature_weight
564
+
565
+ def make_trace_node_quadrature_weight(self):
566
+ # Non-conforming, zero measure on sides
567
+
568
+ @wp.func
569
+ def zero(node_index_in_elt: int):
570
+ return 0.0
571
+
572
+ return zero
573
+
574
+ def make_element_inner_weight(self):
575
+ tri_inner_weight = self._tri_shape.make_element_inner_weight()
576
+
577
+ SQUARE_TO_TRI = wp.constant(wp.mat22(np.linalg.inv(self._tri_to_square)))
578
+
579
+ @cache.dynamic_func(suffix=self.name)
580
+ def element_inner_weight(
581
+ coords: Coords,
582
+ node_index_in_elt: int,
583
+ ):
584
+ tri_param = SQUARE_TO_TRI * (
585
+ wp.vec2(coords[0], coords[1]) - SquareNonConformingPolynomialShapeFunctions._TRI_OFFSET
586
+ )
587
+ tri_coords = Coords(1.0 - tri_param[0] - tri_param[1], tri_param[0], tri_param[1])
588
+
589
+ return tri_inner_weight(tri_coords, node_index_in_elt)
590
+
591
+ return element_inner_weight
592
+
593
+ def make_element_inner_weight_gradient(self):
594
+ tri_inner_weight_gradient = self._tri_shape.make_element_inner_weight_gradient()
595
+
596
+ SQUARE_TO_TRI = wp.constant(wp.mat22(np.linalg.inv(self._tri_to_square)))
597
+
598
+ @cache.dynamic_func(suffix=self.name)
599
+ def element_inner_weight_gradient(
600
+ coords: Coords,
601
+ node_index_in_elt: int,
602
+ ):
603
+ tri_param = SQUARE_TO_TRI * (
604
+ wp.vec2(coords[0], coords[1]) - SquareNonConformingPolynomialShapeFunctions._TRI_OFFSET
605
+ )
606
+ tri_coords = Coords(1.0 - tri_param[0] - tri_param[1], tri_param[0], tri_param[1])
607
+
608
+ grad = tri_inner_weight_gradient(tri_coords, node_index_in_elt)
609
+ return wp.transpose(SQUARE_TO_TRI) * grad
610
+
611
+ return element_inner_weight_gradient