ngsolve 6.2.2501.post16.dev1__cp313-cp313-macosx_10_15_universal2.whl → 6.2.2501.post34.dev1__cp313-cp313-macosx_10_15_universal2.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of ngsolve might be problematic. Click here for more details.

Files changed (286) hide show
  1. ngsolve/webgui.py +1 -1
  2. {ngsolve-6.2.2501.post16.dev1.dist-info → ngsolve-6.2.2501.post34.dev1.dist-info}/METADATA +2 -2
  3. ngsolve-6.2.2501.post34.dev1.dist-info/RECORD +25 -0
  4. netgen/include/arnoldi.hpp +0 -55
  5. netgen/include/bandmatrix.hpp +0 -334
  6. netgen/include/basematrix.hpp +0 -957
  7. netgen/include/basevector.hpp +0 -1268
  8. netgen/include/bdbequations.hpp +0 -2752
  9. netgen/include/bdbintegrator.hpp +0 -1659
  10. netgen/include/bessel.hpp +0 -1064
  11. netgen/include/bilinearform.hpp +0 -963
  12. netgen/include/bla.hpp +0 -29
  13. netgen/include/blockalloc.hpp +0 -95
  14. netgen/include/blockjacobi.hpp +0 -316
  15. netgen/include/bspline.hpp +0 -114
  16. netgen/include/calcinverse.hpp +0 -141
  17. netgen/include/cg.hpp +0 -368
  18. netgen/include/chebyshev.hpp +0 -44
  19. netgen/include/cholesky.hpp +0 -720
  20. netgen/include/clapack.h +0 -7254
  21. netgen/include/code_generation.hpp +0 -296
  22. netgen/include/coefficient.hpp +0 -2006
  23. netgen/include/coefficient_impl.hpp +0 -18
  24. netgen/include/coefficient_stdmath.hpp +0 -157
  25. netgen/include/commutingAMG.hpp +0 -106
  26. netgen/include/comp.hpp +0 -79
  27. netgen/include/compatibility.hpp +0 -41
  28. netgen/include/complex_wrapper.hpp +0 -73
  29. netgen/include/compressedfespace.hpp +0 -110
  30. netgen/include/contact.hpp +0 -231
  31. netgen/include/diagonalmatrix.hpp +0 -154
  32. netgen/include/differentialoperator.hpp +0 -276
  33. netgen/include/diffop.hpp +0 -1286
  34. netgen/include/diffop_impl.hpp +0 -326
  35. netgen/include/discontinuous.hpp +0 -84
  36. netgen/include/dump.hpp +0 -949
  37. netgen/include/eigen.hpp +0 -60
  38. netgen/include/eigensystem.hpp +0 -18
  39. netgen/include/elasticity_equations.hpp +0 -595
  40. netgen/include/elementbyelement.hpp +0 -195
  41. netgen/include/elementtopology.hpp +0 -1760
  42. netgen/include/elementtransformation.hpp +0 -339
  43. netgen/include/evalfunc.hpp +0 -405
  44. netgen/include/expr.hpp +0 -1655
  45. netgen/include/facetfe.hpp +0 -175
  46. netgen/include/facetfespace.hpp +0 -178
  47. netgen/include/facethofe.hpp +0 -111
  48. netgen/include/facetsurffespace.hpp +0 -112
  49. netgen/include/fe_interfaces.hpp +0 -32
  50. netgen/include/fem.hpp +0 -87
  51. netgen/include/fesconvert.hpp +0 -14
  52. netgen/include/fespace.hpp +0 -1445
  53. netgen/include/finiteelement.hpp +0 -286
  54. netgen/include/globalinterfacespace.hpp +0 -77
  55. netgen/include/globalspace.hpp +0 -115
  56. netgen/include/gridfunction.hpp +0 -525
  57. netgen/include/h1amg.hpp +0 -41
  58. netgen/include/h1hofe.hpp +0 -188
  59. netgen/include/h1hofe_impl.hpp +0 -1262
  60. netgen/include/h1hofefo.hpp +0 -148
  61. netgen/include/h1hofefo_impl.hpp +0 -185
  62. netgen/include/h1hofespace.hpp +0 -167
  63. netgen/include/h1lofe.hpp +0 -1237
  64. netgen/include/h1lumping.hpp +0 -35
  65. netgen/include/hcurl_equations.hpp +0 -1352
  66. netgen/include/hcurlcurlfe.hpp +0 -2221
  67. netgen/include/hcurlcurlfespace.hpp +0 -78
  68. netgen/include/hcurlfe.hpp +0 -259
  69. netgen/include/hcurlfe_utils.hpp +0 -107
  70. netgen/include/hcurlhdiv_dshape.hpp +0 -857
  71. netgen/include/hcurlhdivfes.hpp +0 -308
  72. netgen/include/hcurlhofe.hpp +0 -175
  73. netgen/include/hcurlhofe_impl.hpp +0 -1871
  74. netgen/include/hcurlhofespace.hpp +0 -193
  75. netgen/include/hcurllofe.hpp +0 -1146
  76. netgen/include/hdiv_equations.hpp +0 -865
  77. netgen/include/hdivdivfe.hpp +0 -2923
  78. netgen/include/hdivdivsurfacespace.hpp +0 -76
  79. netgen/include/hdivfe.hpp +0 -206
  80. netgen/include/hdivfe_utils.hpp +0 -716
  81. netgen/include/hdivfes.hpp +0 -75
  82. netgen/include/hdivhofe.hpp +0 -447
  83. netgen/include/hdivhofe_impl.hpp +0 -1107
  84. netgen/include/hdivhofefo.hpp +0 -229
  85. netgen/include/hdivhofespace.hpp +0 -175
  86. netgen/include/hdivhosurfacefespace.hpp +0 -106
  87. netgen/include/hdivlofe.hpp +0 -773
  88. netgen/include/hidden.hpp +0 -74
  89. netgen/include/householder.hpp +0 -181
  90. netgen/include/hypre_ams_precond.hpp +0 -123
  91. netgen/include/hypre_precond.hpp +0 -73
  92. netgen/include/integrator.hpp +0 -2024
  93. netgen/include/integratorcf.hpp +0 -253
  94. netgen/include/interpolate.hpp +0 -49
  95. netgen/include/intrule.hpp +0 -2541
  96. netgen/include/irspace.hpp +0 -49
  97. netgen/include/jacobi.hpp +0 -136
  98. netgen/include/l2hofe.hpp +0 -193
  99. netgen/include/l2hofe_impl.hpp +0 -564
  100. netgen/include/l2hofefo.hpp +0 -542
  101. netgen/include/l2hofespace.hpp +0 -344
  102. netgen/include/la.hpp +0 -38
  103. netgen/include/linearform.hpp +0 -266
  104. netgen/include/matrix.hpp +0 -2140
  105. netgen/include/memusage.hpp +0 -41
  106. netgen/include/meshaccess.hpp +0 -1358
  107. netgen/include/mgpre.hpp +0 -204
  108. netgen/include/mptools.hpp +0 -2145
  109. netgen/include/multigrid.hpp +0 -42
  110. netgen/include/multivector.hpp +0 -447
  111. netgen/include/mumpsinverse.hpp +0 -187
  112. netgen/include/mycomplex.hpp +0 -361
  113. netgen/include/ng_lapack.hpp +0 -1661
  114. netgen/include/ngblas.hpp +0 -1099
  115. netgen/include/ngs_defines.hpp +0 -30
  116. netgen/include/ngs_stdcpp_include.hpp +0 -106
  117. netgen/include/ngs_utils.hpp +0 -121
  118. netgen/include/ngsobject.hpp +0 -1019
  119. netgen/include/ngsstream.hpp +0 -113
  120. netgen/include/ngstd.hpp +0 -72
  121. netgen/include/nodalhofe.hpp +0 -96
  122. netgen/include/nodalhofe_impl.hpp +0 -141
  123. netgen/include/normalfacetfe.hpp +0 -223
  124. netgen/include/normalfacetfespace.hpp +0 -98
  125. netgen/include/normalfacetsurfacefespace.hpp +0 -84
  126. netgen/include/order.hpp +0 -251
  127. netgen/include/parallel_matrices.hpp +0 -222
  128. netgen/include/paralleldofs.hpp +0 -340
  129. netgen/include/parallelngs.hpp +0 -23
  130. netgen/include/parallelvector.hpp +0 -269
  131. netgen/include/pardisoinverse.hpp +0 -200
  132. netgen/include/periodic.hpp +0 -125
  133. netgen/include/plateaufespace.hpp +0 -25
  134. netgen/include/pml.hpp +0 -275
  135. netgen/include/pmltrafo.hpp +0 -631
  136. netgen/include/postproc.hpp +0 -142
  137. netgen/include/precomp.hpp +0 -60
  138. netgen/include/preconditioner.hpp +0 -602
  139. netgen/include/prolongation.hpp +0 -235
  140. netgen/include/python_comp.hpp +0 -107
  141. netgen/include/python_fem.hpp +0 -89
  142. netgen/include/python_linalg.hpp +0 -58
  143. netgen/include/python_ngstd.hpp +0 -385
  144. netgen/include/recursive_pol.hpp +0 -4844
  145. netgen/include/recursive_pol_tet.hpp +0 -395
  146. netgen/include/recursive_pol_trig.hpp +0 -492
  147. netgen/include/reorderedfespace.hpp +0 -81
  148. netgen/include/sample_sort.hpp +0 -105
  149. netgen/include/scalarfe.hpp +0 -335
  150. netgen/include/shapefunction_utils.hpp +0 -113
  151. netgen/include/simd_complex.hpp +0 -284
  152. netgen/include/smoother.hpp +0 -253
  153. netgen/include/solve.hpp +0 -89
  154. netgen/include/sparsecholesky.hpp +0 -313
  155. netgen/include/sparsematrix.hpp +0 -1038
  156. netgen/include/sparsematrix_dyn.hpp +0 -91
  157. netgen/include/sparsematrix_impl.hpp +0 -920
  158. netgen/include/special_matrix.hpp +0 -461
  159. netgen/include/specialelement.hpp +0 -125
  160. netgen/include/statushandler.hpp +0 -33
  161. netgen/include/stringops.hpp +0 -12
  162. netgen/include/superluinverse.hpp +0 -136
  163. netgen/include/symbolicintegrator.hpp +0 -849
  164. netgen/include/symmetricmatrix.hpp +0 -144
  165. netgen/include/tangentialfacetfe.hpp +0 -224
  166. netgen/include/tangentialfacetfespace.hpp +0 -106
  167. netgen/include/tensor.hpp +0 -522
  168. netgen/include/tensorcoefficient.hpp +0 -446
  169. netgen/include/tensorproductintegrator.hpp +0 -113
  170. netgen/include/thcurlfe.hpp +0 -128
  171. netgen/include/thcurlfe_impl.hpp +0 -380
  172. netgen/include/thdivfe.hpp +0 -80
  173. netgen/include/thdivfe_impl.hpp +0 -426
  174. netgen/include/tpdiffop.hpp +0 -461
  175. netgen/include/tpfes.hpp +0 -133
  176. netgen/include/tpintrule.hpp +0 -224
  177. netgen/include/triangular.hpp +0 -465
  178. netgen/include/tscalarfe.hpp +0 -245
  179. netgen/include/tscalarfe_impl.hpp +0 -1029
  180. netgen/include/umfpackinverse.hpp +0 -148
  181. netgen/include/vector.hpp +0 -1219
  182. netgen/include/voxelcoefficientfunction.hpp +0 -41
  183. netgen/include/vtkoutput.hpp +0 -198
  184. netgen/include/vvector.hpp +0 -208
  185. netgen/include/webgui.hpp +0 -92
  186. netgen/libngbla.dylib +0 -0
  187. netgen/libngcomp.dylib +0 -0
  188. netgen/libngfem.dylib +0 -0
  189. netgen/libngla.dylib +0 -0
  190. netgen/libngsolve.dylib +0 -0
  191. netgen/libngstd.dylib +0 -0
  192. ngsolve/__init__.pyi +0 -231
  193. ngsolve/bla.pyi +0 -1139
  194. ngsolve/bvp.pyi +0 -32
  195. ngsolve/cmake/NGSolveConfig.cmake +0 -102
  196. ngsolve/cmake/ngsolve-targets-release.cmake +0 -69
  197. ngsolve/cmake/ngsolve-targets.cmake +0 -163
  198. ngsolve/comp/__init__.pyi +0 -5382
  199. ngsolve/comp/pml.pyi +0 -89
  200. ngsolve/config/__init__.py +0 -1
  201. ngsolve/config/__init__.pyi +0 -43
  202. ngsolve/config/__main__.py +0 -4
  203. ngsolve/config/config.py +0 -60
  204. ngsolve/config/config.pyi +0 -45
  205. ngsolve/demos/TensorProduct/__init__.py +0 -0
  206. ngsolve/demos/TensorProduct/tp_dg_1d_1d.py +0 -80
  207. ngsolve/demos/TensorProduct/tp_dg_1d_2d.py +0 -73
  208. ngsolve/demos/TensorProduct/tp_dg_2d_1d.py +0 -72
  209. ngsolve/demos/TensorProduct/tp_dg_2d_2d.py +0 -66
  210. ngsolve/demos/__init__.py +0 -0
  211. ngsolve/demos/howto/__init__.py +0 -0
  212. ngsolve/demos/howto/hhj.py +0 -44
  213. ngsolve/demos/howto/hybrid_dg.py +0 -53
  214. ngsolve/demos/howto/mixed.py +0 -30
  215. ngsolve/demos/howto/nonlin.py +0 -29
  216. ngsolve/demos/howto/pickling.py +0 -26
  217. ngsolve/demos/howto/pml.py +0 -31
  218. ngsolve/demos/howto/taskmanager.py +0 -20
  219. ngsolve/demos/howto/tdnns.py +0 -47
  220. ngsolve/demos/howto/timeDG-skeleton.py +0 -45
  221. ngsolve/demos/howto/timeDG.py +0 -38
  222. ngsolve/demos/howto/timeDGlap.py +0 -42
  223. ngsolve/demos/howto/timeDGwave.py +0 -61
  224. ngsolve/demos/intro/__init__.py +0 -0
  225. ngsolve/demos/intro/adaptive.py +0 -123
  226. ngsolve/demos/intro/cmagnet.py +0 -62
  227. ngsolve/demos/intro/elasticity.py +0 -76
  228. ngsolve/demos/intro/navierstokes.py +0 -74
  229. ngsolve/demos/intro/poisson.ipynb +0 -170
  230. ngsolve/demos/intro/poisson.py +0 -41
  231. ngsolve/demos/mpi/__init__.py +0 -0
  232. ngsolve/demos/mpi/mpi_cmagnet.py +0 -87
  233. ngsolve/demos/mpi/mpi_navierstokes.py +0 -117
  234. ngsolve/demos/mpi/mpi_poisson.py +0 -89
  235. ngsolve/demos/mpi/mpi_timeDG.py +0 -82
  236. ngsolve/directsolvers.pyi +0 -18
  237. ngsolve/eigenvalues.pyi +0 -30
  238. ngsolve/fem.pyi +0 -1707
  239. ngsolve/krylovspace.pyi +0 -309
  240. ngsolve/la.pyi +0 -1218
  241. ngsolve/ngslib.so +0 -0
  242. ngsolve/ngstd.pyi +0 -58
  243. ngsolve/nonlinearsolvers.pyi +0 -98
  244. ngsolve/preconditioners.pyi +0 -6
  245. ngsolve/solve.pyi +0 -108
  246. ngsolve/solvers.pyi +0 -14
  247. ngsolve/timestepping.pyi +0 -34
  248. ngsolve/timing.pyi +0 -57
  249. ngsolve/utils.pyi +0 -279
  250. ngsolve-6.2.2501.post16.dev1.data/data/Netgen.icns +0 -0
  251. ngsolve-6.2.2501.post16.dev1.data/data/bin/ngscxx +0 -17
  252. ngsolve-6.2.2501.post16.dev1.data/data/bin/ngsld +0 -13
  253. ngsolve-6.2.2501.post16.dev1.data/data/bin/ngsolve.tcl +0 -648
  254. ngsolve-6.2.2501.post16.dev1.data/data/bin/ngspy +0 -2
  255. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/beam.geo +0 -17
  256. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/beam.vol +0 -240
  257. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/chip.in2d +0 -41
  258. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/chip.vol +0 -614
  259. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/coil.geo +0 -12
  260. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/coil.vol +0 -2560
  261. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/coilshield.geo +0 -24
  262. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/coilshield.vol +0 -3179
  263. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/cube.geo +0 -19
  264. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/cube.vol +0 -1832
  265. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d10_DGdoubleglazing.pde +0 -50
  266. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d11_chip_nitsche.pde +0 -40
  267. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d1_square.pde +0 -43
  268. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d2_chip.pde +0 -35
  269. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d3_helmholtz.pde +0 -22
  270. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d4_cube.pde +0 -46
  271. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d5_beam.pde +0 -74
  272. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d6_shaft.pde +0 -73
  273. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d7_coil.pde +0 -50
  274. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d8_coilshield.pde +0 -49
  275. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/d9_hybridDG.pde +0 -72
  276. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/doubleglazing.in2d +0 -27
  277. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/doubleglazing.vol +0 -737
  278. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/piezo2d40round4.vol.gz +0 -0
  279. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/shaft.geo +0 -73
  280. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/shaft.vol +0 -4291
  281. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/square.in2d +0 -17
  282. ngsolve-6.2.2501.post16.dev1.data/data/share/ngsolve/square.vol +0 -149
  283. ngsolve-6.2.2501.post16.dev1.dist-info/RECORD +0 -304
  284. {ngsolve-6.2.2501.post16.dev1.dist-info → ngsolve-6.2.2501.post34.dev1.dist-info}/LICENSE +0 -0
  285. {ngsolve-6.2.2501.post16.dev1.dist-info → ngsolve-6.2.2501.post34.dev1.dist-info}/WHEEL +0 -0
  286. {ngsolve-6.2.2501.post16.dev1.dist-info → ngsolve-6.2.2501.post34.dev1.dist-info}/top_level.txt +0 -0
@@ -1,857 +0,0 @@
1
- #ifndef FILE_HCURLHDIV_DSHAPE
2
- #define FILE_HCURLHDIV_DSHAPE
3
-
4
-
5
- #include "finiteelement.hpp"
6
- #include "diffop.hpp"
7
-
8
- namespace ngfem
9
- {
10
-
11
- /** calculates [du1/dx1 du2/dx1 (du3/dx1) du1/dx2 du2/dx2 (du3/dx2) (du1/dx3 du2/dx3 du3/dx3)] */
12
- template<typename FEL, int DIMSPACE, int DIM, int DIM_STRESS>
13
- void CalcDShapeFE(const FEL & fel, const MappedIntegrationPoint<DIM,DIMSPACE>& mip,
14
- BareSliceMatrix<> bmatu, LocalHeap& lh, double eps = 1e-4)
15
- {
16
- HeapReset hr(lh);
17
- // bmatu = 0;
18
- // evaluate dshape by numerical diff
19
- //fel, eltrans, mip, returnval, lh
20
- int nd_u = fel.GetNDof();
21
- const IntegrationPoint& ip = mip.IP();//volume_ir[i];
22
- const ElementTransformation & eltrans = mip.GetTransformation();
23
- FlatMatrixFixWidth<DIM_STRESS> shape_ul(nd_u, lh);
24
- FlatMatrixFixWidth<DIM_STRESS> shape_ur(nd_u, lh);
25
- FlatMatrixFixWidth<DIM_STRESS> shape_ull(nd_u, lh);
26
- FlatMatrixFixWidth<DIM_STRESS> shape_urr(nd_u, lh);
27
- FlatMatrixFixWidth<DIM_STRESS> dshape_u_ref(nd_u, lh);//(shape_ur); ///saves "reserved lh-memory"
28
-
29
- FlatMatrixFixWidth<DIM> dshape_u_ref_comp(nd_u, lh);
30
- FlatMatrixFixWidth<DIMSPACE> dshape_u(nd_u, lh);//(shape_ul);///saves "reserved lh-memory"
31
-
32
- for (int j = 0; j < DIM; j++) // d / dxj
33
- {
34
- IntegrationPoint ipl(ip);
35
- ipl(j) -= eps;
36
- IntegrationPoint ipr(ip);
37
- ipr(j) += eps;
38
- IntegrationPoint ipll(ip);
39
- ipll(j) -= 2*eps;
40
- IntegrationPoint iprr(ip);
41
- iprr(j) += 2*eps;
42
-
43
- MappedIntegrationPoint<DIM,DIMSPACE> mipl(ipl, eltrans);
44
- MappedIntegrationPoint<DIM,DIMSPACE> mipr(ipr, eltrans);
45
- MappedIntegrationPoint<DIM,DIMSPACE> mipll(ipll, eltrans);
46
- MappedIntegrationPoint<DIM,DIMSPACE> miprr(iprr, eltrans);
47
-
48
- fel.CalcMappedShape (mipl, shape_ul);
49
- fel.CalcMappedShape (mipr, shape_ur);
50
- fel.CalcMappedShape (mipll, shape_ull);
51
- fel.CalcMappedShape (miprr, shape_urr);
52
-
53
- dshape_u_ref = (1.0/(12.0*eps)) * (8.0*shape_ur-8.0*shape_ul-shape_urr+shape_ull);
54
- for (int l = 0; l < DIM_STRESS; l++)
55
- bmatu.Col(j*DIM_STRESS+l) = dshape_u_ref.Col(l);
56
- }
57
-
58
- for (int j = 0; j < DIM_STRESS; j++)
59
- {
60
- for (int k = 0; k < nd_u; k++)
61
- for (int l = 0; l < DIM; l++)
62
- dshape_u_ref_comp(k,l) = bmatu(k, l*DIM_STRESS+j);
63
-
64
- dshape_u = dshape_u_ref_comp * mip.GetJacobianInverse();
65
-
66
- for (int k = 0; k < nd_u; k++)
67
- for (int l = 0; l < DIMSPACE; l++)
68
- bmatu(k, l*DIM_STRESS+j) = dshape_u(k,l);
69
- }
70
- }
71
-
72
-
73
- template<typename FEL, int DIMSPACE, int DIM, int DIM_STRESS, class TVX, class TVY>
74
- void ApplyDShapeFE(const FEL & fel, const MappedIntegrationPoint<DIM,DIMSPACE>& mip, const TVX & x, TVY & y, LocalHeap& lh, double eps = 1e-4)
75
- {
76
- const IntegrationPoint& ip = mip.IP();
77
- const ElementTransformation & eltrans = mip.GetTransformation();
78
- Mat<DIM_STRESS,1> shape_ul;
79
- Mat<DIM_STRESS,1> shape_ur;
80
- Mat<DIM_STRESS,1> shape_ull;
81
- Mat<DIM_STRESS,1> shape_urr;
82
- Mat<DIM_STRESS,1> dshape_u_ref;
83
-
84
- Vec<DIM> dshape_u_ref_comp;
85
- Vec<DIMSPACE> dshape_u;
86
-
87
- for (int j = 0; j < DIM; j++) // d / dxj
88
- {
89
- IntegrationPoint ipl(ip);
90
- ipl(j) -= eps;
91
- IntegrationPoint ipr(ip);
92
- ipr(j) += eps;
93
- IntegrationPoint ipll(ip);
94
- ipll(j) -= 2*eps;
95
- IntegrationPoint iprr(ip);
96
- iprr(j) += 2*eps;
97
-
98
- MappedIntegrationPoint<DIM,DIMSPACE> mipl(ipl, eltrans);
99
- MappedIntegrationPoint<DIM,DIMSPACE> mipr(ipr, eltrans);
100
- MappedIntegrationPoint<DIM,DIMSPACE> mipll(ipll, eltrans);
101
- MappedIntegrationPoint<DIM,DIMSPACE> miprr(iprr, eltrans);
102
-
103
- fel.EvaluateMappedShape (mipl, x, shape_ul);
104
- fel.EvaluateMappedShape (mipr, x, shape_ur);
105
- fel.EvaluateMappedShape (mipll, x, shape_ull);
106
- fel.EvaluateMappedShape (miprr, x, shape_urr);
107
-
108
- dshape_u_ref = (1.0/(12.0*eps)) * (8.0*shape_ur-8.0*shape_ul-shape_urr+shape_ull);
109
-
110
- for (int l = 0; l < DIM_STRESS; l++)
111
- y(j*DIM_STRESS+l) = dshape_u_ref(l);
112
- }
113
-
114
- for (int j = 0; j < DIM_STRESS; j++)
115
- {
116
- for (int l = 0; l < DIM; l++)
117
- dshape_u_ref_comp(l) = y(l*DIM_STRESS+j);
118
-
119
- dshape_u = Trans(mip.GetJacobianInverse()) * dshape_u_ref_comp;
120
-
121
- for (int l = 0; l < DIMSPACE; l++)
122
- y(l*DIM_STRESS+j) = dshape_u(l);
123
- }
124
- }
125
-
126
- template<typename FEL, int DIMSPACE, int DIM, int DIM_STRESS, class TVX, class TVY>
127
- void ApplyTransDShapeFE(const FEL & fel_u, const MappedIntegrationPoint<DIM,DIMSPACE>& mip, const TVX & x, TVY & by, LocalHeap & lh, double eps = 1e-4)
128
- {
129
- typedef typename TVX::TSCAL TSCALX;
130
-
131
- HeapReset hr(lh);
132
- int nd_u = fel_u.GetNDof();
133
- FlatMatrixFixWidth<DIM_STRESS*DIMSPACE> bmatu(nd_u,lh);
134
-
135
- auto y = by.Range(0, nd_u);
136
- const IntegrationPoint& ip = mip.IP();
137
- const ElementTransformation & eltrans = mip.GetTransformation();
138
- FlatMatrixFixWidth<DIM_STRESS> shape_ul(nd_u, lh);
139
- FlatMatrixFixWidth<DIM_STRESS> shape_ur(nd_u, lh);
140
- FlatMatrixFixWidth<DIM_STRESS> shape_ull(nd_u, lh);
141
- FlatMatrixFixWidth<DIM_STRESS> shape_urr(nd_u, lh);
142
- FlatMatrixFixWidth<DIM_STRESS> dshape_u_ref(nd_u, lh);
143
- FlatMatrixFixWidth<DIM_STRESS> dshape_u(nd_u, lh);
144
-
145
- FlatMatrix<TSCALX> hx(DIMSPACE,DIM_STRESS,&x(0));
146
- Mat<DIM,DIM_STRESS,TSCALX> tx = mip.GetJacobianInverse() * hx;
147
-
148
- y = 0;
149
- for (int j = 0; j < DIM; j++) // d / dxj
150
- {
151
- IntegrationPoint ipts[4];
152
-
153
- ipts[0] = ip;
154
- ipts[0](j) -= eps;
155
- ipts[1] = ip;
156
- ipts[1](j) += eps;
157
- ipts[2] = ip;
158
- ipts[2](j) -= 2*eps;
159
- ipts[3] = ip;
160
- ipts[3](j) += 2*eps;
161
-
162
- IntegrationRule ir(4, ipts);
163
- MappedIntegrationRule<DIM,DIMSPACE> mirl(ir, eltrans, lh);
164
-
165
- fel_u.CalcMappedShape (mirl[0], shape_ul);
166
- fel_u.CalcMappedShape (mirl[1], shape_ur);
167
- fel_u.CalcMappedShape (mirl[2], shape_ull);
168
- fel_u.CalcMappedShape (mirl[3], shape_urr);
169
-
170
- dshape_u_ref = (1.0/(12.0*eps)) * (8.0*shape_ur-8.0*shape_ul-shape_urr+shape_ull);
171
- y += dshape_u_ref * tx.Row(j);
172
- }
173
- }
174
-
175
-
176
-
177
- template<typename FEL, int DIMSPACE, int DIM, int DIM_STRESS>
178
- void CalcSIMDDShapeFE(const FEL & fel, const SIMD_MappedIntegrationRule<DIM,DIMSPACE>& mir, BareSliceMatrix<SIMD<double>> mat, double eps = 1e-4)
179
- {
180
- size_t nd_u = fel.GetNDof();
181
-
182
- STACK_ARRAY(SIMD<double>, mem1, 2*DIM_STRESS*nd_u);
183
- FlatMatrix<SIMD<double>> shape_u_tmp(nd_u*DIM_STRESS, 1, &mem1[0]);
184
-
185
- FlatMatrix<SIMD<double>> dshape_u_ref(nd_u*DIM_STRESS, 1, &mem1[DIM_STRESS*nd_u]);
186
-
187
- LocalHeapMem<10000> lh("diffopgrad-lh");
188
-
189
- auto & ir = mir.IR();
190
- for (size_t i = 0; i < mir.Size(); i++)
191
- {
192
- const SIMD<IntegrationPoint> & ip = ir[i];
193
- const ElementTransformation & eltrans = mir[i].GetTransformation();
194
-
195
- for (int j = 0; j < DIM; j++) // d / dxj
196
- {
197
- HeapReset hr(lh);
198
- SIMD<IntegrationPoint> ipts[4];
199
- ipts[0] = ip;
200
- ipts[0](j) -= eps;
201
- ipts[1] = ip;
202
- ipts[1](j) += eps;
203
- ipts[2] = ip;
204
- ipts[2](j) -= 2*eps;
205
- ipts[3] = ip;
206
- ipts[3](j) += 2*eps;
207
-
208
- SIMD_IntegrationRule ir(4, ipts);
209
- SIMD_MappedIntegrationRule<DIM,DIMSPACE> mirl(ir, eltrans, lh);
210
-
211
- fel.CalcMappedShape (mirl[2], shape_u_tmp);
212
- dshape_u_ref = 1.0/(12.0*eps) * shape_u_tmp;
213
- fel.CalcMappedShape (mirl[3], shape_u_tmp);
214
- dshape_u_ref -= 1.0/(12.0*eps) * shape_u_tmp;
215
- fel.CalcMappedShape (mirl[0], shape_u_tmp);
216
- dshape_u_ref -= 8.0/(12.0*eps) * shape_u_tmp;
217
- fel.CalcMappedShape (mirl[1], shape_u_tmp);
218
- dshape_u_ref += 8.0/(12.0*eps) * shape_u_tmp;
219
-
220
- // dshape_u_ref = (8.0*shape_ur-8.0*shape_ul-shape_urr+shape_ull);
221
- for (size_t l = 0; l < DIM_STRESS; l++)
222
- for (size_t k = 0; k < nd_u; k++)
223
- mat(k*DIM_STRESS*DIM+j*DIM_STRESS+l, i) = dshape_u_ref(k*DIM_STRESS+l, 0);
224
- }
225
-
226
- for (size_t j = 0; j < DIM_STRESS; j++)
227
- for (size_t k = 0; k < nd_u; k++)
228
- {
229
- Vec<DIM,SIMD<double>> dshape_u_ref, dshape_u;
230
- for (size_t l = 0; l < DIM; l++)
231
- dshape_u_ref(l) = mat(k*DIM_STRESS*DIM+l*DIM+j, i);
232
-
233
- dshape_u = Trans(mir[i].GetJacobianInverse()) * dshape_u_ref;
234
-
235
- for (size_t l = 0; l < DIMSPACE; l++)
236
- mat(k*DIM_STRESS*DIMSPACE+l*DIM_STRESS+j, i) = dshape_u(l);
237
- }
238
- }
239
- }
240
-
241
- template<typename FEL, int DIMSPACE, int DIM, int DIM_STRESS>
242
- void ApplySIMDDShapeFE (const FEL & fel_u, const SIMD_BaseMappedIntegrationRule & bmir,
243
- BareSliceVector<double> x, BareSliceMatrix<SIMD<double>> y, double eps = 1e-4)
244
- {
245
- constexpr size_t BS = 64; // number of simd-points
246
- size_t maxnp = min2(BS, bmir.Size());
247
- size_t size = (maxnp+1)*SIMD<double>::Size()*500 + 5*DIM_STRESS*BS*sizeof(SIMD<double>);
248
- STACK_ARRAY(char, data, size);
249
- LocalHeap lh(data, size);
250
-
251
- auto & mir = static_cast<const SIMD_MappedIntegrationRule<DIM,DIMSPACE>&> (bmir);
252
- auto & ir = mir.IR();
253
- const ElementTransformation & trafo = mir.GetTransformation();
254
-
255
- for (int k = 0; k < mir.Size(); k++)
256
- for (int m = 0; m < DIM_STRESS*DIMSPACE; m++)
257
- y(m, k) = SIMD<double> (0.0);
258
-
259
- for (size_t base = 0; base < ir.Size(); base += BS)
260
- {
261
- HeapReset hr(lh);
262
- size_t num = min2(BS, ir.Size()-base);
263
-
264
- FlatMatrix<SIMD<double>> hxl(DIM_STRESS, num, lh);
265
- FlatMatrix<SIMD<double>> hxr(DIM_STRESS, num, lh);
266
- FlatMatrix<SIMD<double>> hxll(DIM_STRESS, num, lh);
267
- FlatMatrix<SIMD<double>> hxrr(DIM_STRESS, num, lh);
268
- FlatMatrix<SIMD<double>> hx(DIM_STRESS, num, lh);
269
-
270
- for (int j = 0; j < DIM; j++)
271
- {
272
- // hx = (F^-1 * x).Row(j)
273
- {
274
- HeapReset hr(lh);
275
- SIMD_IntegrationRule irl(num*SIMD<double>::Size(), lh);
276
- for (int k = 0; k < irl.Size(); k++)
277
- {
278
- irl[k] = ir[base+k];
279
- irl[k](j) -= eps;
280
- }
281
- SIMD_MappedIntegrationRule<DIM,DIMSPACE> mirl(irl, trafo, lh);
282
- fel_u.Evaluate (mirl, x, hxl);
283
- }
284
- {
285
- HeapReset hr(lh);
286
- SIMD_IntegrationRule irr(num*SIMD<double>::Size(), lh);
287
- for (int k = 0; k < irr.Size(); k++)
288
- {
289
- irr[k] = ir[base+k];
290
- irr[k](j) += eps;
291
- }
292
- SIMD_MappedIntegrationRule<DIM,DIMSPACE> mirr(irr, trafo, lh);
293
- fel_u.Evaluate (mirr, x, hxr);
294
- }
295
- {
296
- HeapReset hr(lh);
297
- SIMD_IntegrationRule irll(num*SIMD<double>::Size(), lh);
298
- for (int k = 0; k < irll.Size(); k++)
299
- {
300
- irll[k] = ir[base+k];
301
- irll[k](j) -= 2*eps;
302
- }
303
- SIMD_MappedIntegrationRule<DIM,DIMSPACE> mirll(irll, trafo, lh);
304
- fel_u.Evaluate (mirll, x, hxll);
305
- }
306
- {
307
- HeapReset hr(lh);
308
- SIMD_IntegrationRule irrr(num*SIMD<double>::Size(), lh);
309
- for (int k = 0; k < irrr.Size(); k++)
310
- {
311
- irrr[k] = ir[base+k];
312
- irrr[k](j) += 2*eps;
313
- }
314
- SIMD_MappedIntegrationRule<DIM,DIMSPACE> mirrr(irrr, trafo, lh);
315
- fel_u.Evaluate (mirrr, x, hxrr);
316
- }
317
- // hx = 1.0/(2*eps) * (hxr-hxl);
318
- hx = 1.0/(12*eps) * (8*hxr-8*hxl-hxrr+hxll);
319
- for (int k = 0; k < num; k++)
320
- {
321
- auto jacinv = mir[base+k].GetJacobianInverse();
322
- for (int l = 0; l < DIM_STRESS; l++)
323
- {
324
- for (int m = 0; m < DIMSPACE; m++)
325
- y(m*DIM_STRESS+l, base+k) += jacinv(j,m) * hx(l, k);
326
- }
327
- }
328
- }
329
- }
330
- }
331
-
332
-
333
-
334
-
335
- template<typename FEL, int DIMSPACE, int DIM, int DIM_STRESS>
336
- void AddTransSIMDDShapeFE (const FEL & fel_u, const SIMD_BaseMappedIntegrationRule & bmir,
337
- BareSliceMatrix<SIMD<double>> x, BareSliceVector<double> y, double eps = 1e-4)
338
- {
339
- constexpr size_t BS = 64; // number of simd-points
340
- size_t maxnp = min2(BS, bmir.Size());
341
- size_t size = (maxnp+1)*SIMD<double>::Size()*500;
342
-
343
- STACK_ARRAY(char, data, size);
344
- LocalHeap lh(data, size);
345
-
346
- auto & mir = static_cast<const SIMD_MappedIntegrationRule<DIM,DIMSPACE>&> (bmir);
347
- auto & ir = mir.IR();
348
- const ElementTransformation & trafo = mir.GetTransformation();
349
-
350
- for (size_t base = 0; base < ir.Size(); base += BS)
351
- {
352
- HeapReset hr(lh);
353
- size_t num = min2(BS, ir.Size()-base);
354
-
355
- FlatMatrix<SIMD<double>> hx1(DIM_STRESS, num, lh);
356
- FlatMatrix<SIMD<double>> hx2(DIM_STRESS, num, lh);
357
-
358
- for (size_t j = 0; j < DIM; j++)
359
- {
360
- // hx = (F^-1 * x).Row(j)
361
- for (size_t k = 0; k < num; k++)
362
- {
363
- auto jacinv = mir[base+k].GetJacobianInverse();
364
- for (int l = 0; l < DIM_STRESS; l++)
365
- {
366
- SIMD<double> sum = 0;
367
- for (int m = 0; m < DIMSPACE; m++)
368
- sum += jacinv(j,m) * x(m*DIM_STRESS+l, base+k);
369
-
370
- hx1(l,k) = (-(8/(12*eps)) * sum).Data();
371
- hx2(l,k) = ( (1/(12*eps)) * sum).Data();
372
- }
373
- }
374
-
375
- {
376
- HeapReset hr(lh);
377
- SIMD_IntegrationRule irl(num*SIMD<double>::Size(), lh);
378
- for (size_t k = 0; k < irl.Size(); k++)
379
- {
380
- irl[k] = ir[base+k];
381
- irl[k](j) -= eps;
382
- }
383
- SIMD_MappedIntegrationRule<DIM,DIMSPACE> mirl(irl, trafo, lh);
384
- fel_u.AddTrans (mirl, hx1, y);
385
- irl.NothingToDelete();
386
- }
387
- {
388
- HeapReset hr(lh);
389
- hx1 *= -1;
390
- SIMD_IntegrationRule irr(num*SIMD<double>::Size(), lh);
391
- for (int k = 0; k < irr.Size(); k++)
392
- {
393
- irr[k] = ir[base+k];
394
- irr[k](j) += eps;
395
- }
396
- SIMD_MappedIntegrationRule<DIM,DIMSPACE> mirr(irr, trafo, lh);
397
- fel_u.AddTrans (mirr, hx1, y);
398
- }
399
- {
400
- HeapReset hr(lh);
401
- SIMD_IntegrationRule irl(num*SIMD<double>::Size(), lh);
402
- for (int k = 0; k < irl.Size(); k++)
403
- {
404
- irl[k] = ir[base+k];
405
- irl[k](j) -= 2*eps;
406
- }
407
- SIMD_MappedIntegrationRule<DIM,DIMSPACE> mirl(irl, trafo, lh);
408
- fel_u.AddTrans (mirl, hx2, y);
409
- }
410
- {
411
- HeapReset hr(lh);
412
- hx2 *= -1;
413
- SIMD_IntegrationRule irr(num*SIMD<double>::Size(), lh);
414
- for (int k = 0; k < irr.Size(); k++)
415
- {
416
- irr[k] = ir[base+k];
417
- irr[k](j) += 2*eps;
418
- }
419
- SIMD_MappedIntegrationRule<DIM,DIMSPACE> mirr(irr, trafo, lh);
420
- fel_u.AddTrans (mirr, hx2, y);
421
- }
422
- }
423
- }
424
- }
425
-
426
-
427
-
428
- template <typename ME, typename ORIG, typename FEL>
429
- class NumDiffGradient : public DiffOp<ME>
430
- {
431
- typedef DiffOp<ME> BASE;
432
- public:
433
- static constexpr double eps() { return 1e-4; }
434
-
435
- static constexpr int DIM = ORIG::DIM;
436
- static constexpr int DIM_SPACE = ORIG::DIM_SPACE;
437
- static constexpr int DIM_ELEMENT = ORIG::DIM_ELEMENT;
438
- static constexpr int DIM_DMAT = ORIG::DIM_DMAT*ORIG::DIM_SPACE;
439
- static constexpr int DIFFORDER = ORIG::DIFFORDER+1;
440
-
441
-
442
- template <typename AFEL, typename SIP, typename MAT,
443
- typename std::enable_if<!std::is_convertible<MAT,BareSliceMatrix<double,ColMajor>>::value, int>::type = 0>
444
- static void GenerateMatrix (const AFEL & fel, const SIP & sip,
445
- MAT & mat, LocalHeap & lh)
446
- {
447
- cout << "nicht gut" << endl;
448
- cout << "type(fel) = " << typeid(fel).name() << ", sip = " << typeid(sip).name()
449
- << ", mat = " << typeid(mat).name() << endl;
450
- }
451
-
452
-
453
- static int DimRef() { return DIM_DMAT + ORIG::DIM_DMAT; } // grad(u), u
454
-
455
- template <typename IP, typename MAT>
456
- static void GenerateMatrixRef (const FiniteElement & fel, const IP & ip,
457
- MAT && mat, LocalHeap & lh)
458
- {
459
- int nd_u = fel.GetNDof();
460
-
461
- FlatMatrixFixWidth<ORIG::DIM_DMAT> shape_ul(nd_u, lh);
462
- FlatMatrixFixWidth<ORIG::DIM_DMAT> shape_ur(nd_u, lh);
463
- FlatMatrixFixWidth<ORIG::DIM_DMAT> shape_ull(nd_u, lh);
464
- FlatMatrixFixWidth<ORIG::DIM_DMAT> shape_urr(nd_u, lh);
465
- FlatMatrixFixWidth<ORIG::DIM_DMAT> dshape_u_ref(nd_u, lh);
466
-
467
- FlatMatrixFixWidth<DIM_ELEMENT> dshape_u_ref_comp(nd_u, lh);
468
- FlatMatrixFixWidth<DIM_SPACE> dshape_u(nd_u, lh);
469
-
470
- for (int j = 0; j < DIM_ELEMENT; j++) // d / dxj
471
- {
472
- IntegrationPoint ipl(ip);
473
- ipl(j) -= eps();
474
- IntegrationPoint ipr(ip);
475
- ipr(j) += eps();
476
- IntegrationPoint ipll(ip);
477
- ipll(j) -= 2*eps();
478
- IntegrationPoint iprr(ip);
479
- iprr(j) += 2*eps();
480
-
481
-
482
- ORIG::GenerateMatrixRef (fel, ipl, Trans(shape_ul), lh);
483
- ORIG::GenerateMatrixRef (fel, ipr, Trans(shape_ur), lh);
484
- ORIG::GenerateMatrixRef (fel, ipll, Trans(shape_ull), lh);
485
- ORIG::GenerateMatrixRef (fel, iprr, Trans(shape_urr), lh);
486
-
487
- dshape_u_ref = (1.0/(12.0*eps())) * (8.0*shape_ur-8.0*shape_ul-shape_urr+shape_ull);
488
- for (int l = 0; l < ORIG::DIM_DMAT; l++)
489
- mat.Row(j*ORIG::DIM_DMAT+l) = dshape_u_ref.Col(l);
490
- }
491
-
492
- ORIG::GenerateMatrixRef (fel, ip, mat.Rows(DIM_DMAT, DIM_DMAT+ORIG::DIM_DMAT), lh);
493
- }
494
-
495
-
496
-
497
- template <typename MIP, typename MAT>
498
- static void CalcTransformationMatrix (const MIP & mip,
499
- MAT & mat, LocalHeap & lh)
500
- {
501
- auto matgrad = Trans(static_cast<const MappedIntegrationPoint<DIM_SPACE,DIM_SPACE>&>(mip).GetJacobianInverse());
502
- Mat<DIM_SPACE,DIM_SPACE> matshape;
503
- ORIG::CalcTransformationMatrix (mip, matshape, lh);
504
-
505
- // input: du0/dx0, du1/dx0, du2/dx0, d0/dx1, ....
506
- // output du0/dx0, du1/dx0, du2/dx0 ...
507
- for (int i = 0; i < DIM_SPACE; i++)
508
- for (int j = 0; j < DIM_SPACE; j++)
509
- for (int k = 0; k < DIM_SPACE; k++)
510
- for (int l = 0; l < DIM_SPACE; l++)
511
- mat(k*DIM_SPACE+i, l*DIM_SPACE+j) = matshape(i,j) * matgrad(k,l);
512
-
513
-
514
- // numerical diff of ORIG::CalcTransformationMatrix (mip, matshape, lh);
515
-
516
- for (int i = 0; i < DIM_SPACE; i++)
517
- for (int j = 0; j < DIM_SPACE; j++)
518
- for (int k = 0; k < DIM_SPACE; k++)
519
- mat(k*DIM_SPACE+i, DIM_SPACE*DIM_SPACE+j) = 0.0;
520
-
521
- Mat<DIM_SPACE,DIM_SPACE> dmatshape_dxj;
522
- const IntegrationPoint& ip = mip.IP();
523
- const ElementTransformation & eltrans = mip.GetTransformation();
524
- for (int j = 0; j < DIM_ELEMENT; j++) // d / dxj
525
- {
526
- IntegrationPoint ipl(ip);
527
- ipl(j) -= eps();
528
- IntegrationPoint ipr(ip);
529
- ipr(j) += eps();
530
- IntegrationPoint ipll(ip);
531
- ipll(j) -= 2*eps();
532
- IntegrationPoint iprr(ip);
533
- iprr(j) += 2*eps();
534
-
535
- MappedIntegrationPoint<DIM_ELEMENT,DIM_SPACE> mipl(ipl, eltrans);
536
- MappedIntegrationPoint<DIM_ELEMENT,DIM_SPACE> mipr(ipr, eltrans);
537
- MappedIntegrationPoint<DIM_ELEMENT,DIM_SPACE> mipll(ipll, eltrans);
538
- MappedIntegrationPoint<DIM_ELEMENT,DIM_SPACE> miprr(iprr, eltrans);
539
-
540
- Mat<DIM_SPACE,DIM_SPACE> dml, dmll, dmr, dmrr;
541
- ORIG::CalcTransformationMatrix (mipl, dml, lh);
542
- ORIG::CalcTransformationMatrix (mipr, dmr, lh);
543
- ORIG::CalcTransformationMatrix (mipll, dmll, lh);
544
- ORIG::CalcTransformationMatrix (miprr, dmrr, lh);
545
-
546
- dmatshape_dxj = (1.0/(12.0*eps())) * (8.0*dmr-8.0*dml-dmrr+dmll);
547
-
548
- for (int i = 0; i < DIM_SPACE; i++)
549
- for (int l = 0; l < DIM_SPACE; l++)
550
- for (int k = 0; k < DIM_SPACE; k++)
551
- mat(k*DIM_SPACE+i, DIM_SPACE*DIM_SPACE+l) += matgrad(k,j) * dmatshape_dxj(i,l);
552
- }
553
-
554
-
555
- }
556
-
557
-
558
-
559
-
560
- template <typename AFEL, typename MIP, typename MAT,
561
- typename std::enable_if<std::is_convertible<MAT,BareSliceMatrix<double,ColMajor>>::value, int>::type = 0>
562
- static void GenerateMatrix (const AFEL & bfel, const MIP & mip,
563
- MAT mat, LocalHeap & lh)
564
- {
565
- // CalcDShapeFE<FEL,DIM_SPACE,DIM_ELEMENT,ORIG::DIM_DMAT>
566
- // (static_cast<const FEL&>(fel), mip, Trans(mat), lh, eps());
567
-
568
- HeapReset hr(lh);
569
-
570
- int nd_u = bfel.GetNDof();
571
- const IntegrationPoint& ip = mip.IP();
572
- const ElementTransformation & eltrans = mip.GetTransformation();
573
- FlatMatrixFixWidth<ORIG::DIM_DMAT> shape_ul(nd_u, lh);
574
- FlatMatrixFixWidth<ORIG::DIM_DMAT> shape_ur(nd_u, lh);
575
- FlatMatrixFixWidth<ORIG::DIM_DMAT> shape_ull(nd_u, lh);
576
- FlatMatrixFixWidth<ORIG::DIM_DMAT> shape_urr(nd_u, lh);
577
- FlatMatrixFixWidth<ORIG::DIM_DMAT> dshape_u_ref(nd_u, lh);
578
-
579
- FlatMatrixFixWidth<DIM_ELEMENT> dshape_u_ref_comp(nd_u, lh);
580
- FlatMatrixFixWidth<DIM_SPACE> dshape_u(nd_u, lh);
581
-
582
- for (int j = 0; j < DIM_ELEMENT; j++) // d / dxj
583
- {
584
- IntegrationPoint ipl(ip);
585
- ipl(j) -= eps();
586
- IntegrationPoint ipr(ip);
587
- ipr(j) += eps();
588
- IntegrationPoint ipll(ip);
589
- ipll(j) -= 2*eps();
590
- IntegrationPoint iprr(ip);
591
- iprr(j) += 2*eps();
592
-
593
- MappedIntegrationPoint<DIM_ELEMENT,DIM_SPACE> mipl(ipl, eltrans);
594
- MappedIntegrationPoint<DIM_ELEMENT,DIM_SPACE> mipr(ipr, eltrans);
595
- MappedIntegrationPoint<DIM_ELEMENT,DIM_SPACE> mipll(ipll, eltrans);
596
- MappedIntegrationPoint<DIM_ELEMENT,DIM_SPACE> miprr(iprr, eltrans);
597
-
598
- ORIG::GenerateMatrix (bfel, mipl, Trans(shape_ul), lh);
599
- ORIG::GenerateMatrix (bfel, mipr, Trans(shape_ur), lh);
600
- ORIG::GenerateMatrix (bfel, mipll, Trans(shape_ull), lh);
601
- ORIG::GenerateMatrix (bfel, miprr, Trans(shape_urr), lh);
602
-
603
- dshape_u_ref = (1.0/(12.0*eps())) * (8.0*shape_ur-8.0*shape_ul-shape_urr+shape_ull);
604
- for (int l = 0; l < ORIG::DIM_DMAT; l++)
605
- mat.Row(j*ORIG::DIM_DMAT+l) = dshape_u_ref.Col(l);
606
- }
607
-
608
- for (int j = 0; j < ORIG::DIM_DMAT; j++)
609
- {
610
- for (int k = 0; k < nd_u; k++)
611
- for (int l = 0; l < DIM_ELEMENT; l++)
612
- dshape_u_ref_comp(k,l) = mat(l*ORIG::DIM_DMAT+j, k);
613
-
614
- dshape_u = dshape_u_ref_comp * mip.GetJacobianInverse();
615
-
616
- for (int k = 0; k < nd_u; k++)
617
- for (int l = 0; l < DIM_SPACE; l++)
618
- mat(l*ORIG::DIM_DMAT+j, k) = dshape_u(k,l);
619
- }
620
- }
621
-
622
-
623
-
624
- /*
625
- template <typename AFEL, typename MIP, typename MAT,
626
- typename std::enable_if<std::is_convertible<MAT,SliceMatrix<double,ColMajor>>::value, int>::type = 0>
627
- static void GenerateMatrix (const AFEL & fel, const MIP & mip,
628
- MAT mat, LocalHeap & lh)
629
- {
630
- CalcDShapeFE<FEL,DIM_SPACE,DIM_ELEMENT,ORIG::DIM_DMAT>
631
- (static_cast<const FEL&>(fel), mip, Trans(mat), lh, eps());
632
- }
633
-
634
- template <typename AFEL, typename MIP, class TVX, class TVY>
635
- static void Apply (const AFEL & fel, const MIP & mip,
636
- const TVX & x, TVY && y,
637
- LocalHeap & lh)
638
- {
639
- HeapReset hr(lh);
640
- FlatMatrixFixWidth<DIM_SPACE*ORIG::DIM_DMAT> hm(fel.GetNDof(),lh);
641
- CalcDShapeFE<FEL,DIM_SPACE,DIM_ELEMENT,ORIG::DIM_DMAT>
642
- (static_cast<const FEL&>(fel), mip, hm, lh, eps());
643
- y = Trans(hm)*x;
644
- }
645
-
646
- template <typename AFEL, typename MIP, class TVX, class TVY>
647
- static void ApplyTrans (const AFEL & fel, const MIP & mip,
648
- const TVX & x, TVY & by,
649
- LocalHeap & lh)
650
- {
651
- ApplyTransDShapeFE<FEL,DIM_SPACE,DIM_ELEMENT,ORIG::DIM_DMAT>
652
- (static_cast<const FEL&>(fel), mip, x, by, lh, eps());
653
- }
654
- */
655
-
656
-
657
- static void GenerateMatrixSIMDIR (const FiniteElement & bfel,
658
- const SIMD_BaseMappedIntegrationRule & bmir, BareSliceMatrix<SIMD<double>> mat)
659
- {
660
- /*
661
- CalcSIMDDShapeFE<FEL,DIM_SPACE,DIM_ELEMENT,ORIG::DIM_DMAT>
662
- (static_cast<const FEL&>(bfel), static_cast<const SIMD_MappedIntegrationRule<DIM_ELEMENT,DIM_SPACE> &>(bmir), mat, eps());
663
- return;
664
- */
665
-
666
- auto & mir = static_cast<const SIMD_MappedIntegrationRule<DIM_ELEMENT,DIM_SPACE>&> (bmir);
667
- // auto & fel_u = static_cast<const FEL&>(bfel);
668
- size_t nd_u = bfel.GetNDof();
669
-
670
- STACK_ARRAY(SIMD<double>, mem1, 5*ORIG::DIM_DMAT*nd_u);
671
- FlatMatrix<SIMD<double>> shape_u_tmp(nd_u*ORIG::DIM_DMAT, 4, &mem1[0]);
672
- FlatMatrix<SIMD<double>> dshape_u_ref(nd_u*ORIG::DIM_DMAT, 1, &mem1[4*ORIG::DIM_DMAT*nd_u]);
673
-
674
- LocalHeapMem<10000> lh("diffopgrad-lh");
675
-
676
- auto & ir = mir.IR();
677
- for (size_t i = 0; i < mir.Size(); i++)
678
- {
679
- const SIMD<IntegrationPoint> & ip = ir[i];
680
- const ElementTransformation & eltrans = mir[i].GetTransformation();
681
-
682
- double dist[] = { 1, -1, 2, -2 };
683
- double weight[] = { 8/12., -8/12., -1/12., 1/12. };
684
-
685
- for (int j = 0; j < DIM_ELEMENT; j++) // d / dxj
686
- {
687
- HeapReset hr(lh);
688
- SIMD<IntegrationPoint> ipts[4];
689
- for (int i = 0; i < 4; i++)
690
- {
691
- ipts[i] = ip;
692
- ipts[i](j) += dist[i]*eps();
693
- }
694
- SIMD_IntegrationRule ir(4, ipts);
695
- SIMD_MappedIntegrationRule<DIM_ELEMENT,DIM_SPACE> mirl(ir, eltrans, lh);
696
- ORIG::GenerateMatrixSIMDIR (bfel, mirl, shape_u_tmp);
697
-
698
- dshape_u_ref.Col(0) =
699
- weight[0]/eps() * shape_u_tmp.Col(0) +
700
- weight[1]/eps() * shape_u_tmp.Col(1) +
701
- weight[2]/eps() * shape_u_tmp.Col(2) +
702
- weight[3]/eps() * shape_u_tmp.Col(3);
703
-
704
- for (size_t l = 0; l < ORIG::DIM_DMAT; l++)
705
- for (size_t k = 0; k < nd_u; k++)
706
- mat(k*ORIG::DIM_DMAT*DIM_ELEMENT+j*ORIG::DIM_DMAT+l, i) = dshape_u_ref(k*ORIG::DIM_DMAT+l, 0);
707
- }
708
-
709
- for (size_t j = 0; j < ORIG::DIM_DMAT; j++)
710
- for (size_t k = 0; k < nd_u; k++)
711
- {
712
- Vec<DIM_ELEMENT,SIMD<double>> dshape_u_ref;
713
- Vec<DIM_SPACE,SIMD<double>> dshape_u;
714
-
715
- for (size_t l = 0; l < DIM_ELEMENT; l++)
716
- dshape_u_ref(l) = mat(k*ORIG::DIM_DMAT*DIM_ELEMENT+l*DIM_ELEMENT+j, i);
717
-
718
- dshape_u = Trans(mir[i].GetJacobianInverse()) * dshape_u_ref;
719
-
720
- for (size_t l = 0; l < DIM_SPACE; l++)
721
- mat(k*ORIG::DIM_DMAT*DIM_SPACE+l*ORIG::DIM_DMAT+j, i) = dshape_u(l);
722
- }
723
- }
724
- }
725
-
726
-
727
-
728
- using BASE::ApplySIMDIR;
729
- static void ApplySIMDIR (const FiniteElement & fel, const SIMD_BaseMappedIntegrationRule & bmir,
730
- BareSliceVector<double> x, BareSliceMatrix<SIMD<double>> y)
731
- {
732
- // ApplySIMDDShapeFE<FEL,ORIG::DIM_SPACE,ORIG::DIM_ELEMENT,ORIG::DIM_DMAT>(static_cast<const FEL&>(fel), bmir, x, y, eps());
733
- // return;
734
-
735
- constexpr size_t BS = 16; // number of simd-points
736
- size_t maxnp = min2(BS, bmir.Size());
737
- size_t size = (maxnp+1)*SIMD<double>::Size()*500 + 5*ORIG::DIM_DMAT*BS*sizeof(SIMD<double>);
738
- size *= 4;
739
- STACK_ARRAY(char, data, size);
740
- LocalHeap lh(data, size);
741
-
742
- auto & mir = static_cast<const SIMD_MappedIntegrationRule<DIM_ELEMENT,DIM_SPACE>&> (bmir);
743
- auto & ir = mir.IR();
744
- const ElementTransformation & trafo = mir.GetTransformation();
745
-
746
- y.AddSize(ORIG::DIM_DMAT*DIM_SPACE, mir.Size()) = SIMD<double>(0.);
747
- for (size_t base = 0; base < ir.Size(); base += BS)
748
- {
749
- HeapReset hr(lh);
750
- size_t num = std::min(BS, ir.Size()-base);
751
- FlatMatrix<SIMD<double>> hxi(ORIG::DIM_DMAT, 4*num, lh);
752
-
753
- static constexpr double dist[] = { 1, -1, 2, -2 };
754
- static constexpr double weight[] = { 8/12., -8/12., -1/12., 1/12. };
755
-
756
- for (int j = 0; j < DIM_ELEMENT; j++)
757
- {
758
- HeapReset hr(lh);
759
-
760
- SIMD_IntegrationRule iri(4*num*SIMD<double>::Size(), lh);
761
-
762
- for (int k = 0; k < num; k++)
763
- for (int i = 0; i < 4; i++)
764
- {
765
- iri[4*k+i] = ir[base+k];
766
- iri[4*k+i](j) += dist[i]*eps();
767
- }
768
-
769
- SIMD_MappedIntegrationRule<DIM_ELEMENT,DIM_SPACE> mir2(iri, trafo, lh);
770
- ORIG::ApplySIMDIR (fel, mir2, x, hxi);
771
-
772
- for (int k = 0; k < num; k++)
773
- {
774
- Vec<ORIG::DIM_DMAT, SIMD<double>> hxk =
775
- weight[0]/eps() * hxi.Col(4*k) +
776
- weight[1]/eps() * hxi.Col(4*k+1) +
777
- weight[2]/eps() * hxi.Col(4*k+2) +
778
- weight[3]/eps() * hxi.Col(4*k+3);
779
-
780
- auto jacinv = mir[base+k].GetJacobianInverse();
781
- for (int l = 0; l < ORIG::DIM_DMAT; l++)
782
- for (int m = 0; m < DIM_SPACE; m++)
783
- y(m*ORIG::DIM_DMAT+l, base+k) += jacinv(j,m) * hxk(l); // , k);
784
- }
785
- }
786
- }
787
- }
788
-
789
-
790
-
791
-
792
- using BASE::AddTransSIMDIR;
793
- static void AddTransSIMDIR (const FiniteElement & fel, const SIMD_BaseMappedIntegrationRule & bmir,
794
- BareSliceMatrix<SIMD<double>> x, BareSliceVector<double> y)
795
- {
796
- // AddTransSIMDDShapeFE<FEL,DIM_SPACE,DIM_ELEMENT,ORIG::DIM_DMAT>(static_cast<const FEL&>(fel), bmir, x, y, eps());
797
- // return;
798
-
799
- // auto & fel_u = static_cast<const FEL&>(fel);
800
- constexpr size_t BS = 64; // number of simd-points
801
- size_t maxnp = std::min(BS, bmir.Size());
802
- size_t size = (maxnp+1)*SIMD<double>::Size()*500;
803
-
804
- STACK_ARRAY(char, data, size);
805
- LocalHeap lh(data, size);
806
-
807
- auto & mir = static_cast<const SIMD_MappedIntegrationRule<DIM_ELEMENT,DIM_SPACE>&> (bmir);
808
- auto & ir = mir.IR();
809
- const ElementTransformation & trafo = mir.GetTransformation();
810
-
811
- for (size_t base = 0; base < ir.Size(); base += BS)
812
- {
813
- HeapReset hr(lh);
814
- size_t num = min2(BS, ir.Size()-base);
815
-
816
- FlatMatrix<SIMD<double>> hx1(ORIG::DIM_DMAT, num, lh);
817
- FlatMatrix<SIMD<double>> hx(ORIG::DIM_DMAT, num, lh);
818
-
819
- for (size_t j = 0; j < DIM_ELEMENT; j++)
820
- {
821
- // hx = (F^-1 * x).Row(j)
822
- for (size_t k = 0; k < num; k++)
823
- {
824
- auto jacinv = mir[base+k].GetJacobianInverse();
825
- for (int l = 0; l < ORIG::DIM_DMAT; l++)
826
- {
827
- SIMD<double> sum = 0;
828
- for (int m = 0; m < DIM_SPACE; m++)
829
- sum += jacinv(j,m) * x(m*ORIG::DIM_DMAT+l, base+k);
830
- hx(l,k) = sum;
831
- }
832
- }
833
-
834
- double dist[] = { 1, -1, 2, -2 };
835
- double weight[] = { 8/12., -8/12., -1/12., 1/12. };
836
- for (int i = 0; i < 4; i++)
837
- {
838
- HeapReset hr(lh);
839
- SIMD_IntegrationRule irl(num*SIMD<double>::Size(), lh);
840
- for (size_t k = 0; k < irl.Size(); k++)
841
- {
842
- irl[k] = ir[base+k];
843
- irl[k](j) += dist[i]*eps();
844
- }
845
- SIMD_MappedIntegrationRule<DIM_ELEMENT,DIM_SPACE> mirl(irl, trafo, lh);
846
- hx1 = weight[i]/eps() * hx;
847
- // fel_u.AddTrans (mirl, hx1, y);
848
- ORIG::AddTransSIMDIR(fel, mirl, hx1, y);
849
- irl.NothingToDelete();
850
- }
851
- }
852
- }
853
- }
854
- };
855
- }
856
-
857
- #endif