ngsolve 6.2.2501.post21.dev1__cp313-cp313-macosx_10_15_universal2.whl → 6.2.2501.post37.dev1__cp313-cp313-macosx_10_15_universal2.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of ngsolve might be problematic. Click here for more details.

Files changed (286) hide show
  1. ngsolve/webgui.py +1 -1
  2. {ngsolve-6.2.2501.post21.dev1.dist-info → ngsolve-6.2.2501.post37.dev1.dist-info}/METADATA +2 -2
  3. ngsolve-6.2.2501.post37.dev1.dist-info/RECORD +25 -0
  4. netgen/include/arnoldi.hpp +0 -55
  5. netgen/include/bandmatrix.hpp +0 -334
  6. netgen/include/basematrix.hpp +0 -957
  7. netgen/include/basevector.hpp +0 -1268
  8. netgen/include/bdbequations.hpp +0 -2752
  9. netgen/include/bdbintegrator.hpp +0 -1659
  10. netgen/include/bessel.hpp +0 -1064
  11. netgen/include/bilinearform.hpp +0 -963
  12. netgen/include/bla.hpp +0 -29
  13. netgen/include/blockalloc.hpp +0 -95
  14. netgen/include/blockjacobi.hpp +0 -316
  15. netgen/include/bspline.hpp +0 -114
  16. netgen/include/calcinverse.hpp +0 -141
  17. netgen/include/cg.hpp +0 -368
  18. netgen/include/chebyshev.hpp +0 -44
  19. netgen/include/cholesky.hpp +0 -720
  20. netgen/include/clapack.h +0 -7254
  21. netgen/include/code_generation.hpp +0 -296
  22. netgen/include/coefficient.hpp +0 -2006
  23. netgen/include/coefficient_impl.hpp +0 -18
  24. netgen/include/coefficient_stdmath.hpp +0 -157
  25. netgen/include/commutingAMG.hpp +0 -106
  26. netgen/include/comp.hpp +0 -79
  27. netgen/include/compatibility.hpp +0 -41
  28. netgen/include/complex_wrapper.hpp +0 -73
  29. netgen/include/compressedfespace.hpp +0 -110
  30. netgen/include/contact.hpp +0 -231
  31. netgen/include/diagonalmatrix.hpp +0 -154
  32. netgen/include/differentialoperator.hpp +0 -276
  33. netgen/include/diffop.hpp +0 -1286
  34. netgen/include/diffop_impl.hpp +0 -326
  35. netgen/include/discontinuous.hpp +0 -84
  36. netgen/include/dump.hpp +0 -949
  37. netgen/include/eigen.hpp +0 -60
  38. netgen/include/eigensystem.hpp +0 -18
  39. netgen/include/elasticity_equations.hpp +0 -595
  40. netgen/include/elementbyelement.hpp +0 -195
  41. netgen/include/elementtopology.hpp +0 -1760
  42. netgen/include/elementtransformation.hpp +0 -339
  43. netgen/include/evalfunc.hpp +0 -405
  44. netgen/include/expr.hpp +0 -1655
  45. netgen/include/facetfe.hpp +0 -175
  46. netgen/include/facetfespace.hpp +0 -178
  47. netgen/include/facethofe.hpp +0 -111
  48. netgen/include/facetsurffespace.hpp +0 -112
  49. netgen/include/fe_interfaces.hpp +0 -32
  50. netgen/include/fem.hpp +0 -87
  51. netgen/include/fesconvert.hpp +0 -14
  52. netgen/include/fespace.hpp +0 -1445
  53. netgen/include/finiteelement.hpp +0 -286
  54. netgen/include/globalinterfacespace.hpp +0 -77
  55. netgen/include/globalspace.hpp +0 -115
  56. netgen/include/gridfunction.hpp +0 -525
  57. netgen/include/h1amg.hpp +0 -41
  58. netgen/include/h1hofe.hpp +0 -188
  59. netgen/include/h1hofe_impl.hpp +0 -1262
  60. netgen/include/h1hofefo.hpp +0 -148
  61. netgen/include/h1hofefo_impl.hpp +0 -185
  62. netgen/include/h1hofespace.hpp +0 -167
  63. netgen/include/h1lofe.hpp +0 -1237
  64. netgen/include/h1lumping.hpp +0 -35
  65. netgen/include/hcurl_equations.hpp +0 -1352
  66. netgen/include/hcurlcurlfe.hpp +0 -2221
  67. netgen/include/hcurlcurlfespace.hpp +0 -78
  68. netgen/include/hcurlfe.hpp +0 -259
  69. netgen/include/hcurlfe_utils.hpp +0 -107
  70. netgen/include/hcurlhdiv_dshape.hpp +0 -857
  71. netgen/include/hcurlhdivfes.hpp +0 -308
  72. netgen/include/hcurlhofe.hpp +0 -175
  73. netgen/include/hcurlhofe_impl.hpp +0 -1871
  74. netgen/include/hcurlhofespace.hpp +0 -193
  75. netgen/include/hcurllofe.hpp +0 -1146
  76. netgen/include/hdiv_equations.hpp +0 -865
  77. netgen/include/hdivdivfe.hpp +0 -2923
  78. netgen/include/hdivdivsurfacespace.hpp +0 -76
  79. netgen/include/hdivfe.hpp +0 -206
  80. netgen/include/hdivfe_utils.hpp +0 -716
  81. netgen/include/hdivfes.hpp +0 -75
  82. netgen/include/hdivhofe.hpp +0 -447
  83. netgen/include/hdivhofe_impl.hpp +0 -1107
  84. netgen/include/hdivhofefo.hpp +0 -229
  85. netgen/include/hdivhofespace.hpp +0 -175
  86. netgen/include/hdivhosurfacefespace.hpp +0 -106
  87. netgen/include/hdivlofe.hpp +0 -773
  88. netgen/include/hidden.hpp +0 -74
  89. netgen/include/householder.hpp +0 -181
  90. netgen/include/hypre_ams_precond.hpp +0 -123
  91. netgen/include/hypre_precond.hpp +0 -73
  92. netgen/include/integrator.hpp +0 -2024
  93. netgen/include/integratorcf.hpp +0 -253
  94. netgen/include/interpolate.hpp +0 -49
  95. netgen/include/intrule.hpp +0 -2541
  96. netgen/include/irspace.hpp +0 -49
  97. netgen/include/jacobi.hpp +0 -136
  98. netgen/include/l2hofe.hpp +0 -193
  99. netgen/include/l2hofe_impl.hpp +0 -564
  100. netgen/include/l2hofefo.hpp +0 -542
  101. netgen/include/l2hofespace.hpp +0 -344
  102. netgen/include/la.hpp +0 -38
  103. netgen/include/linearform.hpp +0 -266
  104. netgen/include/matrix.hpp +0 -2140
  105. netgen/include/memusage.hpp +0 -41
  106. netgen/include/meshaccess.hpp +0 -1358
  107. netgen/include/mgpre.hpp +0 -204
  108. netgen/include/mptools.hpp +0 -2145
  109. netgen/include/multigrid.hpp +0 -42
  110. netgen/include/multivector.hpp +0 -447
  111. netgen/include/mumpsinverse.hpp +0 -187
  112. netgen/include/mycomplex.hpp +0 -361
  113. netgen/include/ng_lapack.hpp +0 -1661
  114. netgen/include/ngblas.hpp +0 -1099
  115. netgen/include/ngs_defines.hpp +0 -30
  116. netgen/include/ngs_stdcpp_include.hpp +0 -106
  117. netgen/include/ngs_utils.hpp +0 -121
  118. netgen/include/ngsobject.hpp +0 -1019
  119. netgen/include/ngsstream.hpp +0 -113
  120. netgen/include/ngstd.hpp +0 -72
  121. netgen/include/nodalhofe.hpp +0 -96
  122. netgen/include/nodalhofe_impl.hpp +0 -141
  123. netgen/include/normalfacetfe.hpp +0 -223
  124. netgen/include/normalfacetfespace.hpp +0 -98
  125. netgen/include/normalfacetsurfacefespace.hpp +0 -84
  126. netgen/include/order.hpp +0 -251
  127. netgen/include/parallel_matrices.hpp +0 -222
  128. netgen/include/paralleldofs.hpp +0 -340
  129. netgen/include/parallelngs.hpp +0 -23
  130. netgen/include/parallelvector.hpp +0 -269
  131. netgen/include/pardisoinverse.hpp +0 -200
  132. netgen/include/periodic.hpp +0 -125
  133. netgen/include/plateaufespace.hpp +0 -25
  134. netgen/include/pml.hpp +0 -275
  135. netgen/include/pmltrafo.hpp +0 -631
  136. netgen/include/postproc.hpp +0 -142
  137. netgen/include/precomp.hpp +0 -60
  138. netgen/include/preconditioner.hpp +0 -602
  139. netgen/include/prolongation.hpp +0 -235
  140. netgen/include/python_comp.hpp +0 -107
  141. netgen/include/python_fem.hpp +0 -89
  142. netgen/include/python_linalg.hpp +0 -58
  143. netgen/include/python_ngstd.hpp +0 -385
  144. netgen/include/recursive_pol.hpp +0 -4844
  145. netgen/include/recursive_pol_tet.hpp +0 -395
  146. netgen/include/recursive_pol_trig.hpp +0 -492
  147. netgen/include/reorderedfespace.hpp +0 -81
  148. netgen/include/sample_sort.hpp +0 -105
  149. netgen/include/scalarfe.hpp +0 -335
  150. netgen/include/shapefunction_utils.hpp +0 -113
  151. netgen/include/simd_complex.hpp +0 -284
  152. netgen/include/smoother.hpp +0 -253
  153. netgen/include/solve.hpp +0 -89
  154. netgen/include/sparsecholesky.hpp +0 -313
  155. netgen/include/sparsematrix.hpp +0 -1038
  156. netgen/include/sparsematrix_dyn.hpp +0 -91
  157. netgen/include/sparsematrix_impl.hpp +0 -920
  158. netgen/include/special_matrix.hpp +0 -461
  159. netgen/include/specialelement.hpp +0 -125
  160. netgen/include/statushandler.hpp +0 -33
  161. netgen/include/stringops.hpp +0 -12
  162. netgen/include/superluinverse.hpp +0 -136
  163. netgen/include/symbolicintegrator.hpp +0 -849
  164. netgen/include/symmetricmatrix.hpp +0 -144
  165. netgen/include/tangentialfacetfe.hpp +0 -224
  166. netgen/include/tangentialfacetfespace.hpp +0 -106
  167. netgen/include/tensor.hpp +0 -522
  168. netgen/include/tensorcoefficient.hpp +0 -446
  169. netgen/include/tensorproductintegrator.hpp +0 -113
  170. netgen/include/thcurlfe.hpp +0 -128
  171. netgen/include/thcurlfe_impl.hpp +0 -380
  172. netgen/include/thdivfe.hpp +0 -80
  173. netgen/include/thdivfe_impl.hpp +0 -426
  174. netgen/include/tpdiffop.hpp +0 -461
  175. netgen/include/tpfes.hpp +0 -133
  176. netgen/include/tpintrule.hpp +0 -224
  177. netgen/include/triangular.hpp +0 -465
  178. netgen/include/tscalarfe.hpp +0 -245
  179. netgen/include/tscalarfe_impl.hpp +0 -1029
  180. netgen/include/umfpackinverse.hpp +0 -148
  181. netgen/include/vector.hpp +0 -1219
  182. netgen/include/voxelcoefficientfunction.hpp +0 -41
  183. netgen/include/vtkoutput.hpp +0 -198
  184. netgen/include/vvector.hpp +0 -208
  185. netgen/include/webgui.hpp +0 -92
  186. netgen/libngbla.dylib +0 -0
  187. netgen/libngcomp.dylib +0 -0
  188. netgen/libngfem.dylib +0 -0
  189. netgen/libngla.dylib +0 -0
  190. netgen/libngsolve.dylib +0 -0
  191. netgen/libngstd.dylib +0 -0
  192. ngsolve/__init__.pyi +0 -231
  193. ngsolve/bla.pyi +0 -1139
  194. ngsolve/bvp.pyi +0 -32
  195. ngsolve/cmake/NGSolveConfig.cmake +0 -102
  196. ngsolve/cmake/ngsolve-targets-release.cmake +0 -69
  197. ngsolve/cmake/ngsolve-targets.cmake +0 -163
  198. ngsolve/comp/__init__.pyi +0 -5382
  199. ngsolve/comp/pml.pyi +0 -89
  200. ngsolve/config/__init__.py +0 -1
  201. ngsolve/config/__init__.pyi +0 -43
  202. ngsolve/config/__main__.py +0 -4
  203. ngsolve/config/config.py +0 -60
  204. ngsolve/config/config.pyi +0 -45
  205. ngsolve/demos/TensorProduct/__init__.py +0 -0
  206. ngsolve/demos/TensorProduct/tp_dg_1d_1d.py +0 -80
  207. ngsolve/demos/TensorProduct/tp_dg_1d_2d.py +0 -73
  208. ngsolve/demos/TensorProduct/tp_dg_2d_1d.py +0 -72
  209. ngsolve/demos/TensorProduct/tp_dg_2d_2d.py +0 -66
  210. ngsolve/demos/__init__.py +0 -0
  211. ngsolve/demos/howto/__init__.py +0 -0
  212. ngsolve/demos/howto/hhj.py +0 -44
  213. ngsolve/demos/howto/hybrid_dg.py +0 -53
  214. ngsolve/demos/howto/mixed.py +0 -30
  215. ngsolve/demos/howto/nonlin.py +0 -29
  216. ngsolve/demos/howto/pickling.py +0 -26
  217. ngsolve/demos/howto/pml.py +0 -31
  218. ngsolve/demos/howto/taskmanager.py +0 -20
  219. ngsolve/demos/howto/tdnns.py +0 -47
  220. ngsolve/demos/howto/timeDG-skeleton.py +0 -45
  221. ngsolve/demos/howto/timeDG.py +0 -38
  222. ngsolve/demos/howto/timeDGlap.py +0 -42
  223. ngsolve/demos/howto/timeDGwave.py +0 -61
  224. ngsolve/demos/intro/__init__.py +0 -0
  225. ngsolve/demos/intro/adaptive.py +0 -123
  226. ngsolve/demos/intro/cmagnet.py +0 -62
  227. ngsolve/demos/intro/elasticity.py +0 -76
  228. ngsolve/demos/intro/navierstokes.py +0 -74
  229. ngsolve/demos/intro/poisson.ipynb +0 -170
  230. ngsolve/demos/intro/poisson.py +0 -41
  231. ngsolve/demos/mpi/__init__.py +0 -0
  232. ngsolve/demos/mpi/mpi_cmagnet.py +0 -87
  233. ngsolve/demos/mpi/mpi_navierstokes.py +0 -117
  234. ngsolve/demos/mpi/mpi_poisson.py +0 -89
  235. ngsolve/demos/mpi/mpi_timeDG.py +0 -82
  236. ngsolve/directsolvers.pyi +0 -18
  237. ngsolve/eigenvalues.pyi +0 -30
  238. ngsolve/fem.pyi +0 -1707
  239. ngsolve/krylovspace.pyi +0 -309
  240. ngsolve/la.pyi +0 -1218
  241. ngsolve/ngslib.so +0 -0
  242. ngsolve/ngstd.pyi +0 -58
  243. ngsolve/nonlinearsolvers.pyi +0 -98
  244. ngsolve/preconditioners.pyi +0 -6
  245. ngsolve/solve.pyi +0 -108
  246. ngsolve/solvers.pyi +0 -14
  247. ngsolve/timestepping.pyi +0 -34
  248. ngsolve/timing.pyi +0 -57
  249. ngsolve/utils.pyi +0 -279
  250. ngsolve-6.2.2501.post21.dev1.data/data/Netgen.icns +0 -0
  251. ngsolve-6.2.2501.post21.dev1.data/data/bin/ngscxx +0 -17
  252. ngsolve-6.2.2501.post21.dev1.data/data/bin/ngsld +0 -13
  253. ngsolve-6.2.2501.post21.dev1.data/data/bin/ngsolve.tcl +0 -648
  254. ngsolve-6.2.2501.post21.dev1.data/data/bin/ngspy +0 -2
  255. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/beam.geo +0 -17
  256. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/beam.vol +0 -240
  257. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/chip.in2d +0 -41
  258. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/chip.vol +0 -614
  259. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/coil.geo +0 -12
  260. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/coil.vol +0 -2560
  261. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/coilshield.geo +0 -24
  262. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/coilshield.vol +0 -3179
  263. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/cube.geo +0 -19
  264. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/cube.vol +0 -1832
  265. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d10_DGdoubleglazing.pde +0 -50
  266. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d11_chip_nitsche.pde +0 -40
  267. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d1_square.pde +0 -43
  268. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d2_chip.pde +0 -35
  269. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d3_helmholtz.pde +0 -22
  270. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d4_cube.pde +0 -46
  271. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d5_beam.pde +0 -74
  272. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d6_shaft.pde +0 -73
  273. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d7_coil.pde +0 -50
  274. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d8_coilshield.pde +0 -49
  275. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/d9_hybridDG.pde +0 -72
  276. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/doubleglazing.in2d +0 -27
  277. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/doubleglazing.vol +0 -737
  278. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/piezo2d40round4.vol.gz +0 -0
  279. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/shaft.geo +0 -73
  280. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/shaft.vol +0 -4291
  281. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/square.in2d +0 -17
  282. ngsolve-6.2.2501.post21.dev1.data/data/share/ngsolve/square.vol +0 -149
  283. ngsolve-6.2.2501.post21.dev1.dist-info/RECORD +0 -304
  284. {ngsolve-6.2.2501.post21.dev1.dist-info → ngsolve-6.2.2501.post37.dev1.dist-info}/LICENSE +0 -0
  285. {ngsolve-6.2.2501.post21.dev1.dist-info → ngsolve-6.2.2501.post37.dev1.dist-info}/WHEEL +0 -0
  286. {ngsolve-6.2.2501.post21.dev1.dist-info → ngsolve-6.2.2501.post37.dev1.dist-info}/top_level.txt +0 -0
netgen/include/dump.hpp DELETED
@@ -1,949 +0,0 @@
1
- #ifndef FILE_NGS_DUMP
2
- #define FILE_NGS_DUMP
3
-
4
- /*********************************************************************/
5
- /* File: dump.hpp */
6
- /* Author: Lukas Kogler */
7
- /* Date: Sep. 2014 */
8
- /*********************************************************************/
9
-
10
- namespace ngstd
11
- {
12
-
13
- template <NODE_TYPE NT>
14
- class key_trait { };
15
-
16
- template <>
17
- class key_trait<NT_VERTEX>
18
- {
19
- public:
20
- typedef int TKEY;
21
- };
22
-
23
- template <>
24
- class key_trait<NT_EDGE>
25
- {
26
- public:
27
- typedef IVec<2> TKEY;
28
- };
29
-
30
- template <>
31
- class key_trait<NT_FACE>
32
- {
33
- public:
34
- typedef IVec<3> TKEY;
35
- };
36
-
37
- template <>
38
- class key_trait<NT_CELL>
39
- {
40
- public:
41
- typedef IVec<4> TKEY;
42
- };
43
-
44
-
45
- template <int N>
46
- bool operator < (IVec<N> a, IVec<N> b)
47
- {
48
- for (int i = 0; i < N; i++)
49
- {
50
- if (a[i] < b[i]) return true;
51
- if (a[i] > b[i]) return false;
52
- }
53
- return false;
54
- }
55
-
56
- /*
57
- bool operator < (IVec<2> & nodea, IVec<2> & nodeb)
58
- {
59
- if(nodea[0] < nodeb[0])
60
- return true;
61
- else if(nodea[0] == nodeb[0] && nodea[1] < nodeb[1])
62
- return true;
63
- return false;
64
- }
65
-
66
- bool operator < (IVec<3> & nodea, IVec<3> & nodeb)
67
- {
68
- if(nodea[0] < nodeb[0])
69
- return true;
70
- else if(nodea[0] == nodeb[0])
71
- {
72
- if(nodea[1] < nodeb[1])
73
- return true;
74
- else if(nodea[1] == nodeb[1])
75
- if(nodea[2] < nodeb[2])
76
- return true;
77
- }
78
- return false;
79
- }
80
-
81
- bool operator < (IVec<4> & nodea, IVec<4> & nodeb)
82
- {
83
- if(nodea[0] < nodeb[0])
84
- return true;
85
- else if(nodea[0] == nodeb[0])
86
- {
87
- if(nodea[1] < nodeb[1])
88
- return true;
89
- else if(nodea[1] == nodeb[1])
90
- {
91
- if(nodea[2] < nodeb[2])
92
- return true;
93
- else if(nodea[2] == nodeb[2])
94
- {
95
- if(nodea[3] < nodeb[3])
96
- return true;
97
- }
98
- }
99
- }
100
- return false;
101
- }
102
- */
103
-
104
-
105
-
106
- /*
107
- template <NODE_TYPE NT>
108
- auto GetGlobalNodeId (const MeshAccess & ma, int nr) -> typename key_trait<NT>::TKEY { ; }
109
- */
110
-
111
- template <NODE_TYPE NT>
112
- inline auto GetGlobalNodeId (const MeshAccess & ma, int nr) -> typename key_trait<NT>::TKEY
113
- {
114
- cout << "called base GetGlobalNodeId!!" << endl;
115
- return 1;
116
- }
117
-
118
- template <>
119
- inline auto GetGlobalNodeId<NT_VERTEX> (const MeshAccess & ma, int nr)
120
- -> typename key_trait<NT_VERTEX>::TKEY
121
- {
122
- cout << "GetGlobalNodeId<vertex>" << endl;
123
- return ma.GetGlobalVertexNum (nr);
124
- }
125
-
126
- template <>
127
- inline auto GetGlobalNodeId<NT_EDGE> (const MeshAccess & ma, int nr) -> typename key_trait<NT_EDGE>::TKEY
128
- {
129
- // int pi1,pi2;
130
- // ma.GetEdgePNums (nr, pi1, pi2);
131
- auto pts = ma.GetEdgePNums(nr);
132
- int pi1 = pts[0], pi2 = pts[1];
133
- cout << "GetGlobalNodeId<edge>" << endl;
134
- return IVec<2> (ma.GetGlobalVertexNum (pi1),
135
- ma.GetGlobalVertexNum (pi2));
136
- }
137
-
138
- template <>
139
- inline auto GetGlobalNodeId<NT_FACE> (const MeshAccess & ma, int nr) -> typename key_trait<NT_FACE>::TKEY
140
- {
141
- // Array<int> edges (3);
142
- Array<int> verts;
143
- // ma.GetFaceEdges(nr, edges);
144
- auto edges = ma.GetFaceEdges(nr);
145
- for(int k=0;k<3;k++)
146
- {
147
- // int p1, p2;
148
- // ma.GetEdgePNums(edges[k], p1, p2);
149
- auto pts = ma.GetEdgePNums(edges[k]);
150
- int p1 = pts[0], p2 = pts[1];
151
-
152
- if(verts.Contains(p1)==0)
153
- verts.Append(p1);
154
- if(verts.Contains(p2)==0)
155
- verts.Append(p2);
156
- }
157
- QuickSort(verts);
158
- return IVec<3> (verts[0], verts[1], verts[2]);
159
- }
160
-
161
- template <>
162
- inline auto GetGlobalNodeId<NT_CELL> (const MeshAccess & ma, int nr) -> typename key_trait<NT_CELL>::TKEY
163
- {
164
- // Array<int> faces(4);
165
- Array<int> verts;
166
- // ma.GetElFacets(nr, faces);
167
- auto faces = ma.GetElFacets(ElementId(VOL,nr));
168
- for(int k=0;k<4;k++)
169
- {
170
- // Array<int> edges(3);
171
- // ma.GetFaceEdges(faces[k], edges);
172
- auto edges = ma.GetFaceEdges(faces[k]);
173
- //cout << "edges: " << edges << endl;
174
- for(int j=0;j<3;j++)
175
- {
176
- // int p1, p2;
177
- // ma.GetEdgePNums(edges[j], p1, p2);
178
- auto pts = ma.GetEdgePNums(edges[j]);
179
- int p1 = pts[0], p2 = pts[1];
180
- if(verts.Contains(p1)==0)
181
- verts.Append(p1);
182
- if(verts.Contains(p2)==0)
183
- verts.Append(p2);
184
- }
185
- }
186
- QuickSort(verts);
187
- return IVec<4> (verts[0], verts[1], verts[2], verts[3]);
188
- }
189
-
190
- /*
191
- template <NODE_TYPE NT>
192
- void SetMPIType(MPI_Datatype * type)
193
- {
194
- int sz = 1;
195
- switch (NT)
196
- {
197
- case NT_VERTEX:
198
- sz = 1;
199
- break;
200
- case NT_EDGE:
201
- sz = 2;
202
- break;
203
- case NT_FACE:
204
- sz = 3;
205
- break;
206
- case NT_CELL:
207
- sz = 4;
208
- break;
209
- }
210
- MPI_Type_contiguous(sz, MPI_INT, type);
211
- MPI_Type_commit(type);
212
- }
213
- */
214
-
215
- /*
216
- template <typename DT> struct MPIT {};
217
- template<> struct MPIT<double> {static MPI_Datatype mpi_type;};
218
- MPI_Datatype MPIT<double> :: mpi_type = MPI_DOUBLE;
219
- template <> struct MPIT<int> {static MPI_Datatype mpi_type;};
220
- MPI_Datatype MPIT<int> :: mpi_type = MPI_INT;
221
- template <> struct MPIT<unsigned char> {static MPI_Datatype mpi_type;};
222
- MPI_Datatype MPIT<unsigned char> :: mpi_type = MPI_BYTE;
223
- template <> struct MPIT<IVec<2,unsigned char>> { static MPI_Datatype mpi_type;};
224
- MPI_Datatype MPIT<IVec<2,unsigned char>> :: mpi_type;
225
- template <> struct MPIT<IVec<3,unsigned char>> { static MPI_Datatype mpi_type;};
226
- MPI_Datatype MPIT<IVec<3,unsigned char>> :: mpi_type;
227
-
228
- class class_init_mpi_types
229
- {
230
- public:
231
- class_init_mpi_types()
232
- {
233
- MPI_Type_contiguous ( 2, MPI_BYTE, &MPIT<IVec<2,unsigned char>>::mpi_type);
234
- MPI_Type_commit ( &MPIT<IVec<2,unsigned char>>::mpi_type );
235
-
236
- MPI_Type_contiguous ( 3, MPI_BYTE, &MPIT<IVec<3,unsigned char>>::mpi_type);
237
- MPI_Type_commit ( &MPIT<IVec<3,unsigned char>>::mpi_type );
238
-
239
- }
240
- };
241
- static class_init_mpi_types init_mpi_types;
242
- */
243
-
244
- //provides the place in merge-tree
245
- inline void find_SRRMS (int rank, int np, int* p1, int* p2, int* p3, bool ignore_in, bool ignore_out);
246
- inline void find_ROMS (int rank, int np, int* p1, int* p2);
247
-
248
-
249
- template<typename DT, NODE_TYPE NT>
250
- void packaged_buffered_send(int rank, int np, DT* a, typename key_trait<NT>::TKEY* b, int n, int pkg_size, int p,
251
- NgMPI_Requests & requests)
252
- {
253
- // NG_MPI_Datatype mpi_type_array = MPIT<DT>::mpi_type;
254
- NG_MPI_Datatype mpi_type_array = GetMPIType<DT>();
255
-
256
- //get type for keys
257
- // NG_MPI_Datatype mpi_type_key;
258
- // SetMPIType<NT>(&mpi_type_key);
259
- typedef typename key_trait<NT>::TKEY tkey;
260
- NG_MPI_Datatype mpi_type_key = GetMPIType<tkey>();
261
-
262
- bool has_extra = n%pkg_size;
263
- int n_packages = n/pkg_size + (has_extra ? 1 : 0);
264
-
265
- //send size
266
- NG_MPI_Send ( &n, 1, NG_MPI_INT, p, 700001, NG_MPI_COMM_WORLD);
267
-
268
- for(int k=0;k<n_packages - has_extra?1:0;k++)
269
- {
270
- // NG_MPI_Send ( a+k*pkg_size, pkg_size, mpi_type_array, p, 700001, NG_MPI_COMM_WORLD);
271
- // NG_MPI_Send ( b+k*pkg_size, pkg_size, mpi_type_key, p, 700001, NG_MPI_COMM_WORLD);
272
- NG_MPI_Request requ;
273
- NG_MPI_Isend ( a+k*pkg_size, pkg_size, mpi_type_array, p, 700001, NG_MPI_COMM_WORLD, &requ);
274
- requests += requ;
275
- NG_MPI_Isend ( b+k*pkg_size, pkg_size, mpi_type_key, p, 700001, NG_MPI_COMM_WORLD, &requ);
276
- requests += requ;
277
- }
278
- //copy last part into new memory so full package can be sent - for simplicity!!
279
- if(has_extra)
280
- {
281
- DT *a_ext = (DT*) malloc(pkg_size * sizeof(DT)); // I know, it is leaking ...
282
- tkey *b_ext = (tkey*) malloc(pkg_size * sizeof(tkey));
283
- for(int k=0;k<n%pkg_size;k++)
284
- {
285
- //a and b already point to last part
286
- a_ext[n%pkg_size-k-1] = a[n-1-k];
287
- b_ext[n%pkg_size-k-1] = b[n-1-k];
288
- }
289
- // NG_MPI_Send ( a_ext, pkg_size, mpi_type_array, p, 700001, NG_MPI_COMM_WORLD);
290
- // NG_MPI_Send ( b_ext, pkg_size, mpi_type_key, p, 700001, NG_MPI_COMM_WORLD);
291
-
292
- NG_MPI_Request requ;
293
- NG_MPI_Isend ( a_ext, pkg_size, mpi_type_array, p, 700001, NG_MPI_COMM_WORLD, &requ);
294
- requests += requ;
295
- NG_MPI_Isend ( b_ext, pkg_size, mpi_type_key, p, 700001, NG_MPI_COMM_WORLD, &requ);
296
- requests += requ;
297
- }
298
- }
299
-
300
- template<typename DT, NODE_TYPE NT>
301
- void merge_own_in_out (int rank, int size, int pkg_size, DT* array, typename key_trait<NT>::TKEY *array_dnrs, int n, int p_in, int p_out)
302
- {
303
- NgMPI_Comm comm(NG_MPI_COMM_WORLD);
304
-
305
- typedef typename key_trait<NT>::TKEY TKEY;
306
-
307
- int base_array_size = n;
308
-
309
- //in-buffer
310
- int n_in = 0;
311
- NG_MPI_Recv( &n_in, 1, NG_MPI_INT, p_in, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
312
-
313
- int in_buf_size = 2 * pkg_size; //do not change this for now!!
314
-
315
- Array<DT> in_buf(in_buf_size);
316
- Array<TKEY> in_dnrs(in_buf_size);
317
-
318
- int index_in = 0;
319
- int index_own = 0;
320
-
321
- //out-buffer
322
- int n_out = base_array_size + n_in;
323
-
324
- NG_MPI_Send(&n_out, 1, NG_MPI_INT, p_out, 700001, NG_MPI_COMM_WORLD);
325
- int out_buf_size = pkg_size;
326
-
327
- Array<DT> out_buf(out_buf_size);
328
- Array<TKEY> out_dnrs(out_buf_size);
329
-
330
- IntRange r1 (0, pkg_size);
331
- IntRange r2 (pkg_size, 2*pkg_size);
332
-
333
- int index_out = 0;
334
- bool has_extra = (n_out%pkg_size)?1:0;
335
-
336
- if(n_in)
337
- {
338
- //get 1st halve
339
- comm.Recv (in_buf[r1], p_in, 700001);
340
- comm.Recv (in_dnrs[r1], p_in, 700001);
341
-
342
- if(n_in>pkg_size)
343
- {
344
- //get 2nd halve
345
- comm.Recv (in_buf[r2], p_in, 700001);
346
- comm.Recv (in_dnrs[r2], p_in, 700001);
347
- }
348
- }
349
-
350
- bool have1[2];
351
- have1[0] = true;
352
- have1[1] = true;
353
-
354
- // int packages_sent = 0;
355
-
356
-
357
- int iib; //index in buf
358
- while (index_in<n_in && index_own<base_array_size)
359
- {
360
- iib = index_in%in_buf_size;
361
- if(iib == pkg_size && index_in+pkg_size<n_in && !have1[0]) //is at first of 2nd halve - replace first halve
362
- {
363
- comm.Recv (in_buf[r1], p_in, 700001);
364
- comm.Recv (in_dnrs[r1], p_in, 700001);
365
- have1[0] = true;
366
- }
367
- if(iib == 0 && index_in!=0 && index_in+pkg_size<n_in && !have1[1] ) //is at last of 2nd halve - set to 0 and replace 2nd halve
368
- {
369
- comm.Recv (in_buf[r2], p_in, 700001);
370
- comm.Recv (in_dnrs[r2], p_in, 700001);
371
- have1[1] = true;
372
- }
373
- if(in_dnrs[iib] < array_dnrs[index_own])
374
- {
375
- out_buf[index_out] = in_buf[iib];
376
- out_dnrs[index_out++] = in_dnrs[iib];
377
- index_in++;
378
- if(index_in%in_buf_size == 0)
379
- have1[1] = false;
380
- else if(index_in%in_buf_size == pkg_size)
381
- have1[0] = false;
382
- }
383
- else
384
- {
385
- out_buf[index_out] = array[index_own];
386
- out_dnrs[index_out++] = array_dnrs[index_own++];
387
- }
388
- if(index_out == pkg_size)
389
- {
390
- index_out = 0;
391
- comm.Send (out_buf, p_out, 700001);
392
- comm.Send (out_dnrs, p_out, 700001);
393
- // packages_sent++;
394
- }
395
- }
396
- while(index_in<n_in)
397
- {
398
- iib = index_in%in_buf_size;
399
- if(iib == pkg_size && index_in+pkg_size<n_in && !have1[0]) //is at first of 2nd halve - replace first halve
400
- {
401
- comm.Recv (in_buf[r1], p_in, 700001);
402
- comm.Recv (in_dnrs[r1], p_in, 700001);
403
- have1[0] = true;
404
- }
405
- if(iib == 0 && index_in!= 0 && index_in+pkg_size<n_in && !have1[1]) //is at last of 2nd halve - set to 0 and replace 2nd halve
406
- {
407
- comm.Recv (in_buf[r2], p_in, 700001);
408
- comm.Recv (in_dnrs[r2], p_in, 700001);
409
- have1[1] = true;
410
- }
411
- out_buf[index_out] = in_buf[iib];
412
- out_dnrs[index_out++] = in_dnrs[iib];
413
- index_in++;
414
- if(index_in%in_buf_size == 0)
415
- have1[1] = false;
416
- else if(index_in%in_buf_size == pkg_size)
417
- have1[0] = false;
418
- if(index_out == pkg_size)
419
- {
420
- index_out = 0;
421
- comm.Send (out_buf, p_out, 700001);
422
- comm.Send (out_dnrs, p_out, 700001);
423
- // packages_sent++;
424
- }
425
- }
426
- while(index_own<base_array_size)
427
- {
428
- out_buf[index_out] = array[index_own];
429
- out_dnrs[index_out++] = array_dnrs[index_own++];
430
- if(index_out == pkg_size)
431
- {
432
- index_out = 0;
433
- comm.Send (out_buf, p_out, 700001);
434
- comm.Send (out_dnrs, p_out, 700001);
435
- // packages_sent++;
436
- }
437
- }
438
- if(has_extra)
439
- {
440
- comm.Send (out_buf, p_out, 700001);
441
- comm.Send (out_dnrs, p_out, 700001);
442
- // packages_sent++;
443
- }
444
- }
445
-
446
- template<typename DT, NODE_TYPE NT>
447
- void merge_in_in_out (int pkg_size, int rank, int np, int p1, int p2, int p_out)
448
- {
449
- // NG_MPI_Datatype mpi_type_array = MPIT<DT>::mpi_type;
450
- NG_MPI_Datatype mpi_type_array = GetMPIType<DT>();
451
- //get type for keys
452
- // NG_MPI_Datatype mpi_type_key;
453
- // SetMPIType<NT>(&mpi_type_key);
454
- typedef typename key_trait<NT>::TKEY tkey;
455
- NG_MPI_Datatype mpi_type_key = GetMPIType<tkey>();
456
-
457
- int in_buf_size = pkg_size * 2;
458
- DT* a1 = (DT*) malloc (sizeof(DT) * in_buf_size);
459
- tkey* b1 = (tkey*) malloc (sizeof(tkey) * in_buf_size);
460
- DT* a2 = (DT*) malloc (sizeof(DT) * in_buf_size);
461
- tkey* b2 = (tkey*) malloc (sizeof(tkey) * in_buf_size);
462
-
463
- int out_buf_size = pkg_size;
464
- DT* a3 = (DT*) malloc (sizeof(DT) * out_buf_size);
465
- tkey* b3 = (tkey*) malloc (sizeof(tkey) * out_buf_size);
466
-
467
- for(int k=0;k<in_buf_size;k++)
468
- {
469
- a1[k] = a2[k] = -1;
470
- b1[k] = b2[k] = -1;
471
- }
472
- for(int k=0;k<out_buf_size;k++)
473
- {
474
- a3[k] = -1;
475
- b3[k] = -1;
476
- }
477
-
478
- //Communicate sizes
479
- int n_in1, n_in2;
480
- int n_out;
481
- NG_MPI_Recv( &n_in1, 1, NG_MPI_INT, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
482
- NG_MPI_Recv( &n_in2, 1, NG_MPI_INT, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
483
-
484
- n_out = n_in1 + n_in2;
485
- NG_MPI_Send( &n_out, 1, NG_MPI_INT, p_out, 700001, NG_MPI_COMM_WORLD);
486
-
487
-
488
- //initial filling of buffer
489
- if(n_in1)
490
- {
491
- //1st halve, p1
492
- NG_MPI_Recv(a1, pkg_size, mpi_type_array, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
493
- NG_MPI_Recv(b1, pkg_size, mpi_type_key, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
494
- if(n_in1>pkg_size)
495
- {
496
- //2nd halve, p1
497
- NG_MPI_Recv(a1+pkg_size, pkg_size, mpi_type_array, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
498
- NG_MPI_Recv(b1+pkg_size, pkg_size, mpi_type_key, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
499
- }
500
- }
501
- if(n_in2)
502
- {
503
- //1st halve, p2
504
- NG_MPI_Recv(a2, pkg_size, mpi_type_array, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
505
- NG_MPI_Recv(b2, pkg_size, mpi_type_key, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
506
- if(n_in2>pkg_size)
507
- {
508
- //2nd halve, p2
509
- NG_MPI_Recv(a2+pkg_size, pkg_size, mpi_type_array, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
510
- NG_MPI_Recv(b2+pkg_size, pkg_size, mpi_type_key, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
511
- }
512
- }
513
-
514
-
515
- // int got_from_p1 = 2;
516
- // int got_from_p2 = 2;
517
- // int packages_sent = 0;
518
- int index1, index2, i3;
519
- index1 = index2 = i3 = 0;
520
-
521
- bool have1[2];
522
- have1[0] = have1[1] = true;
523
- bool have2[2];
524
- have2[0] = have2[1] = true;
525
-
526
-
527
- while(index1<n_in1 && index2<n_in2)
528
- {
529
- int i1 = index1%in_buf_size;
530
- int i2 = index2%in_buf_size;
531
- if(i1==pkg_size && index1+pkg_size<n_in1 && !have1[0]) //replace 1st halve
532
- {
533
- //1st halve, p1
534
- NG_MPI_Recv(a1, pkg_size, mpi_type_array, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
535
- NG_MPI_Recv(b1, pkg_size, mpi_type_key, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
536
- have1[0] = true;
537
- // got_from_p1++;
538
- }
539
- else if (i1 == 0 && index1 !=0 && index1+pkg_size<n_in1 && !have1[1]) //replace 2nd halve
540
- {
541
- //2nd halve, p1
542
- NG_MPI_Recv(a1+pkg_size, pkg_size, mpi_type_array, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
543
- NG_MPI_Recv(b1+pkg_size, pkg_size, mpi_type_key, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
544
- have1[1] = true;
545
- // got_from_p1++;
546
- }
547
- else if(i2==pkg_size && index2+pkg_size<n_in2 && !have2[0]) //replace 1st halve
548
- {
549
- //1st halve, p2
550
- NG_MPI_Recv(a2, pkg_size, mpi_type_array, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
551
- NG_MPI_Recv(b2, pkg_size, mpi_type_key, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
552
- have2[0] = true;
553
- // got_from_p2++;
554
- }
555
- else if (i2 == 0 && index2 !=0 && index2+pkg_size<n_in2 && !have2[1]) //replace 2nd halve
556
- {
557
- have2[1] = true;
558
- NG_MPI_Recv(a2+pkg_size, pkg_size, mpi_type_array, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
559
- NG_MPI_Recv(b2+pkg_size, pkg_size, mpi_type_key, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
560
- // got_from_p2++;
561
- }
562
-
563
- if(b1[i1]<b2[i2])
564
- {
565
- b3[i3] = b1[i1];
566
- a3[i3++] = a1[i1];
567
- index1++;
568
- if(index1%in_buf_size == 0)
569
- have1[1] = false;
570
- else if(index1%in_buf_size == pkg_size)
571
- have1[0] = false;
572
- }
573
- else
574
- {
575
- b3[i3] = b2[i2];
576
- a3[i3++] = a2[i2];
577
- index2++;
578
- if(index2%in_buf_size == 0)
579
- have2[1] = false;
580
- else if(index2%in_buf_size == pkg_size)
581
- have2[0] = false;
582
- }
583
-
584
- if(i3==pkg_size)
585
- {
586
- i3 = 0;
587
- NG_MPI_Send(a3, pkg_size, mpi_type_array, p_out, 700001, NG_MPI_COMM_WORLD);
588
- NG_MPI_Send(b3, pkg_size, mpi_type_key, p_out, 700001, NG_MPI_COMM_WORLD);
589
- // packages_sent++;
590
- }
591
-
592
- }
593
- while(index1<n_in1)
594
- {
595
- int i1 = index1%in_buf_size;
596
- if(i1==pkg_size && index1+pkg_size<n_in1 && have1[0] == false) //replace 1st halve
597
- {
598
- //1st halve, p1
599
- NG_MPI_Recv(a1, pkg_size, mpi_type_array, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
600
- NG_MPI_Recv(b1, pkg_size, mpi_type_key, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
601
- have1[0] = true;
602
- // got_from_p1++;
603
- }
604
- else if (i1 == 0 && index1 !=0 && index1+pkg_size<n_in1 && have1[1] == false) //replace 2nd halve
605
- {
606
- //2nd halve, p1
607
- NG_MPI_Recv(a1+pkg_size, pkg_size, mpi_type_array, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
608
- NG_MPI_Recv(b1+pkg_size, pkg_size, mpi_type_key, p1, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
609
- have1[1] = true;
610
- // got_from_p1++;
611
- }
612
- b3[i3] = b1[i1];
613
- a3[i3++] = a1[i1];
614
- index1++;
615
- if(index1%in_buf_size == 0)
616
- have1[1] = false;
617
- else if(index1%in_buf_size == pkg_size)
618
- have1[0] = false;
619
- if(i3==pkg_size)
620
- {
621
- i3 = 0;
622
- NG_MPI_Send(a3, pkg_size, mpi_type_array, p_out, 700001, NG_MPI_COMM_WORLD);
623
- NG_MPI_Send(b3, pkg_size, mpi_type_key, p_out, 700001, NG_MPI_COMM_WORLD);
624
- // packages_sent++;
625
- }
626
- }
627
- while(index2<n_in2)
628
- {
629
- int i2 = index2%in_buf_size;
630
- if(i2==pkg_size && index2+pkg_size<n_in2 && have2[0] == false) //replace 1st halve
631
- {
632
- //1st halve, p2
633
- NG_MPI_Recv(a2, pkg_size, mpi_type_array, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
634
- NG_MPI_Recv(b2, pkg_size, mpi_type_key, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
635
- have2[0] = true;
636
- // got_from_p2++;
637
- }
638
- else if (i2 == 0 && index2 !=0 && index2+pkg_size<n_in2 && have2[1] == false) //replace 2nd halve
639
- {
640
- NG_MPI_Recv(a2+pkg_size, pkg_size, mpi_type_array, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
641
- NG_MPI_Recv(b2+pkg_size, pkg_size, mpi_type_key, p2, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
642
- have2[1] = true;
643
- // got_from_p2++;
644
- }
645
- b3[i3] = b2[i2];
646
- a3[i3++] = a2[i2];
647
- index2++;
648
- if(index2%in_buf_size == 0)
649
- have2[1] = false;
650
- else if(index2%in_buf_size == pkg_size)
651
- have2[0] = false;
652
- if(i3==pkg_size)
653
- {
654
- i3 = 0;
655
- NG_MPI_Send(a3, pkg_size, mpi_type_array, p_out, 700001, NG_MPI_COMM_WORLD);
656
- NG_MPI_Send(b3, pkg_size, mpi_type_key, p_out, 700001, NG_MPI_COMM_WORLD);
657
- // packages_sent++;
658
- }
659
- }
660
- if(i3!=0)
661
- {
662
- i3 = 0;
663
- NG_MPI_Send(a3, pkg_size, mpi_type_array, p_out, 700001, NG_MPI_COMM_WORLD);
664
- NG_MPI_Send(b3, pkg_size, mpi_type_key, p_out, 700001, NG_MPI_COMM_WORLD);
665
- // packages_sent++;
666
- }
667
-
668
- free(a1);
669
- free(a2);
670
- free(a3);
671
- free(b1);
672
- free(b2);
673
- free(b3);
674
- }
675
-
676
-
677
- void find_ROMS (int rank, int np, int* p1, int* p2)
678
- {
679
- //cout << "rank " << rank << " called _roms " << endl;
680
- int p_in, p_out;
681
- p_in = rank - 1;
682
- if(rank%4==1 && rank+1<np)
683
- p_out = rank+1;
684
- else if(rank%4==1)
685
- {
686
- int q1, q2, q3;
687
- find_SRRMS(rank+1, np, &q1, &q2, &q3, true, false);
688
- p_out = q3;
689
- }
690
- else
691
- p_out = rank-1;
692
- *p1 = p_in;
693
- *p2 = p_out;
694
- //cout << "rank " << rank << " _roms " << p_in << "/" << p_out << endl;
695
-
696
- }
697
-
698
- //send, recv+recv, send
699
- void find_SRRMS (int rank, int np, int* p1, int* p2, int* p3, bool ignore_in, bool ignore_out)
700
- {
701
-
702
- if(rank%2!=0)
703
- {
704
- // cout << "rank " << rank << " reached end of recursion SRRMS, use ROMS" << endl;
705
- *p1 = rank -1;
706
- *p2 = rank;
707
- *p3 = 0;
708
- //cout << "rank " << rank << "_srrms (after _roms) " << *p1 << "/" << *p2 << "/" << *p3 << endl;
709
- return;
710
- }
711
- int p_in1, p_in2, p_out;
712
- // int k = 1;
713
- int block_size = 2;
714
- int first_active = 1;
715
- bool found = false;
716
- while(!found)
717
- {
718
- block_size *=2;
719
- // k++;
720
- first_active *=2;
721
- int am_i = first_active;
722
- while(am_i<2*np)
723
- {
724
- if(am_i == rank)
725
- {
726
- found = true;
727
- am_i = 2*np;
728
- }
729
- else
730
- am_i+=block_size;
731
- }
732
- }
733
- p_in1 = rank - block_size/4;
734
- p_in2 = rank + block_size/4;
735
- if(block_size>=np) //send to 0
736
- {
737
- p_out = 0;
738
- //cout << "rank " << rank << " gives back to start " << endl;
739
- }
740
- else if((rank/block_size)%2==0)
741
- p_out = rank + block_size/2;
742
- else
743
- p_out = rank - block_size/2;
744
-
745
- // cout << "rank " << rank << " _srrms " << p_in1 << "/" << p_in2 << "/" << p_out << endl;
746
-
747
- if(!ignore_in) //look up, prioritize left
748
- {
749
- if(p_in1>np-1)
750
- {
751
- int q1, q2, q3;
752
- //cout << "rank " << rank << " go left up to " << p_in1 << endl;
753
- find_SRRMS(p_in1, np, &q1, &q2, &q3, false, true);
754
- p_in1 = q1;
755
- }
756
- else if(p_in2>np-1)
757
- {
758
- int q1, q2, q3;
759
- //cout << "rank " << rank << " go right up to " << p_in2 << endl;
760
- find_SRRMS(p_in2, np, &q1, &q2, &q3, false, true);
761
- p_in2 = q1;
762
- }
763
- }
764
-
765
- if(!ignore_out)
766
- {
767
- if(p_out>np-1) //look down
768
- {
769
- int q1, q2, q3;
770
- find_SRRMS(p_out, np, &q1, &q2, &q3, true, false);
771
- p_out = q3;
772
- }
773
- }
774
- *p1 = p_in1;
775
- *p2 = p_in2;
776
- *p3 = p_out;
777
-
778
- }
779
-
780
- template<typename DT, NODE_TYPE NT, typename TSIZEFUNC, typename TFUNC>
781
- void streamed_key_merge_templated (DT* array,
782
- typename key_trait<NT>::TKEY* array_keys,
783
- int base_array_size, int pkg_size,
784
- TSIZEFUNC sf, TFUNC f)
785
- {
786
- // NG_MPI_Datatype mpi_type_array = MyGetMPIType<DT>();
787
- typedef typename key_trait<NT>::TKEY tkey;
788
- // NG_MPI_Datatype mpi_type_key = MyGetMPIType<tkey>();
789
-
790
- NgMPI_Comm comm(NG_MPI_COMM_WORLD);
791
- int rank = comm.Rank();
792
- int np = comm.Size();
793
- /*
794
- int rank, np;
795
- NG_MPI_Comm_rank(NG_MPI_COMM_WORLD, &rank);
796
- NG_MPI_Comm_size(NG_MPI_COMM_WORLD, &np);
797
- */
798
- bool even = 1-rank%2;
799
- //first step
800
-
801
- if(rank == 0)
802
- {
803
- NgMPI_Requests requests;
804
- //packaged_send
805
- packaged_buffered_send<DT,NT>(rank, np, array, array_keys, base_array_size, pkg_size, 1, requests);
806
-
807
- int n;
808
- NG_MPI_Recv(&n, 1, NG_MPI_INT, NG_MPI_ANY_SOURCE, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
809
- int n_pkg = n/pkg_size + ( (n%pkg_size)?1:0);
810
-
811
- sf(n);
812
-
813
- /*
814
- DT* end = (DT*) malloc(pkg_size * sizeof(DT));
815
- tkey* end_keys = (tkey*) malloc(pkg_size * sizeof(tkey));
816
- */
817
- Array<DT> end(pkg_size);
818
- Array<tkey> end_keys(pkg_size);
819
-
820
- for(int k=0;k<n_pkg-1;k++)
821
- {
822
- // NG_MPI_Recv(&end[0] , pkg_size, mpi_type_array, NG_MPI_ANY_SOURCE, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
823
- // NG_MPI_Recv(&end_keys[0], pkg_size, mpi_type_key , NG_MPI_ANY_SOURCE, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
824
-
825
- comm.Recv(end, NG_MPI_ANY_SOURCE, 700001);
826
- comm.Recv(end_keys, NG_MPI_ANY_SOURCE, 700001);
827
-
828
- //cout << "0 received pkg " << k << "/" << n_pkg << endl;
829
- for(int j = 0; j < pkg_size; j++)
830
- f(end_keys[j], end[j]);
831
- }
832
- // NG_MPI_Recv(&end[0] , pkg_size, mpi_type_array, NG_MPI_ANY_SOURCE, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
833
- // NG_MPI_Recv(&end_keys[0], pkg_size, mpi_type_key , NG_MPI_ANY_SOURCE, 700001, NG_MPI_COMM_WORLD, NG_MPI_STATUS_IGNORE);
834
- comm.Recv(end, NG_MPI_ANY_SOURCE, 700001);
835
- comm.Recv(end_keys, NG_MPI_ANY_SOURCE, 700001);
836
-
837
- for(int j=0;(n_pkg-1)*pkg_size+j < n;j++)
838
- f(end_keys[j], end[j]);
839
- requests.WaitAll();
840
- // free(end);
841
- // free(end_keys);
842
- }
843
- else if(even)
844
- {
845
- // -> RRM
846
- int p_in1, p_in2, p_out;
847
- find_SRRMS (rank, np, &p_in1, &p_in2, &p_out, false, false);
848
- if(np-1 == rank) //is on right border
849
- {
850
- //cout << "rank " << rank << " (irregularly) gets from " << p_in1 << " and sends to " << p_out << endl;
851
- merge_own_in_out <DT,NT> (rank, np, pkg_size, array, array_keys, base_array_size, p_in1, p_out);
852
- }
853
- else //regular
854
- {
855
- //cout << "rank " << rank << " sends to " << rank+1 << " then gets from " << p_in1 << "/" << p_in2 << " and sends to " << p_out << endl;
856
- NgMPI_Requests requests;
857
- packaged_buffered_send<DT,NT>(rank, np, array, array_keys, base_array_size, pkg_size, rank+1, requests);
858
- merge_in_in_out<DT,NT>(pkg_size, rank, np, p_in1, p_in2, p_out);
859
- requests.WaitAll();
860
- }
861
- }
862
- else
863
- {
864
- // ROM ->
865
- int p_in,p_out;
866
- find_ROMS(rank, np, &p_in, &p_out);
867
- //cout << "rank " << rank << " gets from " << p_in << " and sends to " << p_out << endl;
868
- merge_own_in_out<DT,NT>(rank, np, pkg_size, array, array_keys, base_array_size, p_in, p_out);
869
- }
870
- }
871
-
872
- template <class T>
873
- void MyQuickSortI (FlatArray<T> data, FlatArray<int> index)
874
- {
875
- if (index.Size() <= 1) return;
876
-
877
- int i = 0;
878
- int j = index.Size()-1;
879
-
880
- int midval = index[ (i+j)/2 ];
881
-
882
- do
883
- {
884
- while (data[index[i]] < data[midval]) i++;
885
- while (data[midval] < data[index[j]]) j--;
886
- /*
887
- while (less (data[index[i]],data[midval]) ) i++;
888
- while (less (data[midval], data[index[j]])) j--;
889
- */
890
-
891
- if (i <= j)
892
- {
893
- Swap (index[i], index[j]);
894
- i++; j--;
895
- }
896
- }
897
- while (i <= j);
898
-
899
- MyQuickSortI (data, index.Range (0, j+1));
900
- MyQuickSortI (data, index.Range (i, index.Size()));
901
- }
902
-
903
-
904
-
905
-
906
-
907
-
908
- template <NODE_TYPE NT, typename T, typename TSIZEFUNC, typename TFUNC>
909
- void GatherNodalData (const MeshAccess & ma, FlatArray<T> data,
910
- TSIZEFUNC sf, TFUNC f)
911
- {
912
- typedef typename key_trait<NT>::TKEY TKEY;
913
-
914
- Array<T> local_data;
915
- Array<TKEY> global_keys;
916
-
917
- // gather local data where I am master
918
- auto comm = ma.GetCommunicator();
919
- int myid = comm.Rank();
920
- for (int i = 0; i < ma.GetNNodes(NT); i++)
921
- {
922
- bool ismaster = true;
923
- for (int p : ma.GetDistantProcs (Node(NT,i)))
924
- if (p < myid) ismaster = false;
925
-
926
- if (ismaster)
927
- {
928
- local_data.Append (data[i]);
929
- TKEY key1 = GetGlobalNodeId<NT>(ma,i);
930
- global_keys.Append (key1);
931
- }
932
- }
933
-
934
- Array<int> index (local_data.Size());
935
- for (int k = 0; k < index.Size(); k++) index[k] = k;
936
-
937
- MyQuickSortI (global_keys, index);
938
-
939
- local_data = Array<T> (local_data[index]);
940
- global_keys = Array<TKEY> (global_keys[index]);
941
-
942
-
943
- streamed_key_merge_templated<T,NT> (&local_data[0], &global_keys[0], local_data.Size(), 10000, sf, f);
944
- }
945
-
946
-
947
-
948
- }
949
- #endif