ngsolve 6.2.2506.post75.dev0__cp314-cp314-manylinux_2_28_x86_64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of ngsolve might be problematic. Click here for more details.
- ngsolve-6.2.2506.post75.dev0.data/data/bin/ngs_nvcc +14 -0
- ngsolve-6.2.2506.post75.dev0.data/data/bin/ngs_nvlink +14 -0
- ngsolve-6.2.2506.post75.dev0.data/data/bin/ngscxx +15 -0
- ngsolve-6.2.2506.post75.dev0.data/data/bin/ngsld +11 -0
- ngsolve-6.2.2506.post75.dev0.data/data/bin/ngsolve.tcl +648 -0
- ngsolve-6.2.2506.post75.dev0.data/data/bin/ngspy +2 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/analytic_integrals.hpp +10 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/arnoldi.hpp +55 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/bandmatrix.hpp +334 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/basematrix.hpp +957 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/basevector.hpp +1268 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/bdbequations.hpp +2805 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/bdbintegrator.hpp +1660 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/bem_diffops.hpp +475 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/bessel.hpp +1064 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/bilinearform.hpp +963 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/bla.hpp +29 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/blockalloc.hpp +95 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/blockjacobi.hpp +328 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/bspline.hpp +116 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/calcinverse.hpp +141 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/cg.hpp +368 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/chebyshev.hpp +44 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/cholesky.hpp +720 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/clapack.h +7254 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/code_generation.hpp +296 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/coefficient.hpp +2033 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/coefficient_impl.hpp +19 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/coefficient_stdmath.hpp +167 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/commutingAMG.hpp +106 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/comp.hpp +79 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/compatibility.hpp +41 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/complex_wrapper.hpp +73 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/compressedfespace.hpp +110 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/contact.hpp +235 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/cuda_linalg.hpp +175 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/cuda_ngbla.hpp +226 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/cuda_ngstd.hpp +527 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/cuda_profiler.hpp +240 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/diagonalmatrix.hpp +154 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/differentialoperator.hpp +276 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/diffop.hpp +1286 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/diffop_impl.hpp +328 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/diffopwithfactor.hpp +123 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/discontinuous.hpp +84 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/dump.hpp +949 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/ectypes.hpp +121 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/eigen.hpp +60 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/eigensystem.hpp +18 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/elasticity_equations.hpp +595 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/elementbyelement.hpp +195 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/elementtopology.hpp +1760 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/elementtransformation.hpp +339 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/evalfunc.hpp +405 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/expr.hpp +1686 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/facetfe.hpp +175 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/facetfespace.hpp +180 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/facethofe.hpp +111 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/facetsurffespace.hpp +112 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/fe_interfaces.hpp +32 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/fem.hpp +87 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/fesconvert.hpp +14 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/fespace.hpp +1449 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/finiteelement.hpp +286 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/globalinterfacespace.hpp +77 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/globalspace.hpp +115 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/gridfunction.hpp +525 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/h1amg.hpp +124 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/h1hofe.hpp +188 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/h1hofe_impl.hpp +1262 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/h1hofefo.hpp +148 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/h1hofefo_impl.hpp +185 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/h1hofespace.hpp +167 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/h1lofe.hpp +1240 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/h1lumping.hpp +41 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurl_equations.hpp +1381 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurlcurlfe.hpp +2241 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurlcurlfespace.hpp +78 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurlfe.hpp +259 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurlfe_utils.hpp +107 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurlhdiv_dshape.hpp +857 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurlhdivfes.hpp +308 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurlhofe.hpp +175 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurlhofe_impl.hpp +1871 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurlhofespace.hpp +193 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hcurllofe.hpp +1146 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdiv_equations.hpp +880 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivdivfe.hpp +2923 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivdivsurfacespace.hpp +76 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivfe.hpp +206 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivfe_utils.hpp +717 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivfes.hpp +75 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivhofe.hpp +447 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivhofe_impl.hpp +1107 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivhofefo.hpp +229 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivhofespace.hpp +177 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivhosurfacefespace.hpp +106 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hdivlofe.hpp +773 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hidden.hpp +74 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/householder.hpp +181 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hypre_ams_precond.hpp +123 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/hypre_precond.hpp +73 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/integrator.hpp +2012 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/integratorcf.hpp +253 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/interpolate.hpp +49 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/intrule.hpp +2542 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/intrules_SauterSchwab.hpp +25 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/irspace.hpp +49 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/jacobi.hpp +153 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/kernels.hpp +762 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/l2hofe.hpp +194 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/l2hofe_impl.hpp +564 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/l2hofefo.hpp +542 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/l2hofespace.hpp +344 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/la.hpp +38 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/linalg_kernels.hpp +102 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/linearform.hpp +266 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/matrix.hpp +2140 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/memusage.hpp +41 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/meshaccess.hpp +1359 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/mgpre.hpp +204 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/mp_coefficient.hpp +145 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/mptools.hpp +2281 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/multigrid.hpp +42 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/multivector.hpp +447 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/mumpsinverse.hpp +187 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/mycomplex.hpp +361 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/ng_lapack.hpp +1661 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/ngblas.hpp +1232 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/ngs_defines.hpp +30 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/ngs_stdcpp_include.hpp +106 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/ngs_utils.hpp +121 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/ngsobject.hpp +1019 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/ngsstream.hpp +113 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/ngstd.hpp +72 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/nodalhofe.hpp +96 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/nodalhofe_impl.hpp +141 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/normalfacetfe.hpp +223 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/normalfacetfespace.hpp +98 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/normalfacetsurfacefespace.hpp +84 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/order.hpp +251 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/parallel_matrices.hpp +222 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/paralleldofs.hpp +340 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/parallelngs.hpp +23 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/parallelvector.hpp +269 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/pardisoinverse.hpp +200 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/periodic.hpp +129 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/plateaufespace.hpp +25 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/pml.hpp +275 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/pmltrafo.hpp +631 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/postproc.hpp +142 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/potentialtools.hpp +22 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/precomp.hpp +60 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/preconditioner.hpp +602 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/prolongation.hpp +377 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/python_comp.hpp +107 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/python_fem.hpp +89 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/python_linalg.hpp +58 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/python_ngstd.hpp +386 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/recursive_pol.hpp +4896 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/recursive_pol_tet.hpp +395 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/recursive_pol_trig.hpp +492 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/reorderedfespace.hpp +81 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/sample_sort.hpp +105 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/scalarfe.hpp +335 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/shapefunction_utils.hpp +113 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/simd_complex.hpp +329 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/smoother.hpp +253 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/solve.hpp +89 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/sparsecholesky.hpp +313 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/sparsematrix.hpp +1038 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/sparsematrix_dyn.hpp +90 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/sparsematrix_impl.hpp +1013 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/special_matrix.hpp +463 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/specialelement.hpp +125 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/statushandler.hpp +33 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/stringops.hpp +12 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/superluinverse.hpp +136 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/symbolicintegrator.hpp +850 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/symmetricmatrix.hpp +144 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tangentialfacetfe.hpp +224 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tangentialfacetfespace.hpp +91 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tensor.hpp +522 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tensorcoefficient.hpp +446 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tensorproductintegrator.hpp +113 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/thcurlfe.hpp +128 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/thcurlfe_impl.hpp +380 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/thdivfe.hpp +80 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/thdivfe_impl.hpp +492 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tpdiffop.hpp +461 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tpfes.hpp +133 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tpintrule.hpp +224 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/triangular.hpp +465 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tscalarfe.hpp +245 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/tscalarfe_impl.hpp +1029 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/umfpackinverse.hpp +148 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/unifiedvector.hpp +103 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/vector.hpp +1273 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/voxelcoefficientfunction.hpp +41 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/vtkoutput.hpp +198 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/vvector.hpp +208 -0
- ngsolve-6.2.2506.post75.dev0.data/data/include/netgen/webgui.hpp +92 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/cmake/ngsolve/NGSolveConfig.cmake +102 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/cmake/ngsolve/ngsolve-targets-release.cmake +89 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/cmake/ngsolve/ngsolve-targets.cmake +173 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/netgen_mesher.libs/libngbla.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/netgen_mesher.libs/libngcomp.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/netgen_mesher.libs/libngfem.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/netgen_mesher.libs/libngla.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/netgen_mesher.libs/libngsbem.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/netgen_mesher.libs/libngscudalib.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/netgen_mesher.libs/libngsolve.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/netgen_mesher.libs/libngstd.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/TensorProductTools.py +210 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/__console.py +94 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/__expr.py +181 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/__init__.py +148 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/_scikit_build_core_dependencies.py +30 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/bvp.py +78 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/config/__init__.py +1 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/config/__main__.py +4 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/config/config.py +60 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/TensorProduct/__init__.py +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/TensorProduct/tp_dg_1d_1d.py +80 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/TensorProduct/tp_dg_1d_2d.py +73 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/TensorProduct/tp_dg_2d_1d.py +72 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/TensorProduct/tp_dg_2d_2d.py +66 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/__init__.py +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/__init__.py +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/hhj.py +44 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/hybrid_dg.py +53 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/mixed.py +30 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/nonlin.py +29 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/pickling.py +26 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/pml.py +31 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/taskmanager.py +20 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/tdnns.py +47 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/timeDG-skeleton.py +45 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/timeDG.py +38 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/timeDGlap.py +42 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/howto/timeDGwave.py +61 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/intro/__init__.py +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/intro/adaptive.py +123 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/intro/cmagnet.py +59 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/intro/elasticity.py +76 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/intro/navierstokes.py +74 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/intro/poisson.ipynb +170 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/intro/poisson.py +41 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/mpi/__init__.py +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/mpi/mpi_cmagnet.py +87 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/mpi/mpi_navierstokes.py +117 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/mpi/mpi_poisson.py +89 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/demos/mpi/mpi_timeDG.py +82 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/directsolvers.py +26 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/eigenvalues.py +364 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/internal.py +89 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/krylovspace.py +1013 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/meshes.py +748 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/ngs2petsc.py +310 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/ngscuda.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/ngscxx.py +42 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/ngslib.so +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/nonlinearsolvers.py +203 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/preconditioners.py +11 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/solve_implementation.py +168 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/solvers.py +7 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/timestepping.py +185 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/timing.py +108 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/utils.py +167 -0
- ngsolve-6.2.2506.post75.dev0.data/data/lib/python3.14/site-packages/ngsolve/webgui.py +670 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/beam.geo +17 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/beam.vol +240 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/chip.in2d +41 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/chip.vol +614 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/coil.geo +12 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/coil.vol +2560 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/coilshield.geo +24 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/coilshield.vol +3179 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/cube.geo +19 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/cube.vol +1832 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d10_DGdoubleglazing.pde +50 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d11_chip_nitsche.pde +40 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d1_square.pde +43 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d2_chip.pde +35 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d3_helmholtz.pde +22 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d4_cube.pde +46 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d5_beam.pde +74 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d6_shaft.pde +73 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d7_coil.pde +50 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d8_coilshield.pde +49 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/d9_hybridDG.pde +72 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/doubleglazing.in2d +27 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/doubleglazing.vol +737 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/piezo2d40round4.vol.gz +0 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/shaft.geo +73 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/shaft.vol +4291 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/square.in2d +17 -0
- ngsolve-6.2.2506.post75.dev0.data/data/share/ngsolve/square.vol +149 -0
- ngsolve-6.2.2506.post75.dev0.dist-info/METADATA +14 -0
- ngsolve-6.2.2506.post75.dev0.dist-info/RECORD +303 -0
- ngsolve-6.2.2506.post75.dev0.dist-info/WHEEL +5 -0
- ngsolve-6.2.2506.post75.dev0.dist-info/licenses/LICENSE +504 -0
- ngsolve-6.2.2506.post75.dev0.dist-info/top_level.txt +1 -0
|
@@ -0,0 +1,527 @@
|
|
|
1
|
+
#ifndef CUDA_NGSTD_HPP
|
|
2
|
+
#define CUDA_NGSTD_HPP
|
|
3
|
+
|
|
4
|
+
#include <cuda_runtime.h>
|
|
5
|
+
#include <ngstd.hpp>
|
|
6
|
+
|
|
7
|
+
#include "cuda_profiler.hpp"
|
|
8
|
+
|
|
9
|
+
namespace ngs_cuda
|
|
10
|
+
{
|
|
11
|
+
using namespace ngstd;
|
|
12
|
+
|
|
13
|
+
// from CUDA C++ Programming Guide:
|
|
14
|
+
// https://docs.nvidia.com/cuda/cuda-c-programming-guide/index.html#atomic-functions
|
|
15
|
+
#ifdef __CUDA_ARCH__
|
|
16
|
+
#if __CUDA_ARCH__ < 600
|
|
17
|
+
inline __device__ double atomicAdd(double* address, double val)
|
|
18
|
+
{
|
|
19
|
+
unsigned long long int* address_as_ull =
|
|
20
|
+
(unsigned long long int*)address;
|
|
21
|
+
unsigned long long int old = *address_as_ull, assumed;
|
|
22
|
+
|
|
23
|
+
do {
|
|
24
|
+
assumed = old;
|
|
25
|
+
old = atomicCAS(address_as_ull, assumed,
|
|
26
|
+
__double_as_longlong(val +
|
|
27
|
+
__longlong_as_double(assumed)));
|
|
28
|
+
|
|
29
|
+
// Note: uses integer comparison to avoid hang in case of NaN (since NaN != NaN)
|
|
30
|
+
} while (assumed != old);
|
|
31
|
+
|
|
32
|
+
return __longlong_as_double(old);
|
|
33
|
+
}
|
|
34
|
+
#endif
|
|
35
|
+
#endif
|
|
36
|
+
|
|
37
|
+
|
|
38
|
+
extern int gpu_clock;
|
|
39
|
+
void InitCUDA (int verbose = 2);
|
|
40
|
+
|
|
41
|
+
|
|
42
|
+
template <typename T>
|
|
43
|
+
class Dev
|
|
44
|
+
{
|
|
45
|
+
public:
|
|
46
|
+
T data;
|
|
47
|
+
static Dev<T> * Malloc(size_t size)
|
|
48
|
+
{
|
|
49
|
+
Dev<T> * ptr;
|
|
50
|
+
if (auto err = cudaMalloc (&ptr, size*sizeof(T)))
|
|
51
|
+
throw Exception("cudaMalloc error, ec="+ToString(err));
|
|
52
|
+
return ptr;
|
|
53
|
+
}
|
|
54
|
+
|
|
55
|
+
static void Free(Dev<T> * data)
|
|
56
|
+
{
|
|
57
|
+
cudaFree (data);
|
|
58
|
+
}
|
|
59
|
+
|
|
60
|
+
T D2H() const
|
|
61
|
+
{
|
|
62
|
+
T res;
|
|
63
|
+
cudaMemcpy (&res, &data, sizeof(T), cudaMemcpyDeviceToHost);
|
|
64
|
+
return res;
|
|
65
|
+
}
|
|
66
|
+
|
|
67
|
+
void H2D (T val)
|
|
68
|
+
{
|
|
69
|
+
cudaMemcpy (&data, &val, sizeof(T), cudaMemcpyHostToDevice);
|
|
70
|
+
}
|
|
71
|
+
|
|
72
|
+
|
|
73
|
+
void D2H (FlatArray<T> hosta)
|
|
74
|
+
{
|
|
75
|
+
cudaMemcpy (hosta.Data(), &data, hosta.Size()*sizeof(T), cudaMemcpyDeviceToHost);
|
|
76
|
+
}
|
|
77
|
+
|
|
78
|
+
void H2D (FlatArray<T> hosta)
|
|
79
|
+
{
|
|
80
|
+
cudaMemcpy (&data, hosta.Data(), hosta.Size()*sizeof(T), cudaMemcpyHostToDevice);
|
|
81
|
+
}
|
|
82
|
+
|
|
83
|
+
|
|
84
|
+
__device__ Dev<T> & operator= (T d2) { data = d2; return *this; }
|
|
85
|
+
__device__ operator T() const { return data; }
|
|
86
|
+
|
|
87
|
+
template <typename T2>
|
|
88
|
+
__device__ auto & operator+= (T2 other) { data += other; return *this; }
|
|
89
|
+
template <typename T2>
|
|
90
|
+
__device__ auto & operator-= (T2 other) { data -= other; return *this; }
|
|
91
|
+
template <typename T2>
|
|
92
|
+
__device__ auto & operator*= (T2 other) { data *= other; return *this; }
|
|
93
|
+
};
|
|
94
|
+
|
|
95
|
+
}
|
|
96
|
+
|
|
97
|
+
namespace ngcore {
|
|
98
|
+
template <typename T>
|
|
99
|
+
struct IsSafe<ngs_cuda::Dev<T>> {
|
|
100
|
+
constexpr operator bool() const { return true; }
|
|
101
|
+
};
|
|
102
|
+
}
|
|
103
|
+
|
|
104
|
+
|
|
105
|
+
namespace ngs_cuda
|
|
106
|
+
{
|
|
107
|
+
|
|
108
|
+
/*
|
|
109
|
+
template <typename T>
|
|
110
|
+
class DevVar
|
|
111
|
+
{
|
|
112
|
+
T * ptr;
|
|
113
|
+
public:
|
|
114
|
+
DevVar()
|
|
115
|
+
{
|
|
116
|
+
cudaMalloc (&ptr, sizeof(T));
|
|
117
|
+
}
|
|
118
|
+
|
|
119
|
+
DevVar(T val)
|
|
120
|
+
{
|
|
121
|
+
cudaMalloc (&ptr, sizeof(T));
|
|
122
|
+
cudaMemcpy (ptr, &val, sizeof(T), cudaMemcpyHostToDevice);
|
|
123
|
+
}
|
|
124
|
+
|
|
125
|
+
operator T () const
|
|
126
|
+
{
|
|
127
|
+
T tmp;
|
|
128
|
+
cudaMemcpy (&tmp, ptr, sizeof(T), cudaMemcpyDeviceToHost);
|
|
129
|
+
return tmp;
|
|
130
|
+
}
|
|
131
|
+
|
|
132
|
+
T * DevPtr() const { return ptr; }
|
|
133
|
+
T & DevRef() const { return *ptr; }
|
|
134
|
+
|
|
135
|
+
};
|
|
136
|
+
|
|
137
|
+
template <typename T>
|
|
138
|
+
inline ostream & operator<< (ostream & ost, DevVar<T> & var)
|
|
139
|
+
{
|
|
140
|
+
ost << T(var);
|
|
141
|
+
return ost;
|
|
142
|
+
}
|
|
143
|
+
*/
|
|
144
|
+
|
|
145
|
+
// TODO: Resize + error checking
|
|
146
|
+
class DevStackMemory
|
|
147
|
+
{
|
|
148
|
+
char * data;
|
|
149
|
+
char * stackptr;
|
|
150
|
+
public:
|
|
151
|
+
DevStackMemory (size_t s = 512*1024*1025)
|
|
152
|
+
{
|
|
153
|
+
cudaMalloc (&data, s);
|
|
154
|
+
stackptr = data;
|
|
155
|
+
}
|
|
156
|
+
|
|
157
|
+
~DevStackMemory ()
|
|
158
|
+
{
|
|
159
|
+
cudaFree (data);
|
|
160
|
+
}
|
|
161
|
+
|
|
162
|
+
template <typename T>
|
|
163
|
+
T * Alloc (size_t s)
|
|
164
|
+
{
|
|
165
|
+
char * tmp = stackptr;
|
|
166
|
+
s *= sizeof(T);
|
|
167
|
+
s = (s+255) & size_t(-256);
|
|
168
|
+
stackptr += s;
|
|
169
|
+
return reinterpret_cast<T*>(tmp);
|
|
170
|
+
}
|
|
171
|
+
|
|
172
|
+
void Free (void * ptr)
|
|
173
|
+
{
|
|
174
|
+
stackptr = reinterpret_cast<char*> (ptr);
|
|
175
|
+
}
|
|
176
|
+
};
|
|
177
|
+
|
|
178
|
+
extern DevStackMemory stackmemory;
|
|
179
|
+
|
|
180
|
+
template <typename T>
|
|
181
|
+
class DevStackArray : public FlatArray<Dev<T>>
|
|
182
|
+
{
|
|
183
|
+
public:
|
|
184
|
+
DevStackArray (size_t s)
|
|
185
|
+
: FlatArray<Dev<T>> (s, (Dev<T>*)stackmemory.Alloc<T>(s))
|
|
186
|
+
{ ; }
|
|
187
|
+
~DevStackArray ()
|
|
188
|
+
{
|
|
189
|
+
stackmemory.Free(this->data);
|
|
190
|
+
}
|
|
191
|
+
T * DevData () const { return (T*)this->data; }
|
|
192
|
+
};
|
|
193
|
+
}
|
|
194
|
+
|
|
195
|
+
namespace std {
|
|
196
|
+
template <typename T>
|
|
197
|
+
struct is_integral<ngs_cuda::Dev<T>> {
|
|
198
|
+
static constexpr bool value = is_integral<T>::value;
|
|
199
|
+
};
|
|
200
|
+
}
|
|
201
|
+
|
|
202
|
+
|
|
203
|
+
|
|
204
|
+
namespace ngcore
|
|
205
|
+
{
|
|
206
|
+
using ngs_cuda::Dev;
|
|
207
|
+
template <typename T>
|
|
208
|
+
class Array<Dev<T>> : public FlatArray<Dev<T>>
|
|
209
|
+
{
|
|
210
|
+
public:
|
|
211
|
+
Array() = default;
|
|
212
|
+
Array (size_t s)
|
|
213
|
+
: FlatArray<Dev<T>>(s, Dev<T>::Malloc(s)) { } ;
|
|
214
|
+
Array (FlatArray<T> a2)
|
|
215
|
+
: Array(a2.Size())
|
|
216
|
+
{
|
|
217
|
+
this->data->H2D(a2);
|
|
218
|
+
}
|
|
219
|
+
|
|
220
|
+
Array& operator= (Array<Dev<T>> && a2)
|
|
221
|
+
{
|
|
222
|
+
Swap (this->data, a2.data);
|
|
223
|
+
Swap (this->size, a2.size);
|
|
224
|
+
return *this;
|
|
225
|
+
}
|
|
226
|
+
|
|
227
|
+
Array& operator= (FlatArray<T> a2)
|
|
228
|
+
{
|
|
229
|
+
SetSize(a2.Size());
|
|
230
|
+
this->data->H2D(a2);
|
|
231
|
+
return *this;
|
|
232
|
+
}
|
|
233
|
+
|
|
234
|
+
void SetSize(size_t s)
|
|
235
|
+
{
|
|
236
|
+
if (this->Size() != s)
|
|
237
|
+
{
|
|
238
|
+
Dev<T>::Free(this->data);
|
|
239
|
+
this->data = Dev<T>::Malloc(s);
|
|
240
|
+
this->size = s;
|
|
241
|
+
}
|
|
242
|
+
}
|
|
243
|
+
|
|
244
|
+
~Array()
|
|
245
|
+
{
|
|
246
|
+
Dev<T>::Free(this->data);
|
|
247
|
+
}
|
|
248
|
+
};
|
|
249
|
+
}
|
|
250
|
+
|
|
251
|
+
|
|
252
|
+
namespace ngs_cuda
|
|
253
|
+
{
|
|
254
|
+
// use Array<Dev<T>> instead
|
|
255
|
+
template <typename T>
|
|
256
|
+
class [[deprecated]] DevArray
|
|
257
|
+
{
|
|
258
|
+
int size;
|
|
259
|
+
T * dev_data;
|
|
260
|
+
|
|
261
|
+
public:
|
|
262
|
+
DevArray (int asize)
|
|
263
|
+
{
|
|
264
|
+
size = asize;
|
|
265
|
+
cudaMalloc((T**)&dev_data, size*sizeof(T));
|
|
266
|
+
}
|
|
267
|
+
|
|
268
|
+
DevArray (FlatArray<T> a2)
|
|
269
|
+
{
|
|
270
|
+
size = a2.Size();
|
|
271
|
+
cudaMalloc((T**)&dev_data, size*sizeof(T));
|
|
272
|
+
cudaMemcpy (dev_data, &a2[0], sizeof(T)*size, cudaMemcpyHostToDevice);
|
|
273
|
+
}
|
|
274
|
+
|
|
275
|
+
~DevArray ()
|
|
276
|
+
{
|
|
277
|
+
cudaFree (dev_data);
|
|
278
|
+
}
|
|
279
|
+
|
|
280
|
+
T * DevPtr() { return dev_data; }
|
|
281
|
+
|
|
282
|
+
DevArray & operator= (FlatArray<T> a2)
|
|
283
|
+
{
|
|
284
|
+
cudaMemcpy (dev_data, &a2[0], sizeof(T)*size, cudaMemcpyHostToDevice);
|
|
285
|
+
return *this;
|
|
286
|
+
}
|
|
287
|
+
|
|
288
|
+
void D2H (FlatArray<T> a2) const
|
|
289
|
+
{
|
|
290
|
+
cudaMemcpy (&a2[0], dev_data, sizeof(T)*size, cudaMemcpyDeviceToHost);
|
|
291
|
+
}
|
|
292
|
+
|
|
293
|
+
INLINE int Size() const { return size; }
|
|
294
|
+
|
|
295
|
+
/*
|
|
296
|
+
INLINE operator FlatArray<T> ()
|
|
297
|
+
{
|
|
298
|
+
return FlatArray<T> (size, dev_data);
|
|
299
|
+
}
|
|
300
|
+
*/
|
|
301
|
+
INLINE FlatArray<T> Dev() const
|
|
302
|
+
{
|
|
303
|
+
return FlatArray<T> (size, dev_data);
|
|
304
|
+
}
|
|
305
|
+
|
|
306
|
+
explicit INLINE operator Array<T> () const
|
|
307
|
+
{
|
|
308
|
+
Array<T> temp(size);
|
|
309
|
+
#ifdef __CUDA_ARCH__
|
|
310
|
+
temp = FlatArray<T> (*this);
|
|
311
|
+
#else
|
|
312
|
+
D2H (temp);
|
|
313
|
+
#endif
|
|
314
|
+
return temp;
|
|
315
|
+
}
|
|
316
|
+
|
|
317
|
+
INLINE Array<T> Host() const
|
|
318
|
+
{
|
|
319
|
+
return Array<T> (*this);
|
|
320
|
+
}
|
|
321
|
+
|
|
322
|
+
T * DevData() const { return dev_data; }
|
|
323
|
+
};
|
|
324
|
+
|
|
325
|
+
|
|
326
|
+
|
|
327
|
+
template <typename T>
|
|
328
|
+
inline Array<T> D2H (FlatArray<Dev<T>> deva)
|
|
329
|
+
{
|
|
330
|
+
Array<T> hosta(deva.Size());
|
|
331
|
+
cudaMemcpy (hosta.Data(), deva.Data(), sizeof(T)*hosta.Size(), cudaMemcpyDeviceToHost);
|
|
332
|
+
return hosta;
|
|
333
|
+
}
|
|
334
|
+
|
|
335
|
+
template <typename T>
|
|
336
|
+
inline void H2D (FlatArray<Dev<T>> deva, FlatArray<T> hosta)
|
|
337
|
+
{
|
|
338
|
+
cudaMemcpy (deva.Data(), hosta.Data(), sizeof(T)*hosta.Size(), cudaMemcpyHostToDevice);
|
|
339
|
+
}
|
|
340
|
+
|
|
341
|
+
/*
|
|
342
|
+
template <class T>
|
|
343
|
+
class TableWrapper : public Table<T>
|
|
344
|
+
{
|
|
345
|
+
using Table<T>::size;
|
|
346
|
+
using Table<T>::data;
|
|
347
|
+
using Table<T>::index;
|
|
348
|
+
public:
|
|
349
|
+
INLINE TableWrapper (int asize, int * aindex, T * adata)
|
|
350
|
+
// : Table<T> (0,0)
|
|
351
|
+
{
|
|
352
|
+
size = asize;
|
|
353
|
+
index = aindex;
|
|
354
|
+
data = adata;
|
|
355
|
+
}
|
|
356
|
+
|
|
357
|
+
INLINE TableWrapper (const Table<T> & tab)
|
|
358
|
+
// : Table<T> (0,0)
|
|
359
|
+
{
|
|
360
|
+
const TableWrapper<T> & htab = static_cast<const TableWrapper<T>&> (tab);
|
|
361
|
+
size = htab.size;
|
|
362
|
+
data = htab.data;
|
|
363
|
+
index = htab.index;
|
|
364
|
+
}
|
|
365
|
+
INLINE ~TableWrapper ()
|
|
366
|
+
{
|
|
367
|
+
data = NULL;
|
|
368
|
+
index = NULL;
|
|
369
|
+
}
|
|
370
|
+
|
|
371
|
+
INLINE int SizeData() { return index[size]; }
|
|
372
|
+
INLINE int* & Index() { return index; }
|
|
373
|
+
INLINE T* & Data() { return data; }
|
|
374
|
+
|
|
375
|
+
// HD const int * & Index() const { return index; }
|
|
376
|
+
// HD const T * & Data() const { return data; }
|
|
377
|
+
};
|
|
378
|
+
*/
|
|
379
|
+
|
|
380
|
+
|
|
381
|
+
|
|
382
|
+
// only data at device, but index at host
|
|
383
|
+
template <typename T>
|
|
384
|
+
class DevDataTable
|
|
385
|
+
{
|
|
386
|
+
int size;
|
|
387
|
+
size_t * index = nullptr;
|
|
388
|
+
Dev<T> * dev_data = nullptr;
|
|
389
|
+
|
|
390
|
+
public:
|
|
391
|
+
|
|
392
|
+
DevDataTable (FlatTable<T> t2)
|
|
393
|
+
{
|
|
394
|
+
size = t2.Size();
|
|
395
|
+
if (size == 0) return;
|
|
396
|
+
|
|
397
|
+
index = new size_t[size+1];
|
|
398
|
+
for (int i = 0; i <= size; i++)
|
|
399
|
+
index[i] = t2.IndexArray()[i];
|
|
400
|
+
|
|
401
|
+
int sizedata = t2.AsArray().Size();
|
|
402
|
+
dev_data = Dev<T>::Malloc(sizedata);
|
|
403
|
+
cudaMemcpy (dev_data, t2.Data(), sizeof(T)*sizedata, cudaMemcpyHostToDevice);
|
|
404
|
+
}
|
|
405
|
+
|
|
406
|
+
~DevDataTable ()
|
|
407
|
+
{
|
|
408
|
+
Dev<T>::Free (dev_data);
|
|
409
|
+
delete [] index;
|
|
410
|
+
}
|
|
411
|
+
|
|
412
|
+
void D2H (FlatTable<T> & t2) const
|
|
413
|
+
{
|
|
414
|
+
int sizedata = t2.AsArray().Size();
|
|
415
|
+
cudaMemcpy (&t2[0][0], dev_data, sizeof(T)*sizedata, cudaMemcpyDeviceToHost);
|
|
416
|
+
}
|
|
417
|
+
|
|
418
|
+
operator FlatTable<Dev<T>> () const
|
|
419
|
+
{
|
|
420
|
+
return FlatTable<Dev<T>> (size, index, dev_data);
|
|
421
|
+
}
|
|
422
|
+
|
|
423
|
+
auto Index() const { return index; }
|
|
424
|
+
auto DevData() const { return dev_data; }
|
|
425
|
+
|
|
426
|
+
FlatArray<Dev<T>> Row(int i) const { return { index[i+1]-index[i], dev_data+index[i] }; }
|
|
427
|
+
|
|
428
|
+
class Iterator
|
|
429
|
+
{
|
|
430
|
+
const DevDataTable & tab;
|
|
431
|
+
size_t row;
|
|
432
|
+
public:
|
|
433
|
+
Iterator (const DevDataTable & _tab, size_t _row) : tab(_tab), row(_row) { ; }
|
|
434
|
+
Iterator & operator++ () { ++row; return *this; }
|
|
435
|
+
auto operator* () const { return tab.Row(row); }
|
|
436
|
+
bool operator!= (const Iterator & it2) { return row != it2.row; }
|
|
437
|
+
};
|
|
438
|
+
|
|
439
|
+
Iterator begin() const { return Iterator(*this, 0); }
|
|
440
|
+
Iterator end() const { return Iterator(*this, size); }
|
|
441
|
+
};
|
|
442
|
+
|
|
443
|
+
|
|
444
|
+
template <typename T>
|
|
445
|
+
class DevTable
|
|
446
|
+
{
|
|
447
|
+
int size;
|
|
448
|
+
Dev<size_t> * dev_index = nullptr;
|
|
449
|
+
Dev<T> * dev_data = nullptr;
|
|
450
|
+
|
|
451
|
+
public:
|
|
452
|
+
|
|
453
|
+
DevTable (FlatTable<T> t2)
|
|
454
|
+
{
|
|
455
|
+
size = t2.Size();
|
|
456
|
+
if (size == 0) return;
|
|
457
|
+
|
|
458
|
+
cudaMalloc((size_t**)&dev_index, (size+1)*sizeof(size_t));
|
|
459
|
+
cudaMemcpy (dev_index, &t2.IndexArray()[0], sizeof(size_t)*(size+1), cudaMemcpyHostToDevice);
|
|
460
|
+
// cout << "res = " << cudaMemcpy (dev_index, t2.Index(), sizeof(int)*(size+1), cudaMemcpyHostToDevice) << endl;
|
|
461
|
+
|
|
462
|
+
int sizedata = t2.AsArray().Size();
|
|
463
|
+
cudaMalloc((int**)&dev_data, sizedata*sizeof(T));
|
|
464
|
+
cudaMemcpy (dev_data, t2.Data(), sizeof(T)*sizedata, cudaMemcpyHostToDevice);
|
|
465
|
+
}
|
|
466
|
+
|
|
467
|
+
~DevTable ()
|
|
468
|
+
{
|
|
469
|
+
cudaFree (dev_data);
|
|
470
|
+
cudaFree (dev_index);
|
|
471
|
+
}
|
|
472
|
+
|
|
473
|
+
void D2H (FlatTable<T> & t2) const
|
|
474
|
+
{
|
|
475
|
+
int sizedata = t2.AsArray().Size();
|
|
476
|
+
cudaMemcpy (&t2[0][0], dev_data, sizeof(T)*sizedata, cudaMemcpyDeviceToHost);
|
|
477
|
+
}
|
|
478
|
+
|
|
479
|
+
operator FlatTable<T> () const
|
|
480
|
+
{
|
|
481
|
+
return FlatTable<T> (size, (size_t*)dev_index, (T*)dev_data);
|
|
482
|
+
}
|
|
483
|
+
|
|
484
|
+
size_t * DevIndex() const { return (size_t*)dev_index; }
|
|
485
|
+
T * DevData() const { return (T*)dev_data; }
|
|
486
|
+
|
|
487
|
+
FlatArray<Dev<T>> AsArray() const
|
|
488
|
+
{
|
|
489
|
+
return FlatArray<Dev<T>> ( dev_index[size].D2H(), dev_data );
|
|
490
|
+
}
|
|
491
|
+
};
|
|
492
|
+
|
|
493
|
+
|
|
494
|
+
|
|
495
|
+
|
|
496
|
+
|
|
497
|
+
|
|
498
|
+
class DevBitArray
|
|
499
|
+
{
|
|
500
|
+
protected:
|
|
501
|
+
size_t size = 0;
|
|
502
|
+
unsigned char * dev_data = nullptr;
|
|
503
|
+
|
|
504
|
+
public:
|
|
505
|
+
DevBitArray (size_t asize);
|
|
506
|
+
DevBitArray (const ngcore::BitArray & ba);
|
|
507
|
+
|
|
508
|
+
~DevBitArray ();
|
|
509
|
+
|
|
510
|
+
DevBitArray & operator= (const ngcore::BitArray &ba);
|
|
511
|
+
|
|
512
|
+
size_t Size () const { return size; }
|
|
513
|
+
auto Data () const { return dev_data; }
|
|
514
|
+
|
|
515
|
+
void SetSize (size_t asize);
|
|
516
|
+
|
|
517
|
+
private:
|
|
518
|
+
size_t Addr (size_t i) const
|
|
519
|
+
{
|
|
520
|
+
return (i / CHAR_BIT);
|
|
521
|
+
}
|
|
522
|
+
};
|
|
523
|
+
|
|
524
|
+
}
|
|
525
|
+
|
|
526
|
+
|
|
527
|
+
#endif
|