PyPI - warp-lang - Versions diffs - 1.1.0__py3-none-manylinux2014_x86_64.whl → 1.2.1__py3-none-manylinux2014_x86_64.whl - Mend

warp-lang 1.1.0__py3-none-manylinux2014_x86_64.whl → 1.2.1__py3-none-manylinux2014_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of warp-lang might be problematic. Click here for more details.

Files changed (218) hide show

warp/bin/warp-clang.so +0 -0
warp/bin/warp.so +0 -0
warp/build.py +10 -37
warp/build_dll.py +2 -2
warp/builtins.py +274 -6
warp/codegen.py +51 -4
warp/config.py +2 -2
warp/constants.py +4 -0
warp/context.py +422 -203
warp/examples/benchmarks/benchmark_api.py +0 -2
warp/examples/benchmarks/benchmark_cloth_warp.py +0 -1
warp/examples/benchmarks/benchmark_launches.py +0 -2
warp/examples/core/example_dem.py +0 -2
warp/examples/core/example_fluid.py +0 -2
warp/examples/core/example_graph_capture.py +0 -2
warp/examples/core/example_marching_cubes.py +0 -2
warp/examples/core/example_mesh.py +0 -2
warp/examples/core/example_mesh_intersect.py +0 -2
warp/examples/core/example_nvdb.py +0 -2
warp/examples/core/example_raycast.py +0 -2
warp/examples/core/example_raymarch.py +0 -2
warp/examples/core/example_render_opengl.py +0 -2
warp/examples/core/example_sph.py +0 -2
warp/examples/core/example_torch.py +0 -3
warp/examples/core/example_wave.py +0 -2
warp/examples/fem/example_apic_fluid.py +140 -115
warp/examples/fem/example_burgers.py +262 -0
warp/examples/fem/example_convection_diffusion.py +0 -2
warp/examples/fem/example_convection_diffusion_dg.py +0 -2
warp/examples/fem/example_deformed_geometry.py +0 -2
warp/examples/fem/example_diffusion.py +0 -2
warp/examples/fem/example_diffusion_3d.py +5 -4
warp/examples/fem/example_diffusion_mgpu.py +0 -2
warp/examples/fem/example_mixed_elasticity.py +0 -2
warp/examples/fem/example_navier_stokes.py +0 -2
warp/examples/fem/example_stokes.py +0 -2
warp/examples/fem/example_stokes_transfer.py +0 -2
warp/examples/optim/example_bounce.py +0 -2
warp/examples/optim/example_cloth_throw.py +0 -2
warp/examples/optim/example_diffray.py +0 -2
warp/examples/optim/example_drone.py +0 -2
warp/examples/optim/example_inverse_kinematics.py +0 -2
warp/examples/optim/example_inverse_kinematics_torch.py +0 -2
warp/examples/optim/example_spring_cage.py +0 -2
warp/examples/optim/example_trajectory.py +0 -2
warp/examples/optim/example_walker.py +0 -2
warp/examples/sim/example_cartpole.py +0 -2
warp/examples/sim/example_cloth.py +0 -2
warp/examples/sim/example_granular.py +0 -2
warp/examples/sim/example_granular_collision_sdf.py +0 -2
warp/examples/sim/example_jacobian_ik.py +0 -2
warp/examples/sim/example_particle_chain.py +0 -2
warp/examples/sim/example_quadruped.py +0 -2
warp/examples/sim/example_rigid_chain.py +0 -2
warp/examples/sim/example_rigid_contact.py +0 -2
warp/examples/sim/example_rigid_force.py +0 -2
warp/examples/sim/example_rigid_gyroscopic.py +0 -2
warp/examples/sim/example_rigid_soft_contact.py +0 -2
warp/examples/sim/example_soft_body.py +0 -2
warp/fem/__init__.py +1 -0
warp/fem/cache.py +3 -1
warp/fem/geometry/__init__.py +1 -0
warp/fem/geometry/element.py +4 -0
warp/fem/geometry/grid_3d.py +0 -4
warp/fem/geometry/nanogrid.py +455 -0
warp/fem/integrate.py +63 -9
warp/fem/space/__init__.py +43 -158
warp/fem/space/basis_space.py +34 -0
warp/fem/space/collocated_function_space.py +1 -1
warp/fem/space/grid_2d_function_space.py +13 -132
warp/fem/space/grid_3d_function_space.py +16 -154
warp/fem/space/hexmesh_function_space.py +37 -134
warp/fem/space/nanogrid_function_space.py +202 -0
warp/fem/space/quadmesh_2d_function_space.py +12 -119
warp/fem/space/restriction.py +4 -1
warp/fem/space/shape/__init__.py +77 -0
warp/fem/space/shape/cube_shape_function.py +5 -15
warp/fem/space/tetmesh_function_space.py +6 -76
warp/fem/space/trimesh_2d_function_space.py +6 -76
warp/native/array.h +12 -3
warp/native/builtin.h +48 -5
warp/native/bvh.cpp +14 -10
warp/native/bvh.cu +23 -15
warp/native/bvh.h +1 -0
warp/native/clang/clang.cpp +2 -1
warp/native/crt.cpp +11 -1
warp/native/crt.h +18 -1
warp/native/exports.h +187 -0
warp/native/mat.h +47 -0
warp/native/mesh.cpp +1 -1
warp/native/mesh.cu +1 -2
warp/native/nanovdb/GridHandle.h +366 -0
warp/native/nanovdb/HostBuffer.h +590 -0
warp/native/nanovdb/NanoVDB.h +3999 -2157
warp/native/nanovdb/PNanoVDB.h +936 -99
warp/native/quat.h +28 -1
warp/native/rand.h +5 -1
warp/native/vec.h +45 -1
warp/native/volume.cpp +335 -103
warp/native/volume.cu +39 -13
warp/native/volume.h +725 -303
warp/native/volume_builder.cu +381 -360
warp/native/volume_builder.h +16 -1
warp/native/volume_impl.h +61 -0
warp/native/warp.cu +8 -2
warp/native/warp.h +15 -7
warp/render/render_opengl.py +191 -52
warp/sim/integrator_featherstone.py +10 -3
warp/sim/integrator_xpbd.py +16 -22
warp/sparse.py +89 -27
warp/stubs.py +83 -0
warp/tests/assets/test_index_grid.nvdb +0 -0
warp/tests/aux_test_dependent.py +0 -2
warp/tests/aux_test_grad_customs.py +0 -2
warp/tests/aux_test_reference.py +0 -2
warp/tests/aux_test_reference_reference.py +0 -2
warp/tests/aux_test_square.py +0 -2
warp/tests/disabled_kinematics.py +0 -2
warp/tests/test_adam.py +0 -2
warp/tests/test_arithmetic.py +0 -36
warp/tests/test_array.py +9 -11
warp/tests/test_array_reduce.py +0 -2
warp/tests/test_async.py +0 -2
warp/tests/test_atomic.py +0 -2
warp/tests/test_bool.py +58 -50
warp/tests/test_builtins_resolution.py +0 -2
warp/tests/test_bvh.py +0 -2
warp/tests/test_closest_point_edge_edge.py +0 -1
warp/tests/test_codegen.py +0 -4
warp/tests/test_compile_consts.py +130 -10
warp/tests/test_conditional.py +0 -2
warp/tests/test_copy.py +0 -2
warp/tests/test_ctypes.py +6 -8
warp/tests/test_dense.py +0 -2
warp/tests/test_devices.py +0 -2
warp/tests/test_dlpack.py +9 -11
warp/tests/test_examples.py +42 -39
warp/tests/test_fabricarray.py +0 -3
warp/tests/test_fast_math.py +0 -2
warp/tests/test_fem.py +75 -54
warp/tests/test_fp16.py +0 -2
warp/tests/test_func.py +0 -2
warp/tests/test_generics.py +27 -2
warp/tests/test_grad.py +147 -8
warp/tests/test_grad_customs.py +0 -2
warp/tests/test_hash_grid.py +1 -3
warp/tests/test_import.py +0 -2
warp/tests/test_indexedarray.py +0 -2
warp/tests/test_intersect.py +0 -2
warp/tests/test_jax.py +0 -2
warp/tests/test_large.py +11 -9
warp/tests/test_launch.py +0 -2
warp/tests/test_lerp.py +10 -54
warp/tests/test_linear_solvers.py +3 -5
warp/tests/test_lvalue.py +0 -2
warp/tests/test_marching_cubes.py +0 -2
warp/tests/test_mat.py +0 -2
warp/tests/test_mat_lite.py +0 -2
warp/tests/test_mat_scalar_ops.py +0 -2
warp/tests/test_math.py +0 -2
warp/tests/test_matmul.py +35 -37
warp/tests/test_matmul_lite.py +29 -31
warp/tests/test_mempool.py +0 -2
warp/tests/test_mesh.py +0 -3
warp/tests/test_mesh_query_aabb.py +0 -2
warp/tests/test_mesh_query_point.py +0 -2
warp/tests/test_mesh_query_ray.py +0 -2
warp/tests/test_mlp.py +0 -2
warp/tests/test_model.py +0 -2
warp/tests/test_module_hashing.py +111 -0
warp/tests/test_modules_lite.py +0 -3
warp/tests/test_multigpu.py +0 -2
warp/tests/test_noise.py +0 -4
warp/tests/test_operators.py +0 -2
warp/tests/test_options.py +0 -2
warp/tests/test_peer.py +0 -2
warp/tests/test_pinned.py +0 -2
warp/tests/test_print.py +0 -2
warp/tests/test_quat.py +0 -2
warp/tests/test_rand.py +41 -5
warp/tests/test_reload.py +0 -10
warp/tests/test_rounding.py +0 -2
warp/tests/test_runlength_encode.py +0 -2
warp/tests/test_sim_grad.py +0 -2
warp/tests/test_sim_kinematics.py +0 -2
warp/tests/test_smoothstep.py +0 -2
warp/tests/test_snippet.py +0 -2
warp/tests/test_sparse.py +0 -2
warp/tests/test_spatial.py +0 -2
warp/tests/test_special_values.py +362 -0
warp/tests/test_streams.py +0 -2
warp/tests/test_struct.py +0 -2
warp/tests/test_tape.py +0 -2
warp/tests/test_torch.py +0 -2
warp/tests/test_transient_module.py +0 -2
warp/tests/test_types.py +0 -2
warp/tests/test_utils.py +0 -2
warp/tests/test_vec.py +0 -2
warp/tests/test_vec_lite.py +0 -2
warp/tests/test_vec_scalar_ops.py +0 -2
warp/tests/test_verify_fp.py +0 -2
warp/tests/test_volume.py +237 -13
warp/tests/test_volume_write.py +86 -3
warp/tests/unittest_serial.py +10 -9
warp/tests/unittest_suites.py +6 -2
warp/tests/unittest_utils.py +2 -171
warp/tests/unused_test_misc.py +0 -2
warp/tests/walkthrough_debug.py +1 -1
warp/thirdparty/unittest_parallel.py +37 -40
warp/types.py +526 -85
{warp_lang-1.1.0.dist-info → warp_lang-1.2.1.dist-info}/METADATA +61 -31
warp_lang-1.2.1.dist-info/RECORD +359 -0
warp/examples/fem/example_convection_diffusion_dg0.py +0 -204
warp/native/nanovdb/PNanoVDBWrite.h +0 -295
warp_lang-1.1.0.dist-info/RECORD +0 -352
{warp_lang-1.1.0.dist-info → warp_lang-1.2.1.dist-info}/LICENSE.md +0 -0
{warp_lang-1.1.0.dist-info → warp_lang-1.2.1.dist-info}/WHEEL +0 -0
{warp_lang-1.1.0.dist-info → warp_lang-1.2.1.dist-info}/top_level.txt +0 -0

warp/fem/space/shape/__init__.py CHANGED Viewed

@@ -1,3 +1,9 @@
+from enum import Enum
+from typing import Optional
+from warp.fem.geometry import element as _element
+from warp.fem.polynomial import Polynomial
 from .cube_shape_function import (
     CubeNonConformingPolynomialShapeFunctions,
     CubeSerendipityShapeFunctions,
@@ -11,3 +17,74 @@ from .square_shape_function import (
 )
 from .tet_shape_function import TetrahedronNonConformingPolynomialShapeFunctions, TetrahedronPolynomialShapeFunctions
 from .triangle_shape_function import Triangle2DNonConformingPolynomialShapeFunctions, Triangle2DPolynomialShapeFunctions
+class ElementBasis(Enum):
+    """Choice of basis function to equip individual elements"""
+    LAGRANGE = 0
+    """Lagrange basis functions :math:`P_k` for simplices, tensor products :math:`Q_k` for squares and cubes"""
+    SERENDIPITY = 1
+    """Serendipity elements :math:`S_k`, corresponding to Lagrange nodes with interior points removed (for degree <= 3)"""
+    NONCONFORMING_POLYNOMIAL = 2
+    """Simplex Lagrange basis functions :math:`P_{kd}` embedded into non conforming reference elements (e.g. squares or cubes). Discontinuous only."""
+def get_shape_function(
+    element: _element.Element,
+    space_dimension: int,
+    degree: int,
+    element_basis: ElementBasis,
+    family: Optional[Polynomial] = None,
+):
+    """
+    Equips a reference element with a shape function basis.
+    Args:
+        element: the reference element on which to build the shape function
+        space_dimension: the dimension of the embedding space
+        degree: polynomial degree of the per-element shape functions
+        element_basis: type of basis function for the individual elements
+        family: Polynomial family used to generate the shape function basis. If not provided, a reasonable basis is chosen.
+    Returns:
+        the corresponding shape function
+    """
+    if degree == 0:
+        return ConstantShapeFunction(element, space_dimension)
+    if family is None:
+        family = Polynomial.LOBATTO_GAUSS_LEGENDRE
+    if isinstance(element, _element.Square):
+        if element_basis == ElementBasis.NONCONFORMING_POLYNOMIAL:
+            return SquareNonConformingPolynomialShapeFunctions(degree=degree)
+        if element_basis == ElementBasis.SERENDIPITY and degree > 1:
+            return SquareSerendipityShapeFunctions(degree=degree, family=family)
+        return SquareBipolynomialShapeFunctions(degree=degree, family=family)
+    if isinstance(element, _element.Triangle):
+        if element_basis == ElementBasis.NONCONFORMING_POLYNOMIAL:
+            return Triangle2DNonConformingPolynomialShapeFunctions(degree=degree)
+        if element_basis == ElementBasis.SERENDIPITY and degree > 2:
+            raise NotImplementedError("Serendipity variant not implemented yet for Triangle elements")
+        return Triangle2DPolynomialShapeFunctions(degree=degree)
+    if isinstance(element, _element.Cube):
+        if element_basis == ElementBasis.NONCONFORMING_POLYNOMIAL:
+            return CubeNonConformingPolynomialShapeFunctions(degree=degree)
+        if element_basis == ElementBasis.SERENDIPITY and degree > 1:
+            return CubeSerendipityShapeFunctions(degree=degree, family=family)
+        return CubeTripolynomialShapeFunctions(degree=degree, family=family)
+    if isinstance(element, _element.Tetrahedron):
+        if element_basis == ElementBasis.NONCONFORMING_POLYNOMIAL:
+            return TetrahedronNonConformingPolynomialShapeFunctions(degree=degree)
+        if element_basis == ElementBasis.SERENDIPITY and degree > 2:
+            raise NotImplementedError("Serendipity variant not implemented yet for Tet elements")
+        return TetrahedronPolynomialShapeFunctions(degree=degree)
+    return NotImplementedError("Unrecognized element type")

warp/fem/space/shape/cube_shape_function.py CHANGED Viewed

@@ -10,16 +10,6 @@ from warp.fem.types import Coords
 from .tet_shape_function import TetrahedronPolynomialShapeFunctions
-_CUBE_EDGE_INDICES = wp.constant(
-    wp.mat(shape=(3, 4), dtype=int)(
-        [
-            [0, 4, 2, 6],
-            [3, 1, 7, 5],
-            [8, 11, 9, 10],
-        ]
-    )
-)
 class CubeTripolynomialShapeFunctions:
     VERTEX = 0
@@ -96,13 +86,13 @@ class CubeTripolynomialShapeFunctions:
                         return CubeTripolynomialShapeFunctions.VERTEX, type_instance, 0
                     # z edge
-                    type_instance = _CUBE_EDGE_INDICES[2, mi * 2 + mj]
+                    type_instance = 8 + mi * 2 + mj
                     type_index = k - 1
                     return CubeTripolynomialShapeFunctions.EDGE, type_instance, type_index
                 if zk + mk == 1:
                     # y edge
-                    type_instance = _CUBE_EDGE_INDICES[1, mk * 2 + mi]
+                    type_instance = 4 + mk * 2 + mi
                     type_index = j - 1
                     return CubeTripolynomialShapeFunctions.EDGE, type_instance, type_index
@@ -114,7 +104,7 @@ class CubeTripolynomialShapeFunctions:
             if zj + mj == 1:
                 if zk + mk == 1:
                     # x edge
-                    type_instance = _CUBE_EDGE_INDICES[0, mj * 2 + mk]
+                    type_instance = mj * 2 + mk
                     type_index = i - 1
                     return CubeTripolynomialShapeFunctions.EDGE, type_instance, type_index
@@ -399,7 +389,7 @@ class CubeSerendipityShapeFunctions:
     def _edge_coords(type_index: int):
         index_in_side = type_index // 4
         side_offset = type_index - 4 * index_in_side
-        return (wp.vec3i(index_in_side + 1, side_offset // 2, side_offset % 2),)
+        return wp.vec3i(index_in_side + 1, side_offset // 2, side_offset & 1)
     @wp.func
     def _edge_axis(node_type: int):
@@ -410,7 +400,7 @@ class CubeSerendipityShapeFunctions:
         index_in_side = type_index // 4
         side_offset = type_index - 4 * index_in_side
-        return _CUBE_EDGE_INDICES[node_type - CubeSerendipityShapeFunctions.EDGE_X, side_offset], index_in_side
+        return 4 * (node_type - CubeSerendipityShapeFunctions.EDGE_X) + side_offset, index_in_side
     def _get_node_lobatto_indices(self):
         ORDER = self.ORDER

warp/fem/space/tetmesh_function_space.py CHANGED Viewed

@@ -1,16 +1,13 @@
 import warp as wp
 from warp.fem import cache
 from warp.fem.geometry import Tetmesh
-from warp.fem.types import Coords, ElementIndex
+from warp.fem.types import ElementIndex
-from .basis_space import ShapeBasisSpace, TraceBasisSpace
 from .shape import (
-    ConstantShapeFunction,
     ShapeFunction,
-    TetrahedronNonConformingPolynomialShapeFunctions,
     TetrahedronPolynomialShapeFunctions,
 )
-from .topology import DiscontinuousSpaceTopologyMixin, SpaceTopology, forward_base_topology
+from .topology import SpaceTopology, forward_base_topology
 @wp.struct
@@ -130,44 +127,6 @@ class TetmeshSpaceTopology(SpaceTopology):
             tet_face_indices[t1, t1_face] = e
-class TetmeshDiscontinuousSpaceTopology(
-    DiscontinuousSpaceTopologyMixin,
-    SpaceTopology,
-):
-    def __init__(self, mesh: Tetmesh, shape: ShapeFunction):
-        super().__init__(mesh, shape.NODES_PER_ELEMENT)
-class TetmeshBasisSpace(ShapeBasisSpace):
-    def __init__(self, topology: TetmeshSpaceTopology, shape: ShapeFunction):
-        super().__init__(topology, shape)
-        self._mesh: Tetmesh = topology.geometry
-class TetmeshPiecewiseConstantBasis(TetmeshBasisSpace):
-    def __init__(self, mesh: Tetmesh):
-        shape = ConstantShapeFunction(mesh.reference_cell(), space_dimension=3)
-        topology = TetmeshDiscontinuousSpaceTopology(mesh, shape)
-        super().__init__(shape=shape, topology=topology)
-    class Trace(TraceBasisSpace):
-        @wp.func
-        def _node_coords_in_element(
-            side_arg: Tetmesh.SideArg,
-            basis_arg: TetmeshBasisSpace.BasisArg,
-            element_index: ElementIndex,
-            node_index_in_element: int,
-        ):
-            return Coords(1.0 / 3.0, 1.0 / 3.0, 1.0 / 3.0)
-        def make_node_coords_in_element(self):
-            return self._node_coords_in_element
-    def trace(self):
-        return TetmeshPiecewiseConstantBasis.Trace(self)
 class TetmeshPolynomialSpaceTopology(TetmeshSpaceTopology):
     def __init__(self, mesh: Tetmesh, shape: TetrahedronPolynomialShapeFunctions):
         super().__init__(mesh, shape, need_tet_edge_indices=shape.ORDER >= 2, need_tet_face_indices=shape.ORDER >= 3)
@@ -258,37 +217,8 @@ class TetmeshPolynomialSpaceTopology(TetmeshSpaceTopology):
         return element_node_index
-class TetmeshPolynomialBasisSpace(TetmeshBasisSpace):
-    def __init__(
-        self,
-        mesh: Tetmesh,
-        degree: int,
-    ):
-        shape = TetrahedronPolynomialShapeFunctions(degree)
-        topology = forward_base_topology(TetmeshPolynomialSpaceTopology, mesh, shape)
-        super().__init__(topology, shape)
-class TetmeshDGPolynomialBasisSpace(TetmeshBasisSpace):
-    def __init__(
-        self,
-        mesh: Tetmesh,
-        degree: int,
-    ):
-        shape = TetrahedronPolynomialShapeFunctions(degree)
-        topology = TetmeshDiscontinuousSpaceTopology(mesh, shape)
-        super().__init__(topology, shape)
-class TetmeshNonConformingPolynomialBasisSpace(TetmeshBasisSpace):
-    def __init__(
-        self,
-        mesh: Tetmesh,
-        degree: int,
-    ):
-        shape = TetrahedronNonConformingPolynomialShapeFunctions(degree)
-        topology = TetmeshDiscontinuousSpaceTopology(mesh, shape)
+def make_tetmesh_space_topology(mesh: Tetmesh, shape: ShapeFunction):
+    if isinstance(shape, TetrahedronPolynomialShapeFunctions):
+        return forward_base_topology(TetmeshPolynomialSpaceTopology, mesh, shape)
-        super().__init__(topology, shape)
+    raise ValueError(f"Unsupported shape function {shape.name}")

warp/fem/space/trimesh_2d_function_space.py CHANGED Viewed

@@ -1,16 +1,13 @@
 import warp as wp
 from warp.fem import cache
 from warp.fem.geometry import Trimesh2D
-from warp.fem.types import Coords, ElementIndex
+from warp.fem.types import ElementIndex
-from .basis_space import ShapeBasisSpace, TraceBasisSpace
 from .shape import (
-    ConstantShapeFunction,
     ShapeFunction,
-    Triangle2DNonConformingPolynomialShapeFunctions,
     Triangle2DPolynomialShapeFunctions,
 )
-from .topology import DiscontinuousSpaceTopologyMixin, SpaceTopology, forward_base_topology
+from .topology import SpaceTopology, forward_base_topology
 @wp.struct
@@ -95,44 +92,6 @@ class Trimesh2DSpaceTopology(SpaceTopology):
             tri_edge_indices[t1, t1_edge] = e
-class Trimesh2DDiscontinuousSpaceTopology(
-    DiscontinuousSpaceTopologyMixin,
-    SpaceTopology,
-):
-    def __init__(self, mesh: Trimesh2D, shape: ShapeFunction):
-        super().__init__(mesh, shape.NODES_PER_ELEMENT)
-class Trimesh2DBasisSpace(ShapeBasisSpace):
-    def __init__(self, topology: Trimesh2DSpaceTopology, shape: ShapeFunction):
-        super().__init__(topology, shape)
-        self._mesh: Trimesh2D = topology.geometry
-class Trimesh2DPiecewiseConstantBasis(Trimesh2DBasisSpace):
-    def __init__(self, mesh: Trimesh2D):
-        shape = ConstantShapeFunction(mesh.reference_cell(), space_dimension=2)
-        topology = Trimesh2DDiscontinuousSpaceTopology(mesh, shape)
-        super().__init__(shape=shape, topology=topology)
-    class Trace(TraceBasisSpace):
-        @wp.func
-        def _node_coords_in_element(
-            side_arg: Trimesh2D.SideArg,
-            basis_arg: Trimesh2DBasisSpace.BasisArg,
-            element_index: ElementIndex,
-            node_index_in_element: int,
-        ):
-            return Coords(0.5, 0.0, 0.0)
-        def make_node_coords_in_element(self):
-            return self._node_coords_in_element
-    def trace(self):
-        return Trimesh2DPiecewiseConstantBasis.Trace(self)
 class Trimesh2DPolynomialSpaceTopology(Trimesh2DSpaceTopology):
     def __init__(self, mesh: Trimesh2D, shape: Triangle2DPolynomialShapeFunctions):
         super().__init__(mesh, shape)
@@ -187,37 +146,8 @@ class Trimesh2DPolynomialSpaceTopology(Trimesh2DSpaceTopology):
         return element_node_index
-class Trimesh2DPolynomialBasisSpace(Trimesh2DBasisSpace):
-    def __init__(
-        self,
-        mesh: Trimesh2D,
-        degree: int,
-    ):
-        shape = Triangle2DPolynomialShapeFunctions(degree)
-        topology = forward_base_topology(Trimesh2DPolynomialSpaceTopology, mesh, shape)
-        super().__init__(topology, shape)
-class Trimesh2DDGPolynomialBasisSpace(Trimesh2DBasisSpace):
-    def __init__(
-        self,
-        mesh: Trimesh2D,
-        degree: int,
-    ):
-        shape = Triangle2DPolynomialShapeFunctions(degree)
-        topology = Trimesh2DDiscontinuousSpaceTopology(mesh, shape)
-        super().__init__(topology, shape)
-class Trimesh2DNonConformingPolynomialBasisSpace(Trimesh2DBasisSpace):
-    def __init__(
-        self,
-        mesh: Trimesh2D,
-        degree: int,
-    ):
-        shape = Triangle2DNonConformingPolynomialShapeFunctions(degree)
-        topology = Trimesh2DDiscontinuousSpaceTopology(mesh, shape)
+def make_trimesh_2d_space_topology(mesh: Trimesh2D, shape: ShapeFunction):
+    if isinstance(shape, Triangle2DPolynomialShapeFunctions):
+        return forward_base_topology(Trimesh2DPolynomialSpaceTopology, mesh, shape)
-        super().__init__(topology, shape)
+    raise ValueError(f"Unsupported shape function {shape.name}")

warp/native/array.h CHANGED Viewed

@@ -489,7 +489,10 @@ CUDA_CALLABLE inline array_t<T> view(array_t<T>& src, int i)
     assert(i >= 0 && i < src.shape[0]);
     array_t<T> a;
-    a.data = data_at_byte_offset(src, byte_offset(src, i));
+    size_t offset = byte_offset(src, i);
+    a.data = data_at_byte_offset(src, offset);
+    if (src.grad)
+        a.grad = grad_at_byte_offset(src, offset);
     a.shape[0] = src.shape[1];
     a.shape[1] = src.shape[2];
     a.shape[2] = src.shape[3];
@@ -509,7 +512,10 @@ CUDA_CALLABLE inline array_t<T> view(array_t<T>& src, int i, int j)
     assert(j >= 0 && j < src.shape[1]);
     array_t<T> a;
-    a.data = data_at_byte_offset(src, byte_offset(src, i, j));
+    size_t offset = byte_offset(src, i, j);
+    a.data = data_at_byte_offset(src, offset);
+    if (src.grad)
+        a.grad = grad_at_byte_offset(src, offset);
     a.shape[0] = src.shape[2];
     a.shape[1] = src.shape[3];
     a.strides[0] = src.strides[2];
@@ -528,7 +534,10 @@ CUDA_CALLABLE inline array_t<T> view(array_t<T>& src, int i, int j, int k)
     assert(k >= 0 && k < src.shape[2]);
     array_t<T> a;
-    a.data = data_at_byte_offset(src, byte_offset(src, i, j, k));
+    size_t offset = byte_offset(src, i, j, k);
+    a.data = data_at_byte_offset(src, offset);
+    if (src.grad)
+        a.grad = grad_at_byte_offset(src, offset);
     a.shape[0] = src.shape[3];
     a.strides[0] = src.strides[3];
     a.ndim = src.ndim-3;

warp/native/builtin.h CHANGED Viewed

@@ -84,8 +84,17 @@ struct half
     unsigned short u;
-    CUDA_CALLABLE inline bool operator==(const half& h) const { return u == h.u; }
-    CUDA_CALLABLE inline bool operator!=(const half& h) const { return u != h.u; }
+    CUDA_CALLABLE inline bool operator==(const half& h) const
+    {
+        // Use float32 to get IEEE 754 behavior in case of a NaN
+        return float32(h) == float32(*this);
+    }
+    CUDA_CALLABLE inline bool operator!=(const half& h) const
+    {
+        // Use float32 to get IEEE 754 behavior in case of a NaN
+        return float32(h) != float32(*this);
+    }
     CUDA_CALLABLE inline bool operator>(const half& h) const { return half_to_float(*this) > half_to_float(h); }
     CUDA_CALLABLE inline bool operator>=(const half& h) const { return half_to_float(*this) >= half_to_float(h); }
     CUDA_CALLABLE inline bool operator<(const half& h) const { return half_to_float(*this) < half_to_float(h); }
@@ -293,7 +302,9 @@ inline CUDA_CALLABLE T bit_xor(T a, T b) { return a^b; } \
 inline CUDA_CALLABLE T lshift(T a, T b) { return a<<b; } \
 inline CUDA_CALLABLE T rshift(T a, T b) { return a>>b; } \
 inline CUDA_CALLABLE T invert(T x) { return ~x; } \
-inline CUDA_CALLABLE bool isfinite(T x) { return true; } \
+inline CUDA_CALLABLE bool isfinite(T x) { return ::isfinite(double(x)); } \
+inline CUDA_CALLABLE bool isnan(T x) { return ::isnan(double(x)); } \
+inline CUDA_CALLABLE bool isinf(T x) { return ::isinf(double(x)); } \
 inline CUDA_CALLABLE void adj_mul(T a, T b, T& adj_a, T& adj_b, T adj_ret) { } \
 inline CUDA_CALLABLE void adj_div(T a, T b, T ret, T& adj_a, T& adj_b, T adj_ret) { } \
 inline CUDA_CALLABLE void adj_add(T a, T b, T& adj_a, T& adj_b, T adj_ret) { } \
@@ -313,7 +324,10 @@ inline CUDA_CALLABLE void adj_bit_or(T a, T b, T& adj_a, T& adj_b, T adj_ret) {
 inline CUDA_CALLABLE void adj_bit_xor(T a, T b, T& adj_a, T& adj_b, T adj_ret) { } \
 inline CUDA_CALLABLE void adj_lshift(T a, T b, T& adj_a, T& adj_b, T adj_ret) { } \
 inline CUDA_CALLABLE void adj_rshift(T a, T b, T& adj_a, T& adj_b, T adj_ret) { } \
-inline CUDA_CALLABLE void adj_invert(T x, T adj_x, T& adj_ret) { }
+inline CUDA_CALLABLE void adj_invert(T x, T adj_x, T& adj_ret) { } \
+inline CUDA_CALLABLE void adj_isnan(const T&, T&, bool) { } \
+inline CUDA_CALLABLE void adj_isinf(const T&, T&, bool) { } \
+inline CUDA_CALLABLE void adj_isfinite(const T&, T&, bool) { }
 inline CUDA_CALLABLE int8 abs(int8 x) { return ::abs(x); }
 inline CUDA_CALLABLE int16 abs(int16 x) { return ::abs(x); }
@@ -354,7 +368,7 @@ inline CUDA_CALLABLE uint32 sign(uint32 x) { return 1; }
 inline CUDA_CALLABLE uint64 sign(uint64 x) { return 1; }
-// Catch-all for non-float types
+// Catch-all for non-float, non-integer types
 template<typename T>
 inline bool CUDA_CALLABLE isfinite(const T&)
 {
@@ -374,6 +388,32 @@ inline bool CUDA_CALLABLE isfinite(double x)
     return ::isfinite(x);
 }
+inline bool CUDA_CALLABLE isnan(half x)
+{
+    return ::isnan(float(x));
+}
+inline bool CUDA_CALLABLE isnan(float x)
+{
+    return ::isnan(x);
+}
+inline bool CUDA_CALLABLE isnan(double x)
+{
+    return ::isnan(x);
+}
+inline bool CUDA_CALLABLE isinf(half x)
+{
+    return ::isinf(float(x));
+}
+inline bool CUDA_CALLABLE isinf(float x)
+{
+    return ::isinf(x);
+}
+inline bool CUDA_CALLABLE isinf(double x)
+{
+    return ::isinf(x);
+}
 template<typename T>
 inline CUDA_CALLABLE void print(const T&)
 {
@@ -466,6 +506,9 @@ inline CUDA_CALLABLE void adj_div(T a, T b, T ret, T& adj_a, T& adj_b, T adj_ret
         assert(0);\
     })\
 }\
+inline CUDA_CALLABLE void adj_isnan(const T&, T&, bool) { }\
+inline CUDA_CALLABLE void adj_isinf(const T&, T&, bool) { }\
+inline CUDA_CALLABLE void adj_isfinite(const T&, T&, bool) { }
 DECLARE_FLOAT_OPS(float16)
 DECLARE_FLOAT_OPS(float32)

warp/native/bvh.cpp CHANGED Viewed

@@ -339,6 +339,19 @@ void bvh_rem_descriptor(uint64_t id)
 }
+// create in-place given existing descriptor
+void bvh_create_host(vec3* lowers, vec3* uppers, int num_items, BVH& bvh)
+{
+    memset(&bvh, 0, sizeof(BVH));
+    bvh.item_lowers = lowers;
+    bvh.item_uppers = uppers;
+    bvh.num_items = num_items;
+    MedianBVHBuilder builder;
+    builder.build(bvh, lowers, uppers, num_items);
+}
 void bvh_destroy_host(BVH& bvh)
 {
     delete[] bvh.node_lowers;
@@ -360,16 +373,7 @@ void bvh_destroy_host(BVH& bvh)
 uint64_t bvh_create_host(vec3* lowers, vec3* uppers, int num_items)
 {
     BVH* bvh = new BVH();
-    memset(bvh, 0, sizeof(BVH));
-    bvh->context = NULL;
-    bvh->item_lowers = lowers;
-    bvh->item_uppers = uppers;
-    bvh->num_items = num_items;
-    MedianBVHBuilder builder;
-    builder.build(*bvh, lowers, uppers, num_items);
+    wp::bvh_create_host(lowers, uppers, num_items, *bvh);
     return (uint64_t)bvh;
 }

warp/native/bvh.cu CHANGED Viewed

@@ -455,7 +455,28 @@ void LinearBVHBuilderGPU::build(BVH& bvh, const vec3* item_lowers, const vec3* i
 }
-void bvh_destroy_device(wp::BVH& bvh)
+// create in-place given existing descriptor
+void bvh_create_device(void* context, vec3* lowers, vec3* uppers, int num_items, BVH& bvh_host)
+{
+    ContextGuard guard(context);
+    bvh_host.num_items = num_items;
+    bvh_host.max_nodes = 2*num_items;
+    bvh_host.node_lowers = (BVHPackedNodeHalf*)alloc_device(WP_CURRENT_CONTEXT, sizeof(BVHPackedNodeHalf)*bvh_host.max_nodes);
+    bvh_host.node_uppers = (BVHPackedNodeHalf*)alloc_device(WP_CURRENT_CONTEXT, sizeof(BVHPackedNodeHalf)*bvh_host.max_nodes);
+    bvh_host.node_parents = (int*)alloc_device(WP_CURRENT_CONTEXT, sizeof(int)*bvh_host.max_nodes);
+    bvh_host.node_counts = (int*)alloc_device(WP_CURRENT_CONTEXT, sizeof(int)*bvh_host.max_nodes);
+    bvh_host.root = (int*)alloc_device(WP_CURRENT_CONTEXT, sizeof(int));
+    bvh_host.item_lowers = lowers;
+    bvh_host.item_uppers = uppers;
+    bvh_host.context = context ? context : cuda_context_get_current();
+    LinearBVHBuilderGPU builder;
+    builder.build(bvh_host, lowers, uppers, num_items, NULL);
+}
+void bvh_destroy_device(BVH& bvh)
 {
     ContextGuard guard(bvh.context);
@@ -485,20 +506,7 @@ uint64_t bvh_create_device(void* context, wp::vec3* lowers, wp::vec3* uppers, in
     ContextGuard guard(context);
     wp::BVH bvh_host;
-    bvh_host.num_items = num_items;
-    bvh_host.max_nodes = 2*num_items;
-    bvh_host.node_lowers = (wp::BVHPackedNodeHalf*)alloc_device(WP_CURRENT_CONTEXT, sizeof(wp::BVHPackedNodeHalf)*bvh_host.max_nodes);
-    bvh_host.node_uppers = (wp::BVHPackedNodeHalf*)alloc_device(WP_CURRENT_CONTEXT, sizeof(wp::BVHPackedNodeHalf)*bvh_host.max_nodes);
-    bvh_host.node_parents = (int*)alloc_device(WP_CURRENT_CONTEXT, sizeof(int)*bvh_host.max_nodes);
-    bvh_host.node_counts = (int*)alloc_device(WP_CURRENT_CONTEXT, sizeof(int)*bvh_host.max_nodes);
-    bvh_host.root = (int*)alloc_device(WP_CURRENT_CONTEXT, sizeof(int));
-    bvh_host.item_lowers = lowers;
-    bvh_host.item_uppers = uppers;
-    bvh_host.context = context ? context : cuda_context_get_current();
-    wp::LinearBVHBuilderGPU builder;
-    builder.build(bvh_host, lowers, uppers, num_items, NULL);
+    bvh_create_device(WP_CURRENT_CONTEXT, lowers, uppers, num_items, bvh_host);
     // create device-side BVH descriptor
     wp::BVH* bvh_device = (wp::BVH*)alloc_device(WP_CURRENT_CONTEXT, sizeof(wp::BVH));

warp/native/bvh.h CHANGED Viewed

@@ -417,6 +417,7 @@ CUDA_CALLABLE void bvh_rem_descriptor(uint64_t id);
 #if !__CUDA_ARCH__
+void bvh_create_host(vec3* lowers, vec3* uppers, int num_items, BVH& bvh);
 void bvh_destroy_host(wp::BVH& bvh);
 void bvh_refit_host(wp::BVH& bvh);

warp/native/clang/clang.cpp CHANGED Viewed

@@ -413,6 +413,8 @@ WP_API int load_obj(const char* object_file, const char* module_name)
             SYMBOL(memcpy), SYMBOL(memset), SYMBOL(memmove),
             SYMBOL(_wp_assert),
             SYMBOL(_wp_isfinite),
+            SYMBOL(_wp_isnan),
+            SYMBOL(_wp_isinf),
         #if defined(_WIN64)
             // For functions with large stack frames the compiler will emit a call to
             // __chkstk() to linearly touch each memory page. This grows the stack without
@@ -492,4 +494,3 @@ WP_API uint64_t lookup(const char* dll_name, const char* function_name)
 }  // extern "C"
 }  // namespace wp

warp/native/crt.cpp CHANGED Viewed

@@ -17,6 +17,16 @@ extern "C" WP_API int _wp_isfinite(double x)
     return std::isfinite(x);
 }
+extern "C" WP_API int _wp_isnan(double x)
+{
+    return std::isnan(x);
+}
+extern "C" WP_API int _wp_isinf(double x)
+{
+    return std::isinf(x);
+}
 extern "C" WP_API void _wp_assert(const char* expression, const char* file, unsigned int line)
 {
     fflush(stdout);
@@ -29,4 +39,4 @@ extern "C" WP_API void _wp_assert(const char* expression, const char* file, unsi
     // Now invoke the standard assert(), which may abort the program or break
     // into the debugger as decided by the runtime environment.
     assert(false && "assert() failed");
-}
+}

warp/native/crt.h CHANGED Viewed

@@ -38,6 +38,12 @@ extern "C" WP_API void _wp_assert(const char* message, const char* file, unsigne
 // Helper for implementing isfinite()
 extern "C" WP_API int _wp_isfinite(double);
+// Helper for implementing isnan()
+extern "C" WP_API int _wp_isnan(double);
+// Helper for implementing isinf()
+extern "C" WP_API int _wp_isinf(double);
 #endif  // !__CUDA_ARCH__
 #if !defined(WP_NO_CRT)
@@ -124,6 +130,7 @@ enum {
 #define INFINITY   ((float)(DBL_MAX * DBL_MAX))
 #define HUGE_VAL   ((double)INFINITY)
 #define HUGE_VALF  ((float)INFINITY)
+#define NAN        ((float)(0.0 / 0.0))
 /// stdint.h
 typedef signed char      int8_t;
@@ -320,6 +327,16 @@ inline bool isfinite(double x)
     return _wp_isfinite(x);
 }
+inline bool isnan(double x)
+{
+    return _wp_isnan(x);
+}
+inline bool isinf(double x)
+{
+    return _wp_isinf(x);
+}
 // assert.h
 #ifdef NDEBUG
     #define assert(expression) ((void)0)
@@ -332,4 +349,4 @@ inline bool isfinite(double x)
 #endif  // !__CUDACC__
-#endif // WP_NO_CRT
+#endif // WP_NO_CRT