PyPI - warp-lang - Versions diffs - 1.2.2__py3-none-win_amd64.whl → 1.3.1__py3-none-win_amd64.whl - Mend

warp-lang 1.2.2__py3-none-win_amd64.whl → 1.3.1__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of warp-lang might be problematic. Click here for more details.

Files changed (194) hide show

warp/__init__.py +8 -6
warp/autograd.py +823 -0
warp/bin/warp-clang.dll +0 -0
warp/bin/warp.dll +0 -0
warp/build.py +6 -2
warp/builtins.py +1412 -888
warp/codegen.py +503 -166
warp/config.py +48 -18
warp/context.py +400 -198
warp/dlpack.py +8 -0
warp/examples/assets/bunny.usd +0 -0
warp/examples/benchmarks/benchmark_cloth_warp.py +1 -1
warp/examples/benchmarks/benchmark_interop_torch.py +158 -0
warp/examples/benchmarks/benchmark_launches.py +1 -1
warp/examples/core/example_cupy.py +78 -0
warp/examples/fem/example_apic_fluid.py +17 -36
warp/examples/fem/example_burgers.py +9 -18
warp/examples/fem/example_convection_diffusion.py +7 -17
warp/examples/fem/example_convection_diffusion_dg.py +27 -47
warp/examples/fem/example_deformed_geometry.py +11 -22
warp/examples/fem/example_diffusion.py +7 -18
warp/examples/fem/example_diffusion_3d.py +24 -28
warp/examples/fem/example_diffusion_mgpu.py +7 -14
warp/examples/fem/example_magnetostatics.py +190 -0
warp/examples/fem/example_mixed_elasticity.py +111 -80
warp/examples/fem/example_navier_stokes.py +30 -34
warp/examples/fem/example_nonconforming_contact.py +290 -0
warp/examples/fem/example_stokes.py +17 -32
warp/examples/fem/example_stokes_transfer.py +12 -21
warp/examples/fem/example_streamlines.py +350 -0
warp/examples/fem/utils.py +936 -0
warp/fabric.py +5 -2
warp/fem/__init__.py +13 -3
warp/fem/cache.py +161 -11
warp/fem/dirichlet.py +37 -28
warp/fem/domain.py +105 -14
warp/fem/field/__init__.py +14 -3
warp/fem/field/field.py +454 -11
warp/fem/field/nodal_field.py +33 -18
warp/fem/geometry/deformed_geometry.py +50 -15
warp/fem/geometry/hexmesh.py +12 -24
warp/fem/geometry/nanogrid.py +106 -31
warp/fem/geometry/quadmesh_2d.py +6 -11
warp/fem/geometry/tetmesh.py +103 -61
warp/fem/geometry/trimesh_2d.py +98 -47
warp/fem/integrate.py +231 -186
warp/fem/operator.py +14 -9
warp/fem/quadrature/pic_quadrature.py +35 -9
warp/fem/quadrature/quadrature.py +119 -32
warp/fem/space/basis_space.py +98 -22
warp/fem/space/collocated_function_space.py +3 -1
warp/fem/space/function_space.py +7 -2
warp/fem/space/grid_2d_function_space.py +3 -3
warp/fem/space/grid_3d_function_space.py +4 -4
warp/fem/space/hexmesh_function_space.py +3 -2
warp/fem/space/nanogrid_function_space.py +12 -14
warp/fem/space/partition.py +45 -47
warp/fem/space/restriction.py +19 -16
warp/fem/space/shape/cube_shape_function.py +91 -3
warp/fem/space/shape/shape_function.py +7 -0
warp/fem/space/shape/square_shape_function.py +32 -0
warp/fem/space/shape/tet_shape_function.py +11 -7
warp/fem/space/shape/triangle_shape_function.py +10 -1
warp/fem/space/topology.py +116 -42
warp/fem/types.py +8 -1
warp/fem/utils.py +301 -83
warp/native/array.h +16 -0
warp/native/builtin.h +0 -15
warp/native/cuda_util.cpp +14 -6
warp/native/exports.h +1348 -1308
warp/native/quat.h +79 -0
warp/native/rand.h +27 -4
warp/native/sparse.cpp +83 -81
warp/native/sparse.cu +381 -453
warp/native/vec.h +64 -0
warp/native/volume.cpp +40 -49
warp/native/volume_builder.cu +2 -3
warp/native/volume_builder.h +12 -17
warp/native/warp.cu +3 -3
warp/native/warp.h +69 -59
warp/render/render_opengl.py +17 -9
warp/sim/articulation.py +117 -17
warp/sim/collide.py +35 -29
warp/sim/model.py +123 -18
warp/sim/render.py +3 -1
warp/sparse.py +867 -203
warp/stubs.py +312 -541
warp/tape.py +29 -1
warp/tests/disabled_kinematics.py +1 -1
warp/tests/test_adam.py +1 -1
warp/tests/test_arithmetic.py +1 -1
warp/tests/test_array.py +58 -1
warp/tests/test_array_reduce.py +1 -1
warp/tests/test_async.py +1 -1
warp/tests/test_atomic.py +1 -1
warp/tests/test_bool.py +1 -1
warp/tests/test_builtins_resolution.py +1 -1
warp/tests/test_bvh.py +6 -1
warp/tests/test_closest_point_edge_edge.py +1 -1
warp/tests/test_codegen.py +91 -1
warp/tests/test_compile_consts.py +1 -1
warp/tests/test_conditional.py +1 -1
warp/tests/test_copy.py +1 -1
warp/tests/test_ctypes.py +1 -1
warp/tests/test_dense.py +1 -1
warp/tests/test_devices.py +1 -1
warp/tests/test_dlpack.py +1 -1
warp/tests/test_examples.py +33 -4
warp/tests/test_fabricarray.py +5 -2
warp/tests/test_fast_math.py +1 -1
warp/tests/test_fem.py +213 -6
warp/tests/test_fp16.py +1 -1
warp/tests/test_func.py +1 -1
warp/tests/test_future_annotations.py +90 -0
warp/tests/test_generics.py +1 -1
warp/tests/test_grad.py +1 -1
warp/tests/test_grad_customs.py +1 -1
warp/tests/test_grad_debug.py +247 -0
warp/tests/test_hash_grid.py +6 -1
warp/tests/test_implicit_init.py +354 -0
warp/tests/test_import.py +1 -1
warp/tests/test_indexedarray.py +1 -1
warp/tests/test_intersect.py +1 -1
warp/tests/test_jax.py +1 -1
warp/tests/test_large.py +1 -1
warp/tests/test_launch.py +1 -1
warp/tests/test_lerp.py +1 -1
warp/tests/test_linear_solvers.py +1 -1
warp/tests/test_lvalue.py +1 -1
warp/tests/test_marching_cubes.py +5 -2
warp/tests/test_mat.py +34 -35
warp/tests/test_mat_lite.py +2 -1
warp/tests/test_mat_scalar_ops.py +1 -1
warp/tests/test_math.py +1 -1
warp/tests/test_matmul.py +20 -16
warp/tests/test_matmul_lite.py +1 -1
warp/tests/test_mempool.py +1 -1
warp/tests/test_mesh.py +5 -2
warp/tests/test_mesh_query_aabb.py +1 -1
warp/tests/test_mesh_query_point.py +1 -1
warp/tests/test_mesh_query_ray.py +1 -1
warp/tests/test_mlp.py +1 -1
warp/tests/test_model.py +1 -1
warp/tests/test_module_hashing.py +77 -1
warp/tests/test_modules_lite.py +1 -1
warp/tests/test_multigpu.py +1 -1
warp/tests/test_noise.py +1 -1
warp/tests/test_operators.py +1 -1
warp/tests/test_options.py +1 -1
warp/tests/test_overwrite.py +542 -0
warp/tests/test_peer.py +1 -1
warp/tests/test_pinned.py +1 -1
warp/tests/test_print.py +1 -1
warp/tests/test_quat.py +15 -1
warp/tests/test_rand.py +1 -1
warp/tests/test_reload.py +1 -1
warp/tests/test_rounding.py +1 -1
warp/tests/test_runlength_encode.py +1 -1
warp/tests/test_scalar_ops.py +95 -0
warp/tests/test_sim_grad.py +1 -1
warp/tests/test_sim_kinematics.py +1 -1
warp/tests/test_smoothstep.py +1 -1
warp/tests/test_sparse.py +82 -15
warp/tests/test_spatial.py +1 -1
warp/tests/test_special_values.py +2 -11
warp/tests/test_streams.py +11 -1
warp/tests/test_struct.py +1 -1
warp/tests/test_tape.py +1 -1
warp/tests/test_torch.py +194 -1
warp/tests/test_transient_module.py +1 -1
warp/tests/test_types.py +1 -1
warp/tests/test_utils.py +1 -1
warp/tests/test_vec.py +15 -63
warp/tests/test_vec_lite.py +2 -1
warp/tests/test_vec_scalar_ops.py +65 -1
warp/tests/test_verify_fp.py +1 -1
warp/tests/test_volume.py +28 -2
warp/tests/test_volume_write.py +1 -1
warp/tests/unittest_serial.py +1 -1
warp/tests/unittest_suites.py +9 -1
warp/tests/walkthrough_debug.py +1 -1
warp/thirdparty/unittest_parallel.py +2 -5
warp/torch.py +103 -41
warp/types.py +341 -224
warp/utils.py +11 -2
{warp_lang-1.2.2.dist-info → warp_lang-1.3.1.dist-info}/METADATA +99 -46
warp_lang-1.3.1.dist-info/RECORD +368 -0
warp/examples/fem/bsr_utils.py +0 -378
warp/examples/fem/mesh_utils.py +0 -133
warp/examples/fem/plot_utils.py +0 -292
warp_lang-1.2.2.dist-info/RECORD +0 -359
{warp_lang-1.2.2.dist-info → warp_lang-1.3.1.dist-info}/LICENSE.md +0 -0
{warp_lang-1.2.2.dist-info → warp_lang-1.3.1.dist-info}/WHEEL +0 -0
{warp_lang-1.2.2.dist-info → warp_lang-1.3.1.dist-info}/top_level.txt +0 -0

warp/dlpack.py CHANGED Viewed

@@ -60,10 +60,18 @@ PyCapsule_SetName.restype = ctypes.c_int
 class _DLPackTensorHolder:
     """Class responsible for deleting DLManagedTensor memory after ownership is transferred from a capsule."""
+    def __new__(cls, *args, **kwargs):
+        instance = super(_DLPackTensorHolder, cls).__new__(cls)
+        instance.mem_ptr = None
+        return instance
     def __init__(self, mem_ptr):
         self.mem_ptr = mem_ptr
     def __del__(self):
+        if not self.mem_ptr:
+            return
         managed_tensor = DLManagedTensor.from_address(self.mem_ptr)
         if managed_tensor.deleter:
             managed_tensor.deleter(self.mem_ptr)

warp/examples/assets/bunny.usd CHANGED Viewed

Binary file

warp/examples/benchmarks/benchmark_cloth_warp.py CHANGED Viewed

@@ -7,7 +7,7 @@
 import warp as wp
-wp.build.clear_kernel_cache()
+wp.clear_kernel_cache()
 @wp.kernel

warp/examples/benchmarks/benchmark_interop_torch.py ADDED Viewed

@@ -0,0 +1,158 @@
+# Copyright (c) 2024 NVIDIA CORPORATION.  All rights reserved.
+# NVIDIA CORPORATION and its licensors retain all intellectual property
+# and proprietary rights in and to this software, related documentation
+# and any modifications thereto.  Any use, reproduction, disclosure or
+# distribution of this software and related documentation without an express
+# license agreement from NVIDIA CORPORATION is strictly prohibited.
+import time
+import torch
+import warp as wp
+def create_simple_kernel(dtype):
+    def simple_kernel(
+        a: wp.array(dtype=dtype),
+        b: wp.array(dtype=dtype),
+        c: wp.array(dtype=dtype),
+        d: wp.array(dtype=dtype),
+        e: wp.array(dtype=dtype),
+    ):
+        pass
+    return wp.Kernel(simple_kernel)
+def test_from_torch(kernel, num_iters, array_size, device, warp_dtype=None):
+    warp_device = wp.get_device(device)
+    torch_device = wp.device_to_torch(warp_device)
+    if hasattr(warp_dtype, "_shape_"):
+        torch_shape = (array_size, *warp_dtype._shape_)
+        torch_dtype = wp.dtype_to_torch(warp_dtype._wp_scalar_type_)
+    else:
+        torch_shape = (array_size,)
+        torch_dtype = torch.float32 if warp_dtype is None else wp.dtype_to_torch(warp_dtype)
+    _a = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _b = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _c = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _d = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _e = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    wp.synchronize()
+    # profiler = Profiler(interval=0.000001)
+    # profiler.start()
+    t1 = time.time_ns()
+    for _ in range(num_iters):
+        a = wp.from_torch(_a, dtype=warp_dtype)
+        b = wp.from_torch(_b, dtype=warp_dtype)
+        c = wp.from_torch(_c, dtype=warp_dtype)
+        d = wp.from_torch(_d, dtype=warp_dtype)
+        e = wp.from_torch(_e, dtype=warp_dtype)
+        wp.launch(kernel, dim=array_size, inputs=[a, b, c, d, e])
+    t2 = time.time_ns()
+    print(f"{(t2 - t1) / 1_000_000 :8.0f} ms  from_torch(...)")
+    # profiler.stop()
+    # profiler.print()
+def test_array_ctype_from_torch(kernel, num_iters, array_size, device, warp_dtype=None):
+    warp_device = wp.get_device(device)
+    torch_device = wp.device_to_torch(warp_device)
+    if hasattr(warp_dtype, "_shape_"):
+        torch_shape = (array_size, *warp_dtype._shape_)
+        torch_dtype = wp.dtype_to_torch(warp_dtype._wp_scalar_type_)
+    else:
+        torch_shape = (array_size,)
+        torch_dtype = torch.float32 if warp_dtype is None else wp.dtype_to_torch(warp_dtype)
+    _a = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _b = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _c = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _d = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _e = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    wp.synchronize()
+    # profiler = Profiler(interval=0.000001)
+    # profiler.start()
+    t1 = time.time_ns()
+    for _ in range(num_iters):
+        a = wp.from_torch(_a, dtype=warp_dtype, return_ctype=True)
+        b = wp.from_torch(_b, dtype=warp_dtype, return_ctype=True)
+        c = wp.from_torch(_c, dtype=warp_dtype, return_ctype=True)
+        d = wp.from_torch(_d, dtype=warp_dtype, return_ctype=True)
+        e = wp.from_torch(_e, dtype=warp_dtype, return_ctype=True)
+        wp.launch(kernel, dim=array_size, inputs=[a, b, c, d, e])
+    t2 = time.time_ns()
+    print(f"{(t2 - t1) / 1_000_000 :8.0f} ms  from_torch(..., return_ctype=True)")
+    # profiler.stop()
+    # profiler.print()
+def test_direct_from_torch(kernel, num_iters, array_size, device, warp_dtype=None):
+    warp_device = wp.get_device(device)
+    torch_device = wp.device_to_torch(warp_device)
+    if hasattr(warp_dtype, "_shape_"):
+        torch_shape = (array_size, *warp_dtype._shape_)
+        torch_dtype = wp.dtype_to_torch(warp_dtype._wp_scalar_type_)
+    else:
+        torch_shape = (array_size,)
+        torch_dtype = torch.float32 if warp_dtype is None else wp.dtype_to_torch(warp_dtype)
+    _a = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _b = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _c = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _d = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    _e = torch.zeros(torch_shape, dtype=torch_dtype, device=torch_device)
+    wp.synchronize()
+    # profiler = Profiler(interval=0.000001)
+    # profiler.start()
+    t1 = time.time_ns()
+    for _ in range(num_iters):
+        wp.launch(kernel, dim=array_size, inputs=[_a, _b, _c, _d, _e])
+    t2 = time.time_ns()
+    print(f"{(t2 - t1) / 1_000_000 :8.0f} ms  direct from torch")
+    # profiler.stop()
+    # profiler.print()
+wp.init()
+params = [
+    # (warp_dtype arg, kernel)
+    (None, create_simple_kernel(wp.float32)),
+    (wp.float32, create_simple_kernel(wp.float32)),
+    (wp.vec3f, create_simple_kernel(wp.vec3f)),
+    (wp.mat22f, create_simple_kernel(wp.mat22f)),
+]
+wp.load_module()
+num_iters = 100000
+for warp_dtype, kernel in params:
+    print(f"\ndtype={wp.context.type_str(warp_dtype)}")
+    test_from_torch(kernel, num_iters, 10, "cuda:0", warp_dtype=warp_dtype)
+    test_array_ctype_from_torch(kernel, num_iters, 10, "cuda:0", warp_dtype=warp_dtype)
+    test_direct_from_torch(kernel, num_iters, 10, "cuda:0", warp_dtype=warp_dtype)

warp/examples/benchmarks/benchmark_launches.py CHANGED Viewed

@@ -128,7 +128,7 @@ def ksz(s: Sz):
     tid = wp.tid()  # noqa: F841
-wp.build.clear_kernel_cache()
+wp.clear_kernel_cache()
 devices = wp.get_devices()
 num_launches = 100000

warp/examples/core/example_cupy.py ADDED Viewed

@@ -0,0 +1,78 @@
+# Copyright (c) 2024 NVIDIA CORPORATION.  All rights reserved.
+# NVIDIA CORPORATION and its licensors retain all intellectual property
+# and proprietary rights in and to this software, related documentation
+# and any modifications thereto.  Any use, reproduction, disclosure or
+# distribution of this software and related documentation without an express
+# license agreement from NVIDIA CORPORATION is strictly prohibited.
+###########################################################################
+# Example CuPy
+#
+# The example demonstrates interoperability with CuPy on CUDA devices
+# and NumPy on CPU devices.
+###########################################################################
+import warp as wp
+@wp.kernel
+def saxpy(x: wp.array(dtype=float), y: wp.array(dtype=float), a: float):
+    i = wp.tid()
+    y[i] = a * x[i] + y[i]
+class Example:
+    def __init__(self):
+        device = wp.get_device()
+        self.n = 10
+        self.a = 1.0
+        if device.is_cuda:
+            # use CuPy arrays on CUDA devices
+            import cupy as cp
+            print(f"Using CuPy on device {device}")
+            # tell CuPy to use the same device
+            with cp.cuda.Device(device.ordinal):
+                self.x = cp.arange(self.n, dtype=cp.float32)
+                self.y = cp.ones(self.n, dtype=cp.float32)
+        else:
+            # use NumPy arrays on CPU
+            import numpy as np
+            print("Using NumPy on CPU")
+            self.x = np.arange(self.n, dtype=np.float32)
+            self.y = np.ones(self.n, dtype=np.float32)
+    def step(self):
+        # Launch a Warp kernel on the pre-allocated arrays.
+        # When running on a CUDA device, these are CuPy arrays.
+        # When running on the CPU, these are NumPy arrays.
+        #
+        # Note that the arrays can be passed to Warp kernels directly.  Under the hood,
+        # Warp uses the __cuda_array_interface__ and __array_interface__ protocols to
+        # access the data.
+        wp.launch(saxpy, dim=self.n, inputs=[self.x, self.y, self.a])
+    def render(self):
+        print(self.y)
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser(formatter_class=argparse.ArgumentDefaultsHelpFormatter)
+    parser.add_argument("--device", type=str, default=None, help="Override the default Warp device.")
+    parser.add_argument("--num_frames", type=int, default=10, help="Total number of frames.")
+    args = parser.parse_known_args()[0]
+    with wp.ScopedDevice(args.device):
+        example = Example()
+        for _ in range(args.num_frames):
+            example.step()
+            example.render()

warp/examples/fem/example_apic_fluid.py CHANGED Viewed

@@ -15,17 +15,13 @@
 import numpy as np
 import warp as wp
+import warp.examples.fem.utils as fem_example_utils
 import warp.fem as fem
 import warp.sim.render
 from warp.fem import Domain, Field, Sample, at_node, div, grad, integrand
 from warp.sim import Model, State
 from warp.sparse import BsrMatrix, bsr_mm, bsr_mv, bsr_transposed
-try:
-    from .bsr_utils import bsr_cg
-except ImportError:
-    from bsr_utils import bsr_cg
 @wp.func
 def collision_sdf(x: wp.vec3):
@@ -130,7 +126,7 @@ def scale_transposed_divergence_mat(
     tr_divergence_mat_values: wp.array(dtype=wp.mat(shape=(3, 1), dtype=float)),
     inv_fraction_int: wp.array(dtype=float),
 ):
-    # In-place scaling of gradient operator rows wiht inverse mass
+    # In-place scaling of gradient operator rows with inverse mass
     u_i = wp.tid()
     block_beg = tr_divergence_mat_offsets[u_i]
@@ -140,22 +136,24 @@ def scale_transposed_divergence_mat(
         tr_divergence_mat_values[b] = tr_divergence_mat_values[b] * inv_fraction_int[u_i]
-@wp.kernel
-def compute_particle_ijk(positions: wp.array(dtype=wp.vec3), voxel_size: float, ijks: wp.array(dtype=wp.vec3i)):
-    # Index-space coordinates of grid cell containing each particle
-    p = wp.tid()
-    pos = positions[p] / voxel_size
-    ijks[p] = wp.vec3i(int(wp.floor(pos[0])), int(wp.floor(pos[1])), int(wp.floor(pos[2])))
-def solve_incompressibility(divergence_mat: BsrMatrix, inv_volume, pressure, velocity, quiet: bool = False):
+def solve_incompressibility(
+    divergence_mat: BsrMatrix, dirichlet_projector: BsrMatrix, inv_volume, pressure, velocity, quiet: bool = False
+):
     """Solve for divergence-free velocity delta:
     delta_velocity = inv_volume * transpose(divergence_mat) * pressure
     divergence_mat * (velocity + delta_velocity) = 0
+    dirichlet_projector * delta_velocity = 0
     """
+    # Constraint-free divergence -- computed *before* projection of divergence_mat
+    rhs = wp.empty_like(pressure)
+    bsr_mv(A=divergence_mat, x=velocity, y=rhs, alpha=-1.0)
+    # Project matrix to enforce boundary conditions
+    # divergence_matrix -= divergence_matrix * vel_projector
+    bsr_mm(alpha=-1.0, x=divergence_mat, y=dirichlet_projector, z=divergence_mat, beta=1.0)
     # Build transposed gradient matrix, scale with inverse fraction
     transposed_divergence_mat = bsr_transposed(divergence_mat)
     wp.launch(
@@ -171,9 +169,7 @@ def solve_incompressibility(divergence_mat: BsrMatrix, inv_volume, pressure, vel
     # For simplicity, assemble Schur complement and solve with CG
     schur = bsr_mm(divergence_mat, transposed_divergence_mat)
-    rhs = wp.zeros_like(pressure)
-    bsr_mv(A=divergence_mat, x=velocity, y=rhs, alpha=-1.0, beta=0.0)
-    bsr_cg(schur, b=rhs, x=pressure, quiet=quiet, tol=1.0e-6)
+    fem_example_utils.bsr_cg(schur, b=rhs, x=pressure, quiet=quiet, tol=1.0e-6)
     # Apply pressure to velocity
     bsr_mv(A=transposed_divergence_mat, x=pressure, y=velocity, alpha=1.0, beta=1.0)
@@ -249,23 +245,11 @@ class Example:
         self.current_frame = self.current_frame + 1
-        particle_ijk = wp.empty(self.state_0.particle_count, dtype=wp.vec3i)
         with wp.ScopedTimer(f"simulate frame {self.current_frame}", active=True):
             for _s in range(self.sim_substeps):
-                # Compute the voxel coordinates for each particle.
-                # `Volume.allocate_by_voxels` accepts world positions, but allocates
-                # the voxels with the closest origin rather than the enclosing ones
-                # (i.e, it "round"s the positions, while here we eant to "floor" it)
-                wp.launch(
-                    compute_particle_ijk,
-                    dim=particle_ijk.shape,
-                    inputs=[self.state_0.particle_q, self.voxel_size, particle_ijk],
-                )
                 # Allocate the voxels and create the warp.fem geometry
                 volume = wp.Volume.allocate_by_voxels(
-                    voxel_points=particle_ijk,
+                    voxel_points=self.state_0.particle_q,
                     voxel_size=self.voxel_size,
                 )
                 grid = fem.Nanogrid(volume)
@@ -354,13 +338,10 @@ class Example:
                     output_dtype=float,
                 )
-                # Project matrix to enforce boundary conditions
-                # divergence_matrix -= divergence_matrix * vel_projector
-                bsr_mm(alpha=-1.0, x=divergence_matrix, y=vel_projector, z=divergence_matrix, beta=1.0)
                 # Solve unilateral incompressibility
                 solve_incompressibility(
                     divergence_matrix,
+                    vel_projector,
                     inv_volume,
                     pressure_field.dof_values,
                     velocity_field.dof_values,

warp/examples/fem/example_burgers.py CHANGED Viewed

@@ -16,17 +16,8 @@
 ###########################################################################
 import warp as wp
+import warp.examples.fem.utils as fem_example_utils
 import warp.fem as fem
-import warp.sparse as sp
-# Import example utilities
-# Make sure that works both when imported as module and run as standalone file
-try:
-    from .bsr_utils import invert_diagonal_bsr_mass_matrix
-    from .plot_utils import Plot
-except ImportError:
-    from bsr_utils import invert_diagonal_bsr_mass_matrix
-    from plot_utils import Plot
 @fem.integrand
@@ -97,7 +88,7 @@ def slope_limiter(domain: fem.Domain, s: fem.Sample, u: fem.Field, dx: wp.vec2):
     # Assumes regular grid topology
     center_coords = fem.Coords(0.5, 0.5, 0.0)
-    cell_center = fem.types.make_free_sample(s.element_index, center_coords)
+    cell_center = fem.make_free_sample(s.element_index, center_coords)
     center_pos = domain(cell_center)
     u_center = u(cell_center)
@@ -149,19 +140,19 @@ class Example:
         matrix_inertia = fem.integrate(
             vel_mass_form, fields={"u": trial, "v": self._test}, output_dtype=wp.float32, nodal=True
         )
-        self._inv_mass_matrix = sp.bsr_copy(matrix_inertia)
-        invert_diagonal_bsr_mass_matrix(self._inv_mass_matrix)
+        self._inv_mass_matrix = wp.sparse.bsr_copy(matrix_inertia)
+        fem_example_utils.invert_diagonal_bsr_matrix(self._inv_mass_matrix)
         # Initial condition
         self.velocity_field = vector_space.make_field()
         fem.interpolate(initial_condition, dest=self.velocity_field)
-        # Velocity nor field -- for visualization purposes
+        # Velocity norm field -- for visualization purposes
         self.velocity_norm_field = scalar_space.make_field()
         fem.interpolate(velocity_norm, dest=self.velocity_norm_field, fields={"u": self.velocity_field})
-        self.renderer = Plot()
-        self.renderer.add_surface("u_norm", self.velocity_norm_field)
+        self.renderer = fem_example_utils.Plot()
+        self.renderer.add_field("u_norm", self.velocity_norm_field)
     def _velocity_delta(self, trial_velocity):
         # Integration on sides
@@ -186,7 +177,7 @@ class Example:
                 alpha=1.0,
                 beta=1.0,
             )
-        return sp.bsr_mv(self._inv_mass_matrix, rhs)
+        return self._inv_mass_matrix @ rhs
     def step(self):
         self.current_frame += 1
@@ -223,7 +214,7 @@ class Example:
     def render(self):
         self.renderer.begin_frame(time=self.current_frame * self.sim_dt)
-        self.renderer.add_surface("u_norm", self.velocity_norm_field)
+        self.renderer.add_field("u_norm", self.velocity_norm_field)
         self.renderer.end_frame()

warp/examples/fem/example_convection_diffusion.py CHANGED Viewed

@@ -15,19 +15,9 @@
 ###########################################################################
 import warp as wp
+import warp.examples.fem.utils as fem_example_utils
 import warp.fem as fem
-# Import example utilities
-# Make sure that works both when imported as module and run as standalone file
-try:
-    from .bsr_utils import bsr_cg
-    from .mesh_utils import gen_trimesh
-    from .plot_utils import Plot
-except ImportError:
-    from bsr_utils import bsr_cg
-    from mesh_utils import gen_trimesh
-    from plot_utils import Plot
 @fem.integrand
 def initial_condition(domain: fem.Domain, s: fem.Sample):
@@ -94,8 +84,8 @@ class Example:
         self.current_frame = 0
         if tri_mesh:
-            positions, tri_vidx = gen_trimesh(res=wp.vec2i(res))
-            geo = fem.Trimesh2D(tri_vertex_indices=tri_vidx, positions=positions)
+            positions, tri_vidx = fem_example_utils.gen_trimesh(res=wp.vec2i(res))
+            geo = fem.Trimesh2D(tri_vertex_indices=tri_vidx, positions=positions, build_bvh=True)
         else:
             geo = fem.Grid2D(res=wp.vec2i(res))
@@ -116,8 +106,8 @@ class Example:
             output_dtype=float,
         )
-        self.renderer = Plot()
-        self.renderer.add_surface("phi", self._phi_field)
+        self.renderer = fem_example_utils.Plot()
+        self.renderer.add_field("phi", self._phi_field)
     def step(self):
         self.current_frame += 1
@@ -131,11 +121,11 @@ class Example:
         )
         # Solve linear system
-        bsr_cg(self._matrix, x=self._phi_field.dof_values, b=rhs, quiet=self._quiet, tol=1.0e-12)
+        fem_example_utils.bsr_cg(self._matrix, x=self._phi_field.dof_values, b=rhs, quiet=self._quiet, tol=1.0e-12)
     def render(self):
         self.renderer.begin_frame(time=self.current_frame * self.sim_dt)
-        self.renderer.add_surface("phi", self._phi_field)
+        self.renderer.add_field("phi", self._phi_field)
         self.renderer.end_frame()

warp/examples/fem/example_convection_diffusion_dg.py CHANGED Viewed

@@ -15,31 +15,14 @@
 ###########################################################################
 import warp as wp
+import warp.examples.fem.utils as fem_example_utils
 import warp.fem as fem
-from warp.sparse import bsr_axpy
-# Import example utilities
-# Make sure that works both when imported as module and run as standalone file
-try:
-    from .bsr_utils import bsr_cg
-    from .example_convection_diffusion import (
-        diffusion_form,
-        inertia_form,
-        initial_condition,
-        velocity,
-    )
-    from .mesh_utils import gen_quadmesh, gen_trimesh
-    from .plot_utils import Plot
-except ImportError:
-    from bsr_utils import bsr_cg
-    from example_convection_diffusion import (
-        diffusion_form,
-        inertia_form,
-        initial_condition,
-        velocity,
-    )
-    from mesh_utils import gen_quadmesh, gen_trimesh
-    from plot_utils import Plot
+from warp.examples.fem.example_convection_diffusion import (
+    diffusion_form,
+    inertia_form,
+    initial_condition,
+    velocity,
+)
 # Standard transport term, on cells' interior
@@ -58,6 +41,10 @@ def upwind_transport_form(s: fem.Sample, domain: fem.Domain, phi: fem.Field, psi
     vel = velocity(pos, ang_vel)
     vel_n = wp.dot(vel, fem.normal(domain, s))
+    if wp.min(pos) <= 0.0 or wp.max(pos) >= 1.0:  # boundary side
+        return phi(s) * (-psi(s) * vel_n + 0.5 * psi(s) * wp.abs(vel_n))
+    # interior side
     return fem.jump(phi, s) * (-fem.average(psi, s) * vel_n + 0.5 * fem.jump(psi, s) * wp.abs(vel_n))
@@ -79,7 +66,7 @@ def sip_diffusion_form(
 class Example:
-    def __init__(self, quiet=False, degree=2, resolution=50, mesh="grid", viscosity=0.001, ang_vel=1.0):
+    def __init__(self, quiet=False, degree=2, resolution=50, mesh="grid", viscosity=0.0001, ang_vel=1.0):
         self._quiet = quiet
         res = resolution
@@ -87,10 +74,10 @@ class Example:
         self.current_frame = 0
         if mesh == "tri":
-            positions, tri_vidx = gen_trimesh(res=wp.vec2i(resolution))
+            positions, tri_vidx = fem_example_utils.gen_trimesh(res=wp.vec2i(resolution))
             geo = fem.Trimesh2D(tri_vertex_indices=tri_vidx, positions=positions)
         elif mesh == "quad":
-            positions, quad_vidx = gen_quadmesh(res=wp.vec2i(resolution))
+            positions, quad_vidx = fem_example_utils.gen_quadmesh(res=wp.vec2i(resolution))
             geo = fem.Quadmesh2D(quad_vertex_indices=quad_vidx, positions=positions)
         else:
             geo = fem.Grid2D(res=wp.vec2i(resolution))
@@ -124,37 +111,30 @@ class Example:
         side_test = fem.make_test(space=scalar_space, domain=sides)
         side_trial = fem.make_trial(space=scalar_space, domain=sides)
-        bsr_axpy(
-            fem.integrate(
-                upwind_transport_form,
-                fields={"phi": side_trial, "psi": side_test},
-                values={"ang_vel": ang_vel},
-            ),
-            y=matrix_transport,
+        matrix_transport += fem.integrate(
+            upwind_transport_form,
+            fields={"phi": side_trial, "psi": side_test},
+            values={"ang_vel": ang_vel},
         )
         matrix_diffusion = fem.integrate(
             diffusion_form,
             fields={"u": trial, "v": self._test},
         )
-        bsr_axpy(
-            fem.integrate(
-                sip_diffusion_form,
-                fields={"phi": side_trial, "psi": side_test},
-            ),
-            y=matrix_diffusion,
+        matrix_diffusion += fem.integrate(
+            sip_diffusion_form,
+            fields={"phi": side_trial, "psi": side_test},
         )
-        self._matrix = matrix_inertia
-        bsr_axpy(x=matrix_transport, y=self._matrix)
-        bsr_axpy(x=matrix_diffusion, y=self._matrix, alpha=viscosity)
+        self._matrix = matrix_inertia + matrix_transport + viscosity * matrix_diffusion
         # Initial condition
         self._phi_field = scalar_space.make_field()
         fem.interpolate(initial_condition, dest=self._phi_field)
-        self.renderer = Plot()
-        self.renderer.add_surface("phi", self._phi_field)
+        self.renderer = fem_example_utils.Plot()
+        self.renderer.add_field("phi", self._phi_field)
     def step(self):
         self.current_frame += 1
@@ -166,13 +146,13 @@ class Example:
         )
         phi = wp.zeros_like(rhs)
-        bsr_cg(self._matrix, b=rhs, x=phi, method="bicgstab", quiet=self._quiet)
+        fem_example_utils.bsr_cg(self._matrix, b=rhs, x=phi, method="bicgstab", quiet=self._quiet)
         wp.utils.array_cast(in_array=phi, out_array=self._phi_field.dof_values)
     def render(self):
         self.renderer.begin_frame(time=self.current_frame * self.sim_dt)
-        self.renderer.add_surface("phi", self._phi_field)
+        self.renderer.add_field("phi", self._phi_field)
         self.renderer.end_frame()