PyPI - warp-lang - Versions diffs - 0.9.0__py3-none-win_amd64.whl → 0.11.0__py3-none-win_amd64.whl - Mend

warp-lang 0.9.0__py3-none-win_amd64.whl → 0.11.0__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of warp-lang might be problematic. Click here for more details.

Files changed (315) hide show

warp/__init__.py +15 -7
warp/__init__.pyi +1 -0
warp/bin/warp-clang.dll +0 -0
warp/bin/warp.dll +0 -0
warp/build.py +22 -443
warp/build_dll.py +384 -0
warp/builtins.py +998 -488
warp/codegen.py +1307 -739
warp/config.py +5 -3
warp/constants.py +6 -0
warp/context.py +1291 -548
warp/dlpack.py +31 -31
warp/fabric.py +326 -0
warp/fem/__init__.py +27 -0
warp/fem/cache.py +389 -0
warp/fem/dirichlet.py +181 -0
warp/fem/domain.py +263 -0
warp/fem/field/__init__.py +101 -0
warp/fem/field/field.py +149 -0
warp/fem/field/nodal_field.py +299 -0
warp/fem/field/restriction.py +21 -0
warp/fem/field/test.py +181 -0
warp/fem/field/trial.py +183 -0
warp/fem/geometry/__init__.py +19 -0
warp/fem/geometry/closest_point.py +70 -0
warp/fem/geometry/deformed_geometry.py +271 -0
warp/fem/geometry/element.py +744 -0
warp/fem/geometry/geometry.py +186 -0
warp/fem/geometry/grid_2d.py +373 -0
warp/fem/geometry/grid_3d.py +435 -0
warp/fem/geometry/hexmesh.py +953 -0
warp/fem/geometry/partition.py +376 -0
warp/fem/geometry/quadmesh_2d.py +532 -0
warp/fem/geometry/tetmesh.py +840 -0
warp/fem/geometry/trimesh_2d.py +577 -0
warp/fem/integrate.py +1616 -0
warp/fem/operator.py +191 -0
warp/fem/polynomial.py +213 -0
warp/fem/quadrature/__init__.py +2 -0
warp/fem/quadrature/pic_quadrature.py +245 -0
warp/fem/quadrature/quadrature.py +294 -0
warp/fem/space/__init__.py +292 -0
warp/fem/space/basis_space.py +489 -0
warp/fem/space/collocated_function_space.py +105 -0
warp/fem/space/dof_mapper.py +236 -0
warp/fem/space/function_space.py +145 -0
warp/fem/space/grid_2d_function_space.py +267 -0
warp/fem/space/grid_3d_function_space.py +306 -0
warp/fem/space/hexmesh_function_space.py +352 -0
warp/fem/space/partition.py +350 -0
warp/fem/space/quadmesh_2d_function_space.py +369 -0
warp/fem/space/restriction.py +160 -0
warp/fem/space/shape/__init__.py +15 -0
warp/fem/space/shape/cube_shape_function.py +738 -0
warp/fem/space/shape/shape_function.py +103 -0
warp/fem/space/shape/square_shape_function.py +611 -0
warp/fem/space/shape/tet_shape_function.py +567 -0
warp/fem/space/shape/triangle_shape_function.py +429 -0
warp/fem/space/tetmesh_function_space.py +292 -0
warp/fem/space/topology.py +295 -0
warp/fem/space/trimesh_2d_function_space.py +221 -0
warp/fem/types.py +77 -0
warp/fem/utils.py +495 -0
warp/native/array.h +164 -55
warp/native/builtin.h +150 -174
warp/native/bvh.cpp +75 -328
warp/native/bvh.cu +406 -23
warp/native/bvh.h +37 -45
warp/native/clang/clang.cpp +136 -24
warp/native/crt.cpp +1 -76
warp/native/crt.h +111 -104
warp/native/cuda_crt.h +1049 -0
warp/native/cuda_util.cpp +15 -3
warp/native/cuda_util.h +3 -1
warp/native/cutlass/tools/library/scripts/conv2d_operation.py +463 -0
warp/native/cutlass/tools/library/scripts/conv3d_operation.py +321 -0
warp/native/cutlass/tools/library/scripts/gemm_operation.py +988 -0
warp/native/cutlass/tools/library/scripts/generator.py +4625 -0
warp/native/cutlass/tools/library/scripts/library.py +799 -0
warp/native/cutlass/tools/library/scripts/manifest.py +402 -0
warp/native/cutlass/tools/library/scripts/pycutlass/docs/source/conf.py +96 -0
warp/native/cutlass/tools/library/scripts/pycutlass/profile/conv/conv2d_f16_sm80.py +106 -0
warp/native/cutlass/tools/library/scripts/pycutlass/profile/gemm/gemm_f32_sm80.py +91 -0
warp/native/cutlass/tools/library/scripts/pycutlass/setup.py +80 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/__init__.py +48 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/arguments.py +118 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/c_types.py +241 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/compiler.py +432 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/conv2d_operation.py +631 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/epilogue.py +1026 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/frontend.py +104 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/gemm_operation.py +1276 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/library.py +744 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/memory_manager.py +74 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/operation.py +110 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/parser.py +619 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/reduction_operation.py +398 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/tensor_ref.py +70 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/__init__.py +4 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/conv2d_testbed.py +646 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_grouped_testbed.py +235 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/gemm_testbed.py +557 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/test/profiler.py +70 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/type_hint.py +39 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/__init__.py +1 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/device.py +76 -0
warp/native/cutlass/tools/library/scripts/pycutlass/src/pycutlass/utils/reference_model.py +255 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/__init__.py +0 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +201 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +177 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +98 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_dgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +95 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_few_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +163 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_fixed_channels_f16nhwc_f16nhwc_f16nhwc_tensor_op_f32_sm80.py +187 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +309 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +54 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_fprop_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_strided_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +253 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.py +97 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.py +242 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_f32nhwc_f32nhwc_f32nhwc_simt_f32_sm80.py +96 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/conv2d_wgrad_implicit_gemm_tf32nhwc_tf32nhwc_f32nhwc_tensor_op_f32_sm80.py +107 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/conv/run_all_tests.py +10 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/frontend/test_frontend.py +146 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/__init__.py +0 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_bf16_sm80.py +96 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f16_sm80.py +447 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f32_sm80.py +146 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_f64_sm80.py +102 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_grouped_sm80.py +203 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/gemm_s8_sm80.py +229 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/gemm/run_all_tests.py +9 -0
warp/native/cutlass/tools/library/scripts/pycutlass/test/unit/test_sm80.py +453 -0
warp/native/cutlass/tools/library/scripts/rank_2k_operation.py +398 -0
warp/native/cutlass/tools/library/scripts/rank_k_operation.py +387 -0
warp/native/cutlass/tools/library/scripts/rt.py +796 -0
warp/native/cutlass/tools/library/scripts/symm_operation.py +400 -0
warp/native/cutlass/tools/library/scripts/trmm_operation.py +407 -0
warp/native/cutlass_gemm.cu +5 -3
warp/native/exports.h +1240 -949
warp/native/fabric.h +228 -0
warp/native/hashgrid.cpp +4 -4
warp/native/hashgrid.h +22 -2
warp/native/initializer_array.h +2 -2
warp/native/intersect.h +22 -7
warp/native/intersect_adj.h +8 -8
warp/native/intersect_tri.h +13 -16
warp/native/marching.cu +157 -161
warp/native/mat.h +119 -19
warp/native/matnn.h +2 -2
warp/native/mesh.cpp +108 -83
warp/native/mesh.cu +243 -6
warp/native/mesh.h +1547 -458
warp/native/nanovdb/NanoVDB.h +1 -1
warp/native/noise.h +272 -329
warp/native/quat.h +51 -8
warp/native/rand.h +45 -35
warp/native/range.h +6 -2
warp/native/reduce.cpp +157 -0
warp/native/reduce.cu +348 -0
warp/native/runlength_encode.cpp +62 -0
warp/native/runlength_encode.cu +46 -0
warp/native/scan.cu +11 -13
warp/native/scan.h +1 -0
warp/native/solid_angle.h +442 -0
warp/native/sort.cpp +13 -0
warp/native/sort.cu +9 -1
warp/native/sparse.cpp +338 -0
warp/native/sparse.cu +545 -0
warp/native/spatial.h +2 -2
warp/native/temp_buffer.h +30 -0
warp/native/vec.h +126 -24
warp/native/volume.h +120 -0
warp/native/warp.cpp +658 -53
warp/native/warp.cu +660 -68
warp/native/warp.h +112 -12
warp/optim/__init__.py +1 -0
warp/optim/linear.py +922 -0
warp/optim/sgd.py +92 -0
warp/render/render_opengl.py +392 -152
warp/render/render_usd.py +11 -11
warp/sim/__init__.py +2 -2
warp/sim/articulation.py +385 -185
warp/sim/collide.py +21 -8
warp/sim/import_mjcf.py +297 -106
warp/sim/import_urdf.py +389 -210
warp/sim/import_usd.py +198 -97
warp/sim/inertia.py +17 -18
warp/sim/integrator_euler.py +14 -8
warp/sim/integrator_xpbd.py +161 -19
warp/sim/model.py +795 -291
warp/sim/optimizer.py +2 -6
warp/sim/render.py +65 -3
warp/sim/utils.py +3 -0
warp/sparse.py +1227 -0
warp/stubs.py +665 -223
warp/tape.py +66 -15
warp/tests/__main__.py +3 -6
warp/tests/assets/curlnoise_golden.npy +0 -0
warp/tests/assets/pnoise_golden.npy +0 -0
warp/tests/assets/torus.usda +105 -105
warp/tests/{test_class_kernel.py → aux_test_class_kernel.py} +9 -1
warp/tests/aux_test_conditional_unequal_types_kernels.py +21 -0
warp/tests/{test_dependent.py → aux_test_dependent.py} +2 -2
warp/tests/{test_reference.py → aux_test_reference.py} +1 -1
warp/tests/aux_test_unresolved_func.py +14 -0
warp/tests/aux_test_unresolved_symbol.py +14 -0
warp/tests/disabled_kinematics.py +239 -0
warp/tests/run_coverage_serial.py +31 -0
warp/tests/test_adam.py +103 -106
warp/tests/test_arithmetic.py +128 -74
warp/tests/test_array.py +1497 -211
warp/tests/test_array_reduce.py +150 -0
warp/tests/test_atomic.py +64 -28
warp/tests/test_bool.py +99 -0
warp/tests/test_builtins_resolution.py +1292 -0
warp/tests/test_bvh.py +75 -43
warp/tests/test_closest_point_edge_edge.py +54 -57
warp/tests/test_codegen.py +233 -128
warp/tests/test_compile_consts.py +28 -20
warp/tests/test_conditional.py +108 -24
warp/tests/test_copy.py +10 -12
warp/tests/test_ctypes.py +112 -88
warp/tests/test_dense.py +21 -14
warp/tests/test_devices.py +98 -0
warp/tests/test_dlpack.py +136 -108
warp/tests/test_examples.py +277 -0
warp/tests/test_fabricarray.py +955 -0
warp/tests/test_fast_math.py +15 -11
warp/tests/test_fem.py +1271 -0
warp/tests/test_fp16.py +53 -19
warp/tests/test_func.py +187 -74
warp/tests/test_generics.py +194 -49
warp/tests/test_grad.py +180 -116
warp/tests/test_grad_customs.py +176 -0
warp/tests/test_hash_grid.py +52 -37
warp/tests/test_import.py +10 -23
warp/tests/test_indexedarray.py +577 -24
warp/tests/test_intersect.py +18 -9
warp/tests/test_large.py +141 -0
warp/tests/test_launch.py +251 -15
warp/tests/test_lerp.py +64 -65
warp/tests/test_linear_solvers.py +154 -0
warp/tests/test_lvalue.py +493 -0
warp/tests/test_marching_cubes.py +12 -13
warp/tests/test_mat.py +508 -2778
warp/tests/test_mat_lite.py +115 -0
warp/tests/test_mat_scalar_ops.py +2889 -0
warp/tests/test_math.py +103 -9
warp/tests/test_matmul.py +305 -69
warp/tests/test_matmul_lite.py +410 -0
warp/tests/test_mesh.py +71 -14
warp/tests/test_mesh_query_aabb.py +41 -25
warp/tests/test_mesh_query_point.py +325 -34
warp/tests/test_mesh_query_ray.py +39 -22
warp/tests/test_mlp.py +30 -22
warp/tests/test_model.py +92 -89
warp/tests/test_modules_lite.py +39 -0
warp/tests/test_multigpu.py +88 -114
warp/tests/test_noise.py +12 -11
warp/tests/test_operators.py +16 -20
warp/tests/test_options.py +11 -11
warp/tests/test_pinned.py +17 -18
warp/tests/test_print.py +32 -11
warp/tests/test_quat.py +275 -129
warp/tests/test_rand.py +18 -16
warp/tests/test_reload.py +38 -34
warp/tests/test_rounding.py +50 -43
warp/tests/test_runlength_encode.py +190 -0
warp/tests/test_smoothstep.py +9 -11
warp/tests/test_snippet.py +143 -0
warp/tests/test_sparse.py +460 -0
warp/tests/test_spatial.py +276 -243
warp/tests/test_streams.py +110 -85
warp/tests/test_struct.py +331 -85
warp/tests/test_tape.py +39 -21
warp/tests/test_torch.py +118 -89
warp/tests/test_transient_module.py +12 -13
warp/tests/test_types.py +614 -0
warp/tests/test_utils.py +494 -0
warp/tests/test_vec.py +354 -1987
warp/tests/test_vec_lite.py +73 -0
warp/tests/test_vec_scalar_ops.py +2099 -0
warp/tests/test_volume.py +457 -293
warp/tests/test_volume_write.py +124 -134
warp/tests/unittest_serial.py +35 -0
warp/tests/unittest_suites.py +341 -0
warp/tests/unittest_utils.py +568 -0
warp/tests/unused_test_misc.py +71 -0
warp/tests/{test_debug.py → walkthough_debug.py} +3 -17
warp/thirdparty/appdirs.py +36 -45
warp/thirdparty/unittest_parallel.py +549 -0
warp/torch.py +72 -30
warp/types.py +1744 -713
warp/utils.py +360 -350
warp_lang-0.11.0.dist-info/LICENSE.md +36 -0
warp_lang-0.11.0.dist-info/METADATA +238 -0
warp_lang-0.11.0.dist-info/RECORD +332 -0
{warp_lang-0.9.0.dist-info → warp_lang-0.11.0.dist-info}/WHEEL +1 -1
warp/bin/warp-clang.exp +0 -0
warp/bin/warp-clang.lib +0 -0
warp/bin/warp.exp +0 -0
warp/bin/warp.lib +0 -0
warp/tests/test_all.py +0 -215
warp/tests/test_array_scan.py +0 -60
warp/tests/test_base.py +0 -208
warp/tests/test_unresolved_func.py +0 -7
warp/tests/test_unresolved_symbol.py +0 -7
warp_lang-0.9.0.dist-info/METADATA +0 -20
warp_lang-0.9.0.dist-info/RECORD +0 -177
/warp/tests/{test_compile_consts_dummy.py → aux_test_compile_consts_dummy.py} +0 -0
/warp/tests/{test_reference_reference.py → aux_test_reference_reference.py} +0 -0
/warp/tests/{test_square.py → aux_test_square.py} +0 -0
{warp_lang-0.9.0.dist-info → warp_lang-0.11.0.dist-info}/top_level.txt +0 -0

warp/tests/test_linear_solvers.py ADDED Viewed

@@ -0,0 +1,154 @@
+import unittest
+import numpy as np
+import warp as wp
+import unittest
+from warp.optim.linear import preconditioner, cg, bicgstab, gmres
+from warp.tests.unittest_utils import *
+wp.init()
+def _check_linear_solve(test, A, b, func, *args, **kwargs):
+    # test from zero
+    x = wp.zeros_like(b)
+    with wp.ScopedDevice(A.device):
+        niter, err, atol = func(A, b, x, *args, use_cuda_graph=True, **kwargs)
+    test.assertLessEqual(err, atol)
+    # test with warm start
+    with wp.ScopedDevice(A.device):
+        niter_warm, err, atol = func(A, b, x, *args, use_cuda_graph=False, **kwargs)
+    test.assertLessEqual(err, atol)
+    test.assertLess(niter_warm, niter)
+    # In CG and BiCGSTAB residual norm is evaluating from running residual
+    # rather then being computed from scratch as Ax - b
+    # This can lead to accumulated inaccuracies over iterations, esp in float32
+    residual = A.numpy() @ x.numpy() - b.numpy()
+    err_np = np.linalg.norm(residual)
+    if A.dtype == wp.float64:
+        test.assertLessEqual(err_np, 2.0 * atol)
+    else:
+        test.assertLessEqual(err_np, 32.0 * atol)
+def _least_square_system(rng, n: int):
+    C = rng.uniform(low=-100, high=100, size=(n, n))
+    f = rng.uniform(low=-100, high=100, size=(n,))
+    A = C @ C.T
+    b = C @ f
+    return A, b
+def _make_spd_system(n: int, seed: int, dtype, device):
+    rng = np.random.default_rng(seed)
+    A, b = _least_square_system(rng, n)
+    return wp.array(A, dtype=dtype, device=device), wp.array(b, dtype=dtype, device=device)
+def _make_nonsymmetric_system(n: int, seed: int, dtype, device, spd=False):
+    rng = np.random.default_rng(seed)
+    s = rng.uniform(low=0.1, high=10, size=(n,))
+    A, b = _least_square_system(rng, n)
+    A = A @ np.diag(s)
+    return wp.array(A, dtype=dtype, device=device), wp.array(b, dtype=dtype, device=device)
+def _make_indefinite_system(n: int, seed: int, dtype, device, spd=False):
+    rng = np.random.default_rng(seed)
+    s = rng.uniform(low=0.1, high=10, size=(n,))
+    A, b = _least_square_system(rng, n)
+    A = A @ np.diag(s)
+    return wp.array(A, dtype=dtype, device=device), wp.array(b, dtype=dtype, device=device)
+def test_cg(test, device):
+    A, b = _make_spd_system(n=64, seed=123, device=device, dtype=wp.float64)
+    M = preconditioner(A, "diag")
+    _check_linear_solve(test, A, b, cg, maxiter=1000)
+    _check_linear_solve(test, A, b, cg, M=M, maxiter=1000)
+    A, b = _make_spd_system(n=16, seed=321, device=device, dtype=wp.float32)
+    M = preconditioner(A, "diag")
+    _check_linear_solve(test, A, b, cg, maxiter=1000)
+    _check_linear_solve(test, A, b, cg, M=M, maxiter=1000)
+def test_bicgstab(test, device):
+    A, b = _make_nonsymmetric_system(n=64, seed=123, device=device, dtype=wp.float64)
+    M = preconditioner(A, "diag")
+    _check_linear_solve(test, A, b, bicgstab, maxiter=1000)
+    _check_linear_solve(test, A, b, bicgstab, M=M, maxiter=1000)
+    _check_linear_solve(test, A, b, bicgstab, M=M, maxiter=1000, is_left_preconditioner=True)
+    A, b = _make_nonsymmetric_system(n=16, seed=321, device=device, dtype=wp.float32)
+    M = preconditioner(A, "diag")
+    _check_linear_solve(test, A, b, bicgstab, maxiter=1000)
+    _check_linear_solve(test, A, b, bicgstab, M=M, maxiter=1000)
+    _check_linear_solve(test, A, b, bicgstab, M=M, maxiter=1000, is_left_preconditioner=True)
+    A, b = _make_indefinite_system(n=64, seed=121, device=device, dtype=wp.float64)
+    M = preconditioner(A, "diag")
+    _check_linear_solve(test, A, b, bicgstab, maxiter=1000)
+    _check_linear_solve(test, A, b, bicgstab, M=M, maxiter=1000)
+    _check_linear_solve(test, A, b, bicgstab, M=M, maxiter=1000, is_left_preconditioner=True)
+def test_gmres(test, device):
+    A, b = _make_nonsymmetric_system(n=64, seed=456, device=device, dtype=wp.float64)
+    M = preconditioner(A, "diag")
+    _check_linear_solve(test, A, b, gmres, maxiter=1000, tol=1.0e-3)
+    _check_linear_solve(test, A, b, gmres, M=M, maxiter=1000, tol=1.0e-5)
+    _check_linear_solve(test, A, b, gmres, M=M, maxiter=1000, tol=1.0e-5, is_left_preconditioner=True)
+    A, b = _make_nonsymmetric_system(n=64, seed=654, device=device, dtype=wp.float64)
+    M = preconditioner(A, "diag")
+    _check_linear_solve(test, A, b, gmres, maxiter=1000, tol=1.0e-3)
+    _check_linear_solve(test, A, b, gmres, M=M, maxiter=1000, tol=1.0e-5)
+    _check_linear_solve(test, A, b, gmres, M=M, maxiter=1000, tol=1.0e-5, is_left_preconditioner=True)
+class TestLinearSolvers(unittest.TestCase):
+    pass
+devices = get_test_devices()
+from warp.context import runtime
+if not runtime.core.is_cutlass_enabled():
+    devices = [d for d in devices if not d.is_cuda]
+    print("Skipping CUDA linear solver tests because CUTLASS is not supported in this build")
+if runtime.core.is_debug_enabled():
+    # cutlass-based matmul is *very* slow in debug mode -- skip
+    devices = [d for d in devices if not d.is_cuda]
+    print("Skipping CUDA linear solver tests in debug mode")
+add_function_test(TestLinearSolvers, "test_cg", test_cg, devices=devices)
+add_function_test(TestLinearSolvers, "test_bicgstab", test_bicgstab, devices=devices)
+add_function_test(TestLinearSolvers, "test_gmres", test_gmres, devices=devices)
+if __name__ == "__main__":
+    wp.build.clear_kernel_cache()
+    unittest.main(verbosity=2)

warp/tests/test_lvalue.py ADDED Viewed

@@ -0,0 +1,493 @@
+# Copyright (c) 2023 NVIDIA CORPORATION.  All rights reserved.
+# NVIDIA CORPORATION and its licensors retain all intellectual property
+# and proprietary rights in and to this software, related documentation
+# and any modifications thereto.  Any use, reproduction, disclosure or
+# distribution of this software and related documentation without an express
+# license agreement from NVIDIA CORPORATION is strictly prohibited.
+import unittest
+import warp as wp
+from warp.tests.unittest_utils import *
+wp.init()
+@wp.kernel
+def rmw_array_kernel(foos: wp.array(dtype=wp.uint32)):
+    i = wp.tid()
+    foos[i] += wp.uint32(1)
+def test_rmw_array(test, device):
+    arr = wp.zeros((10,), dtype=wp.uint32, device=device)
+    wp.launch(
+        kernel=rmw_array_kernel,
+        dim=(10,),
+        inputs=[arr],
+        device=device,
+    )
+    wp.synchronize()
+    for f in arr.list():
+        if f != 1:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {1}")
+@wp.struct
+class RmwFoo:
+    field: wp.uint32
+@wp.kernel
+def rmw_array_struct_kernel(foos: wp.array(dtype=RmwFoo)):
+    i = wp.tid()
+    foos[i].field += wp.uint32(1)
+def test_rmw_array_struct(test, device):
+    foos = wp.zeros((10,), dtype=RmwFoo, device=device)
+    wp.launch(
+        kernel=rmw_array_struct_kernel,
+        dim=(10,),
+        inputs=[foos],
+        device=device,
+    )
+    wp.synchronize()
+    expected = RmwFoo()
+    expected.field = 1
+    for f in foos.list():
+        if f.field != expected.field:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {expected}")
+@wp.func
+def lookup(foos: wp.array(dtype=wp.uint32), index: int):
+    return foos[index]
+@wp.kernel
+def lookup_kernel(foos: wp.array(dtype=wp.uint32)):
+    i = wp.tid()
+    x = lookup(foos, i)
+    foos[i] = x + wp.uint32(1)
+def test_lookup(test, device):
+    arr = wp.zeros((10,), dtype=wp.uint32, device=device)
+    wp.launch(
+        kernel=lookup_kernel,
+        dim=(10,),
+        inputs=[arr],
+        device=device,
+    )
+    wp.synchronize()
+    for f in arr.list():
+        if f != 1:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {1}")
+@wp.func
+def lookup3(foos: wp.array(dtype=wp.float32), index: int):
+    return foos[index]
+@wp.kernel
+def grad_kernel(foos: wp.array(dtype=wp.float32), bars: wp.array(dtype=wp.float32)):
+    i = wp.tid()
+    x = lookup3(foos, i)
+    bars[i] = x * wp.float32(i) + 1.0
+def test_grad(test, device):
+    num = 10
+    data = np.linspace(20, 20 + num, num, endpoint=False, dtype=np.float32)
+    input = wp.array(data, device=device, requires_grad=True)
+    output = wp.zeros(num, dtype=wp.float32, device=device)
+    ones = wp.array(np.ones(len(output)), dtype=wp.float32, device=device)
+    tape = wp.Tape()
+    with tape:
+        wp.launch(
+            kernel=grad_kernel,
+            dim=(num,),
+            inputs=[input],
+            outputs=[output],
+            device=device,
+        )
+    tape.backward(grads={output: ones})
+    wp.synchronize()
+    # test forward results
+    for i, f in enumerate(output.list()):
+        expected = data[i] * i + 1
+        if f != expected:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {expected}")
+    # test backward results
+    for i, f in enumerate(tape.gradients[input].list()):
+        expected = i
+        if f != expected:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {expected}")
+@wp.func
+def lookup2(foos: wp.array(dtype=wp.uint32), index: int):
+    if index % 2 == 0:
+        x = foos[index]
+        x = wp.uint32(0)
+        return x
+    else:
+        return foos[index]
+@wp.kernel
+def lookup2_kernel(foos: wp.array(dtype=wp.uint32)):
+    i = wp.tid()
+    x = lookup2(foos, i)
+    foos[i] = x + wp.uint32(1)
+def test_lookup2(test, device):
+    arr = wp.zeros((10,), dtype=wp.uint32, device=device)
+    wp.launch(
+        kernel=lookup2_kernel,
+        dim=(10,),
+        inputs=[arr],
+        device=device,
+    )
+    wp.synchronize()
+    for f in arr.list():
+        if f != 1:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {1}")
+@wp.kernel
+def unary_kernel(foos: wp.array(dtype=wp.uint32)):
+    i = wp.tid()
+    foos[i] = wp.uint32(-1)
+    x = -foos[i]
+    foos[i] = x
+def test_unary(test, device):
+    arr = wp.zeros((10,), dtype=wp.uint32, device=device)
+    wp.launch(
+        kernel=unary_kernel,
+        dim=(10,),
+        inputs=[arr],
+        device=device,
+    )
+    wp.synchronize()
+    for f in arr.list():
+        if f != 1:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {1}")
+@wp.kernel
+def rvalue_kernel(foos: wp.array(dtype=wp.uint32)):
+    i = wp.tid()
+    if foos[i] < wp.uint32(1):
+        foos[i] = wp.uint32(1)
+def test_rvalue(test, device):
+    arr = wp.zeros((10,), dtype=wp.uint32, device=device)
+    wp.launch(
+        kernel=rvalue_kernel,
+        dim=(10,),
+        inputs=[arr],
+        device=device,
+    )
+    wp.synchronize()
+    for f in arr.list():
+        if f != 1:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {1}")
+# Tests, among other things, that assigning a reference to a new variable does
+# not create a reference
+@wp.kernel
+def intermediate_kernel(foos: wp.array(dtype=wp.uint32)):
+    i = wp.tid()
+    x = foos[i]
+    x = x + wp.uint32(1)
+    foos[i] = x
+def test_intermediate(test, device):
+    arr = wp.zeros((10,), dtype=wp.uint32, device=device)
+    wp.launch(
+        kernel=intermediate_kernel,
+        dim=(10,),
+        inputs=[arr],
+        device=device,
+    )
+    wp.synchronize()
+    for f in arr.list():
+        if f != 1:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {1}")
+@wp.kernel
+def array_kernel(foos: wp.array(dtype=wp.uint32)):
+    i = wp.tid()
+    foos[i] = wp.uint32(1)
+def test_array_assign(test, device):
+    arr = wp.zeros((10,), dtype=wp.uint32, device=device)
+    wp.launch(
+        kernel=array_kernel,
+        dim=(10,),
+        inputs=[arr],
+        device=device,
+    )
+    wp.synchronize()
+    for f in arr.list():
+        if f != 1:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {1}")
+@wp.func
+def increment(arg: wp.uint32):
+    return arg + wp.uint32(1)
+@wp.kernel
+def array_call_kernel(foos: wp.array(dtype=wp.uint32)):
+    i = wp.tid()
+    foos[i] = increment(foos[i])
+def test_array_call_assign(test, device):
+    arr = wp.zeros((10,), dtype=wp.uint32, device=device)
+    wp.launch(
+        kernel=array_kernel,
+        dim=(10,),
+        inputs=[arr],
+        device=device,
+    )
+    wp.synchronize()
+    for f in arr.list():
+        if f != 1:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {1}")
+@wp.struct
+class Foo:
+    field: wp.uint32
+@wp.kernel
+def array_struct_kernel(foos: wp.array(dtype=Foo)):
+    i = wp.tid()
+    foos[i].field = wp.uint32(1)
+def test_array_struct_assign(test, device):
+    foos = wp.zeros((10,), dtype=Foo, device=device)
+    wp.launch(
+        kernel=array_struct_kernel,
+        dim=(10,),
+        inputs=[foos],
+        device=device,
+    )
+    wp.synchronize()
+    expected = Foo()
+    expected.field = 1
+    for f in foos.list():
+        if f.field != expected.field:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {expected}")
+@wp.struct
+class Bar:
+    field: wp.uint32
+@wp.struct
+class Baz:
+    bar: Bar
+@wp.kernel
+def array_struct_struct_kernel(foos: wp.array(dtype=Baz)):
+    i = wp.tid()
+    foos[i].bar.field = wp.uint32(1)
+def test_array_struct_struct_assign(test, device):
+    foos = wp.zeros((10,), dtype=Baz, device=device)
+    wp.launch(
+        kernel=array_struct_struct_kernel,
+        dim=(10,),
+        inputs=[foos],
+        device=device,
+    )
+    wp.synchronize()
+    expected = Baz()
+    expected.bar.field = 1
+    for f in foos.list():
+        if f.bar.field != expected.bar.field:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {expected}")
+@wp.struct
+class S:
+    a: wp.uint32
+    b: wp.float32
+@wp.struct
+class F:
+    x: wp.float32
+    s: S
+    y: wp.int32
+@wp.kernel
+def complex_kernel(foos: wp.array(dtype=F)):
+    i = wp.tid()
+    foos[i].x += wp.float32(1.0)
+    foos[i].y = wp.int32(2)
+    foos[i].s.b += wp.float32(3.0)
+    foos[i].s.a = wp.uint32(foos[i].y)
+def test_complex(test, device):
+    foos = wp.zeros((10,), dtype=F, device=device)
+    wp.launch(
+        kernel=complex_kernel,
+        dim=(10,),
+        inputs=[foos],
+        device=device,
+    )
+    wp.synchronize()
+    expected = F()
+    expected.x = 1.0
+    expected.y = 2
+    expected.s.b = 3.0
+    expected.s.a = expected.y
+    for f in foos.list():
+        if f.x != expected.x or f.y != expected.y or f.s.a != expected.s.a or f.s.b != expected.s.b:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {expected}")
+@wp.struct
+class Svec:
+    a: wp.uint32
+    b: wp.vec2f
+@wp.struct
+class Fvec:
+    x: wp.vec2f
+    s: Svec
+    y: wp.int32
+@wp.kernel
+def swizzle_kernel(foos: wp.array(dtype=Fvec)):
+    i = wp.tid()
+    foos[i].x += wp.vec2f(1.0, 2.0)
+    foos[i].y = wp.int32(3)
+    foos[i].s.b = wp.vec2f(4.0, 5.0)
+    foos[i].s.b.y = wp.float32(6.0)
+    foos[i].s.b.x = foos[i].x.y
+    foos[i].s.a = wp.uint32(foos[i].y)
+def test_swizzle(test, device):
+    foos = wp.zeros((10,), dtype=Fvec, device=device)
+    wp.launch(
+        kernel=swizzle_kernel,
+        dim=(10,),
+        inputs=[foos],
+        device=device,
+    )
+    wp.synchronize()
+    expected = Fvec()
+    expected.x = wp.vec2f(1.0, 2.0)
+    expected.y = 3
+    expected.s.b = wp.vec2f(4.0, 5.0)
+    expected.s.b.y = 6.0
+    expected.s.b.x = expected.x.y
+    expected.s.a = expected.y
+    for f in foos.list():
+        if f.x != expected.x or f.y != expected.y or f.s.a != expected.s.a or f.s.b != expected.s.b:
+            raise AssertionError(f"Unexpected result, got: {f} expected: {expected}")
+devices = get_test_devices()
+class TestLValue(unittest.TestCase):
+    def test_swizzle_error_invalid_attribute(self):
+        v = wp.vec3(1, 2, 3)
+        with self.assertRaisesRegex(
+            AttributeError,
+            r"'vec3f' object has no attribute 'foo'$",
+        ):
+            v.foo
+        try:
+            v.bar = 123
+        except AttributeError:
+            self.fail()
+add_function_test(TestLValue, "test_rmw_array", test_rmw_array, devices=devices)
+add_function_test(TestLValue, "test_rmw_array_struct", test_rmw_array_struct, devices=devices)
+add_function_test(TestLValue, "test_lookup", test_lookup, devices=devices)
+add_function_test(TestLValue, "test_lookup2", test_lookup2, devices=devices)
+add_function_test(TestLValue, "test_grad", test_grad, devices=devices)
+add_function_test(TestLValue, "test_unary", test_unary, devices=devices)
+add_function_test(TestLValue, "test_rvalue", test_rvalue, devices=devices)
+add_function_test(TestLValue, "test_intermediate", test_intermediate, devices=devices)
+add_function_test(TestLValue, "test_array_assign", test_array_assign, devices=devices)
+add_function_test(TestLValue, "test_array_struct_assign", test_array_struct_assign, devices=devices)
+add_function_test(TestLValue, "test_array_struct_struct_assign", test_array_struct_struct_assign, devices=devices)
+add_function_test(TestLValue, "test_complex", test_complex, devices=devices)
+add_function_test(TestLValue, "test_swizzle", test_swizzle, devices=devices)
+if __name__ == "__main__":
+    wp.build.clear_kernel_cache()
+    unittest.main(verbosity=2)

warp/tests/test_marching_cubes.py CHANGED Viewed

@@ -5,14 +5,12 @@
 # distribution of this software and related documentation without an express
 # license agreement from NVIDIA CORPORATION is strictly prohibited.
-# include parent path
+import unittest
 import numpy as np
-import math
 import warp as wp
-from warp.tests.test_base import *
-import unittest
+from warp.tests.unittest_utils import *
 wp.init()
@@ -39,7 +37,7 @@ def test_marching_cubes(test, device):
     radius = dim / 4.0
-    wp.launch(make_field, dim=field.shape, inputs=[field, wp.vec3(dim / 2, dim / 2, dim / 2), radius], device="cuda")
+    wp.launch(make_field, dim=field.shape, inputs=[field, wp.vec3(dim / 2, dim / 2, dim / 2), radius], device=device)
     iso.surface(field=field, threshold=0.0)
@@ -49,18 +47,19 @@ def test_marching_cubes(test, device):
     test.assertTrue(np.max(error) < 1.0)
+    iso.resize(nx=dim * 2, ny=dim * 2, nz=dim * 2, max_verts=max_verts, max_tris=max_tris)
+devices = get_unique_cuda_test_devices()
-def register(parent):
-    devices = ["cuda"]
-    class TestMarchingCubes(parent):
-        pass
+class TestMarchingCubes(unittest.TestCase):
+    pass
-    add_function_test(TestMarchingCubes, "test_marching_cubes", test_marching_cubes, devices=devices)
-    return TestMarchingCubes
+add_function_test(TestMarchingCubes, "test_marching_cubes", test_marching_cubes, devices=devices)
 if __name__ == "__main__":
-    c = register(unittest.TestCase)
+    wp.build.clear_kernel_cache()
     unittest.main(verbosity=2)