PyPI - warp-lang - Versions diffs - 1.8.1__py3-none-macosx_10_13_universal2.whl → 1.9.1__py3-none-macosx_10_13_universal2.whl - Mend

warp-lang 1.8.1__py3-none-macosx_10_13_universal2.whl → 1.9.1__py3-none-macosx_10_13_universal2.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of warp-lang might be problematic. Click here for more details.

Files changed (141) hide show

warp/__init__.py +282 -103
warp/__init__.pyi +1904 -114
warp/bin/libwarp-clang.dylib +0 -0
warp/bin/libwarp.dylib +0 -0
warp/build.py +93 -30
warp/build_dll.py +331 -101
warp/builtins.py +1244 -160
warp/codegen.py +317 -206
warp/config.py +1 -1
warp/context.py +1465 -789
warp/examples/core/example_marching_cubes.py +1 -0
warp/examples/core/example_render_opengl.py +100 -3
warp/examples/fem/example_apic_fluid.py +98 -52
warp/examples/fem/example_convection_diffusion_dg.py +25 -4
warp/examples/fem/example_diffusion_mgpu.py +8 -3
warp/examples/fem/utils.py +68 -22
warp/examples/interop/example_jax_kernel.py +2 -1
warp/fabric.py +1 -1
warp/fem/cache.py +27 -19
warp/fem/domain.py +2 -2
warp/fem/field/nodal_field.py +2 -2
warp/fem/field/virtual.py +264 -166
warp/fem/geometry/geometry.py +5 -5
warp/fem/integrate.py +129 -51
warp/fem/space/restriction.py +4 -0
warp/fem/space/shape/tet_shape_function.py +3 -10
warp/jax_experimental/custom_call.py +25 -2
warp/jax_experimental/ffi.py +22 -1
warp/jax_experimental/xla_ffi.py +16 -7
warp/marching_cubes.py +708 -0
warp/native/array.h +99 -4
warp/native/builtin.h +86 -9
warp/native/bvh.cpp +64 -28
warp/native/bvh.cu +58 -58
warp/native/bvh.h +2 -2
warp/native/clang/clang.cpp +7 -7
warp/native/coloring.cpp +8 -2
warp/native/crt.cpp +2 -2
warp/native/crt.h +3 -5
warp/native/cuda_util.cpp +41 -10
warp/native/cuda_util.h +10 -4
warp/native/exports.h +1842 -1908
warp/native/fabric.h +2 -1
warp/native/hashgrid.cpp +37 -37
warp/native/hashgrid.cu +2 -2
warp/native/initializer_array.h +1 -1
warp/native/intersect.h +2 -2
warp/native/mat.h +1910 -116
warp/native/mathdx.cpp +43 -43
warp/native/mesh.cpp +24 -24
warp/native/mesh.cu +26 -26
warp/native/mesh.h +4 -2
warp/native/nanovdb/GridHandle.h +179 -12
warp/native/nanovdb/HostBuffer.h +8 -7
warp/native/nanovdb/NanoVDB.h +517 -895
warp/native/nanovdb/NodeManager.h +323 -0
warp/native/nanovdb/PNanoVDB.h +2 -2
warp/native/quat.h +331 -14
warp/native/range.h +7 -1
warp/native/reduce.cpp +10 -10
warp/native/reduce.cu +13 -14
warp/native/runlength_encode.cpp +2 -2
warp/native/runlength_encode.cu +5 -5
warp/native/scan.cpp +3 -3
warp/native/scan.cu +4 -4
warp/native/sort.cpp +10 -10
warp/native/sort.cu +40 -31
warp/native/sort.h +2 -0
warp/native/sparse.cpp +8 -8
warp/native/sparse.cu +13 -13
warp/native/spatial.h +366 -17
warp/native/temp_buffer.h +2 -2
warp/native/tile.h +471 -82
warp/native/vec.h +328 -14
warp/native/volume.cpp +54 -54
warp/native/volume.cu +1 -1
warp/native/volume.h +2 -1
warp/native/volume_builder.cu +30 -37
warp/native/warp.cpp +150 -149
warp/native/warp.cu +377 -216
warp/native/warp.h +227 -226
warp/optim/linear.py +736 -271
warp/render/imgui_manager.py +289 -0
warp/render/render_opengl.py +99 -18
warp/render/render_usd.py +1 -0
warp/sim/graph_coloring.py +2 -2
warp/sparse.py +558 -175
warp/tests/aux_test_module_aot.py +7 -0
warp/tests/cuda/test_async.py +3 -3
warp/tests/cuda/test_conditional_captures.py +101 -0
warp/tests/geometry/test_hash_grid.py +38 -0
warp/tests/geometry/test_marching_cubes.py +233 -12
warp/tests/interop/test_jax.py +608 -28
warp/tests/sim/test_coloring.py +6 -6
warp/tests/test_array.py +58 -5
warp/tests/test_codegen.py +4 -3
warp/tests/test_context.py +8 -15
warp/tests/test_enum.py +136 -0
warp/tests/test_examples.py +2 -2
warp/tests/test_fem.py +49 -6
warp/tests/test_fixedarray.py +229 -0
warp/tests/test_func.py +18 -15
warp/tests/test_future_annotations.py +7 -5
warp/tests/test_linear_solvers.py +30 -0
warp/tests/test_map.py +15 -1
warp/tests/test_mat.py +1518 -378
warp/tests/test_mat_assign_copy.py +178 -0
warp/tests/test_mat_constructors.py +574 -0
warp/tests/test_module_aot.py +287 -0
warp/tests/test_print.py +69 -0
warp/tests/test_quat.py +140 -34
warp/tests/test_quat_assign_copy.py +145 -0
warp/tests/test_reload.py +2 -1
warp/tests/test_sparse.py +71 -0
warp/tests/test_spatial.py +140 -34
warp/tests/test_spatial_assign_copy.py +160 -0
warp/tests/test_struct.py +43 -3
warp/tests/test_tuple.py +96 -0
warp/tests/test_types.py +61 -20
warp/tests/test_vec.py +179 -34
warp/tests/test_vec_assign_copy.py +143 -0
warp/tests/tile/test_tile.py +245 -18
warp/tests/tile/test_tile_cholesky.py +605 -0
warp/tests/tile/test_tile_load.py +169 -0
warp/tests/tile/test_tile_mathdx.py +2 -558
warp/tests/tile/test_tile_matmul.py +1 -1
warp/tests/tile/test_tile_mlp.py +1 -1
warp/tests/tile/test_tile_shared_memory.py +5 -5
warp/tests/unittest_suites.py +6 -0
warp/tests/walkthrough_debug.py +1 -1
warp/thirdparty/unittest_parallel.py +108 -9
warp/types.py +571 -267
warp/utils.py +68 -86
{warp_lang-1.8.1.dist-info → warp_lang-1.9.1.dist-info}/METADATA +29 -69
{warp_lang-1.8.1.dist-info → warp_lang-1.9.1.dist-info}/RECORD +138 -128
warp/native/marching.cpp +0 -19
warp/native/marching.cu +0 -514
warp/native/marching.h +0 -19
{warp_lang-1.8.1.dist-info → warp_lang-1.9.1.dist-info}/WHEEL +0 -0
{warp_lang-1.8.1.dist-info → warp_lang-1.9.1.dist-info}/licenses/LICENSE.md +0 -0
{warp_lang-1.8.1.dist-info → warp_lang-1.9.1.dist-info}/top_level.txt +0 -0

warp/utils.py CHANGED Viewed

@@ -131,16 +131,16 @@ def array_scan(in_array, out_array, inclusive=True):
     if in_array.device.is_cpu:
         if in_array.dtype == wp.int32:
-            runtime.core.array_scan_int_host(in_array.ptr, out_array.ptr, in_array.size, inclusive)
+            runtime.core.wp_array_scan_int_host(in_array.ptr, out_array.ptr, in_array.size, inclusive)
         elif in_array.dtype == wp.float32:
-            runtime.core.array_scan_float_host(in_array.ptr, out_array.ptr, in_array.size, inclusive)
+            runtime.core.wp_array_scan_float_host(in_array.ptr, out_array.ptr, in_array.size, inclusive)
         else:
             raise RuntimeError(f"Unsupported data type: {type_repr(in_array.dtype)}")
     elif in_array.device.is_cuda:
         if in_array.dtype == wp.int32:
-            runtime.core.array_scan_int_device(in_array.ptr, out_array.ptr, in_array.size, inclusive)
+            runtime.core.wp_array_scan_int_device(in_array.ptr, out_array.ptr, in_array.size, inclusive)
         elif in_array.dtype == wp.float32:
-            runtime.core.array_scan_float_device(in_array.ptr, out_array.ptr, in_array.size, inclusive)
+            runtime.core.wp_array_scan_float_device(in_array.ptr, out_array.ptr, in_array.size, inclusive)
         else:
             raise RuntimeError(f"Unsupported data type: {type_repr(in_array.dtype)}")
@@ -173,22 +173,22 @@ def radix_sort_pairs(keys, values, count: int):
     if keys.device.is_cpu:
         if keys.dtype == wp.int32 and values.dtype == wp.int32:
-            runtime.core.radix_sort_pairs_int_host(keys.ptr, values.ptr, count)
+            runtime.core.wp_radix_sort_pairs_int_host(keys.ptr, values.ptr, count)
         elif keys.dtype == wp.float32 and values.dtype == wp.int32:
-            runtime.core.radix_sort_pairs_float_host(keys.ptr, values.ptr, count)
+            runtime.core.wp_radix_sort_pairs_float_host(keys.ptr, values.ptr, count)
         elif keys.dtype == wp.int64 and values.dtype == wp.int32:
-            runtime.core.radix_sort_pairs_int64_host(keys.ptr, values.ptr, count)
+            runtime.core.wp_radix_sort_pairs_int64_host(keys.ptr, values.ptr, count)
         else:
             raise RuntimeError(
                 f"Unsupported keys and values data types: {type_repr(keys.dtype)}, {type_repr(values.dtype)}"
             )
     elif keys.device.is_cuda:
         if keys.dtype == wp.int32 and values.dtype == wp.int32:
-            runtime.core.radix_sort_pairs_int_device(keys.ptr, values.ptr, count)
+            runtime.core.wp_radix_sort_pairs_int_device(keys.ptr, values.ptr, count)
         elif keys.dtype == wp.float32 and values.dtype == wp.int32:
-            runtime.core.radix_sort_pairs_float_device(keys.ptr, values.ptr, count)
+            runtime.core.wp_radix_sort_pairs_float_device(keys.ptr, values.ptr, count)
         elif keys.dtype == wp.int64 and values.dtype == wp.int32:
-            runtime.core.radix_sort_pairs_int64_device(keys.ptr, values.ptr, count)
+            runtime.core.wp_radix_sort_pairs_int64_device(keys.ptr, values.ptr, count)
         else:
             raise RuntimeError(
                 f"Unsupported keys and values data types: {type_repr(keys.dtype)}, {type_repr(values.dtype)}"
@@ -256,7 +256,7 @@ def segmented_sort_pairs(
     if keys.device.is_cpu:
         if keys.dtype == wp.int32 and values.dtype == wp.int32:
-            runtime.core.segmented_sort_pairs_int_host(
+            runtime.core.wp_segmented_sort_pairs_int_host(
                 keys.ptr,
                 values.ptr,
                 count,
@@ -265,7 +265,7 @@ def segmented_sort_pairs(
                 num_segments,
             )
         elif keys.dtype == wp.float32 and values.dtype == wp.int32:
-            runtime.core.segmented_sort_pairs_float_host(
+            runtime.core.wp_segmented_sort_pairs_float_host(
                 keys.ptr,
                 values.ptr,
                 count,
@@ -277,7 +277,7 @@ def segmented_sort_pairs(
             raise RuntimeError(f"Unsupported data type: {type_repr(keys.dtype)}")
     elif keys.device.is_cuda:
         if keys.dtype == wp.int32 and values.dtype == wp.int32:
-            runtime.core.segmented_sort_pairs_int_device(
+            runtime.core.wp_segmented_sort_pairs_int_device(
                 keys.ptr,
                 values.ptr,
                 count,
@@ -286,7 +286,7 @@ def segmented_sort_pairs(
                 num_segments,
             )
         elif keys.dtype == wp.float32 and values.dtype == wp.int32:
-            runtime.core.segmented_sort_pairs_float_device(
+            runtime.core.wp_segmented_sort_pairs_float_device(
                 keys.ptr,
                 values.ptr,
                 count,
@@ -356,14 +356,14 @@ def runlength_encode(values, run_values, run_lengths, run_count=None, value_coun
     if values.device.is_cpu:
         if values.dtype == wp.int32:
-            runtime.core.runlength_encode_int_host(
+            runtime.core.wp_runlength_encode_int_host(
                 values.ptr, run_values.ptr, run_lengths.ptr, run_count.ptr, value_count
             )
         else:
             raise RuntimeError(f"Unsupported data type: {type_repr(values.dtype)}")
     elif values.device.is_cuda:
         if values.dtype == wp.int32:
-            runtime.core.runlength_encode_int_device(
+            runtime.core.wp_runlength_encode_int_device(
                 values.ptr, run_values.ptr, run_lengths.ptr, run_count.ptr, value_count
             )
         else:
@@ -435,16 +435,16 @@ def array_sum(values, out=None, value_count=None, axis=None):
     if values.device.is_cpu:
         if scalar_type == wp.float32:
-            native_func = runtime.core.array_sum_float_host
+            native_func = runtime.core.wp_array_sum_float_host
         elif scalar_type == wp.float64:
-            native_func = runtime.core.array_sum_double_host
+            native_func = runtime.core.wp_array_sum_double_host
         else:
             raise RuntimeError(f"Unsupported data type: {type_repr(values.dtype)}")
     elif values.device.is_cuda:
         if scalar_type == wp.float32:
-            native_func = runtime.core.array_sum_float_device
+            native_func = runtime.core.wp_array_sum_float_device
         elif scalar_type == wp.float64:
-            native_func = runtime.core.array_sum_double_device
+            native_func = runtime.core.wp_array_sum_double_device
         else:
             raise RuntimeError(f"Unsupported data type: {type_repr(values.dtype)}")
@@ -543,16 +543,16 @@ def array_inner(a, b, out=None, count=None, axis=None):
     if a.device.is_cpu:
         if scalar_type == wp.float32:
-            native_func = runtime.core.array_inner_float_host
+            native_func = runtime.core.wp_array_inner_float_host
         elif scalar_type == wp.float64:
-            native_func = runtime.core.array_inner_double_host
+            native_func = runtime.core.wp_array_inner_double_host
         else:
             raise RuntimeError(f"Unsupported data type: {type_repr(a.dtype)}")
     elif a.device.is_cuda:
         if scalar_type == wp.float32:
-            native_func = runtime.core.array_inner_float_device
+            native_func = runtime.core.wp_array_inner_float_device
         elif scalar_type == wp.float64:
-            native_func = runtime.core.array_inner_double_device
+            native_func = runtime.core.wp_array_inner_double_device
         else:
             raise RuntimeError(f"Unsupported data type: {type_repr(a.dtype)}")
@@ -914,7 +914,6 @@ def map(
     module = None
     out_dtypes = None
-    skip_arg_type_checks = False
     if isinstance(func, wp.Function):
         func_name = func.key
         wp_func = func
@@ -924,72 +923,50 @@ def map(
             raise TypeError("func must be a callable function or a warp.Function")
         wp_func, module = create_warp_function(func)
         func_name = wp_func.key
-        # we created a generic function here (arg types are all Any)
-        skip_arg_type_checks = True
     if module is None:
         module = warp.context.get_module(f"map_{func_name}")
     arg_names = list(wp_func.input_types.keys())
+    if len(inputs) != len(arg_names):
+        raise TypeError(
+            f"Number of input arguments ({len(inputs)}) does not match expected number of function arguments ({len(arg_names)})"
+        )
     # determine output dtype
-    if wp_func.value_func is not None or wp_func.value_type is not None:
-        arg_types = {}
-        arg_values = {}
-        for i, arg_name in enumerate(arg_names):
-            if is_array(inputs[i]):
-                # we will pass an element of the array to the function
-                arg_types[arg_name] = inputs[i].dtype
-                if device is None:
-                    device = inputs[i].device
-            else:
-                # we pass the input value directly to the function
-                arg_types[arg_name] = get_warp_type(inputs[i])
-        func_or_none = wp_func.get_overload(list(arg_types.values()), {})
-        if func_or_none is None:
-            raise TypeError(
-                f"Function {func_name} does not support the provided argument types {', '.join(type_repr(t) for t in arg_types.values())}"
-            )
-        func = func_or_none
-        if func.value_func is not None:
-            out_dtype = func.value_func(arg_types, arg_values)
-        else:
-            out_dtype = func.value_type
-        if isinstance(out_dtype, tuple) or isinstance(out_dtype, list):
-            out_dtypes = out_dtype
+    arg_types = {}
+    arg_values = {}
+    for i, arg_name in enumerate(arg_names):
+        if is_array(inputs[i]):
+            # we will pass an element of the array to the function
+            arg_types[arg_name] = inputs[i].dtype
+            if device is None:
+                device = inputs[i].device
         else:
-            out_dtypes = (out_dtype,)
+            # we pass the input value directly to the function
+            arg_types[arg_name] = get_warp_type(inputs[i])
+    func_or_none = wp_func.get_overload(list(arg_types.values()), {})
+    if func_or_none is None:
+        raise TypeError(
+            f"Function {func_name} does not support the provided argument types {', '.join(type_repr(t) for t in arg_types.values())}"
+        )
+    func = func_or_none
+    if func.value_type is not None:
+        out_dtype = func.value_type
+    elif func.value_func is not None:
+        out_dtype = func.value_func(arg_types, arg_values)
     else:
-        # try to evaluate the function to determine the output type
-        args = []
-        arg_types = wp_func.input_types
-        if len(inputs) != len(arg_types):
-            raise TypeError(
-                f"Number of input arguments ({len(inputs)}) does not match expected number of function arguments ({len(arg_types)})"
-            )
-        for (arg_name, arg_type), input in zip(arg_types.items(), inputs):
-            if is_array(input):
-                if not skip_arg_type_checks and not types_equal(input.dtype, arg_type):
-                    raise TypeError(
-                        f'Incorrect input provided for argument "{arg_name}": received array of dtype {type_repr(input.dtype)}, expected {type_repr(arg_type)}'
-                    )
-                args.append(input.dtype())
-                if device is None:
-                    device = input.device
-            else:
-                if not skip_arg_type_checks and not types_equal(type(input), arg_type):
-                    raise TypeError(
-                        f'Incorrect input provided for argument "{arg_name}": received {type_repr(type(input))}, expected {type_repr(arg_type)}'
-                    )
-                args.append(input)
-        result = wp_func(*args)
-        if result is None:
-            raise TypeError("The provided function must return a value")
-        if isinstance(result, tuple) or isinstance(result, list):
-            out_dtypes = tuple(get_warp_type(r) for r in result)
-        else:
-            out_dtypes = (get_warp_type(result),)
+        func.build(None)
+        out_dtype = func.value_func(arg_types, arg_values)
-    if out_dtypes is None:
-        raise TypeError("Could not determine the output type of the function, make sure it returns a value")
+    if out_dtype is None:
+        raise TypeError("The provided function must return a value")
+    if isinstance(out_dtype, tuple) or isinstance(out_dtype, list):
+        out_dtypes = out_dtype
+    else:
+        out_dtypes = (out_dtype,)
     if out is None:
         requires_grad = any(getattr(a, "requires_grad", False) for a in inputs if is_array(a))
@@ -1514,6 +1491,11 @@ class ScopedCapture:
         if self.active:
             try:
                 self.graph = wp.capture_end(device=self.device, stream=self.stream)
+            except Exception:
+                # Only report this exception if __exit__() was reached without an exception,
+                # otherwise re-raise the original exception.
+                if exc_type is None:
+                    raise
             finally:
                 self.active = False
@@ -1583,7 +1565,7 @@ def timing_begin(cuda_filter: int = TIMING_ALL, synchronize: bool = True) -> Non
     if synchronize:
         warp.synchronize()
-    warp.context.runtime.core.cuda_timing_begin(cuda_filter)
+    warp.context.runtime.core.wp_cuda_timing_begin(cuda_filter)
 def timing_end(synchronize: bool = True) -> list[TimingResult]:
@@ -1600,11 +1582,11 @@ def timing_end(synchronize: bool = True) -> list[TimingResult]:
         warp.synchronize()
     # get result count
-    count = warp.context.runtime.core.cuda_timing_get_result_count()
+    count = warp.context.runtime.core.wp_cuda_timing_get_result_count()
     # get result array from C++
     result_buffer = (timing_result_t * count)()
-    warp.context.runtime.core.cuda_timing_end(ctypes.byref(result_buffer), count)
+    warp.context.runtime.core.wp_cuda_timing_end(ctypes.byref(result_buffer), count)
     # prepare Python result list
     results = []

{warp_lang-1.8.1.dist-info → warp_lang-1.9.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: warp-lang
-Version: 1.8.1
+Version: 1.9.1
 Summary: A Python framework for high-performance simulation and graphics programming
 Author-email: NVIDIA Corporation <warp-python@nvidia.com>
 License: Apache-2.0
@@ -55,7 +55,6 @@ Dynamic: license-file
 [![Downloads](https://static.pepy.tech/badge/warp-lang/month)](https://pepy.tech/project/warp-lang)
 [![codecov](https://codecov.io/github/NVIDIA/warp/graph/badge.svg?token=7O1KSM79FG)](https://codecov.io/github/NVIDIA/warp)
 ![GitHub - CI](https://github.com/NVIDIA/warp/actions/workflows/ci.yml/badge.svg)
-[![Discord](https://img.shields.io/badge/Discord-%235865F2.svg?logo=discord&logoColor=white)](https://discord.com/invite/nvidiaomniverse)
 # NVIDIA Warp
@@ -88,19 +87,16 @@ pip install warp-lang
 You can also use `pip install warp-lang[extras]` to install additional dependencies for running examples and USD-related features.
-The binaries hosted on PyPI are currently built with the CUDA 12 runtime and therefore
-require a minimum version of the CUDA driver of 525.60.13 (Linux x86-64) or 528.33 (Windows x86-64).
-If you require GPU support on a system with an older CUDA driver, you can build Warp from source or
-install wheels built with the CUDA 11.8 runtime from the [GitHub Releases](https://github.com/NVIDIA/warp/releases) page.
-Copy the URL of the appropriate wheel file (`warp-lang-{ver}+cu12-py3-none-{platform}.whl`) and pass it to
+The binaries hosted on PyPI are currently built with the CUDA 12 runtime.
+We also provide binaries built with the CUDA 13.0 runtime on the [GitHub Releases](https://github.com/NVIDIA/warp/releases) page.
+Copy the URL of the appropriate wheel file (`warp-lang-{ver}+cu13-py3-none-{platform}.whl`) and pass it to
 the `pip install` command, e.g.
 | Platform        | Install Command                                                                                                               |
 | --------------- | ----------------------------------------------------------------------------------------------------------------------------- |
-| Linux aarch64   | `pip install https://github.com/NVIDIA/warp/releases/download/v1.8.1/warp_lang-1.8.1+cu11-py3-none-manylinux2014_aarch64.whl` |
-| Linux x86-64    | `pip install https://github.com/NVIDIA/warp/releases/download/v1.8.1/warp_lang-1.8.1+cu11-py3-none-manylinux2014_x86_64.whl`  |
-| Windows x86-64  | `pip install https://github.com/NVIDIA/warp/releases/download/v1.8.1/warp_lang-1.8.1+cu11-py3-none-win_amd64.whl`             |
+| Linux aarch64   | `pip install https://github.com/NVIDIA/warp/releases/download/v1.9.1/warp_lang-1.9.1+cu13-py3-none-manylinux_2_34_aarch64.whl` |
+| Linux x86-64    | `pip install https://github.com/NVIDIA/warp/releases/download/v1.9.1/warp_lang-1.9.1+cu13-py3-none-manylinux_2_34_x86_64.whl`  |
+| Windows x86-64  | `pip install https://github.com/NVIDIA/warp/releases/download/v1.9.1/warp_lang-1.9.1+cu13-py3-none-win_amd64.whl`             |
 The `--force-reinstall` option may need to be used to overwrite a previous installation.
@@ -127,8 +123,8 @@ This ensures the index is automatically used for `pip` commands, avoiding the ne
 ### CUDA Requirements
-* Warp packages built with CUDA Toolkit 11.x require NVIDIA driver 470 or newer.
 * Warp packages built with CUDA Toolkit 12.x require NVIDIA driver 525 or newer.
+* Warp packages built with CUDA Toolkit 13.x require NVIDIA driver 580 or newer.
 This applies to pre-built packages distributed on PyPI and GitHub and also when building Warp from source.
@@ -151,66 +147,32 @@ To remedy the situation there are a few options:
 * Install a compatible pre-built Warp package.
 * Build Warp from source using a CUDA Toolkit that's compatible with the installed driver.
-## Getting Started
-An example first program that computes the lengths of random 3D vectors is given below:
-```python
-import warp as wp
-import numpy as np
-num_points = 1024
-@wp.kernel
-def length(points: wp.array(dtype=wp.vec3),
-           lengths: wp.array(dtype=float)):
+## Tutorial Notebooks
-    # thread index
-    tid = wp.tid()
-    # compute distance of each point from origin
-    lengths[tid] = wp.length(points[tid])
-# allocate an array of 3d points
-points = wp.array(np.random.rand(num_points, 3), dtype=wp.vec3)
-lengths = wp.zeros(num_points, dtype=float)
-# launch kernel
-wp.launch(kernel=length,
-          dim=len(points),
-          inputs=[points, lengths])
-print(lengths)
-```
+The [NVIDIA Accelerated Computing Hub](https://github.com/NVIDIA/accelerated-computing-hub) contains the current,
+actively maintained set of Warp tutorials:
-## Running Notebooks
+| Notebook | Colab Link |
+|----------|------------|
+| [Introduction to NVIDIA Warp](https://github.com/NVIDIA/accelerated-computing-hub/blob/9c334fcfcbbaf8d0cff91d012cdb2c11bf0f3dba/Accelerated_Python_User_Guide/notebooks/Chapter_12_Intro_to_NVIDIA_Warp.ipynb) | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/accelerated-computing-hub/blob/9c334fcfcbbaf8d0cff91d012cdb2c11bf0f3dba/Accelerated_Python_User_Guide/notebooks/Chapter_12_Intro_to_NVIDIA_Warp.ipynb) |
+| [GPU-Accelerated Ising Model Simulation in NVIDIA Warp](https://github.com/NVIDIA/accelerated-computing-hub/blob/9c334fcfcbbaf8d0cff91d012cdb2c11bf0f3dba/Accelerated_Python_User_Guide/notebooks/Chapter_12.1_IsingModel_In_Warp.ipynb) | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/accelerated-computing-hub/blob/9c334fcfcbbaf8d0cff91d012cdb2c11bf0f3dba/Accelerated_Python_User_Guide/notebooks/Chapter_12.1_IsingModel_In_Warp.ipynb) |
-A few notebooks are available in the [notebooks](./notebooks/) directory to provide an overview over the key features available in Warp.
+Additionally, several notebooks in the [notebooks](https://github.com/NVIDIA/warp/tree/main/notebooks) directory
+provide additional examples and cover key Warp features:
-To run these notebooks, ``jupyterlab`` is required to be installed using:
-```text
-pip install jupyterlab
-```
-From there, opening the notebooks can be done with the following command:
-```text
-jupyter lab ./notebooks
-```
-* [Warp Core Tutorial: Basics](./notebooks/core_01_basics.ipynb) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_01_basics.ipynb)
-* [Warp Core Tutorial: Generics](./notebooks/core_02_generics.ipynb) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_02_generics.ipynb)
-* [Warp Core Tutorial: Points](./notebooks/core_03_points.ipynb) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_03_points.ipynb)
-* [Warp Core Tutorial: Meshes](./notebooks/core_04_meshes.ipynb) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_04_meshes.ipynb)
-* [Warp Core Tutorial: Volumes](./notebooks/core_05_volumes.ipynb) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_05_volumes.ipynb)
-* [Warp PyTorch Tutorial: Basics](./notebooks/pytorch_01_basics.ipynb) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/pytorch_01_basics.ipynb)
-* [Warp PyTorch Tutorial: Custom Operators](./notebooks/pytorch_02_custom_operators.ipynb) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/pytorch_02_custom_operators.ipynb)
+| Notebook | Colab Link |
+|----------|------------|
+| [Warp Core Tutorial: Basics](https://github.com/NVIDIA/warp/blob/main/notebooks/core_01_basics.ipynb) | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_01_basics.ipynb) |
+| [Warp Core Tutorial: Generics](https://github.com/NVIDIA/warp/blob/main/notebooks/core_02_generics.ipynb) | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_02_generics.ipynb) |
+| [Warp Core Tutorial: Points](https://github.com/NVIDIA/warp/blob/main/notebooks/core_03_points.ipynb) | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_03_points.ipynb) |
+| [Warp Core Tutorial: Meshes](https://github.com/NVIDIA/warp/blob/main/notebooks/core_04_meshes.ipynb) | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_04_meshes.ipynb) |
+| [Warp Core Tutorial: Volumes](https://github.com/NVIDIA/warp/blob/main/notebooks/core_05_volumes.ipynb) | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/core_05_volumes.ipynb) |
+| [Warp PyTorch Tutorial: Basics](https://github.com/NVIDIA/warp/blob/main/notebooks/pytorch_01_basics.ipynb) | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/pytorch_01_basics.ipynb) |
+| [Warp PyTorch Tutorial: Custom Operators](https://github.com/NVIDIA/warp/blob/main/notebooks/pytorch_02_custom_operators.ipynb) | [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/NVIDIA/warp/blob/main/notebooks/pytorch_02_custom_operators.ipynb) |
 ## Running Examples
-The [warp/examples](./warp/examples/) directory contains a number of scripts categorized under subdirectories
+The [warp/examples](https://github.com/NVIDIA/warp/tree/main/warp/examples) directory contains a number of scripts categorized under subdirectories
 that show how to implement various simulation methods using the Warp API.
 Most examples will generate USD files containing time-sampled animations in the current working directory.
 Before running examples, users should ensure that the ``usd-core``, ``matplotlib``, and ``pyglet`` packages are installed using:
@@ -454,7 +416,7 @@ For developers who want to build the library themselves, the following tools are
 * Microsoft Visual Studio 2019 upwards (Windows)
 * GCC 9.4 upwards (Linux)
-* CUDA Toolkit 11.5 or higher
+* CUDA Toolkit 12.0 or higher
 * [Git LFS](https://git-lfs.github.com/) installed
 After cloning the repository, users should run:
@@ -500,9 +462,7 @@ See the [FAQ](https://nvidia.github.io/warp/faq.html) in the Warp documentation.
 Problems, questions, and feature requests can be opened on [GitHub Issues](https://github.com/NVIDIA/warp/issues).
-The Warp team also monitors the **#warp** forum on the public [Omniverse Discord](https://discord.com/invite/nvidiaomniverse) server, come chat with us!
-For inquiries not suited for GitHub Issues or Discord, please email warp-python@nvidia.com.
+For inquiries not suited for GitHub Issues, please email warp-python@nvidia.com.
 ## Versioning