warp-lang 1.9.1__py3-none-win_amd64.whl → 1.10.0rc2__py3-none-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of warp-lang might be problematic. Click here for more details.
- warp/__init__.py +301 -287
- warp/__init__.pyi +794 -305
- warp/_src/__init__.py +14 -0
- warp/_src/autograd.py +1075 -0
- warp/_src/build.py +618 -0
- warp/_src/build_dll.py +640 -0
- warp/{builtins.py → _src/builtins.py} +1382 -377
- warp/_src/codegen.py +4359 -0
- warp/{config.py → _src/config.py} +178 -169
- warp/_src/constants.py +57 -0
- warp/_src/context.py +8294 -0
- warp/_src/dlpack.py +462 -0
- warp/_src/fabric.py +355 -0
- warp/_src/fem/__init__.py +14 -0
- warp/_src/fem/adaptivity.py +508 -0
- warp/_src/fem/cache.py +687 -0
- warp/_src/fem/dirichlet.py +188 -0
- warp/{fem → _src/fem}/domain.py +40 -30
- warp/_src/fem/field/__init__.py +131 -0
- warp/_src/fem/field/field.py +701 -0
- warp/{fem → _src/fem}/field/nodal_field.py +30 -15
- warp/{fem → _src/fem}/field/restriction.py +1 -1
- warp/{fem → _src/fem}/field/virtual.py +53 -27
- warp/_src/fem/geometry/__init__.py +32 -0
- warp/{fem → _src/fem}/geometry/adaptive_nanogrid.py +77 -163
- warp/_src/fem/geometry/closest_point.py +97 -0
- warp/{fem → _src/fem}/geometry/deformed_geometry.py +14 -22
- warp/{fem → _src/fem}/geometry/element.py +32 -10
- warp/{fem → _src/fem}/geometry/geometry.py +48 -20
- warp/{fem → _src/fem}/geometry/grid_2d.py +12 -23
- warp/{fem → _src/fem}/geometry/grid_3d.py +12 -23
- warp/{fem → _src/fem}/geometry/hexmesh.py +40 -63
- warp/{fem → _src/fem}/geometry/nanogrid.py +255 -248
- warp/{fem → _src/fem}/geometry/partition.py +121 -63
- warp/{fem → _src/fem}/geometry/quadmesh.py +26 -45
- warp/{fem → _src/fem}/geometry/tetmesh.py +40 -63
- warp/{fem → _src/fem}/geometry/trimesh.py +26 -45
- warp/{fem → _src/fem}/integrate.py +164 -158
- warp/_src/fem/linalg.py +383 -0
- warp/_src/fem/operator.py +396 -0
- warp/_src/fem/polynomial.py +229 -0
- warp/{fem → _src/fem}/quadrature/pic_quadrature.py +15 -20
- warp/{fem → _src/fem}/quadrature/quadrature.py +95 -47
- warp/_src/fem/space/__init__.py +248 -0
- warp/{fem → _src/fem}/space/basis_function_space.py +20 -11
- warp/_src/fem/space/basis_space.py +679 -0
- warp/{fem → _src/fem}/space/dof_mapper.py +3 -3
- warp/{fem → _src/fem}/space/function_space.py +14 -13
- warp/{fem → _src/fem}/space/grid_2d_function_space.py +4 -7
- warp/{fem → _src/fem}/space/grid_3d_function_space.py +4 -4
- warp/{fem → _src/fem}/space/hexmesh_function_space.py +4 -10
- warp/{fem → _src/fem}/space/nanogrid_function_space.py +3 -9
- warp/{fem → _src/fem}/space/partition.py +117 -60
- warp/{fem → _src/fem}/space/quadmesh_function_space.py +4 -10
- warp/{fem → _src/fem}/space/restriction.py +66 -33
- warp/_src/fem/space/shape/__init__.py +152 -0
- warp/{fem → _src/fem}/space/shape/cube_shape_function.py +9 -9
- warp/{fem → _src/fem}/space/shape/shape_function.py +8 -9
- warp/{fem → _src/fem}/space/shape/square_shape_function.py +6 -6
- warp/{fem → _src/fem}/space/shape/tet_shape_function.py +3 -3
- warp/{fem → _src/fem}/space/shape/triangle_shape_function.py +3 -3
- warp/{fem → _src/fem}/space/tetmesh_function_space.py +3 -9
- warp/_src/fem/space/topology.py +459 -0
- warp/{fem → _src/fem}/space/trimesh_function_space.py +3 -9
- warp/_src/fem/types.py +112 -0
- warp/_src/fem/utils.py +486 -0
- warp/_src/jax.py +186 -0
- warp/_src/jax_experimental/__init__.py +14 -0
- warp/_src/jax_experimental/custom_call.py +387 -0
- warp/_src/jax_experimental/ffi.py +1284 -0
- warp/_src/jax_experimental/xla_ffi.py +656 -0
- warp/_src/marching_cubes.py +708 -0
- warp/_src/math.py +414 -0
- warp/_src/optim/__init__.py +14 -0
- warp/_src/optim/adam.py +163 -0
- warp/_src/optim/linear.py +1606 -0
- warp/_src/optim/sgd.py +112 -0
- warp/_src/paddle.py +406 -0
- warp/_src/render/__init__.py +14 -0
- warp/_src/render/imgui_manager.py +289 -0
- warp/_src/render/render_opengl.py +3636 -0
- warp/_src/render/render_usd.py +937 -0
- warp/_src/render/utils.py +160 -0
- warp/_src/sparse.py +2716 -0
- warp/_src/tape.py +1206 -0
- warp/{thirdparty → _src/thirdparty}/unittest_parallel.py +9 -2
- warp/_src/torch.py +391 -0
- warp/_src/types.py +5870 -0
- warp/_src/utils.py +1693 -0
- warp/autograd.py +12 -1054
- warp/bin/warp-clang.dll +0 -0
- warp/bin/warp.dll +0 -0
- warp/build.py +8 -588
- warp/build_dll.py +6 -721
- warp/codegen.py +6 -4251
- warp/constants.py +6 -39
- warp/context.py +12 -8062
- warp/dlpack.py +6 -444
- warp/examples/distributed/example_jacobi_mpi.py +4 -5
- warp/examples/fem/example_adaptive_grid.py +1 -1
- warp/examples/fem/example_apic_fluid.py +1 -1
- warp/examples/fem/example_burgers.py +8 -8
- warp/examples/fem/example_diffusion.py +1 -1
- warp/examples/fem/example_distortion_energy.py +1 -1
- warp/examples/fem/example_mixed_elasticity.py +2 -2
- warp/examples/fem/example_navier_stokes.py +1 -1
- warp/examples/fem/example_nonconforming_contact.py +7 -7
- warp/examples/fem/example_stokes.py +1 -1
- warp/examples/fem/example_stokes_transfer.py +1 -1
- warp/examples/fem/utils.py +2 -2
- warp/examples/interop/example_jax_callable.py +1 -1
- warp/examples/interop/example_jax_ffi_callback.py +1 -1
- warp/examples/interop/example_jax_kernel.py +1 -1
- warp/examples/tile/example_tile_mcgp.py +191 -0
- warp/fabric.py +6 -337
- warp/fem/__init__.py +159 -97
- warp/fem/adaptivity.py +7 -489
- warp/fem/cache.py +9 -648
- warp/fem/dirichlet.py +6 -184
- warp/fem/field/__init__.py +8 -109
- warp/fem/field/field.py +7 -652
- warp/fem/geometry/__init__.py +7 -18
- warp/fem/geometry/closest_point.py +11 -77
- warp/fem/linalg.py +18 -366
- warp/fem/operator.py +11 -369
- warp/fem/polynomial.py +9 -209
- warp/fem/space/__init__.py +5 -211
- warp/fem/space/basis_space.py +6 -662
- warp/fem/space/shape/__init__.py +41 -118
- warp/fem/space/topology.py +6 -437
- warp/fem/types.py +6 -81
- warp/fem/utils.py +11 -444
- warp/jax.py +8 -165
- warp/jax_experimental/__init__.py +14 -1
- warp/jax_experimental/custom_call.py +8 -365
- warp/jax_experimental/ffi.py +17 -873
- warp/jax_experimental/xla_ffi.py +5 -605
- warp/marching_cubes.py +5 -689
- warp/math.py +16 -393
- warp/native/array.h +385 -37
- warp/native/builtin.h +314 -37
- warp/native/bvh.cpp +43 -9
- warp/native/bvh.cu +62 -27
- warp/native/bvh.h +310 -309
- warp/native/clang/clang.cpp +102 -97
- warp/native/coloring.cpp +0 -1
- warp/native/crt.h +208 -0
- warp/native/exports.h +156 -0
- warp/native/hashgrid.cu +2 -0
- warp/native/intersect.h +24 -1
- warp/native/intersect_tri.h +44 -35
- warp/native/mat.h +1456 -276
- warp/native/mesh.cpp +4 -4
- warp/native/mesh.cu +4 -2
- warp/native/mesh.h +176 -61
- warp/native/quat.h +0 -52
- warp/native/scan.cu +2 -0
- warp/native/sparse.cu +7 -3
- warp/native/spatial.h +12 -0
- warp/native/tile.h +681 -89
- warp/native/tile_radix_sort.h +1 -1
- warp/native/tile_reduce.h +394 -46
- warp/native/tile_scan.h +4 -4
- warp/native/vec.h +469 -0
- warp/native/version.h +23 -0
- warp/native/volume.cpp +1 -1
- warp/native/volume.cu +1 -0
- warp/native/volume.h +1 -1
- warp/native/volume_builder.cu +2 -0
- warp/native/warp.cpp +57 -29
- warp/native/warp.cu +253 -171
- warp/native/warp.h +11 -8
- warp/optim/__init__.py +6 -3
- warp/optim/adam.py +6 -145
- warp/optim/linear.py +14 -1585
- warp/optim/sgd.py +6 -94
- warp/paddle.py +6 -388
- warp/render/__init__.py +8 -4
- warp/render/imgui_manager.py +7 -267
- warp/render/render_opengl.py +6 -3618
- warp/render/render_usd.py +6 -919
- warp/render/utils.py +6 -142
- warp/sparse.py +37 -2563
- warp/tape.py +6 -1188
- warp/tests/__main__.py +1 -1
- warp/tests/cuda/test_async.py +4 -4
- warp/tests/cuda/test_conditional_captures.py +1 -1
- warp/tests/cuda/test_multigpu.py +1 -1
- warp/tests/cuda/test_streams.py +58 -1
- warp/tests/geometry/test_bvh.py +157 -22
- warp/tests/geometry/test_marching_cubes.py +0 -1
- warp/tests/geometry/test_mesh.py +5 -3
- warp/tests/geometry/test_mesh_query_aabb.py +5 -12
- warp/tests/geometry/test_mesh_query_point.py +5 -2
- warp/tests/geometry/test_mesh_query_ray.py +15 -3
- warp/tests/geometry/test_volume_write.py +5 -5
- warp/tests/interop/test_dlpack.py +14 -14
- warp/tests/interop/test_jax.py +772 -49
- warp/tests/interop/test_paddle.py +1 -1
- warp/tests/test_adam.py +0 -1
- warp/tests/test_arithmetic.py +9 -9
- warp/tests/test_array.py +527 -100
- warp/tests/test_array_reduce.py +3 -3
- warp/tests/test_atomic.py +12 -8
- warp/tests/test_atomic_bitwise.py +209 -0
- warp/tests/test_atomic_cas.py +4 -4
- warp/tests/test_bool.py +2 -2
- warp/tests/test_builtins_resolution.py +5 -571
- warp/tests/test_codegen.py +33 -14
- warp/tests/test_conditional.py +1 -1
- warp/tests/test_context.py +6 -6
- warp/tests/test_copy.py +242 -161
- warp/tests/test_ctypes.py +3 -3
- warp/tests/test_devices.py +24 -2
- warp/tests/test_examples.py +16 -84
- warp/tests/test_fabricarray.py +35 -35
- warp/tests/test_fast_math.py +0 -2
- warp/tests/test_fem.py +56 -10
- warp/tests/test_fixedarray.py +3 -3
- warp/tests/test_func.py +8 -5
- warp/tests/test_generics.py +1 -1
- warp/tests/test_indexedarray.py +24 -24
- warp/tests/test_intersect.py +39 -9
- warp/tests/test_large.py +1 -1
- warp/tests/test_lerp.py +3 -1
- warp/tests/test_linear_solvers.py +1 -1
- warp/tests/test_map.py +35 -4
- warp/tests/test_mat.py +52 -62
- warp/tests/test_mat_constructors.py +4 -5
- warp/tests/test_mat_lite.py +1 -1
- warp/tests/test_mat_scalar_ops.py +121 -121
- warp/tests/test_math.py +34 -0
- warp/tests/test_module_aot.py +4 -4
- warp/tests/test_modules_lite.py +28 -2
- warp/tests/test_print.py +11 -11
- warp/tests/test_quat.py +93 -58
- warp/tests/test_runlength_encode.py +1 -1
- warp/tests/test_scalar_ops.py +38 -10
- warp/tests/test_smoothstep.py +1 -1
- warp/tests/test_sparse.py +126 -15
- warp/tests/test_spatial.py +105 -87
- warp/tests/test_special_values.py +6 -6
- warp/tests/test_static.py +7 -7
- warp/tests/test_struct.py +13 -2
- warp/tests/test_triangle_closest_point.py +48 -1
- warp/tests/test_types.py +27 -15
- warp/tests/test_utils.py +52 -52
- warp/tests/test_vec.py +29 -29
- warp/tests/test_vec_constructors.py +5 -5
- warp/tests/test_vec_scalar_ops.py +97 -97
- warp/tests/test_version.py +75 -0
- warp/tests/tile/test_tile.py +178 -0
- warp/tests/tile/test_tile_atomic_bitwise.py +403 -0
- warp/tests/tile/test_tile_cholesky.py +7 -4
- warp/tests/tile/test_tile_load.py +26 -2
- warp/tests/tile/test_tile_mathdx.py +3 -3
- warp/tests/tile/test_tile_matmul.py +1 -1
- warp/tests/tile/test_tile_mlp.py +2 -4
- warp/tests/tile/test_tile_reduce.py +214 -13
- warp/tests/unittest_suites.py +6 -14
- warp/tests/unittest_utils.py +10 -9
- warp/tests/walkthrough_debug.py +3 -1
- warp/torch.py +6 -373
- warp/types.py +29 -5764
- warp/utils.py +10 -1659
- {warp_lang-1.9.1.dist-info → warp_lang-1.10.0rc2.dist-info}/METADATA +46 -99
- warp_lang-1.10.0rc2.dist-info/RECORD +468 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/Gaia-LICENSE.txt +6 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/appdirs-LICENSE.txt +22 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/asset_pixel_jpg-LICENSE.txt +3 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/cuda-LICENSE.txt +1582 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/dlpack-LICENSE.txt +201 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/fp16-LICENSE.txt +28 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/libmathdx-LICENSE.txt +220 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/llvm-LICENSE.txt +279 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/moller-LICENSE.txt +16 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/nanovdb-LICENSE.txt +2 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/nvrtc-LICENSE.txt +1592 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/svd-LICENSE.txt +23 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/unittest_parallel-LICENSE.txt +21 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/usd-LICENSE.txt +213 -0
- warp_lang-1.10.0rc2.dist-info/licenses/licenses/windingnumber-LICENSE.txt +21 -0
- warp/examples/assets/cartpole.urdf +0 -110
- warp/examples/assets/crazyflie.usd +0 -0
- warp/examples/assets/nv_ant.xml +0 -92
- warp/examples/assets/nv_humanoid.xml +0 -183
- warp/examples/assets/quadruped.urdf +0 -268
- warp/examples/optim/example_bounce.py +0 -266
- warp/examples/optim/example_cloth_throw.py +0 -228
- warp/examples/optim/example_drone.py +0 -870
- warp/examples/optim/example_inverse_kinematics.py +0 -182
- warp/examples/optim/example_inverse_kinematics_torch.py +0 -191
- warp/examples/optim/example_softbody_properties.py +0 -400
- warp/examples/optim/example_spring_cage.py +0 -245
- warp/examples/optim/example_trajectory.py +0 -227
- warp/examples/sim/example_cartpole.py +0 -143
- warp/examples/sim/example_cloth.py +0 -225
- warp/examples/sim/example_cloth_self_contact.py +0 -316
- warp/examples/sim/example_granular.py +0 -130
- warp/examples/sim/example_granular_collision_sdf.py +0 -202
- warp/examples/sim/example_jacobian_ik.py +0 -244
- warp/examples/sim/example_particle_chain.py +0 -124
- warp/examples/sim/example_quadruped.py +0 -203
- warp/examples/sim/example_rigid_chain.py +0 -203
- warp/examples/sim/example_rigid_contact.py +0 -195
- warp/examples/sim/example_rigid_force.py +0 -133
- warp/examples/sim/example_rigid_gyroscopic.py +0 -115
- warp/examples/sim/example_rigid_soft_contact.py +0 -140
- warp/examples/sim/example_soft_body.py +0 -196
- warp/examples/tile/example_tile_walker.py +0 -327
- warp/sim/__init__.py +0 -74
- warp/sim/articulation.py +0 -793
- warp/sim/collide.py +0 -2570
- warp/sim/graph_coloring.py +0 -307
- warp/sim/import_mjcf.py +0 -791
- warp/sim/import_snu.py +0 -227
- warp/sim/import_urdf.py +0 -579
- warp/sim/import_usd.py +0 -898
- warp/sim/inertia.py +0 -357
- warp/sim/integrator.py +0 -245
- warp/sim/integrator_euler.py +0 -2000
- warp/sim/integrator_featherstone.py +0 -2101
- warp/sim/integrator_vbd.py +0 -2487
- warp/sim/integrator_xpbd.py +0 -3295
- warp/sim/model.py +0 -4821
- warp/sim/particles.py +0 -121
- warp/sim/render.py +0 -431
- warp/sim/utils.py +0 -431
- warp/tests/sim/disabled_kinematics.py +0 -244
- warp/tests/sim/test_cloth.py +0 -863
- warp/tests/sim/test_collision.py +0 -743
- warp/tests/sim/test_coloring.py +0 -347
- warp/tests/sim/test_inertia.py +0 -161
- warp/tests/sim/test_model.py +0 -226
- warp/tests/sim/test_sim_grad.py +0 -287
- warp/tests/sim/test_sim_grad_bounce_linear.py +0 -212
- warp/tests/sim/test_sim_kinematics.py +0 -98
- warp/thirdparty/__init__.py +0 -0
- warp_lang-1.9.1.dist-info/RECORD +0 -456
- /warp/{fem → _src/fem}/quadrature/__init__.py +0 -0
- /warp/{tests/sim → _src/thirdparty}/__init__.py +0 -0
- /warp/{thirdparty → _src/thirdparty}/appdirs.py +0 -0
- /warp/{thirdparty → _src/thirdparty}/dlpack.py +0 -0
- {warp_lang-1.9.1.dist-info → warp_lang-1.10.0rc2.dist-info}/WHEEL +0 -0
- {warp_lang-1.9.1.dist-info → warp_lang-1.10.0rc2.dist-info}/licenses/LICENSE.md +0 -0
- {warp_lang-1.9.1.dist-info → warp_lang-1.10.0rc2.dist-info}/top_level.txt +0 -0
warp/_src/math.py
ADDED
|
@@ -0,0 +1,414 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
from typing import Any
|
|
17
|
+
|
|
18
|
+
import warp as wp
|
|
19
|
+
|
|
20
|
+
"""
|
|
21
|
+
Vector norm functions
|
|
22
|
+
"""
|
|
23
|
+
|
|
24
|
+
__all__ = [
|
|
25
|
+
"norm_huber",
|
|
26
|
+
"norm_l1",
|
|
27
|
+
"norm_l2",
|
|
28
|
+
"norm_pseudo_huber",
|
|
29
|
+
"smooth_normalize",
|
|
30
|
+
"transform_compose",
|
|
31
|
+
"transform_decompose",
|
|
32
|
+
"transform_from_matrix",
|
|
33
|
+
"transform_to_matrix",
|
|
34
|
+
]
|
|
35
|
+
|
|
36
|
+
|
|
37
|
+
@wp.func
|
|
38
|
+
def norm_l1(v: Any):
|
|
39
|
+
"""
|
|
40
|
+
Computes the L1 norm of a vector v.
|
|
41
|
+
|
|
42
|
+
.. math:: \\|v\\|_1 = \\sum_i |v_i|
|
|
43
|
+
|
|
44
|
+
Args:
|
|
45
|
+
v (Vector[Any,Float]): The vector to compute the L1 norm of.
|
|
46
|
+
|
|
47
|
+
Returns:
|
|
48
|
+
float: The L1 norm of the vector.
|
|
49
|
+
"""
|
|
50
|
+
n = float(0.0)
|
|
51
|
+
for i in range(len(v)):
|
|
52
|
+
n += wp.abs(v[i])
|
|
53
|
+
return n
|
|
54
|
+
|
|
55
|
+
|
|
56
|
+
@wp.func
|
|
57
|
+
def norm_l2(v: Any):
|
|
58
|
+
"""
|
|
59
|
+
Computes the L2 norm of a vector v.
|
|
60
|
+
|
|
61
|
+
.. math:: \\|v\\|_2 = \\sqrt{\\sum_i v_i^2}
|
|
62
|
+
|
|
63
|
+
Args:
|
|
64
|
+
v (Vector[Any,Float]): The vector to compute the L2 norm of.
|
|
65
|
+
|
|
66
|
+
Returns:
|
|
67
|
+
float: The L2 norm of the vector.
|
|
68
|
+
"""
|
|
69
|
+
return wp.length(v)
|
|
70
|
+
|
|
71
|
+
|
|
72
|
+
@wp.func
|
|
73
|
+
def norm_huber(v: Any, delta: float = 1.0):
|
|
74
|
+
"""
|
|
75
|
+
Computes the Huber norm of a vector v with a given delta.
|
|
76
|
+
|
|
77
|
+
.. math::
|
|
78
|
+
H(v) = \\begin{cases} \\frac{1}{2} \\|v\\|^2 & \\text{if } \\|v\\| \\leq \\delta \\\\ \\delta(\\|v\\| - \\frac{1}{2}\\delta) & \\text{otherwise} \\end{cases}
|
|
79
|
+
|
|
80
|
+
.. image:: /img/norm_huber.svg
|
|
81
|
+
:align: center
|
|
82
|
+
|
|
83
|
+
Args:
|
|
84
|
+
v (Vector[Any,Float]): The vector to compute the Huber norm of.
|
|
85
|
+
delta (float): The threshold value, defaults to 1.0.
|
|
86
|
+
|
|
87
|
+
Returns:
|
|
88
|
+
float: The Huber norm of the vector.
|
|
89
|
+
"""
|
|
90
|
+
a = wp.dot(v, v)
|
|
91
|
+
if a <= delta * delta:
|
|
92
|
+
return 0.5 * a
|
|
93
|
+
return delta * (wp.sqrt(a) - 0.5 * delta)
|
|
94
|
+
|
|
95
|
+
|
|
96
|
+
@wp.func
|
|
97
|
+
def norm_pseudo_huber(v: Any, delta: float = 1.0):
|
|
98
|
+
"""
|
|
99
|
+
Computes the "pseudo" Huber norm of a vector v with a given delta.
|
|
100
|
+
|
|
101
|
+
.. math::
|
|
102
|
+
H^\\prime(v) = \\delta \\sqrt{1 + \\frac{\\|v\\|^2}{\\delta^2}}
|
|
103
|
+
|
|
104
|
+
.. image:: /img/norm_pseudo_huber.svg
|
|
105
|
+
:align: center
|
|
106
|
+
|
|
107
|
+
Args:
|
|
108
|
+
v (Vector[Any,Float]): The vector to compute the Huber norm of.
|
|
109
|
+
delta (float): The threshold value, defaults to 1.0.
|
|
110
|
+
|
|
111
|
+
Returns:
|
|
112
|
+
float: The Huber norm of the vector.
|
|
113
|
+
"""
|
|
114
|
+
a = wp.dot(v, v)
|
|
115
|
+
return delta * wp.sqrt(1.0 + a / (delta * delta))
|
|
116
|
+
|
|
117
|
+
|
|
118
|
+
@wp.func
|
|
119
|
+
def smooth_normalize(v: Any, delta: float = 1.0):
|
|
120
|
+
"""
|
|
121
|
+
Normalizes a vector using the pseudo-Huber norm.
|
|
122
|
+
|
|
123
|
+
See :func:`norm_pseudo_huber`.
|
|
124
|
+
|
|
125
|
+
.. math::
|
|
126
|
+
\\frac{v}{H^\\prime(v)}
|
|
127
|
+
|
|
128
|
+
Args:
|
|
129
|
+
v (Vector[Any,Float]): The vector to normalize.
|
|
130
|
+
delta (float): The threshold value, defaults to 1.0.
|
|
131
|
+
|
|
132
|
+
Returns:
|
|
133
|
+
Vector[Any,Float]: The normalized vector.
|
|
134
|
+
"""
|
|
135
|
+
return v / norm_pseudo_huber(v, delta)
|
|
136
|
+
|
|
137
|
+
|
|
138
|
+
def create_transform_from_matrix_func(dtype):
|
|
139
|
+
mat44 = wp._src.types.matrix((4, 4), dtype)
|
|
140
|
+
vec3 = wp._src.types.vector(3, dtype)
|
|
141
|
+
transform = wp._src.types.transformation(dtype)
|
|
142
|
+
|
|
143
|
+
def transform_from_matrix(mat: mat44) -> transform:
|
|
144
|
+
"""
|
|
145
|
+
Construct a transformation from a 4x4 matrix.
|
|
146
|
+
|
|
147
|
+
.. math::
|
|
148
|
+
M = \\begin{bmatrix}
|
|
149
|
+
R_{00} & R_{01} & R_{02} & p_x \\\\
|
|
150
|
+
R_{10} & R_{11} & R_{12} & p_y \\\\
|
|
151
|
+
R_{20} & R_{21} & R_{22} & p_z \\\\
|
|
152
|
+
0 & 0 & 0 & 1
|
|
153
|
+
\\end{bmatrix}
|
|
154
|
+
|
|
155
|
+
Where:
|
|
156
|
+
|
|
157
|
+
* :math:`R` is the 3x3 rotation matrix created from the orientation quaternion of the input transform.
|
|
158
|
+
* :math:`p` is the 3D position vector :math:`[p_x, p_y, p_z]` of the input transform.
|
|
159
|
+
|
|
160
|
+
Args:
|
|
161
|
+
mat (Matrix[4, 4, Float]): Matrix to convert.
|
|
162
|
+
|
|
163
|
+
Returns:
|
|
164
|
+
Transformation[Float]: The transformation.
|
|
165
|
+
"""
|
|
166
|
+
p = vec3(mat[0][3], mat[1][3], mat[2][3])
|
|
167
|
+
q = wp.quat_from_matrix(mat)
|
|
168
|
+
return transform(p, q)
|
|
169
|
+
|
|
170
|
+
return transform_from_matrix
|
|
171
|
+
|
|
172
|
+
|
|
173
|
+
transform_from_matrix = wp.func(
|
|
174
|
+
create_transform_from_matrix_func(wp.float32),
|
|
175
|
+
name="transform_from_matrix",
|
|
176
|
+
)
|
|
177
|
+
wp.func(
|
|
178
|
+
create_transform_from_matrix_func(wp.float16),
|
|
179
|
+
name="transform_from_matrix",
|
|
180
|
+
)
|
|
181
|
+
wp.func(
|
|
182
|
+
create_transform_from_matrix_func(wp.float64),
|
|
183
|
+
name="transform_from_matrix",
|
|
184
|
+
)
|
|
185
|
+
|
|
186
|
+
|
|
187
|
+
def create_transform_to_matrix_func(dtype):
|
|
188
|
+
mat44 = wp._src.types.matrix((4, 4), dtype)
|
|
189
|
+
transform = wp._src.types.transformation(dtype)
|
|
190
|
+
|
|
191
|
+
def transform_to_matrix(xform: transform) -> mat44:
|
|
192
|
+
"""
|
|
193
|
+
Convert a transformation to a 4x4 matrix.
|
|
194
|
+
|
|
195
|
+
.. math::
|
|
196
|
+
M = \\begin{bmatrix}
|
|
197
|
+
R_{00} & R_{01} & R_{02} & p_x \\\\
|
|
198
|
+
R_{10} & R_{11} & R_{12} & p_y \\\\
|
|
199
|
+
R_{20} & R_{21} & R_{22} & p_z \\\\
|
|
200
|
+
0 & 0 & 0 & 1
|
|
201
|
+
\\end{bmatrix}
|
|
202
|
+
|
|
203
|
+
Where:
|
|
204
|
+
|
|
205
|
+
* :math:`R` is the 3x3 rotation matrix created from the orientation quaternion of the input transform.
|
|
206
|
+
* :math:`p` is the 3D position vector :math:`[p_x, p_y, p_z]` of the input transform.
|
|
207
|
+
|
|
208
|
+
Args:
|
|
209
|
+
xform (Transformation[Float]): Transformation to convert.
|
|
210
|
+
|
|
211
|
+
Returns:
|
|
212
|
+
Matrix[4, 4, Float]: The matrix.
|
|
213
|
+
"""
|
|
214
|
+
p = wp.transform_get_translation(xform)
|
|
215
|
+
q = wp.transform_get_rotation(xform)
|
|
216
|
+
rot = wp.quat_to_matrix(q)
|
|
217
|
+
# fmt: off
|
|
218
|
+
return mat44(
|
|
219
|
+
rot[0][0], rot[0][1], rot[0][2], p[0],
|
|
220
|
+
rot[1][0], rot[1][1], rot[1][2], p[1],
|
|
221
|
+
rot[2][0], rot[2][1], rot[2][2], p[2],
|
|
222
|
+
dtype(0.0), dtype(0.0), dtype(0.0), dtype(1.0),
|
|
223
|
+
)
|
|
224
|
+
# fmt: on
|
|
225
|
+
|
|
226
|
+
return transform_to_matrix
|
|
227
|
+
|
|
228
|
+
|
|
229
|
+
transform_to_matrix = wp.func(
|
|
230
|
+
create_transform_to_matrix_func(wp.float32),
|
|
231
|
+
name="transform_to_matrix",
|
|
232
|
+
)
|
|
233
|
+
wp.func(
|
|
234
|
+
create_transform_to_matrix_func(wp.float16),
|
|
235
|
+
name="transform_to_matrix",
|
|
236
|
+
)
|
|
237
|
+
wp.func(
|
|
238
|
+
create_transform_to_matrix_func(wp.float64),
|
|
239
|
+
name="transform_to_matrix",
|
|
240
|
+
)
|
|
241
|
+
|
|
242
|
+
|
|
243
|
+
def create_transform_compose_func(dtype):
|
|
244
|
+
mat44 = wp._src.types.matrix((4, 4), dtype)
|
|
245
|
+
quat = wp._src.types.quaternion(dtype)
|
|
246
|
+
vec3 = wp._src.types.vector(3, dtype)
|
|
247
|
+
|
|
248
|
+
def transform_compose(position: vec3, rotation: quat, scale: vec3):
|
|
249
|
+
"""
|
|
250
|
+
Compose a 4x4 transformation matrix from a 3D position, quaternion orientation, and 3D scale.
|
|
251
|
+
|
|
252
|
+
.. math::
|
|
253
|
+
M = \\begin{bmatrix}
|
|
254
|
+
s_x R_{00} & s_y R_{01} & s_z R_{02} & p_x \\\\
|
|
255
|
+
s_x R_{10} & s_y R_{11} & s_z R_{12} & p_y \\\\
|
|
256
|
+
s_x R_{20} & s_y R_{21} & s_z R_{22} & p_z \\\\
|
|
257
|
+
0 & 0 & 0 & 1
|
|
258
|
+
\\end{bmatrix}
|
|
259
|
+
|
|
260
|
+
Where:
|
|
261
|
+
|
|
262
|
+
* :math:`R` is the 3x3 rotation matrix created from the orientation quaternion of the input transform.
|
|
263
|
+
* :math:`p` is the 3D position vector :math:`[p_x, p_y, p_z]` of the input transform.
|
|
264
|
+
* :math:`s` is the 3D scale vector :math:`[s_x, s_y, s_z]` of the input transform.
|
|
265
|
+
|
|
266
|
+
Args:
|
|
267
|
+
position (Vector[3, Float]): The 3D position vector.
|
|
268
|
+
rotation (Quaternion[Float]): The quaternion orientation.
|
|
269
|
+
scale (Vector[3, Float]): The 3D scale vector.
|
|
270
|
+
|
|
271
|
+
Returns:
|
|
272
|
+
Matrix[4, 4, Float]: The transformation matrix.
|
|
273
|
+
"""
|
|
274
|
+
R = wp.quat_to_matrix(rotation)
|
|
275
|
+
# fmt: off
|
|
276
|
+
return mat44(
|
|
277
|
+
scale[0] * R[0,0], scale[1] * R[0,1], scale[2] * R[0,2], position[0],
|
|
278
|
+
scale[0] * R[1,0], scale[1] * R[1,1], scale[2] * R[1,2], position[1],
|
|
279
|
+
scale[0] * R[2,0], scale[1] * R[2,1], scale[2] * R[2,2], position[2],
|
|
280
|
+
dtype(0.0), dtype(0.0), dtype(0.0), dtype(1.0),
|
|
281
|
+
)
|
|
282
|
+
# fmt: on
|
|
283
|
+
|
|
284
|
+
return transform_compose
|
|
285
|
+
|
|
286
|
+
|
|
287
|
+
transform_compose = wp.func(
|
|
288
|
+
create_transform_compose_func(wp.float32),
|
|
289
|
+
name="transform_compose",
|
|
290
|
+
)
|
|
291
|
+
wp.func(
|
|
292
|
+
create_transform_compose_func(wp.float16),
|
|
293
|
+
name="transform_compose",
|
|
294
|
+
)
|
|
295
|
+
wp.func(
|
|
296
|
+
create_transform_compose_func(wp.float64),
|
|
297
|
+
name="transform_compose",
|
|
298
|
+
)
|
|
299
|
+
|
|
300
|
+
|
|
301
|
+
def create_transform_decompose_func(dtype):
|
|
302
|
+
mat44 = wp._src.types.matrix((4, 4), dtype)
|
|
303
|
+
vec3 = wp._src.types.vector(3, dtype)
|
|
304
|
+
mat33 = wp._src.types.matrix((3, 3), dtype)
|
|
305
|
+
zero = dtype(0.0)
|
|
306
|
+
|
|
307
|
+
def transform_decompose(m: mat44):
|
|
308
|
+
"""
|
|
309
|
+
Decompose a 4x4 transformation matrix into 3D position, quaternion orientation, and 3D scale.
|
|
310
|
+
|
|
311
|
+
.. math::
|
|
312
|
+
M = \\begin{bmatrix}
|
|
313
|
+
s_x R_{00} & s_y R_{01} & s_z R_{02} & p_x \\\\
|
|
314
|
+
s_x R_{10} & s_y R_{11} & s_z R_{12} & p_y \\\\
|
|
315
|
+
s_x R_{20} & s_y R_{21} & s_z R_{22} & p_z \\\\
|
|
316
|
+
0 & 0 & 0 & 1
|
|
317
|
+
\\end{bmatrix}
|
|
318
|
+
|
|
319
|
+
Where:
|
|
320
|
+
|
|
321
|
+
* :math:`R` is the 3x3 rotation matrix created from the orientation quaternion of the input transform.
|
|
322
|
+
* :math:`p` is the 3D position vector :math:`[p_x, p_y, p_z]` of the input transform.
|
|
323
|
+
* :math:`s` is the 3D scale vector :math:`[s_x, s_y, s_z]` of the input transform.
|
|
324
|
+
|
|
325
|
+
Args:
|
|
326
|
+
m (Matrix[4, 4, Float]): The matrix to decompose.
|
|
327
|
+
|
|
328
|
+
Returns:
|
|
329
|
+
Tuple[Vector[3, Float], Quaternion[Float], Vector[3, Float]]: A tuple containing the position vector, quaternion orientation, and scale vector.
|
|
330
|
+
"""
|
|
331
|
+
# extract position
|
|
332
|
+
position = vec3(m[0, 3], m[1, 3], m[2, 3])
|
|
333
|
+
# extract rotation matrix components
|
|
334
|
+
r00, r01, r02 = m[0, 0], m[0, 1], m[0, 2]
|
|
335
|
+
r10, r11, r12 = m[1, 0], m[1, 1], m[1, 2]
|
|
336
|
+
r20, r21, r22 = m[2, 0], m[2, 1], m[2, 2]
|
|
337
|
+
# get scale magnitudes
|
|
338
|
+
sx = wp.sqrt(r00 * r00 + r10 * r10 + r20 * r20)
|
|
339
|
+
sy = wp.sqrt(r01 * r01 + r11 * r11 + r21 * r21)
|
|
340
|
+
sz = wp.sqrt(r02 * r02 + r12 * r12 + r22 * r22)
|
|
341
|
+
# normalize rotation matrix components
|
|
342
|
+
if sx != zero:
|
|
343
|
+
r00 /= sx
|
|
344
|
+
r10 /= sx
|
|
345
|
+
r20 /= sx
|
|
346
|
+
if sy != zero:
|
|
347
|
+
r01 /= sy
|
|
348
|
+
r11 /= sy
|
|
349
|
+
r21 /= sy
|
|
350
|
+
if sz != zero:
|
|
351
|
+
r02 /= sz
|
|
352
|
+
r12 /= sz
|
|
353
|
+
r22 /= sz
|
|
354
|
+
# extract rotation (quaternion)
|
|
355
|
+
rotation = wp.quat_from_matrix(mat33(r00, r01, r02, r10, r11, r12, r20, r21, r22))
|
|
356
|
+
# extract scale
|
|
357
|
+
scale = vec3(sx, sy, sz)
|
|
358
|
+
return position, rotation, scale
|
|
359
|
+
|
|
360
|
+
return transform_decompose
|
|
361
|
+
|
|
362
|
+
|
|
363
|
+
transform_decompose = wp.func(
|
|
364
|
+
create_transform_decompose_func(wp.float32),
|
|
365
|
+
name="transform_decompose",
|
|
366
|
+
)
|
|
367
|
+
wp.func(
|
|
368
|
+
create_transform_decompose_func(wp.float16),
|
|
369
|
+
name="transform_decompose",
|
|
370
|
+
)
|
|
371
|
+
wp.func(
|
|
372
|
+
create_transform_decompose_func(wp.float64),
|
|
373
|
+
name="transform_decompose",
|
|
374
|
+
)
|
|
375
|
+
|
|
376
|
+
|
|
377
|
+
# register API functions so they appear in the documentation
|
|
378
|
+
|
|
379
|
+
wp._src.context.register_api_function(
|
|
380
|
+
norm_l1,
|
|
381
|
+
group="Vector Math",
|
|
382
|
+
)
|
|
383
|
+
wp._src.context.register_api_function(
|
|
384
|
+
norm_l2,
|
|
385
|
+
group="Vector Math",
|
|
386
|
+
)
|
|
387
|
+
wp._src.context.register_api_function(
|
|
388
|
+
norm_huber,
|
|
389
|
+
group="Vector Math",
|
|
390
|
+
)
|
|
391
|
+
wp._src.context.register_api_function(
|
|
392
|
+
norm_pseudo_huber,
|
|
393
|
+
group="Vector Math",
|
|
394
|
+
)
|
|
395
|
+
wp._src.context.register_api_function(
|
|
396
|
+
smooth_normalize,
|
|
397
|
+
group="Vector Math",
|
|
398
|
+
)
|
|
399
|
+
wp._src.context.register_api_function(
|
|
400
|
+
transform_from_matrix,
|
|
401
|
+
group="Transformations",
|
|
402
|
+
)
|
|
403
|
+
wp._src.context.register_api_function(
|
|
404
|
+
transform_to_matrix,
|
|
405
|
+
group="Transformations",
|
|
406
|
+
)
|
|
407
|
+
wp._src.context.register_api_function(
|
|
408
|
+
transform_compose,
|
|
409
|
+
group="Transformations",
|
|
410
|
+
)
|
|
411
|
+
wp._src.context.register_api_function(
|
|
412
|
+
transform_decompose,
|
|
413
|
+
group="Transformations",
|
|
414
|
+
)
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
warp/_src/optim/adam.py
ADDED
|
@@ -0,0 +1,163 @@
|
|
|
1
|
+
# SPDX-FileCopyrightText: Copyright (c) 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
|
2
|
+
# SPDX-License-Identifier: Apache-2.0
|
|
3
|
+
#
|
|
4
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
5
|
+
# you may not use this file except in compliance with the License.
|
|
6
|
+
# You may obtain a copy of the License at
|
|
7
|
+
#
|
|
8
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
9
|
+
#
|
|
10
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
11
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
12
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
13
|
+
# See the License for the specific language governing permissions and
|
|
14
|
+
# limitations under the License.
|
|
15
|
+
|
|
16
|
+
import warp as wp
|
|
17
|
+
|
|
18
|
+
|
|
19
|
+
@wp.kernel
|
|
20
|
+
def adam_step_kernel_vec3(
|
|
21
|
+
g: wp.array(dtype=wp.vec3),
|
|
22
|
+
m: wp.array(dtype=wp.vec3),
|
|
23
|
+
v: wp.array(dtype=wp.vec3),
|
|
24
|
+
lr: float,
|
|
25
|
+
beta1: float,
|
|
26
|
+
beta2: float,
|
|
27
|
+
t: float,
|
|
28
|
+
eps: float,
|
|
29
|
+
params: wp.array(dtype=wp.vec3),
|
|
30
|
+
):
|
|
31
|
+
i = wp.tid()
|
|
32
|
+
m[i] = beta1 * m[i] + (1.0 - beta1) * g[i]
|
|
33
|
+
v[i] = beta2 * v[i] + (1.0 - beta2) * wp.cw_mul(g[i], g[i])
|
|
34
|
+
mhat = m[i] / (1.0 - wp.pow(beta1, (t + 1.0)))
|
|
35
|
+
vhat = v[i] / (1.0 - wp.pow(beta2, (t + 1.0)))
|
|
36
|
+
sqrt_vhat = wp.vec3(wp.sqrt(vhat[0]), wp.sqrt(vhat[1]), wp.sqrt(vhat[2]))
|
|
37
|
+
eps_vec3 = wp.vec3(eps, eps, eps)
|
|
38
|
+
params[i] = params[i] - lr * wp.cw_div(mhat, (sqrt_vhat + eps_vec3))
|
|
39
|
+
|
|
40
|
+
|
|
41
|
+
@wp.kernel
|
|
42
|
+
def adam_step_kernel_float(
|
|
43
|
+
g: wp.array(dtype=float),
|
|
44
|
+
m: wp.array(dtype=float),
|
|
45
|
+
v: wp.array(dtype=float),
|
|
46
|
+
lr: float,
|
|
47
|
+
beta1: float,
|
|
48
|
+
beta2: float,
|
|
49
|
+
t: float,
|
|
50
|
+
eps: float,
|
|
51
|
+
params: wp.array(dtype=float),
|
|
52
|
+
):
|
|
53
|
+
i = wp.tid()
|
|
54
|
+
m[i] = beta1 * m[i] + (1.0 - beta1) * g[i]
|
|
55
|
+
v[i] = beta2 * v[i] + (1.0 - beta2) * g[i] * g[i]
|
|
56
|
+
mhat = m[i] / (1.0 - wp.pow(beta1, (t + 1.0)))
|
|
57
|
+
vhat = v[i] / (1.0 - wp.pow(beta2, (t + 1.0)))
|
|
58
|
+
params[i] = params[i] - lr * mhat / (wp.sqrt(vhat) + eps)
|
|
59
|
+
|
|
60
|
+
|
|
61
|
+
@wp.kernel
|
|
62
|
+
def adam_step_kernel_half(
|
|
63
|
+
g: wp.array(dtype=wp.float16),
|
|
64
|
+
m: wp.array(dtype=float),
|
|
65
|
+
v: wp.array(dtype=float),
|
|
66
|
+
lr: float,
|
|
67
|
+
beta1: float,
|
|
68
|
+
beta2: float,
|
|
69
|
+
t: float,
|
|
70
|
+
eps: float,
|
|
71
|
+
params: wp.array(dtype=wp.float16),
|
|
72
|
+
):
|
|
73
|
+
i = wp.tid()
|
|
74
|
+
m[i] = beta1 * m[i] + (1.0 - beta1) * float(g[i])
|
|
75
|
+
v[i] = beta2 * v[i] + (1.0 - beta2) * float(g[i]) * float(g[i])
|
|
76
|
+
mhat = m[i] / (1.0 - wp.pow(beta1, (t + 1.0)))
|
|
77
|
+
vhat = v[i] / (1.0 - wp.pow(beta2, (t + 1.0)))
|
|
78
|
+
params[i] = params[i] - wp.float16(lr * mhat / (wp.sqrt(vhat) + eps))
|
|
79
|
+
|
|
80
|
+
|
|
81
|
+
class Adam:
|
|
82
|
+
"""An implementation of the Adam Optimizer
|
|
83
|
+
It is designed to mimic Pytorch's version.
|
|
84
|
+
https://pytorch.org/docs/stable/generated/torch.optim.Adam.html#torch.optim.Adam
|
|
85
|
+
"""
|
|
86
|
+
|
|
87
|
+
def __init__(self, params=None, lr=0.001, betas=(0.9, 0.999), eps=1e-08):
|
|
88
|
+
self.m = [] # first moment
|
|
89
|
+
self.v = [] # second moment
|
|
90
|
+
self.set_params(params)
|
|
91
|
+
self.lr = lr
|
|
92
|
+
self.beta1 = betas[0]
|
|
93
|
+
self.beta2 = betas[1]
|
|
94
|
+
self.eps = eps
|
|
95
|
+
self.t = 0
|
|
96
|
+
|
|
97
|
+
def set_params(self, params):
|
|
98
|
+
self.params = params
|
|
99
|
+
if params is not None and isinstance(params, list) and len(params) > 0:
|
|
100
|
+
if len(self.m) != len(params):
|
|
101
|
+
self.m = [None] * len(params) # reset first moment
|
|
102
|
+
if len(self.v) != len(params):
|
|
103
|
+
self.v = [None] * len(params) # reset second moment
|
|
104
|
+
for i in range(len(params)):
|
|
105
|
+
param = params[i]
|
|
106
|
+
|
|
107
|
+
if param.dtype == wp.vec3:
|
|
108
|
+
dtype = wp.vec3
|
|
109
|
+
elif param.dtype == wp.float32:
|
|
110
|
+
dtype = wp.float32
|
|
111
|
+
elif param.dtype == wp.float16:
|
|
112
|
+
dtype = wp.float32 # we always use fp32 for moments, even if params are fp16
|
|
113
|
+
else:
|
|
114
|
+
raise RuntimeError(f"Unsupported dtype for Warp Adam optimizer: {param.dtype}")
|
|
115
|
+
|
|
116
|
+
if self.m[i] is None or self.m[i].shape != param.shape or self.m[i].dtype != param.dtype:
|
|
117
|
+
self.m[i] = wp.zeros(shape=param.shape, dtype=dtype, device=param.device)
|
|
118
|
+
if self.v[i] is None or self.v[i].shape != param.shape or self.v[i].dtype != param.dtype:
|
|
119
|
+
self.v[i] = wp.zeros(shape=param.shape, dtype=dtype, device=param.device)
|
|
120
|
+
|
|
121
|
+
def reset_internal_state(self):
|
|
122
|
+
for m_i in self.m:
|
|
123
|
+
m_i.zero_()
|
|
124
|
+
for v_i in self.v:
|
|
125
|
+
v_i.zero_()
|
|
126
|
+
self.t = 0
|
|
127
|
+
|
|
128
|
+
def step(self, grad):
|
|
129
|
+
assert self.params is not None
|
|
130
|
+
for i in range(len(self.params)):
|
|
131
|
+
Adam.step_detail(
|
|
132
|
+
grad[i], self.m[i], self.v[i], self.lr, self.beta1, self.beta2, self.t, self.eps, self.params[i]
|
|
133
|
+
)
|
|
134
|
+
self.t = self.t + 1
|
|
135
|
+
|
|
136
|
+
@staticmethod
|
|
137
|
+
def step_detail(g, m, v, lr, beta1, beta2, t, eps, params):
|
|
138
|
+
assert params.dtype == g.dtype
|
|
139
|
+
assert params.shape == g.shape
|
|
140
|
+
kernel_inputs = [g, m, v, lr, beta1, beta2, t, eps, params]
|
|
141
|
+
if params.dtype == wp._src.types.float32:
|
|
142
|
+
wp.launch(
|
|
143
|
+
kernel=adam_step_kernel_float,
|
|
144
|
+
dim=len(params),
|
|
145
|
+
inputs=kernel_inputs,
|
|
146
|
+
device=params.device,
|
|
147
|
+
)
|
|
148
|
+
elif params.dtype == wp._src.types.float16:
|
|
149
|
+
wp.launch(
|
|
150
|
+
kernel=adam_step_kernel_half,
|
|
151
|
+
dim=len(params),
|
|
152
|
+
inputs=kernel_inputs,
|
|
153
|
+
device=params.device,
|
|
154
|
+
)
|
|
155
|
+
elif params.dtype == wp._src.types.vec3:
|
|
156
|
+
wp.launch(
|
|
157
|
+
kernel=adam_step_kernel_vec3,
|
|
158
|
+
dim=len(params),
|
|
159
|
+
inputs=kernel_inputs,
|
|
160
|
+
device=params.device,
|
|
161
|
+
)
|
|
162
|
+
else:
|
|
163
|
+
raise RuntimeError("Params data type not supported in Adam step kernels.")
|