PyPI - xax - Versions diffs - 0.1.14__tar.gz → 0.1.16__tar.gz - Mend

xax 0.1.14tar.gz → 0.1.16tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (72) hide show

{xax-0.1.14/xax.egg-info → xax-0.1.16}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: xax
-Version: 0.1.14
+Version: 0.1.16
 Summary: A library for fast Jax experimentation
 Home-page: https://github.com/kscalelabs/xax
 Author: Benjamin Bolte

{xax-0.1.14 → xax-0.1.16}/xax/__init__.py RENAMED Viewed

@@ -12,7 +12,7 @@ and running the update script:
     python -m scripts.update_api --inplace
 """
-__version__ = "0.1.14"
+__version__ = "0.1.16"
 # This list shouldn't be modified by hand; instead, run the update script.
 __all__ = [
@@ -40,6 +40,7 @@ __all__ = [
     "load_eqx_mlp",
     "make_eqx_mlp",
     "save_eqx",
+    "cubic_bezier_interpolation",
     "euler_to_quat",
     "get_projected_gravity_vector_from_quat",
     "quat_to_euler",
@@ -201,6 +202,7 @@ NAME_MAP: dict[str, str] = {
     "load_eqx_mlp": "nn.equinox",
     "make_eqx_mlp": "nn.equinox",
     "save_eqx": "nn.equinox",
+    "cubic_bezier_interpolation": "nn.geom",
     "euler_to_quat": "nn.geom",
     "get_projected_gravity_vector_from_quat": "nn.geom",
     "quat_to_euler": "nn.geom",
@@ -363,6 +365,7 @@ if IMPORT_ALL or TYPE_CHECKING:
         save_eqx,
     )
     from xax.nn.geom import (
+        cubic_bezier_interpolation,
         euler_to_quat,
         get_projected_gravity_vector_from_quat,
         quat_to_euler,

{xax-0.1.14 → xax-0.1.16}/xax/nn/geom.py RENAMED Viewed

@@ -1,10 +1,10 @@
 """Defines geometry functions."""
-import jax
 from jax import numpy as jnp
+from jaxtyping import Array
-def quat_to_euler(quat_4: jax.Array, eps: float = 1e-6) -> jax.Array:
+def quat_to_euler(quat_4: Array, eps: float = 1e-6) -> Array:
     """Normalizes and converts a quaternion (w, x, y, z) to roll, pitch, yaw.
     Args:
@@ -40,7 +40,7 @@ def quat_to_euler(quat_4: jax.Array, eps: float = 1e-6) -> jax.Array:
     return jnp.concatenate([roll, pitch, yaw], axis=-1)
-def euler_to_quat(euler_3: jax.Array) -> jax.Array:
+def euler_to_quat(euler_3: Array) -> Array:
     """Converts roll, pitch, yaw angles to a quaternion (w, x, y, z).
     Args:
@@ -75,7 +75,7 @@ def euler_to_quat(euler_3: jax.Array) -> jax.Array:
     return quat
-def get_projected_gravity_vector_from_quat(quat: jax.Array, eps: float = 1e-6) -> jax.Array:
+def get_projected_gravity_vector_from_quat(quat: Array, eps: float = 1e-6) -> Array:
     """Calculates the gravity vector projected onto the local frame given a quaternion orientation.
     Args:
@@ -101,7 +101,7 @@ def get_projected_gravity_vector_from_quat(quat: jax.Array, eps: float = 1e-6) -
     return jnp.concatenate([gx, gy, -gz], axis=-1)
-def rotate_vector_by_quat(vector: jax.Array, quat: jax.Array, eps: float = 1e-6) -> jax.Array:
+def rotate_vector_by_quat(vector: Array, quat: Array, eps: float = 1e-6) -> Array:
     """Rotates a vector by a quaternion.
     Args:
@@ -156,3 +156,24 @@ def rotate_vector_by_quat(vector: jax.Array, quat: jax.Array, eps: float = 1e-6)
     )
     return jnp.concatenate([xx, yy, zz], axis=-1)
+def cubic_bezier_interpolation(y_start: Array, y_end: Array, x: Array) -> Array:
+    """Cubic bezier interpolation.
+    This is a cubic bezier curve that starts at y_start and ends at y_end,
+    and is controlled by the parameter x. The curve is defined by the following formula:
+    y(x) = y_start + (y_end - y_start) * (x**3 + 3 * (x**2 * (1 - x)))
+    Args:
+        y_start: The start value, shape (*).
+        y_end: The end value, shape (*).
+        x: The interpolation parameter, shape (*).
+    Returns:
+        The interpolated value, shape (*).
+    """
+    y_diff = y_end - y_start
+    bezier = x**3 + 3 * (x**2 * (1 - x))
+    return y_start + y_diff * bezier

{xax-0.1.14 → xax-0.1.16}/xax/task/logger.py RENAMED Viewed

@@ -205,6 +205,12 @@ def as_numpy(array: Array) -> np.ndarray:
     return np.array(array)
+@dataclass(kw_only=True)
+class LogString:
+    value: str
+    secondary: bool
 @dataclass(kw_only=True)
 class LogImage:
     image: PILImage
@@ -223,6 +229,12 @@ class LogVideo:
     fps: int
+@dataclass(kw_only=True)
+class LogScalar:
+    value: Number
+    secondary: bool
 @dataclass(kw_only=True)
 class LogDistribution:
     mean: Number
@@ -243,10 +255,10 @@ class LogHistogram:
 @dataclass(kw_only=True)
 class LogLine:
     state: State
-    scalars: dict[str, dict[str, Number]]
+    scalars: dict[str, dict[str, LogScalar]]
     distributions: dict[str, dict[str, LogDistribution]]
     histograms: dict[str, dict[str, LogHistogram]]
-    strings: dict[str, dict[str, str]]
+    strings: dict[str, dict[str, LogString]]
     images: dict[str, dict[str, LogImage]]
     videos: dict[str, dict[str, LogVideo]]
@@ -515,10 +527,10 @@ class Logger:
     """Defines an intermediate container which holds values to log somewhere else."""
     def __init__(self, default_namespace: str = DEFAULT_NAMESPACE) -> None:
-        self.scalars: dict[str, dict[str, Callable[[], Number]]] = defaultdict(dict)
+        self.scalars: dict[str, dict[str, Callable[[], LogScalar]]] = defaultdict(dict)
         self.distributions: dict[str, dict[str, Callable[[], LogDistribution]]] = defaultdict(dict)
         self.histograms: dict[str, dict[str, Callable[[], LogHistogram]]] = defaultdict(dict)
-        self.strings: dict[str, dict[str, Callable[[], str]]] = defaultdict(dict)
+        self.strings: dict[str, dict[str, Callable[[], LogString]]] = defaultdict(dict)
         self.images: dict[str, dict[str, Callable[[], LogImage]]] = defaultdict(dict)
         self.videos: dict[str, dict[str, Callable[[], LogVideo]]] = defaultdict(dict)
         self.default_namespace = default_namespace
@@ -616,13 +628,23 @@ class Logger:
     def resolve_namespace(self, namespace: str | None = None) -> str:
         return "_".join([self.default_namespace if namespace is None else namespace] + NAMESPACE_STACK)
-    def log_scalar(self, key: str, value: Callable[[], Number] | Number, *, namespace: str | None = None) -> None:
+    def log_scalar(
+        self,
+        key: str,
+        value: Callable[[], Number] | Number,
+        *,
+        namespace: str | None = None,
+        secondary: bool = False,
+    ) -> None:
         """Logs a scalar value.
         Args:
             key: The key being logged
             value: The scalar value being logged
             namespace: An optional logging namespace
+            secondary: If set, treat this as a secondary value (meaning, it is
+                less important than other values, and some downstream loggers
+                will not display it)
         """
         if not self.active:
             raise RuntimeError("The logger is not active")
@@ -632,11 +654,11 @@ class Logger:
             assert value.ndim == 0, f"Scalar must be a 0D array, got shape {value.shape}"
         @functools.lru_cache(maxsize=None)
-        def scalar_future() -> Number:
+        def scalar_future() -> LogScalar:
             with ContextTimer() as timer:
                 value_concrete = value() if callable(value) else value
             logger.debug("Scalar Key: %s, Time: %s", key, timer.elapsed_time)
-            return value_concrete
+            return LogScalar(value=value_concrete, secondary=secondary)
         self.scalars[namespace][key] = scalar_future
@@ -770,21 +792,31 @@ class Logger:
         self.histograms[namespace][key] = histogram_future
-    def log_string(self, key: str, value: Callable[[], str] | str, *, namespace: str | None = None) -> None:
+    def log_string(
+        self,
+        key: str,
+        value: Callable[[], str] | str,
+        *,
+        namespace: str | None = None,
+        secondary: bool = False,
+    ) -> None:
         """Logs a string value.
         Args:
             key: The key being logged
             value: The string value being logged
             namespace: An optional logging namespace
+            secondary: If set, treat this as a secondary value (meaning, it is
+                less important than other values, and some downstream loggers
+                will not display it)
         """
         if not self.active:
             raise RuntimeError("The logger is not active")
         namespace = self.resolve_namespace(namespace)
         @functools.lru_cache(maxsize=None)
-        def value_future() -> str:
-            return value() if callable(value) else value
+        def value_future() -> LogString:
+            return LogString(value=value() if callable(value) else value, secondary=secondary)
         self.strings[namespace][key] = value_future

{xax-0.1.14 → xax-0.1.16}/xax/task/loggers/json.py RENAMED Viewed

@@ -3,11 +3,19 @@
 import json
 import sys
 from dataclasses import asdict
-from typing import Any, Literal, TextIO
+from typing import Any, Literal, Mapping, TextIO
 from jaxtyping import Array
-from xax.task.logger import LogError, LoggerImpl, LogLine, LogPing, LogStatus
+from xax.task.logger import (
+    LogError,
+    LoggerImpl,
+    LogLine,
+    LogPing,
+    LogScalar,
+    LogStatus,
+    LogString,
+)
 def get_json_value(value: Any) -> Any:  # noqa: ANN401
@@ -61,14 +69,14 @@ class JsonLogger(LoggerImpl):
     def get_json(self, line: LogLine) -> str:
         data: dict = {"state": asdict(line.state)}
-        def add_logs(log: dict[str, dict[str, Any]], data: dict) -> None:
+        def add_logs(log: Mapping[str, Mapping[str, LogScalar | LogString]], data: dict) -> None:
             for namespace, values in log.items():
                 if self.remove_unicode_from_namespaces:
                     namespace = namespace.encode("ascii", errors="ignore").decode("ascii").strip()
                 if namespace not in data:
                     data[namespace] = {}
                 for k, v in values.items():
-                    data[namespace][k] = get_json_value(v)
+                    data[namespace][k] = get_json_value(v.value)
         add_logs(line.scalars, data)
         add_logs(line.strings, data)

{xax-0.1.14 → xax-0.1.16}/xax/task/loggers/stdout.py RENAMED Viewed

@@ -4,11 +4,20 @@ import datetime
 import logging
 import sys
 from collections import deque
-from typing import Any, Deque, TextIO
+from typing import Any, Deque, Mapping, TextIO
 from jaxtyping import Array
-from xax.task.logger import LogError, LogErrorSummary, LoggerImpl, LogLine, LogPing, LogStatus
+from xax.task.logger import (
+    LogError,
+    LogErrorSummary,
+    LoggerImpl,
+    LogLine,
+    LogPing,
+    LogScalar,
+    LogStatus,
+    LogString,
+)
 from xax.utils.text import Color, colored, format_timedelta
@@ -95,20 +104,17 @@ class StdoutLogger(LoggerImpl):
     def write_log_window(self, line: LogLine) -> None:
         namespace_to_lines: dict[str, dict[str, str]] = {}
-        def add_logs(log: dict[str, dict[str, Any]], namespace_to_lines: dict[str, dict[str, str]]) -> None:
+        def add_logs(
+            log: Mapping[str, Mapping[str, LogScalar | LogString]],
+            namespace_to_lines: dict[str, dict[str, str]],
+        ) -> None:
             for namespace, values in log.items():
-                if not self.log_timers and namespace.startswith("⌛"):
-                    continue
-                if not self.log_perf and namespace.startswith("🔧"):
-                    continue
-                if not self.log_optim and namespace.startswith("📉"):
-                    continue
-                if not self.log_fp and namespace.startswith("⚖️"):
-                    continue
-                if namespace not in namespace_to_lines:
-                    namespace_to_lines[namespace] = {}
                 for k, v in values.items():
-                    v_str = as_str(v, self.precision)
+                    if v.secondary:
+                        continue
+                    if namespace not in namespace_to_lines:
+                        namespace_to_lines[namespace] = {}
+                    v_str = as_str(v.value, self.precision)
                     namespace_to_lines[namespace][k] = v_str
         add_logs(line.scalars, namespace_to_lines)
@@ -116,9 +122,8 @@ class StdoutLogger(LoggerImpl):
         if not namespace_to_lines:
             return
-        self.write_fp.write("\n")
         for namespace, lines in sorted(namespace_to_lines.items()):
-            self.write_fp.write(f"{colored(namespace, 'cyan', bold=True)}\n")
+            self.write_fp.write(f"\n{colored(namespace, 'cyan', bold=True)}\n")
             for k, v in lines.items():
                 self.write_fp.write(f" ↪ {k}: {v}\n")

{xax-0.1.14 → xax-0.1.16}/xax/task/loggers/tensorboard.py RENAMED Viewed

@@ -158,7 +158,7 @@ class TensorboardLogger(LoggerImpl):
             for scalar_key, scalar_value in scalars.items():
                 writer.add_scalar(
                     f"{namespace}/{scalar_key}",
-                    as_float(scalar_value),
+                    as_float(scalar_value.value),
                     global_step=line.state.num_steps,
                     walltime=walltime,
                 )
@@ -192,7 +192,7 @@ class TensorboardLogger(LoggerImpl):
             for string_key, string_value in strings.items():
                 writer.add_text(
                     f"{namespace}/{string_key}",
-                    string_value,
+                    string_value.value,
                     global_step=line.state.num_steps,
                     walltime=walltime,
                 )

{xax-0.1.14 → xax-0.1.16}/xax/task/mixins/cpu_stats.py RENAMED Viewed

@@ -248,15 +248,15 @@ class CPUStatsMixin(ProcessMixin[Config], LoggerMixin[Config], Generic[Config]):
         stats = monitor.get_if_set() if self.config.cpu_stats.only_log_once else monitor.get()
         if stats is not None:
-            self.logger.log_scalar("child_procs", stats.num_child_procs, namespace="🔧 cpu")
-            self.logger.log_scalar("percent", stats.cpu_percent, namespace="🔧 cpu")
-            self.logger.log_scalar("child_percent", stats.child_cpu_percent, namespace="🔧 cpu")
-            self.logger.log_scalar("percent", stats.mem_percent, namespace="🔧 mem")
-            self.logger.log_scalar("shared", stats.mem_shared, namespace="🔧 mem")
-            self.logger.log_scalar("child_percent", stats.child_mem_percent, namespace="🔧 mem")
-            self.logger.log_scalar("rss/cur", stats.mem_rss, namespace="🔧 mem")
-            self.logger.log_scalar("rss/total", stats.mem_rss_total, namespace="🔧 mem")
-            self.logger.log_scalar("vms/cur", stats.mem_vms, namespace="🔧 mem")
-            self.logger.log_scalar("vms/total", stats.mem_vms_total, namespace="🔧 mem")
+            self.logger.log_scalar("child_procs", stats.num_child_procs, namespace="🔧 cpu", secondary=True)
+            self.logger.log_scalar("percent", stats.cpu_percent, namespace="🔧 cpu", secondary=True)
+            self.logger.log_scalar("child_percent", stats.child_cpu_percent, namespace="🔧 cpu", secondary=True)
+            self.logger.log_scalar("percent", stats.mem_percent, namespace="🔧 mem", secondary=True)
+            self.logger.log_scalar("shared", stats.mem_shared, namespace="🔧 mem", secondary=True)
+            self.logger.log_scalar("child_percent", stats.child_mem_percent, namespace="🔧 mem", secondary=True)
+            self.logger.log_scalar("rss/cur", stats.mem_rss, namespace="🔧 mem", secondary=True)
+            self.logger.log_scalar("rss/total", stats.mem_rss_total, namespace="🔧 mem", secondary=True)
+            self.logger.log_scalar("vms/cur", stats.mem_vms, namespace="🔧 mem", secondary=True)
+            self.logger.log_scalar("vms/total", stats.mem_vms_total, namespace="🔧 mem", secondary=True)
         return state

{xax-0.1.14 → xax-0.1.16}/xax/task/mixins/gpu_stats.py RENAMED Viewed

@@ -264,8 +264,8 @@ class GPUStatsMixin(ProcessMixin[Config], LoggerMixin[Config], Generic[Config]):
         for gpu_stat in stats.values():
             if gpu_stat is None:
                 continue
-            self.logger.log_scalar(f"mem/{gpu_stat.index}", gpu_stat.memory_used, namespace="🔧 gpu")
-            self.logger.log_scalar(f"temp/{gpu_stat.index}", gpu_stat.temperature, namespace="🔧 gpu")
-            self.logger.log_scalar(f"util/{gpu_stat.index}", gpu_stat.utilization, namespace="🔧 gpu")
+            self.logger.log_scalar(f"mem/{gpu_stat.index}", gpu_stat.memory_used, namespace="🔧 gpu", secondary=True)
+            self.logger.log_scalar(f"temp/{gpu_stat.index}", gpu_stat.temperature, namespace="🔧 gpu", secondary=True)
+            self.logger.log_scalar(f"util/{gpu_stat.index}", gpu_stat.utilization, namespace="🔧 gpu", secondary=True)
         return state

{xax-0.1.14 → xax-0.1.16}/xax/task/mixins/train.py RENAMED Viewed

@@ -50,8 +50,7 @@ from xax.utils.experiments import (
     TrainingFinishedError,
     diff_configs,
     get_diff_string,
-    get_git_state,
-    get_packages_with_versions,
+    get_state_file_string,
     get_training_code,
 )
 from xax.utils.jax import jit as xax_jit
@@ -219,7 +218,12 @@ class TrainMixin(
         return state.replace(elapsed_time_s=time.time() - state.start_time_s)
     def log_train_step(
-        self, model: PyTree, batch: Batch, output: Output, metrics: FrozenDict[str, Array], state: State
+        self,
+        model: PyTree,
+        batch: Batch,
+        output: Output,
+        metrics: FrozenDict[str, Array],
+        state: State,
     ) -> None:
         """Override this function to do logging during the training phase.
@@ -235,7 +239,12 @@ class TrainMixin(
         """
     def log_valid_step(
-        self, model: PyTree, batch: Batch, output: Output, metrics: FrozenDict[str, Array], state: State
+        self,
+        model: PyTree,
+        batch: Batch,
+        output: Output,
+        metrics: FrozenDict[str, Array],
+        state: State,
     ) -> None:
         """Override this function to do logging during the validation phase.
@@ -253,12 +262,20 @@ class TrainMixin(
     def log_state_timers(self, state: State) -> None:
         timer = self.state_timers[state.phase]
         timer.step(state)
-        for ns, d in timer.log_dict().items():
-            for k, v in d.items():
-                self.logger.log_scalar(k, v, namespace=ns)
+        for k, v in timer.log_dict().items():
+            if isinstance(v, tuple):
+                v, secondary = v
+            else:
+                secondary = False
+            self.logger.log_scalar(k, v, namespace="⌛ timers", secondary=secondary)
     def log_step(
-        self, model: PyTree, batch: Batch, output: Output, metrics: FrozenDict[str, Array], state: State
+        self,
+        model: PyTree,
+        batch: Batch,
+        output: Output,
+        metrics: FrozenDict[str, Array],
+        state: State,
     ) -> None:
         phase = state.phase
@@ -534,9 +551,8 @@ class TrainMixin(
         logger.log(LOG_STATUS, self.task_path)
         logger.log(LOG_STATUS, self.task_name)
         logger.log(LOG_STATUS, "JAX devices: %s", jax.devices())
-        self.logger.log_file("git_state.txt", get_git_state(self))
-        self.logger.log_file("packages.txt", get_packages_with_versions())
-        self.logger.log_file("training_code.txt", get_training_code(self))
+        self.logger.log_file("state.txt", get_state_file_string(self))
+        self.logger.log_file("training_code.py", get_training_code(self))
         self.logger.log_file("config.yaml", self.config_str(self.config, use_cli=False))
     def model_partition_fn(self, item: Any) -> bool:  # noqa: ANN401

{xax-0.1.14 → xax-0.1.16}/xax/utils/experiments.py RENAMED Viewed

@@ -114,28 +114,15 @@ class StateTimer:
         self.sample_timer.step(state.num_samples if state.phase == "train" else state.num_valid_samples, cur_time)
         self.iter_timer.step(cur_time)
-    def log_dict(self) -> dict[str, dict[str, int | float]]:
-        logs: dict[str, dict[str, int | float]] = {}
-        # Logs step statistics.
-        logs["⌛ steps"] = {
-            "total": self.step_timer.steps,
-            "per-second": self.step_timer.steps_per_second,
-        }
-        # Logs sample statistics.
-        logs["⌛ samples"] = {
-            "total": self.sample_timer.steps,
-            "per-second": self.sample_timer.steps_per_second,
-        }
-        # Logs full iteration statistics.
-        logs["⌛ dt"] = {
-            "iter": self.iter_timer.iter_seconds,
+    def log_dict(self) -> dict[str, int | float | tuple[int | float, bool]]:
+        return {
+            "steps": (self.step_timer.steps, True),
+            "steps/second": self.step_timer.steps_per_second,
+            "samples": (self.sample_timer.steps, True),
+            "samples/second": (self.sample_timer.steps_per_second, True),
+            "dt": self.iter_timer.iter_seconds,
         }
-        return logs
 class IntervalTicker:
     def __init__(self, interval: float) -> None:
@@ -479,6 +466,20 @@ def get_packages_with_versions() -> str:
     return "\n".join([f"{key}=={version}" for key, version in sorted(packages)])
+def get_command_line_string() -> str:
+    return " ".join(sys.argv)
+def get_state_file_string(obj: object) -> str:
+    return "\n\n".join(
+        [
+            f"=== Command Line ===\n\n{get_command_line_string()}",
+            f"=== Git State ===\n\n{get_git_state(obj)}",
+            f"=== Packages ===\n\n{get_packages_with_versions()}",
+        ]
+    )
 def get_training_code(obj: object) -> str:
     """Gets the text from the file containing the provided object.

{xax-0.1.14 → xax-0.1.16/xax.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: xax
-Version: 0.1.14
+Version: 0.1.16
 Summary: A library for fast Jax experimentation
 Home-page: https://github.com/kscalelabs/xax
 Author: Benjamin Bolte