PyPI - neuracore-types - Versions diffs - 1.0.0__py3-none-any.whl - Mend

neuracore-types 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

neuracore_types/__init__.py +5 -0
neuracore_types/neuracore_types.py +1077 -0
neuracore_types-1.0.0.dist-info/METADATA +89 -0
neuracore_types-1.0.0.dist-info/RECORD +6 -0
neuracore_types-1.0.0.dist-info/WHEEL +4 -0
neuracore_types-1.0.0.dist-info/licenses/LICENSE +21 -0

neuracore_types/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""Neuracore Types - Shared type definitions for Neuracore."""
+from neuracore_types.neuracore_types import *  # noqa: F403
+__version__ = "1.0.0"

neuracore_types/neuracore_types.py ADDED Viewed

@@ -0,0 +1,1077 @@
+"""Defines the core data structures used throughout Neuracore."""
+import base64
+import time
+from datetime import datetime, timezone
+from enum import Enum
+from typing import Any, List, NamedTuple, Optional, Tuple, Union
+from uuid import uuid4
+import numpy as np
+from pydantic import (
+    BaseModel,
+    ConfigDict,
+    Field,
+    NonNegativeInt,
+    field_serializer,
+    field_validator,
+)
+def _sort_dict_by_keys(data_dict: Optional[dict[str, Any]]) -> Optional[dict[str, Any]]:
+    """Sort a dictionary by its keys to ensure consistent ordering.
+    This is a helper function used internally by the data models to ensure
+    consistent dictionary ordering. Use the model's order() or
+    sort_in_place() methods instead of calling this directly.
+    Args:
+        data_dict: Dictionary to sort, or None
+    Returns:
+        New dictionary with keys sorted alphabetically, or None if input was None
+    """
+    if data_dict is None:
+        return None
+    return {key: data_dict[key] for key in sorted(data_dict.keys())}
+class NCData(BaseModel):
+    """Base class for all Neuracore data with automatic timestamping.
+    Provides a common base for all data types in the system with automatic
+    timestamp generation for temporal synchronization and data ordering.
+    """
+    timestamp: float = Field(default_factory=lambda: time.time())
+    def order(self) -> "NCData":
+        """Return a new instance with sorted data.
+        This method should be overridden by subclasses to implement specific
+        ordering logic for the data type. The base class implementation does
+        nothing and returns self.
+        """
+        return self
+class JointData(NCData):
+    """Robot joint state data including positions, velocities, or torques.
+    Represents joint-space data for robotic systems with support for named
+    joints and additional auxiliary values. Used for positions, velocities,
+    torques, and target positions.
+    """
+    values: dict[str, float]
+    additional_values: Optional[dict[str, float]] = None
+    def order(self) -> "JointData":
+        """Return a new JointData instance with sorted joint names.
+        Returns:
+            New JointData with alphabetically sorted joint names.
+        """
+        return JointData(
+            timestamp=self.timestamp,
+            values=_sort_dict_by_keys(self.values) or {},
+            additional_values=_sort_dict_by_keys(self.additional_values),
+        )
+    def numpy(self, order: Optional[List[str]] = None) -> np.ndarray:
+        """Convert the joint values to a NumPy array.
+        Args:
+            order: The order in which the numpy array is returned.
+        Returns:
+            NumPy array of joint values.
+        """
+        if order is not None:
+            values = [self.values[name] for name in order]
+        else:
+            values = list(self.values.values())
+        return np.array(values, dtype=np.float32)
+class CameraData(NCData):
+    """Camera sensor data including images and calibration information.
+    Contains image data along with camera intrinsic and extrinsic parameters
+    for 3D reconstruction and computer vision applications. The frame field
+    is populated during dataset iteration for efficiency.
+    """
+    frame_idx: int = 0  # Needed so we can index video after sync
+    extrinsics: Optional[list[list[float]]] = None
+    intrinsics: Optional[list[list[float]]] = None
+    frame: Optional[Union[Any, str]] = None  # Only filled in when using dataset iter
+class PoseData(NCData):
+    """6DOF pose data for objects, end-effectors, or coordinate frames.
+    Represents position and orientation information for tracking objects
+    or robot components in 3D space. Poses are stored as dictionaries
+    mapping pose names to [x, y, z, rx, ry, rz] values.
+    """
+    pose: dict[str, list[float]]
+    def order(self) -> "PoseData":
+        """Return a new PoseData instance with sorted pose coordinates.
+        Returns:
+            New PoseData with alphabetically sorted pose coordinate names.
+        """
+        return PoseData(
+            timestamp=self.timestamp, pose=_sort_dict_by_keys(self.pose) or {}
+        )
+class EndEffectorData(NCData):
+    """End-effector state data including gripper and tool configurations.
+    Contains the state of robot end-effectors such as gripper opening amounts,
+    tool activations, or other end-effector specific parameters.
+    """
+    open_amounts: dict[str, float]
+    def order(self) -> "EndEffectorData":
+        """Return a new EndEffectorData instance with sorted effector names.
+        Returns:
+            New EndEffectorData with alphabetically sorted effector names.
+        """
+        return EndEffectorData(
+            timestamp=self.timestamp,
+            open_amounts=_sort_dict_by_keys(self.open_amounts) or {},
+        )
+class EndEffectorPoseData(NCData):
+    """End-effector pose data.
+    Contains the pose of end-effectors as a 7-element list containing the
+    position and unit quaternion orientation [x, y, z, qx, qy, qz, qw].
+    """
+    poses: dict[str, list[float]]
+    def order(self) -> "EndEffectorPoseData":
+        """Return a new EndEffectorPoseData instance with sorted effector names.
+        Returns:
+            New EndEffectorPoseData with alphabetically sorted effector names.
+        """
+        return EndEffectorPoseData(
+            timestamp=self.timestamp,
+            poses=_sort_dict_by_keys(self.poses) or {},
+        )
+class ParallelGripperOpenAmountData(NCData):
+    """Open amount data for parallel end effector gripper.
+    Contains the state of parallel gripper opening amounts.
+    """
+    open_amounts: dict[str, float]
+    def order(self) -> "ParallelGripperOpenAmountData":
+        """Return a new Gripper Open Amount instance with sorted gripper names.
+        Returns:
+            New ParallelGripperOpenAmountData with alphabetically sorted gripper names.
+        """
+        return ParallelGripperOpenAmountData(
+            timestamp=self.timestamp,
+            open_amounts=_sort_dict_by_keys(self.open_amounts) or {},
+        )
+class PointCloudData(NCData):
+    """3D point cloud data with optional RGB colouring and camera parameters.
+    Represents 3D spatial data from depth sensors or LiDAR systems with
+    optional colour information and camera calibration for registration.
+    """
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    points: Optional[np.ndarray] = None  # (N, 3) float16
+    rgb_points: Optional[np.ndarray] = None  # (N, 3) uint8
+    extrinsics: Optional[np.ndarray] = None  # (4, 4) float16
+    intrinsics: Optional[np.ndarray] = None  # (3, 3) float16
+    @staticmethod
+    def _encode(arr: np.ndarray, dtype: Any) -> str:
+        return base64.b64encode(arr.astype(dtype).tobytes()).decode("utf-8")
+    @staticmethod
+    def _decode(data: str, dtype: Any, shape: Tuple[int, ...]) -> np.ndarray:
+        return np.frombuffer(
+            base64.b64decode(data.encode("utf-8")), dtype=dtype
+        ).reshape(*shape)
+    @field_validator("points", mode="before")
+    @classmethod
+    def decode_points(cls, v: Union[str, np.ndarray]) -> Optional[np.ndarray]:
+        """Decode base64 string to NumPy array if needed.
+        Args:
+            v: Base64 encoded string or NumPy array
+        Returns:
+            Decoded NumPy array or None
+        """
+        return cls._decode(v, np.float16, (-1, 3)) if isinstance(v, str) else v
+    @field_validator("rgb_points", mode="before")
+    @classmethod
+    def decode_rgb_points(cls, v: Union[str, np.ndarray]) -> Optional[np.ndarray]:
+        """Decode base64 string to NumPy array if needed.
+        Args:
+            v: Base64 encoded string or NumPy array
+        Returns:
+            Decoded NumPy array or None
+        """
+        return cls._decode(v, np.uint8, (-1, 3)) if isinstance(v, str) else v
+    @field_validator("extrinsics", mode="before")
+    @classmethod
+    def decode_extrinsics(cls, v: Union[str, np.ndarray]) -> Optional[np.ndarray]:
+        """Decode base64 string to NumPy array if needed.
+        Args:
+            v: Base64 encoded string or NumPy array
+        Returns:
+            Decoded NumPy array or None
+        """
+        return cls._decode(v, np.float16, (4, 4)) if isinstance(v, str) else v
+    @field_validator("intrinsics", mode="before")
+    @classmethod
+    def decode_intrinsics(cls, v: Union[str, np.ndarray]) -> Optional[np.ndarray]:
+        """Decode base64 string to NumPy array if needed.
+        Args:
+            v: Base64 encoded string or NumPy array
+        Returns:
+            Decoded NumPy array or None
+        """
+        return cls._decode(v, np.float16, (3, 3)) if isinstance(v, str) else v
+    # --- Serializers (encode on dump) ---
+    @field_serializer("points", when_used="json")
+    def serialize_points(self, v: Optional[np.ndarray]) -> Optional[str]:
+        """Encode NumPy array to base64 string if needed.
+        Args:
+            v: NumPy array to encode
+        Returns:
+            Base64 encoded string or None
+        """
+        return self._encode(v, np.float16) if v is not None else None
+    @field_serializer("rgb_points", when_used="json")
+    def serialize_rgb_points(self, v: Optional[np.ndarray]) -> Optional[str]:
+        """Encode NumPy array to base64 string if needed.
+        Args:
+            v: NumPy array to encode
+        Returns:
+            Base64 encoded string or None
+        """
+        return self._encode(v, np.uint8) if v is not None else None
+    @field_serializer("extrinsics", when_used="json")
+    def serialize_extrinsics(self, v: Optional[np.ndarray]) -> Optional[str]:
+        """Encode NumPy array to base64 string if needed.
+        Args:
+            v: NumPy array to encode
+        Returns:
+            Base64 encoded string or None
+        """
+        return self._encode(v, np.float16) if v is not None else None
+    @field_serializer("intrinsics", when_used="json")
+    def serialize_intrinsics(self, v: Optional[np.ndarray]) -> Optional[str]:
+        """Encode NumPy array to base64 string if needed.
+        Args:
+            v: NumPy array to encode
+        Returns:
+            Base64 encoded string or None
+        """
+        return self._encode(v, np.float16) if v is not None else None
+class LanguageData(NCData):
+    """Natural language instruction or description data.
+    Contains text-based information such as task descriptions, voice commands,
+    or other linguistic data associated with robot demonstrations.
+    """
+    text: str
+class CustomData(NCData):
+    """Generic container for application-specific data types.
+    Provides a flexible way to include custom sensor data or application-specific
+    information that doesn't fit into the standard data categories.
+    """
+    data: Any
+class SyncPoint(BaseModel):
+    """Synchronized collection of all sensor data at a single time point.
+    Represents a complete snapshot of robot state and sensor information
+    at a specific timestamp. Used for creating temporally aligned datasets
+    and ensuring consistent data relationships across different sensors.
+    """
+    timestamp: float = Field(default_factory=lambda: time.time())
+    joint_positions: Optional[JointData] = None
+    joint_velocities: Optional[JointData] = None
+    joint_torques: Optional[JointData] = None
+    joint_target_positions: Optional[JointData] = None
+    end_effectors: Optional[EndEffectorData] = None
+    end_effector_poses: Optional[EndEffectorPoseData] = None
+    parallel_gripper_open_amounts: Optional[ParallelGripperOpenAmountData] = None
+    poses: Optional[PoseData] = None
+    rgb_images: Optional[dict[str, CameraData]] = None
+    depth_images: Optional[dict[str, CameraData]] = None
+    point_clouds: Optional[dict[str, PointCloudData]] = None
+    language_data: Optional[LanguageData] = None
+    custom_data: Optional[dict[str, CustomData]] = None
+    robot_id: Optional[str] = None
+    def order(self) -> "SyncPoint":
+        """Return a new SyncPoint with all dictionary data consistently ordered.
+        This method ensures all dictionary keys in the sync point are sorted
+        alphabetically to provide consistent ordering for machine learning models.
+        This is critical for model training and inference as it ensures deterministic
+        input ordering across different sync points.
+        The following fields are ordered:
+        - RGB images (by camera name)
+        - Depth images (by camera name)
+        - Point clouds (by sensor name)
+        - Custom data (by data type name)
+        - Joint data values (by joint name)
+        - Pose data (by pose name and pose coordinate names)
+        - End effector data (by effector name)
+        Returns:
+            New SyncPoint with all dictionary data consistently ordered.
+        Example:
+            >>> sync_point = SyncPoint(
+            ...     rgb_images={"cam_2": data2, "cam_1": data1},
+            ...     joint_positions=JointData(values={"joint_2": 1.0, "joint_1": 0.5})
+            ... )
+            >>> ordered = sync_point.order()
+            >>> list(ordered.rgb_images.keys())
+            ['cam_1', 'cam_2']
+            >>> list(ordered.joint_positions.values.keys())
+            ['joint_1', 'joint_2']
+        """
+        return SyncPoint(
+            timestamp=self.timestamp,
+            # Order joint data using their get_ordered methods
+            joint_positions=(
+                self.joint_positions.order() if self.joint_positions else None
+            ),
+            joint_velocities=(
+                self.joint_velocities.order() if self.joint_velocities else None
+            ),
+            joint_torques=(self.joint_torques.order() if self.joint_torques else None),
+            joint_target_positions=(
+                self.joint_target_positions.order()
+                if self.joint_target_positions
+                else None
+            ),
+            # Order end effector data
+            end_effectors=(self.end_effectors.order() if self.end_effectors else None),
+            # Order pose data (both pose names and pose coordinates)
+            poses=self.poses.order() if self.poses else None,
+            # Order end effector pose data
+            end_effector_poses=(
+                self.end_effector_poses.order() if self.end_effector_poses else None
+            ),
+            # Order parallel gripper open amount data
+            parallel_gripper_open_amounts=(
+                self.parallel_gripper_open_amounts.order()
+                if self.parallel_gripper_open_amounts
+                else None
+            ),
+            # Order camera data by camera/sensor names
+            rgb_images=_sort_dict_by_keys(self.rgb_images),
+            depth_images=_sort_dict_by_keys(self.depth_images),
+            point_clouds=_sort_dict_by_keys(self.point_clouds),
+            # Language data doesn't need ordering (single value)
+            language_data=self.language_data,
+            # Order custom data by data type names
+            custom_data=_sort_dict_by_keys(self.custom_data),
+            robot_id=self.robot_id,
+        )
+class SyncedData(BaseModel):
+    """Complete synchronized dataset containing a sequence of data points.
+    Represents an entire recording or demonstration as a time-ordered sequence
+    of synchronized data points with start and end timestamps for temporal
+    reference.
+    """
+    frames: list[SyncPoint]
+    start_time: float
+    end_time: float
+    robot_id: str
+    def order(self) -> "SyncedData":
+        """Return a new SyncedData with all sync points ordered.
+        Returns:
+            New SyncedData with all sync points having consistent ordering.
+        """
+        return SyncedData(
+            frames=[frame.order() for frame in self.frames],
+            start_time=self.start_time,
+            end_time=self.end_time,
+            robot_id=self.robot_id,
+        )
+class DataType(str, Enum):
+    """Enumeration of supported data types in the Neuracore system.
+    Defines the standard data categories used for dataset organization,
+    model training, and data processing pipelines.
+    """
+    # Robot state
+    JOINT_POSITIONS = "joint_positions"
+    JOINT_VELOCITIES = "joint_velocities"
+    JOINT_TORQUES = "joint_torques"
+    JOINT_TARGET_POSITIONS = "joint_target_positions"
+    END_EFFECTORS = "end_effectors"
+    END_EFFECTOR_POSES = "end_effector_poses"
+    PARALLEL_GRIPPER_OPEN_AMOUNTS = "parallel_gripper_open_amounts"
+    # Vision
+    RGB_IMAGE = "rgb_image"
+    DEPTH_IMAGE = "depth_image"
+    POINT_CLOUD = "point_cloud"
+    # Other
+    POSES = "poses"
+    LANGUAGE = "language"
+    CUSTOM = "custom"
+class DataItemStats(BaseModel):
+    """Statistical summary of data dimensions and distributions.
+    Contains statistical information about data arrays including means,
+    standard deviations, counts, and maximum lengths for normalization
+    and model configuration purposes.
+    Attributes:
+        mean: List of means for each data dimension
+        std: List of standard deviations for each data dimension
+        count: List of counts for each data dimension
+        max_len: Maximum length of the data arrays
+        robot_to_ncdata_keys: Mapping of robot ids to their associated
+            data keys for this data type
+    """
+    mean: list[float] = Field(default_factory=list)
+    std: list[float] = Field(default_factory=list)
+    count: list[int] = Field(default_factory=list)
+    max_len: int = Field(default_factory=lambda data: len(data["mean"]))
+    robot_to_ncdata_keys: dict[str, list[str]] = Field(default_factory=dict)
+class DatasetDescription(BaseModel):
+    """Comprehensive description of dataset contents and statistics.
+    Provides metadata about a complete dataset including statistical summaries
+    for all data types, maximum counts for variable-length data, and methods
+    for determining which data types are present.
+    """
+    # Joint data statistics
+    joint_positions: DataItemStats = Field(default_factory=DataItemStats)
+    joint_velocities: DataItemStats = Field(default_factory=DataItemStats)
+    joint_torques: DataItemStats = Field(default_factory=DataItemStats)
+    joint_target_positions: DataItemStats = Field(default_factory=DataItemStats)
+    # End-effector statistics
+    end_effector_states: DataItemStats = Field(default_factory=DataItemStats)
+    # End-effector poses statistics
+    end_effector_poses: DataItemStats = Field(default_factory=DataItemStats)
+    # Parallel gripper open amount statistics
+    parallel_gripper_open_amounts: DataItemStats = Field(default_factory=DataItemStats)
+    # Pose statistics
+    poses: DataItemStats = Field(default_factory=DataItemStats)
+    # Visual data counts
+    rgb_images: DataItemStats = Field(default_factory=DataItemStats)
+    depth_images: DataItemStats = Field(default_factory=DataItemStats)
+    point_clouds: DataItemStats = Field(default_factory=DataItemStats)
+    # Language data
+    language: DataItemStats = Field(default_factory=DataItemStats)
+    # Custom data statistics
+    custom_data: dict[str, DataItemStats] = Field(default_factory=dict)
+    def get_data_types(self) -> list[DataType]:
+        """Determine which data types are present in the dataset.
+        Analyzes the dataset statistics to identify which data modalities
+        contain actual data (non-zero lengths/counts).
+        Returns:
+            List of DataType enums representing the data modalities
+            present in this dataset.
+        """
+        data_types = []
+        # Joint data
+        if self.joint_positions.max_len > 0:
+            data_types.append(DataType.JOINT_POSITIONS)
+        if self.joint_velocities.max_len > 0:
+            data_types.append(DataType.JOINT_VELOCITIES)
+        if self.joint_torques.max_len > 0:
+            data_types.append(DataType.JOINT_TORQUES)
+        if self.joint_target_positions.max_len > 0:
+            data_types.append(DataType.JOINT_TARGET_POSITIONS)
+        # End-effector data
+        if self.end_effector_states.max_len > 0:
+            data_types.append(DataType.END_EFFECTORS)
+        # End effector pose data
+        if self.end_effector_poses.max_len > 0:
+            data_types.append(DataType.END_EFFECTOR_POSES)
+        # Parallel gripper open amount data
+        if self.parallel_gripper_open_amounts.max_len > 0:
+            data_types.append(DataType.PARALLEL_GRIPPER_OPEN_AMOUNTS)
+        # Pose data
+        if self.poses.max_len > 0:
+            data_types.append(DataType.POSES)
+        # Visual data
+        if self.rgb_images.max_len > 0:
+            data_types.append(DataType.RGB_IMAGE)
+        if self.depth_images.max_len > 0:
+            data_types.append(DataType.DEPTH_IMAGE)
+        if self.point_clouds.max_len > 0:
+            data_types.append(DataType.POINT_CLOUD)
+        # Language data
+        if self.language.max_len > 0:
+            data_types.append(DataType.LANGUAGE)
+        # Custom data
+        if self.custom_data:
+            data_types.append(DataType.CUSTOM)
+        return data_types
+    def add_custom_data(
+        self, key: str, stats: DataItemStats, max_length: int = 0
+    ) -> None:
+        """Add statistics for a custom data type.
+        Args:
+            key: Name of the custom data type
+            stats: Statistical information for the custom data
+            max_length: Maximum length of the custom data arrays
+        """
+        self.custom_data[key] = stats
+class RecordingDescription(BaseModel):
+    """Description of a single recording episode with statistics and counts.
+    Provides metadata about an individual recording including data statistics,
+    sensor counts, and episode length for analysis and processing.
+    """
+    # Joint data statistics
+    joint_positions: DataItemStats = Field(default_factory=DataItemStats)
+    joint_velocities: DataItemStats = Field(default_factory=DataItemStats)
+    joint_torques: DataItemStats = Field(default_factory=DataItemStats)
+    joint_target_positions: DataItemStats = Field(default_factory=DataItemStats)
+    # End-effector statistics
+    end_effector_states: DataItemStats = Field(default_factory=DataItemStats)
+    # End-effector pose statistics
+    end_effector_poses: DataItemStats = Field(default_factory=DataItemStats)
+    # Parallel gripper open amount statistics
+    parallel_gripper_open_amounts: DataItemStats = Field(default_factory=DataItemStats)
+    # Pose statistics
+    poses: DataItemStats = Field(default_factory=DataItemStats)
+    # Visual data counts
+    rgb_images: DataItemStats = Field(default_factory=DataItemStats)
+    depth_images: DataItemStats = Field(default_factory=DataItemStats)
+    point_clouds: DataItemStats = Field(default_factory=DataItemStats)
+    # Language data
+    language: DataItemStats = Field(default_factory=DataItemStats)
+    # Episode metadata
+    episode_length: int = 0
+    # Custom data statistics
+    custom_data: dict[str, DataItemStats] = Field(default_factory=dict)
+    def get_data_types(self) -> list[DataType]:
+        """Determine which data types are present in the recording.
+        Analyzes the recording statistics to identify which data modalities
+        contain actual data (non-zero lengths/counts).
+        Returns:
+            List of DataType enums representing the data modalities
+            present in this recording.
+        """
+        data_types = []
+        # Joint data
+        if self.joint_positions.max_len > 0:
+            data_types.append(DataType.JOINT_POSITIONS)
+        if self.joint_velocities.max_len > 0:
+            data_types.append(DataType.JOINT_VELOCITIES)
+        if self.joint_torques.max_len > 0:
+            data_types.append(DataType.JOINT_TORQUES)
+        if self.joint_target_positions.max_len > 0:
+            data_types.append(DataType.JOINT_TARGET_POSITIONS)
+        # End-effector data
+        if self.end_effector_states.max_len > 0:
+            data_types.append(DataType.END_EFFECTORS)
+        # End-effector pose data
+        if self.end_effector_poses.max_len > 0:
+            data_types.append(DataType.END_EFFECTOR_POSES)
+        # Parallel gripper open amount data
+        if self.parallel_gripper_open_amounts.max_len > 0:
+            data_types.append(DataType.PARALLEL_GRIPPER_OPEN_AMOUNTS)
+        # Pose data
+        if self.poses.max_len > 0:
+            data_types.append(DataType.POSES)
+        # Visual data
+        if self.rgb_images.max_len > 0:
+            data_types.append(DataType.RGB_IMAGE)
+        if self.depth_images.max_len > 0:
+            data_types.append(DataType.DEPTH_IMAGE)
+        if self.point_clouds.max_len > 0:
+            data_types.append(DataType.POINT_CLOUD)
+        # Language data
+        if self.language.max_len > 0:
+            data_types.append(DataType.LANGUAGE)
+        # Custom data
+        if self.custom_data:
+            data_types.append(DataType.CUSTOM)
+        return data_types
+class ModelInitDescription(BaseModel):
+    """Configuration specification for initializing Neuracore models.
+    Defines the model architecture requirements including dataset characteristics,
+    input/output data types, and prediction horizons for model initialization
+    and training configuration.
+    """
+    dataset_description: DatasetDescription
+    input_data_types: list[DataType]
+    output_data_types: list[DataType]
+    output_prediction_horizon: int = 1
+class ModelPrediction(BaseModel):
+    """Model inference output containing predictions and timing information.
+    Represents the results of model inference including predicted outputs
+    for each configured data type and optional timing information for
+    performance monitoring.
+    """
+    outputs: dict[DataType, Any] = Field(default_factory=dict)
+    prediction_time: Optional[float] = None
+class SyncedDataset(BaseModel):
+    """Represents a dataset of robot demonstrations.
+    A Synchronized dataset groups related robot demonstrations together
+    and maintains metadata about the collection as a whole.
+    Attributes:
+        id: Unique identifier for the synced dataset.
+        parent_id: Unique identifier of the corresponding dataset.
+        freq: Frequency at which dataset was processed.
+        name: Human-readable name for the dataset.
+        created_at: Unix timestamp of dataset creation.
+        modified_at: Unix timestamp of last modification.
+        description: Optional description of the dataset.
+        recording_ids: List of recording IDs in this dataset
+        num_demonstrations: Total number of demonstrations.
+        total_duration_seconds: Total duration of all demonstrations.
+        is_shared: Whether the dataset is shared with other users.
+        metadata: Additional arbitrary metadata.
+    """
+    id: str
+    parent_id: str
+    freq: int
+    name: str
+    created_at: float
+    modified_at: float
+    description: Optional[str] = None
+    recording_ids: list[str] = Field(default_factory=list)
+    num_demonstrations: int = 0
+    num_processed_demonstrations: int = 0
+    total_duration_seconds: float = 0.0
+    is_shared: bool = False
+    metadata: dict[str, Any] = Field(default_factory=dict)
+    dataset_description: DatasetDescription = Field(default_factory=DatasetDescription)
+    all_data_types: dict[DataType, int] = Field(default_factory=dict)
+    common_data_types: dict[DataType, int] = Field(default_factory=dict)
+class Dataset(BaseModel):
+    """Represents a dataset of robot demonstrations.
+    A dataset groups related robot demonstrations together and maintains metadata
+    about the collection as a whole.
+    Attributes:
+        id: Unique identifier for the dataset.
+        name: Human-readable name for the dataset.
+        created_at: Unix timestamp of dataset creation.
+        modified_at: Unix timestamp of last modification.
+        description: Optional description of the dataset.
+        tags: List of tags for categorizing the dataset.
+        recording_ids: List of recording IDs in this dataset
+        demonstration_ids: List of demonstration IDs in this dataset.
+        num_demonstrations: Total number of demonstrations.
+        total_duration_seconds: Total duration of all demonstrations.
+        size_bytes: Total size of all demonstrations.
+        is_shared: Whether the dataset is shared with other users.
+        metadata: Additional arbitrary metadata.
+        synced_dataset_ids: List of synced dataset IDs in this dataset.
+                            They point to synced datasets that synchronized
+                            this dataset at a particular frequency.
+    """
+    id: str
+    name: str
+    created_at: float
+    modified_at: float
+    description: Optional[str] = None
+    tags: list[str] = Field(default_factory=list)
+    recording_ids: list[str] = Field(default_factory=list)
+    num_demonstrations: int = 0
+    total_duration_seconds: float = 0.0
+    size_bytes: int = 0
+    is_shared: bool = False
+    metadata: dict[str, Any] = Field(default_factory=dict)
+    synced_dataset_ids: dict[str, Any] = Field(default_factory=dict)
+    all_data_types: dict[DataType, int] = Field(default_factory=dict)
+    common_data_types: dict[DataType, int] = Field(default_factory=dict)
+    recording_ids_in_bucket: bool = False
+class MessageType(str, Enum):
+    """Enumerates the types of signaling messages for WebRTC handshakes.
+    These types are used to identify the purpose of a message sent through
+    the signaling server during connection establishment.
+    """
+    SDP_OFFER = "offer"  # Session Description Protocol (SDP) offer from the caller
+    SDP_ANSWER = "answer"  # Session Description Protocol (SDP) answer from the callee
+    ICE_CANDIDATE = "ice"  # Interactive Connectivity Establishment (ICE) candidate
+    OPEN_CONNECTION = "open_connection"  # Request to open a new connection
+class HandshakeMessage(BaseModel):
+    """Represents a signaling message for the WebRTC handshake process.
+    This message is exchanged between two peers via a signaling server to
+    negotiate the connection details, such as SDP offers/answers and ICE
+    candidates.
+    Attributes:
+        from_id: The unique identifier of the sender peer.
+        to_id: The unique identifier of the recipient peer.
+        data: The payload of the message, typically an SDP string or a JSON
+              object with ICE candidate information.
+        connection_id: The unique identifier for the connection session.
+        type: The type of the handshake message, as defined by MessageType.
+        id: A unique identifier for the message itself.
+    """
+    from_id: str
+    to_id: str
+    data: str
+    connection_id: str
+    type: MessageType
+    id: str = Field(default_factory=lambda: uuid4().hex)
+class VideoFormat(str, Enum):
+    """Enumerates video format styles over a WebRTC connection."""
+    # use a standard video track with negotiated codec this is more efficient
+    WEB_RTC_NEGOTIATED = "WEB_RTC_NEGOTIATED"
+    # uses neuracore's data URI format over a custom data channel
+    NEURACORE_CUSTOM = "NEURACORE_CUSTOM"
+class OpenConnectionRequest(BaseModel):
+    """Represents a request to open a new WebRTC connection.
+    Attributes:
+        from_id: The unique identifier of the consumer peer.
+        to_id: The unique identifier of the producer peer.
+        robot_id: The unique identifier for the robot to be created.
+        robot_instance: The identifier for the instance of the robot to connect to.
+        video_format: The type of video the consumer expects to receive.
+        id: the identifier for this connection request.
+        created_at: when the request was created.
+    """
+    from_id: str
+    to_id: str
+    robot_id: str
+    robot_instance: NonNegativeInt
+    video_format: VideoFormat
+    id: str = Field(default_factory=lambda: uuid4().hex)
+    created_at: datetime = Field(default_factory=lambda: datetime.now(timezone.utc))
+class OpenConnectionDetails(BaseModel):
+    """The details describing properties about the new connection.
+    Attributes:
+        connection_token: The token used for security to establish the connection.
+        robot_id: The unique identifier for the robot to connect to
+        robot_instance: The identifier for the instance of the robot to connect to.
+        video_format: The type of video the consumer expects to receive.
+    """
+    connection_token: str
+    robot_id: str
+    robot_instance: NonNegativeInt
+    video_format: VideoFormat
+class StreamAliveResponse(BaseModel):
+    """Represents the response from asserting a stream is alive.
+    This is returned when a client pings a stream to keep it active.
+    Attributes:
+        resurrected: A boolean indicating if the stream was considered dead
+                     and has been successfully resurrected by this request.
+    """
+    resurrected: bool
+class RobotInstanceIdentifier(NamedTuple):
+    """A tuple that uniquely identifies a robot instance.
+    Attributes:
+        robot_id: The unique identifier of the robot providing the stream.
+        robot_instance: The specific instance number of the robot.
+    """
+    robot_id: str
+    robot_instance: int
+class TrackKind(str, Enum):
+    """Enumerates the supported track kinds for streaming."""
+    JOINTS = "joints"
+    RGB = "rgb"
+    DEPTH = "depth"
+    LANGUAGE = "language"
+    GRIPPER = "gripper"
+    END_EFFECTOR_POSE = "end_effector_pose"
+    PARALLEL_GRIPPER_OPEN_AMOUNT = "parallel_gripper_open_amount"
+    POINT_CLOUD = "point_cloud"
+    POSE = "pose"
+    CUSTOM = "custom"
+class RobotStreamTrack(BaseModel):
+    """Metadata for a robot's media stream track.
+    This model holds all the necessary information to identify and manage
+    a single media track (e.g., a video or audio feed) from a specific
+    robot instance.
+    Attributes:
+        robot_id: The unique identifier of the robot providing the stream.
+        robot_instance: The specific instance number of the robot.
+        stream_id: The identifier for the overall media stream session.
+        kind: The type of media track, typically 'audio' or 'video'.
+        label: A human-readable label for the track (e.g., 'front_camera').
+        mid: The media ID used in SDP, essential for WebRTC negotiation.
+        id: A unique identifier for this track metadata object.
+        created_at: The UTC timestamp when this track metadata was created.
+    """
+    robot_id: str
+    robot_instance: NonNegativeInt
+    stream_id: str
+    kind: TrackKind
+    label: str
+    mid: str
+    id: str = Field(default_factory=lambda: uuid4().hex)
+    created_at: datetime = Field(default_factory=lambda: datetime.now(timezone.utc))
+class AvailableRobotInstance(BaseModel):
+    """Represents a single, available instance of a robot.
+    Attributes:
+        robot_instance: The unique identifier for this robot instance.
+        tracks: A dictionary of available media stream tracks for this instance.
+        connections: The number of current connections to this instance.
+    """
+    robot_instance: NonNegativeInt
+    # stream_id to list of tracks
+    tracks: dict[str, list[RobotStreamTrack]]
+    connections: int
+class AvailableRobot(BaseModel):
+    """Represents an available robot, including all its running instances.
+    Attributes:
+        robot_id: The unique identifier for the robot model/type.
+        instances: A dictionary of all available instances for this robot,
+                   keyed by instance ID.
+    """
+    robot_id: str
+    instances: dict[int, AvailableRobotInstance]
+class AvailableRobotCapacityUpdate(BaseModel):
+    """Represents an update on the available capacity of all robots.
+    This model is used to broadcast the current state of all available
+    robots and their instances.
+    Attributes:
+        robots: A list of all available robots and their instances.
+    """
+    robots: list[AvailableRobot]
+class BaseRecodingUpdatePayload(BaseModel):
+    """Base payload for recording update notifications.
+    Contains the minimum information needed to identify a recording
+    and the robot instance it belongs to.
+    """
+    recording_id: str
+    robot_id: str
+    instance: NonNegativeInt
+class RecodingRequestedPayload(BaseRecodingUpdatePayload):
+    """Payload for recording request notifications.
+    Contains information about who requested the recording and what
+    data types should be captured.
+    """
+    created_by: str
+    dataset_ids: list[str] = Field(default_factory=list)
+    data_types: set[DataType] = Field(default_factory=set)
+class RecordingStartPayload(RecodingRequestedPayload):
+    """Payload for recording start notifications.
+    Extends the request payload with the actual start timestamp
+    when recording begins.
+    """
+    start_time: float
+class RecordingNotificationType(str, Enum):
+    """Types of recording lifecycle notifications."""
+    INIT = "init"
+    REQUESTED = "requested"
+    START = "start"
+    STOP = "stop"
+    SAVED = "saved"
+    DISCARDED = "discarded"
+    EXPIRED = "expired"
+class RecordingNotification(BaseModel):
+    """Notification message for recording lifecycle events.
+    Used to communicate recording state changes across the system,
+    including initialization, start/stop events, and final disposition.
+    """
+    type: RecordingNotificationType
+    payload: Union[
+        RecordingStartPayload,
+        RecodingRequestedPayload,
+        list[Union[RecordingStartPayload, RecodingRequestedPayload]],
+        BaseRecodingUpdatePayload,
+    ]
+    id: str = Field(default_factory=lambda: uuid4().hex)

neuracore_types-1.0.0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,89 @@
+Metadata-Version: 2.4
+Name: neuracore-types
+Version: 1.0.0
+Summary: Shared type definitions for Neuracore.
+Author: Neuracore
+License: MIT
+License-File: LICENSE
+Requires-Python: >=3.10
+Requires-Dist: numpy>=1.24.0
+Requires-Dist: pydantic>=2.0.0
+Provides-Extra: dev
+Requires-Dist: pre-commit; extra == 'dev'
+Requires-Dist: pydantic-to-typescript2>=1.0.0; extra == 'dev'
+Description-Content-Type: text/markdown
+# Neuracore Types
+Shared type definitions for the Neuracore platform. This package maintains a single source of truth for data types in Python (Pydantic models) and automatically generates TypeScript types.
+## Overview
+- **Python Package**: `neuracore-types` - Pydantic models for Python backend
+- **NPM Package**: `@neuracore/types` - TypeScript types for frontend
+## Installation
+### Python
+```bash
+pip install neuracore-types
+```
+### TypeScript/JavaScript
+```bash
+npm install @neuracore/types
+# or
+yarn add @neuracore/types
+# or
+pnpm add @neuracore/types
+```
+## Development
+### Setup
+```bash
+# Clone the repository
+git clone https://github.com/neuracoreai/neuracore_types.git
+cd neuracore_types
+# Install Python dependencies
+pip install -e ".[dev]"
+# Install Node dependencies
+npm install
+```
+### Generate TypeScript Types
+The TypeScript types are automatically generated from the Python Pydantic models:
+```bash
+npm install json-schema-to-typescript
+python scripts/generate_types.py
+```
+This will:
+1. Read the Pydantic models from `neuracore_types/neuracore_types.py`
+2. Generate TypeScript definitions in `typescript/neuracore_types.ts`
+3. Create an index file at `typescript/index.ts`
+### Build TypeScript Package
+```bash
+npm run build
+```
+This compiles the TypeScript files to JavaScript and generates type declarations in the `dist/` directory.
+## CI/CD
+The repository includes GitHub Actions workflows that:
+1. **On every push to `main` or PR**:
+   - Automatically generates TypeScript types from Python models
+   - Builds and validates both packages
+   - Publishes Python package to PyPI
+   - Publishes NPM package to npm registry

neuracore_types-1.0.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,6 @@
+neuracore_types/__init__.py,sha256=oxBrxwWgs4DxiD5ITELQGVKnXyN4aFwb3BE-1ANXihE,147
+neuracore_types/neuracore_types.py,sha256=Nsl0Kg-50rKQCWRDD-8O8WpuoGDdugGdwDFRaPSPQfQ,37546
+neuracore_types-1.0.0.dist-info/METADATA,sha256=X7QO87UcsFy5VCU2hUlIBliACQ5I4PwyuSRJfuyq8B0,2073
+neuracore_types-1.0.0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+neuracore_types-1.0.0.dist-info/licenses/LICENSE,sha256=TPLH9MVhc33h8soaIkSnaVcBTspRM8QK4ipd61wQlJk,1066
+neuracore_types-1.0.0.dist-info/RECORD,,

neuracore_types-1.0.0.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,4 @@
+Wheel-Version: 1.0
+Generator: hatchling 1.27.0
+Root-Is-Purelib: true
+Tag: py3-none-any

neuracore_types-1.0.0.dist-info/licenses/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2025 Neuracore
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.