PyPI - atdata - Versions diffs - 0.1.1a2__tar.gz → 0.1.2a1__tar.gz - Mend

atdata 0.1.1a2tar.gz → 0.1.2a1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

atdata-0.1.2a1/.github/workflows/uv-publish-pypi.yml +46 -0
atdata-0.1.2a1/.github/workflows/uv-test.yml +40 -0
{atdata-0.1.1a2 → atdata-0.1.2a1}/.gitignore +2 -0
{atdata-0.1.1a2 → atdata-0.1.2a1}/PKG-INFO +1 -1
{atdata-0.1.1a2 → atdata-0.1.2a1}/pyproject.toml +3 -3
atdata-0.1.2a1/src/atdata/__init__.py +14 -0
atdata-0.1.2a1/src/atdata/_helpers.py +22 -0
{atdata-0.1.1a2 → atdata-0.1.2a1}/src/atdata/dataset.py +70 -33
atdata-0.1.2a1/tests/test_dataset.py +301 -0
atdata-0.1.1a2/.github/workflows/python-package.yml +0 -66
atdata-0.1.1a2/.github/workflows/python-publish.yml +0 -129
atdata-0.1.1a2/src/atdata/__init__.py +0 -2
atdata-0.1.1a2/src/atdata/_helpers.py +0 -30
atdata-0.1.1a2/tests/test_dataset.py +0 -69
{atdata-0.1.1a2 → atdata-0.1.2a1}/.python-version +0 -0
{atdata-0.1.1a2 → atdata-0.1.2a1}/LICENSE +0 -0
{atdata-0.1.1a2 → atdata-0.1.2a1}/README.md +0 -0

atdata-0.1.2a1/.github/workflows/uv-publish-pypi.yml ADDED Viewed

@@ -0,0 +1,46 @@
+#
+name: Build and upload package to PyPI
+on:
+  release:
+    types:
+      - published
+permissions:
+  contents: read
+jobs:
+  uv-build-release-pypi-publish:
+    name: "Build release distribution and publish to PyPI"
+    runs-on: ubuntu-latest
+    environment:
+      name: pypi
+    steps:
+      - uses: actions/checkout@v5
+      - name: "Set up Python"
+        uses: actions/setup-python@v5
+        with:
+          python-version-file: "pyproject.toml"
+      - name: Install uv
+        uses: astral-sh/setup-uv@v6
+      - name: Install project
+        run: uv sync --all-extras --dev
+        # TODO Better to use --locked for author control over versions?
+        # run: uv sync --locked --all-extras --dev
+      - name: Build release distributions
+        run: uv build
+      - name: Publish to PyPI
+        env:
+          UV_PUBLISH_TOKEN: ${{ secrets.UV_PUBLISH_TOKEN }}
+        run: uv publish
+##

atdata-0.1.2a1/.github/workflows/uv-test.yml ADDED Viewed

@@ -0,0 +1,40 @@
+#
+name: Run tests with `uv`
+on:
+  push:
+    branches:
+      - main
+      - release/*
+  pull_request:
+    branches:
+      - main
+jobs:
+  uv-test:
+    name: Run tests
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v5
+      - name: "Set up Python"
+        uses: actions/setup-python@v5
+        with:
+          python-version-file: "pyproject.toml"
+      - name: Install uv
+        uses: astral-sh/setup-uv@v6
+      - name: Install the project
+        run: uv sync --all-extras --dev
+        # TODO Better to use --locked for author control over versions?
+        # run: uv sync --locked --all-extras --dev
+      - name: Run tests
+        # For example, using `pytest`
+        run: uv run pytest tests
+#

{atdata-0.1.1a2 → atdata-0.1.2a1}/.gitignore RENAMED Viewed

@@ -1,5 +1,7 @@
 ## Custom
+# mac garbage
+**/.DS_Store
 # Don't commit any .env files
 **/*.env
 # Don't commit `uv` lockfiles

{atdata-0.1.1a2 → atdata-0.1.2a1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: atdata
-Version: 0.1.1a2
+Version: 0.1.2a1
 Summary: A loose federation of distributed, typed datasets
 Author-email: Maxine Levesque <hello@maxine.science>
 License-File: LICENSE

{atdata-0.1.1a2 → atdata-0.1.2a1}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "atdata"
-version = "0.1.1a2"
+version = "0.1.2a1"
 description = "A loose federation of distributed, typed datasets"
 readme = "README.md"
 authors = [
@@ -15,14 +15,14 @@ dependencies = [
 ]
 [project.scripts]
-ekumen = "atdata:main"
+atdata = "atdata:main"
 [build-system]
 requires = ["hatchling"]
 build-backend = "hatchling.build"
 [tool.pytest.ini_options]
-addopts = "--cov=atdata"
+addopts = "--cov=atdata --cov-report=html"
 [dependency-groups]
 dev = [

atdata-0.1.2a1/src/atdata/__init__.py ADDED Viewed

@@ -0,0 +1,14 @@
+"""A loose federation of distributed, typed datasets"""
+##
+# Expose components
+from .dataset import (
+    PackableSample,
+    SampleBatch,
+    Dataset,
+    packable,
+)
+#

atdata-0.1.2a1/src/atdata/_helpers.py ADDED Viewed

@@ -0,0 +1,22 @@
+"""Assorted helper methods for `atdata`"""
+##
+# Imports
+from io import BytesIO
+import numpy as np
+##
+def array_to_bytes( x: np.ndarray ) -> bytes:
+    """Convert `numpy` array to a format suitable for packing"""
+    np_bytes = BytesIO()
+    np.save( np_bytes, x, allow_pickle = True )
+    return np_bytes.getvalue()
+def bytes_to_array( b: bytes ) -> np.ndarray:
+    """Convert packed bytes back to a `numpy` array"""
+    np_bytes = BytesIO( b )
+    return np.load( np_bytes, allow_pickle = True )

{atdata-0.1.1a2 → atdata-0.1.2a1}/src/atdata/dataset.py RENAMED Viewed

@@ -5,6 +5,7 @@
 import webdataset as wds
+import functools
 from dataclasses import dataclass
 import uuid
@@ -57,38 +58,38 @@ DT = TypeVar( 'DT' )
 MsgpackRawSample: TypeAlias = Dict[str, Any]
-@dataclass
-class ArrayBytes:
-    """Annotates bytes that should be interpreted as the raw contents of a
-    numpy NDArray"""
+# @dataclass
+# class ArrayBytes:
+#     """Annotates bytes that should be interpreted as the raw contents of a
+#     numpy NDArray"""
-    raw_bytes: bytes
-    """The raw bytes of the corresponding NDArray"""
-    def __init__( self,
-            array: Optional[ArrayLike] = None,
-            raw: Optional[bytes] = None,
-        ):
-        """TODO"""
-        if array is not None:
-            array = np.array( array )
-            self.raw_bytes = eh.array_to_bytes( array )
+#     raw_bytes: bytes
+#     """The raw bytes of the corresponding NDArray"""
+#     def __init__( self,
+#             array: Optional[ArrayLike] = None,
+#             raw: Optional[bytes] = None,
+#         ):
+#         """TODO"""
+#         if array is not None:
+#             array = np.array( array )
+#             self.raw_bytes = eh.array_to_bytes( array )
-        elif raw is not None:
-            self.raw_bytes = raw
+#         elif raw is not None:
+#             self.raw_bytes = raw
-        else:
-            raise ValueError( 'Must provide either `array` or `raw` bytes' )
+#         else:
+#             raise ValueError( 'Must provide either `array` or `raw` bytes' )
-    @property
-    def to_numpy( self ) -> NDArray:
-        """Return the `raw_bytes` data as an NDArray"""
-        return eh.bytes_to_array( self.raw_bytes )
+#     @property
+#     def to_numpy( self ) -> NDArray:
+#         """Return the `raw_bytes` data as an NDArray"""
+#         return eh.bytes_to_array( self.raw_bytes )
 def _make_packable( x ):
-    if isinstance( x, ArrayBytes ):
-        return x.raw_bytes
+    # if isinstance( x, ArrayBytes ):
+    #     return x.raw_bytes
     if isinstance( x, np.ndarray ):
         return eh.array_to_bytes( x )
     return x
@@ -114,8 +115,8 @@ class PackableSample( ABC ):
                     # we're good!
                     pass
-                elif isinstance( var_cur_value, ArrayBytes ):
-                    setattr( self, var_name, var_cur_value.to_numpy )
+                # elif isinstance( var_cur_value, ArrayBytes ):
+                #     setattr( self, var_name, var_cur_value.to_numpy )
                 elif isinstance( var_cur_value, bytes ):
                     setattr( self, var_name, eh.bytes_to_array( var_cur_value ) )
@@ -172,7 +173,7 @@ def _batch_aggregate( xs: Sequence ):
     return list( xs )
-class SamlpeBatch( Generic[DT] ):
+class SampleBatch( Generic[DT] ):
     def __init__( self, samples: Sequence[DT] ):
         """TODO"""
@@ -233,7 +234,7 @@ class Dataset( Generic[ST] ):
     def batch_type( self ) -> Type:
         """The type of a batch built from `sample_class`"""
         # return self.__orig_class__.__args__[1]
-        return SamlpeBatch[self.sample_type]
+        return SampleBatch[self.sample_type]
     # _schema_registry_sample: dict[str, Type]
@@ -396,7 +397,7 @@ class Dataset( Generic[ST] ):
                 value = sample,
             )
-    def wrap_batch( self, batch: WDSRawBatch ) -> SamlpeBatch[ST]:
+    def wrap_batch( self, batch: WDSRawBatch ) -> SampleBatch[ST]:
         """Wrap a `batch` of samples into the appropriate dataset-specific type
         This default implementation simply creates a list one sample at a time
@@ -405,7 +406,7 @@ class Dataset( Generic[ST] ):
         assert 'msgpack' in batch
         batch_unpacked = [ self.sample_type.from_bytes( bs )
                            for bs in batch['msgpack'] ]
-        return SamlpeBatch[self.sample_type]( batch_unpacked )
+        return SampleBatch[self.sample_type]( batch_unpacked )
     # # @classmethod
@@ -415,4 +416,40 @@ class Dataset( Generic[ST] ):
     #     This default implementation simply creates a list one sample at a time
     #     """
     #     assert cls.batch_class is not None, 'No batch class specified'
-    #     return cls.batch_class( **batch )
+    #     return cls.batch_class( **batch )
+##
+# Shortcut decorators
+# def packable( cls ):
+#     """TODO"""
+#     def decorator( cls ):
+#         # Create a new class dynamically
+#         # The new class inherits from the new_parent_class first, then the original cls
+#         new_bases = (PackableSample,) + cls.__bases__
+#         new_cls = type(cls.__name__, new_bases, dict(cls.__dict__))
+#         # Optionally, update __module__ and __qualname__ for better introspection
+#         new_cls.__module__ = cls.__module__
+#         new_cls.__qualname__ = cls.__qualname__
+#         return new_cls
+#     return decorator
+def packable( cls ):
+    """TODO"""
+    ##
+    as_dataclass = dataclass( cls )
+    class as_packable( as_dataclass, PackableSample ):
+        pass
+    as_packable.__name__ = cls.__name__
+    ##
+    return as_packable

atdata-0.1.2a1/tests/test_dataset.py ADDED Viewed

@@ -0,0 +1,301 @@
+"""Test dataaset functionality."""
+##
+# Imports
+# Tests
+import pytest
+# System
+from dataclasses import dataclass
+# External
+import numpy as np
+import webdataset as wds
+# Local
+import atdata
+import atdata.dataset as atds
+# Typing
+from numpy.typing import NDArray
+from typing import (
+    Type,
+    Any,
+)
+##
+# Sample test cases
+@dataclass
+class BasicTestSample( atdata.PackableSample ):
+    name: str
+    position: int
+    value: float
+@dataclass
+class NumpyTestSample( atdata.PackableSample ):
+    label: int
+    image: NDArray
+test_cases = [
+    {
+        'SampleType': BasicTestSample,
+        'sample_data': {
+            'name': 'Hello, world!',
+            'position': 42,
+            'value': 1024.768,
+        },
+        'sample_wds_stem': 'basic_test',
+    },
+    {
+        'SampleType': NumpyTestSample,
+        'sample_data':
+        {
+            'label': 9_001,
+            'image': np.random.randn( 1024, 1024 ),
+        },
+        'sample_wds_stem': 'numpy_test',
+    },
+]
+## Tests
+@pytest.mark.parametrize(
+    ('SampleType', 'sample_data'),
+    [ (case['SampleType'], case['sample_data'])
+      for case in test_cases ]
+)
+def test_create_sample(
+            SampleType: Type[atdata.PackableSample],
+            sample_data: atds.MsgpackRawSample,
+        ):
+    """Test our ability to create samples from semi-structured data"""
+    sample = SampleType.from_data( sample_data )
+    assert isinstance( sample, SampleType ), \
+        f'Did not properly form sample for test type {SampleType}'
+    for k, v in sample_data.items():
+        cur_assertion: bool
+        if isinstance( v, np.ndarray ):
+            cur_assertion = np.all( getattr( sample, k ) == v ) == True
+        else:
+            cur_assertion = getattr( sample, k ) == v
+        assert cur_assertion, \
+            f'Did not properly incorporate property {k} of test type {SampleType}'
+#
+def test_decorator_syntax():
+    """Test use of decorator syntax for sample types"""
+    @atdata.packable
+    class BasicTestSampleDecorated:
+        name: str
+        position: int
+        value: float
+    @atdata.packable
+    class NumpyTestSampleDecorated:
+        label: int
+        image: NDArray
+    ##
+    test_create_sample( BasicTestSampleDecorated, {
+        'name': 'Hello, world!',
+        'position': 42,
+        'value': 1024.768,
+    } )
+    test_create_sample( NumpyTestSampleDecorated, {
+        'label': 9_001,
+        'image': np.random.randn( 1024, 1024 ),
+    } )
+#
+@pytest.mark.parametrize(
+    ('SampleType', 'sample_data', 'sample_wds_stem'),
+    [ (case['SampleType'], case['sample_data'], case['sample_wds_stem'])
+      for case in test_cases ]
+)
+def test_wds(
+            SampleType: Type[atdata.PackableSample],
+            sample_data: atds.MsgpackRawSample,
+            sample_wds_stem: str,
+            tmp_path
+        ):
+    """Test our ability to write samples as `WebDatasets` to disk"""
+    ## Testing hyperparameters
+    n_copies = 100
+    shard_maxcount = 10
+    batch_size = 4
+    n_iterate = 10
+    ## Write sharded dataset
+    file_pattern = (
+        tmp_path
+        / (f'{sample_wds_stem}' + '-{shard_id}.tar')
+    ).as_posix()
+    file_wds_pattern = file_pattern.format( shard_id = '%06d' )
+    with wds.ShardWriter(
+        pattern = file_wds_pattern,
+        maxcount = shard_maxcount,
+    ) as sink:
+        for i_sample in range( n_copies ):
+            new_sample = SampleType.from_data( sample_data )
+            assert isinstance( new_sample, SampleType ), \
+                f'Did not properly form sample for test type {SampleType}'
+            sink.write( new_sample.as_wds )
+    ## Ordered
+    # Read first shard, no batches
+    first_filename = file_pattern.format( shard_id = f'{0:06d}' )
+    dataset = atdata.Dataset[SampleType]( first_filename )
+    iterations_run = 0
+    for i_iterate, cur_sample in enumerate( dataset.ordered( batch_size = None ) ):
+        assert isinstance( cur_sample, SampleType ), \
+            f'Single sample for {SampleType} written to `wds` is of wrong type'
+        # Check sample values
+        for k, v in sample_data.items():
+            if isinstance( v, np.ndarray ):
+                is_correct = np.all( getattr( cur_sample, k ) == v )
+            else:
+                is_correct = getattr( cur_sample, k ) == v
+            assert is_correct, \
+                f'{SampleType}: Incorrect sample value found for {k}'
+        iterations_run += 1
+        if iterations_run >= n_iterate:
+            break
+    assert iterations_run == n_iterate, \
+        f"Only found {iterations_run} samples, not {n_iterate}"
+    # Read all shards, batches
+    start_id = f'{0:06d}'
+    end_id = f'{9:06d}'
+    first_filename = file_pattern.format( shard_id = '{' + start_id + '..' + end_id + '}' )
+    print( first_filename )
+    dataset = atdata.Dataset[SampleType]( first_filename )
+    iterations_run = 0
+    for i_iterate, cur_batch in enumerate( dataset.ordered( batch_size = batch_size ) ):
+        assert isinstance( cur_batch, atdata.SampleBatch ), \
+            f'{SampleType}: Batch sample is not correctly a batch'
+        assert cur_batch.sample_type == SampleType, \
+            f'{SampleType}: Batch `sample_type` is incorrect type'
+        if i_iterate == 0:
+            cur_n = len( cur_batch.samples )
+            assert cur_n == batch_size, \
+                f'{SampleType}: Batch has {cur_n} samples, not {batch_size}'
+        assert isinstance( cur_batch.samples[0], SampleType ), \
+            f'{SampleType}: Batch sample of wrong type ({type( cur_batch.samples[0])})'
+        # Check batch values
+        for k, v in sample_data.items():
+            cur_batch_data = getattr( cur_batch, k )
+            if isinstance( v, np.ndarray ):
+                assert isinstance( cur_batch_data, np.ndarray ), \
+                    f'{SampleType}: `NDArray` not carried through to batch'
+                is_correct = all(
+                    [ np.all( cur_batch_data[i] == v )
+                      for i in range( cur_batch_data.shape[0] ) ]
+                )
+            else:
+                is_correct = all(
+                    [ cur_batch_data[i] == v
+                      for i in range( len( cur_batch_data ) ) ]
+                )
+            assert is_correct, \
+                f'{SampleType}: Incorrect sample value found for {k}'
+        iterations_run += 1
+        if iterations_run >= n_iterate:
+            break
+    assert iterations_run == n_iterate, \
+        "Only found {iterations_run} samples, not {n_iterate}"
+    ## Shuffled
+    # Read first shard, no batches
+    first_filename = file_pattern.format( shard_id = f'{0:06d}' )
+    dataset = atdata.Dataset[SampleType]( first_filename )
+    iterations_run = 0
+    for i_iterate, cur_sample in enumerate( dataset.shuffled( batch_size = None ) ):
+        assert isinstance( cur_sample, SampleType ), \
+            f'Single sample for {SampleType} written to `wds` is of wrong type'
+        iterations_run += 1
+        if iterations_run >= n_iterate:
+            break
+    assert iterations_run == n_iterate, \
+        f"Only found {iterations_run} samples, not {n_iterate}"
+    # Read all shards, batches
+    start_id = f'{0:06d}'
+    end_id = f'{9:06d}'
+    first_filename = file_pattern.format( shard_id = '{' + start_id + '..' + end_id + '}' )
+    print( first_filename )
+    dataset = atdata.Dataset[SampleType]( first_filename )
+    iterations_run = 0
+    for i_iterate, cur_sample in enumerate( dataset.shuffled( batch_size = batch_size ) ):
+        assert isinstance( cur_sample, atdata.SampleBatch ), \
+            f'{SampleType}: Batch sample is not correctly a batch'
+        assert cur_sample.sample_type == SampleType, \
+            f'{SampleType}: Batch `sample_type` is incorrect type'
+        if i_iterate == 0:
+            cur_n = len( cur_sample.samples )
+            assert cur_n == batch_size, \
+                f'{SampleType}: Batch has {cur_n} samples, not {batch_size}'
+        assert isinstance( cur_sample.samples[0], SampleType ), \
+            f'{SampleType}: Batch sample of wrong type ({type( cur_sample.samples[0])})'
+        iterations_run += 1
+        if iterations_run >= n_iterate:
+            break
+    assert iterations_run == n_iterate, \
+        "Only found {iterations_run} samples, not {n_iterate}"
+##

atdata-0.1.1a2/.github/workflows/python-package.yml DELETED Viewed

@@ -1,66 +0,0 @@
-# This workflow will install Python dependencies, run tests and lint with a variety of Python versions
-# For more information see: https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python
-name: Python package
-on:
-  push:
-    branches: [ "main" ]
-  pull_request:
-    branches: [ "main" ]
-jobs:
-  uv-test:
-    name: python
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v5
-      - name: "Set up Python"
-        uses: actions/setup-python@v5
-        with:
-          python-version-file: "pyproject.toml"
-      - name: Install uv
-        uses: astral-sh/setup-uv@v6
-      - name: Install the project
-        run: uv sync --all-extras --dev
-        # TODO Better to use --locked for author control over versions?
-        # run: uv sync --locked --all-extras --dev
-      - name: Run tests
-        # For example, using `pytest`
-        run: uv run pytest tests
-# OLD - kept for legacy
-# jobs:
-#   build:
-#     runs-on: ubuntu-latest
-#     strategy:
-#       fail-fast: false
-#       matrix:
-#         python-version: ["3.12", "3.13"]
-#     steps:
-#     - uses: actions/checkout@v4
-#     - name: Set up Python ${{ matrix.python-version }}
-#       uses: actions/setup-python@v3
-#       with:
-#         python-version: ${{ matrix.python-version }}
-#     - name: Install dependencies
-#       run: |
-#         python -m pip install --upgrade pip
-#         python -m pip install flake8 pytest
-#         if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
-#     - name: Lint with flake8
-#       run: |
-#         # stop the build if there are Python syntax errors or undefined names
-#         flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics
-#         # exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide
-#         flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics
-#     - name: Test with pytest
-#       run: |
-#         pytest

atdata-0.1.1a2/.github/workflows/python-publish.yml DELETED Viewed

@@ -1,129 +0,0 @@
-# This workflow will upload a Python Package to PyPI when a release is created
-# For more information see: https://docs.github.com/en/actions/automating-builds-and-tests/building-and-testing-python#publishing-to-package-registries
-# This workflow uses actions that are not certified by GitHub.
-# They are provided by a third-party and are governed by
-# separate terms of service, privacy policy, and support
-# documentation.
-name: Build and upload package to PyPI
-on:
-  release:
-    types: [published]
-permissions:
-  contents: read
-jobs:
-  # uv-release-build-publish:
-  #   # name: python
-  #   runs-on: ubuntu-latest
-  #   steps:
-  #     - uses: actions/checkout@v5
-  #     - name: "Set up Python"
-  #       uses: actions/setup-python@v5
-  #       with:
-  #         python-version-file: "pyproject.toml"
-  #     - name: Install uv
-  #       uses: astral-sh/setup-uv@v6
-  #     - name: Install the project
-  #       run: uv sync --all-extras --dev
-  #       # TODO Better to use --locked for author control over versions?
-  #       # run: uv sync --locked --all-extras --dev
-  #     - name: Build release distributions
-  #       run: uv build
-  uv-build-release-pypi-publish:
-    name: "Build release distribution and publish to PyPI"
-    runs-on: ubuntu-latest
-    # needs:
-    #   - uv-release-build
-    environment:
-      name: pypi
-    steps:
-      - uses: actions/checkout@v5
-      - name: "Set up Python"
-        uses: actions/setup-python@v5
-        with:
-          python-version-file: "pyproject.toml"
-      - name: Install uv
-        uses: astral-sh/setup-uv@v6
-      - name: Install the project
-        run: uv sync --all-extras --dev
-        # TODO Better to use --locked for author control over versions?
-        # run: uv sync --locked --all-extras --dev
-      - name: Build release distributions
-        run: uv build
-      - name: Publish to PyPI
-        env:
-          UV_PUBLISH_TOKEN: ${{ secrets.UV_PUBLISH_TOKEN }}
-        run: uv publish
-# TODO Original variant kept for reference
-# jobs:
-#   release-build:
-#     runs-on: ubuntu-latest
-#     steps:
-#       - uses: actions/checkout@v4
-#       - uses: actions/setup-python@v5
-#         with:
-#           python-version: "3.x"
-#       - name: Build release distributions
-#         run: |
-#           # NOTE: put your own distribution build steps here.
-#           python -m pip install build
-#           python -m build
-#       - name: Upload distributions
-#         uses: actions/upload-artifact@v4
-#         with:
-#           name: release-dists
-#           path: dist/
-#   pypi-publish:
-#     runs-on: ubuntu-latest
-#     needs:
-#       - release-build
-#     permissions:
-#       # IMPORTANT: this permission is mandatory for trusted publishing
-#       id-token: write
-#     # Dedicated environments with protections for publishing are strongly recommended.
-#     # For more information, see: https://docs.github.com/en/actions/deployment/targeting-different-environments/using-environments-for-deployment#deployment-protection-rules
-#     environment:
-#       name: pypi
-#       # OPTIONAL: uncomment and update to include your PyPI project URL in the deployment status:
-#       # url: https://pypi.org/p/YOURPROJECT
-#       #
-#       # ALTERNATIVE: if your GitHub Release name is the PyPI project version string
-#       # ALTERNATIVE: exactly, uncomment the following line instead:
-#       # url: https://pypi.org/project/YOURPROJECT/${{ github.event.release.name }}
-#     steps:
-#       - name: Retrieve release distributions
-#         uses: actions/download-artifact@v4
-#         with:
-#           name: release-dists
-#           path: dist/
-#       - name: Publish release distributions to PyPI
-#         uses: pypa/gh-action-pypi-publish@release/v1
-#         with:
-#           packages-dir: dist/

atdata-0.1.1a2/src/atdata/__init__.py DELETED Viewed

	@@ -1,2 +0,0 @@
1	- def main() -> None:
2	- print("Hello from ekumen!")

atdata-0.1.1a2/src/atdata/_helpers.py DELETED Viewed

@@ -1,30 +0,0 @@
-"""Assorted helper methods for `ekumen`"""
-##
-# Imports
-from io import BytesIO
-import ormsgpack as omp
-import numpy as np
-##
-#
-def pack_instance( x ) -> bytes:
-    return omp.packb( x )
-def unpack( bs: bytes ):
-    return omp.unpackb( bs )
-##
-def array_to_bytes(x: np.ndarray) -> bytes:
-    np_bytes = BytesIO()
-    np.save(np_bytes, x, allow_pickle=True)
-    return np_bytes.getvalue()
-def bytes_to_array(b: bytes) -> np.ndarray:
-    np_bytes = BytesIO(b)
-    return np.load(np_bytes, allow_pickle=True)

atdata-0.1.1a2/tests/test_dataset.py DELETED Viewed

@@ -1,69 +0,0 @@
-"""Test dataaset functionality."""
-##
-import pytest
-from dataclasses import dataclass
-import numpy as np
-from numpy.typing import NDArray
-from typing import (
-    Type,
-    Any,
-)
-import atdata.dataset as ekd
-## Sample test cases
-@dataclass
-class BasicTestSample( ekd.PackableSample ):
-    name: str
-    position: int
-    value: float
-@dataclass
-class NumpyTestSample( ekd.PackableSample ):
-    label: int
-    image: NDArray
-test_sample_classes = [
-    (
-        BasicTestSample, {
-            'name': 'Hello, world!',
-            'position': 42,
-            'value': 1024.768,
-        }
-    ),
-    (
-        NumpyTestSample, {
-            'label': 9_001,
-            'image': np.random.randn( 1024, 1024 ),
-        }
-    )
-]
-## Tests
-@pytest.mark.parametrize( ('SampleType', 'sample_data'), test_sample_classes )
-def test_create_sample(
-            SampleType: Type[ekd.PackableSample],
-            sample_data: ekd.MsgpackRawSample,
-        ):
-    """
-    Test our ability to create samples from semi-structured data
-    """
-    sample = SampleType.from_data( sample_data )
-    assert isinstance( sample, SampleType ), f'Did not properly form sample for test type {SampleType}'
-    for k, v in sample_data.items():
-        cur_assertion: bool
-        if isinstance( v, np.ndarray ):
-            cur_assertion = np.all( getattr( sample, k ) == v ) == True
-        else:
-            cur_assertion = getattr( sample, k ) == v
-        assert cur_assertion, f'Did not properly incorporate property {k} of test type {SampleType}'

{atdata-0.1.1a2 → atdata-0.1.2a1}/.python-version RENAMED Viewed

File without changes

{atdata-0.1.1a2 → atdata-0.1.2a1}/LICENSE RENAMED Viewed

File without changes

{atdata-0.1.1a2 → atdata-0.1.2a1}/README.md RENAMED Viewed

File without changes

atdata 0.1.1a2__tar.gz → 0.1.2a1__tar.gz

atdata 0.1.1a2tar.gz → 0.1.2a1tar.gz