PyPI - atdata - Versions diffs - 0.1.1a1__py3-none-any.whl → 0.1.1a3__py3-none-any.whl - Mend

atdata 0.1.1a1py3-none-any.whl → 0.1.1a3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

atdata/__init__.py +13 -2
atdata/_helpers.py +8 -16
atdata/dataset.py +32 -32
{atdata-0.1.1a1.dist-info → atdata-0.1.1a3.dist-info}/METADATA +2 -2
atdata-0.1.1a3.dist-info/RECORD +8 -0
atdata-0.1.1a3.dist-info/entry_points.txt +2 -0
atdata-0.1.1a1.dist-info/RECORD +0 -8
atdata-0.1.1a1.dist-info/entry_points.txt +0 -2
{atdata-0.1.1a1.dist-info → atdata-0.1.1a3.dist-info}/WHEEL +0 -0
{atdata-0.1.1a1.dist-info → atdata-0.1.1a3.dist-info}/licenses/LICENSE +0 -0

atdata/__init__.py CHANGED Viewed

@@ -1,2 +1,13 @@
-def main() -> None:
-    print("Hello from ekumen!")
+"""A loose federation of distributed, typed datasets"""
+##
+# Expose components
+from .dataset import (
+    PackableSample,
+    SampleBatch,
+    Dataset,
+)
+#

atdata/_helpers.py CHANGED Viewed

@@ -1,30 +1,22 @@
-"""Assorted helper methods for `ekumen`"""
+"""Assorted helper methods for `atdata`"""
 ##
 # Imports
 from io import BytesIO
-import ormsgpack as omp
 import numpy as np
 ##
-#
-def pack_instance( x ) -> bytes:
-    return omp.packb( x )
-def unpack( bs: bytes ):
-    return omp.unpackb( bs )
-##
-def array_to_bytes(x: np.ndarray) -> bytes:
+def array_to_bytes( x: np.ndarray ) -> bytes:
+    """Convert `numpy` array to a format suitable for packing"""
     np_bytes = BytesIO()
-    np.save(np_bytes, x, allow_pickle=True)
+    np.save( np_bytes, x, allow_pickle = True )
     return np_bytes.getvalue()
-def bytes_to_array(b: bytes) -> np.ndarray:
-    np_bytes = BytesIO(b)
-    return np.load(np_bytes, allow_pickle=True)
+def bytes_to_array( b: bytes ) -> np.ndarray:
+    """Convert packed bytes back to a `numpy` array"""
+    np_bytes = BytesIO( b )
+    return np.load( np_bytes, allow_pickle = True )

atdata/dataset.py CHANGED Viewed

@@ -57,38 +57,38 @@ DT = TypeVar( 'DT' )
 MsgpackRawSample: TypeAlias = Dict[str, Any]
-@dataclass
-class ArrayBytes:
-    """Annotates bytes that should be interpreted as the raw contents of a
-    numpy NDArray"""
+# @dataclass
+# class ArrayBytes:
+#     """Annotates bytes that should be interpreted as the raw contents of a
+#     numpy NDArray"""
-    raw_bytes: bytes
-    """The raw bytes of the corresponding NDArray"""
-    def __init__( self,
-            array: Optional[ArrayLike] = None,
-            raw: Optional[bytes] = None,
-        ):
-        """TODO"""
-        if array is not None:
-            array = np.array( array )
-            self.raw_bytes = eh.array_to_bytes( array )
+#     raw_bytes: bytes
+#     """The raw bytes of the corresponding NDArray"""
+#     def __init__( self,
+#             array: Optional[ArrayLike] = None,
+#             raw: Optional[bytes] = None,
+#         ):
+#         """TODO"""
+#         if array is not None:
+#             array = np.array( array )
+#             self.raw_bytes = eh.array_to_bytes( array )
-        elif raw is not None:
-            self.raw_bytes = raw
+#         elif raw is not None:
+#             self.raw_bytes = raw
-        else:
-            raise ValueError( 'Must provide either `array` or `raw` bytes' )
+#         else:
+#             raise ValueError( 'Must provide either `array` or `raw` bytes' )
-    @property
-    def to_numpy( self ) -> NDArray:
-        """Return the `raw_bytes` data as an NDArray"""
-        return eh.bytes_to_array( self.raw_bytes )
+#     @property
+#     def to_numpy( self ) -> NDArray:
+#         """Return the `raw_bytes` data as an NDArray"""
+#         return eh.bytes_to_array( self.raw_bytes )
 def _make_packable( x ):
-    if isinstance( x, ArrayBytes ):
-        return x.raw_bytes
+    # if isinstance( x, ArrayBytes ):
+    #     return x.raw_bytes
     if isinstance( x, np.ndarray ):
         return eh.array_to_bytes( x )
     return x
@@ -114,8 +114,8 @@ class PackableSample( ABC ):
                     # we're good!
                     pass
-                elif isinstance( var_cur_value, ArrayBytes ):
-                    setattr( self, var_name, var_cur_value.to_numpy )
+                # elif isinstance( var_cur_value, ArrayBytes ):
+                #     setattr( self, var_name, var_cur_value.to_numpy )
                 elif isinstance( var_cur_value, bytes ):
                     setattr( self, var_name, eh.bytes_to_array( var_cur_value ) )
@@ -172,7 +172,7 @@ def _batch_aggregate( xs: Sequence ):
     return list( xs )
-class SamlpeBatch( Generic[DT] ):
+class SampleBatch( Generic[DT] ):
     def __init__( self, samples: Sequence[DT] ):
         """TODO"""
@@ -233,7 +233,7 @@ class Dataset( Generic[ST] ):
     def batch_type( self ) -> Type:
         """The type of a batch built from `sample_class`"""
         # return self.__orig_class__.__args__[1]
-        return SamlpeBatch[self.sample_type]
+        return SampleBatch[self.sample_type]
     # _schema_registry_sample: dict[str, Type]
@@ -396,7 +396,7 @@ class Dataset( Generic[ST] ):
                 value = sample,
             )
-    def wrap_batch( self, batch: WDSRawBatch ) -> SamlpeBatch[ST]:
+    def wrap_batch( self, batch: WDSRawBatch ) -> SampleBatch[ST]:
         """Wrap a `batch` of samples into the appropriate dataset-specific type
         This default implementation simply creates a list one sample at a time
@@ -405,7 +405,7 @@ class Dataset( Generic[ST] ):
         assert 'msgpack' in batch
         batch_unpacked = [ self.sample_type.from_bytes( bs )
                            for bs in batch['msgpack'] ]
-        return SamlpeBatch[self.sample_type]( batch_unpacked )
+        return SampleBatch[self.sample_type]( batch_unpacked )
     # # @classmethod

{atdata-0.1.1a1.dist-info → atdata-0.1.1a3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: atdata
-Version: 0.1.1a1
+Version: 0.1.1a3
 Summary: A loose federation of distributed, typed datasets
 Author-email: Maxine Levesque <hello@maxine.science>
 License-File: LICENSE
@@ -11,5 +11,5 @@ Requires-Dist: ormsgpack>=1.11.0
 Requires-Dist: webdataset>=1.0.2
 Description-Content-Type: text/markdown
-# ekumen
+# atdata
 A loose federation of distributed, typed datasets

atdata-0.1.1a3.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,8 @@
+atdata/__init__.py,sha256=VwlLoJkqsXf1XWSzsGGIiuxUluIihR2vHOtYao3w0EY,159
+atdata/_helpers.py,sha256=R63JhXewAKZYnZ9Th7R6yZh0IOUPYGBsth3FpRUMD-U,503
+atdata/dataset.py,sha256=tuph87zUZmSLPIXrHvPxSxdrAknLT_4gKAB4kHTqiZ8,12210
+atdata-0.1.1a3.dist-info/METADATA,sha256=gKjbubI4HoLafCG5p4lsE-1_QMPMaHWZ48TLcIiWKO8,434
+atdata-0.1.1a3.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+atdata-0.1.1a3.dist-info/entry_points.txt,sha256=6-iQr1veSTq-ac94bLyfcyGHprrZWevPEd12BWX37tQ,39
+atdata-0.1.1a3.dist-info/licenses/LICENSE,sha256=Pz2eACSxkhsGfW9_iN60pgy-enjnbGTj8df8O3ebnQQ,16726
+atdata-0.1.1a3.dist-info/RECORD,,

atdata-0.1.1a3.dist-info/entry_points.txt ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ [console_scripts]
2	+ atdata = atdata:main

atdata-0.1.1a1.dist-info/RECORD DELETED Viewed

@@ -1,8 +0,0 @@
-atdata/__init__.py,sha256=yN07kW_3UcMlYZrM_Jrpy6DMCzTp9kvu2ICcU7n1-5w,52
-atdata/_helpers.py,sha256=CjIvLruNOhHRl1Arse5SahGTmI0Et3BoNqsWC9b8noE,515
-atdata/dataset.py,sha256=mvmCYtL6wD9961qq4lprZSkone56ubTKp3vDgEnWdPI,12158
-atdata-0.1.1a1.dist-info/METADATA,sha256=9-r5DmpN26ZNNMCp21wtOrk1RxTiWCsZ8rVSd-uig6E,434
-atdata-0.1.1a1.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-atdata-0.1.1a1.dist-info/entry_points.txt,sha256=KuQtj4ZAwWLSyJUxhpQEHYfwSG-0ZXuj5hcZ1uAgGRQ,39
-atdata-0.1.1a1.dist-info/licenses/LICENSE,sha256=Pz2eACSxkhsGfW9_iN60pgy-enjnbGTj8df8O3ebnQQ,16726
-atdata-0.1.1a1.dist-info/RECORD,,

atdata-0.1.1a1.dist-info/entry_points.txt DELETED Viewed

	@@ -1,2 +0,0 @@
1	- [console_scripts]
2	- ekumen = atdata:main

{atdata-0.1.1a1.dist-info → atdata-0.1.1a3.dist-info}/WHEEL RENAMED Viewed

File without changes

{atdata-0.1.1a1.dist-info → atdata-0.1.1a3.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

atdata 0.1.1a1__py3-none-any.whl → 0.1.1a3__py3-none-any.whl

atdata 0.1.1a1py3-none-any.whl → 0.1.1a3py3-none-any.whl