PyPI - xarray_sql - Versions diffs - 0.2.1__tar.gz → 0.2.3__tar.gz - Mend

xarray_sql 0.2.1tar.gz → 0.2.3tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

{xarray_sql-0.2.1 → xarray_sql-0.2.3}/.gitignore +2 -0
{xarray_sql-0.2.1 → xarray_sql-0.2.3}/Cargo.lock +1 -1
{xarray_sql-0.2.1 → xarray_sql-0.2.3}/Cargo.toml +1 -1
{xarray_sql-0.2.1 → xarray_sql-0.2.3}/PKG-INFO +112 -58
{xarray_sql-0.2.1 → xarray_sql-0.2.3}/README.md +102 -57
xarray_sql-0.2.3/docs/assets/logo.svg +104 -0
xarray_sql-0.2.3/docs/contributing.md +1 -0
xarray_sql-0.2.3/docs/examples.md +93 -0
xarray_sql-0.2.3/docs/index.md +1 -0
xarray_sql-0.2.3/docs/reference/xarray_sql.md +8 -0
{xarray_sql-0.2.1 → xarray_sql-0.2.3}/pyproject.toml +23 -6
xarray_sql-0.2.3/tests/__init__.py +0 -0
xarray_sql-0.2.3/tests/conftest.py +150 -0
xarray_sql-0.2.3/tests/test_cft.py +170 -0
xarray_sql-0.2.3/tests/test_df.py +443 -0
xarray_sql-0.2.3/tests/test_reader.py +1377 -0
xarray_sql-0.2.3/tests/test_sql.py +439 -0
{xarray_sql-0.2.1 → xarray_sql-0.2.3}/xarray_sql/__init__.py +2 -0
xarray_sql-0.2.3/xarray_sql/cftime.py +248 -0
xarray_sql-0.2.3/xarray_sql/core.py +49 -0
xarray_sql-0.2.3/xarray_sql/df.py +447 -0
xarray_sql-0.2.3/xarray_sql/reader.py +305 -0
xarray_sql-0.2.3/xarray_sql/sql.py +129 -0
xarray_sql-0.2.3/zensical.toml +122 -0
xarray_sql-0.2.1/xarray_sql/core.py +0 -49
xarray_sql-0.2.1/xarray_sql/df.py +0 -378
xarray_sql-0.2.1/xarray_sql/df_test.py +0 -489
xarray_sql-0.2.1/xarray_sql/reader.py +0 -298
xarray_sql-0.2.1/xarray_sql/reader_test.py +0 -1372
xarray_sql-0.2.1/xarray_sql/sql.py +0 -18
xarray_sql-0.2.1/xarray_sql/sql_test.py +0 -194
{xarray_sql-0.2.1 → xarray_sql-0.2.3}/LICENSE +0 -0
{xarray_sql-0.2.1 → xarray_sql-0.2.3}/src/lib.rs +0 -0

{xarray_sql-0.2.1 → xarray_sql-0.2.3}/.gitignore RENAMED Viewed

@@ -12,3 +12,5 @@ test_data
 .chainlink
 .claude
 CHANGELOG.md
+*.ipynb
+/site

{xarray_sql-0.2.1 → xarray_sql-0.2.3}/Cargo.lock RENAMED Viewed

@@ -3375,7 +3375,7 @@ checksum = "ea2f10b9bb0928dfb1b42b65e1f9e36f7f54dbdf08457afefb38afcdec4fa2bb"
 [[package]]
 name = "xarray_sql"
-version = "0.2.1"
+version = "0.2.3"
 dependencies = [
  "arrow",
  "async-stream",

{xarray_sql-0.2.1 → xarray_sql-0.2.3}/Cargo.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [package]
 name = "xarray_sql"
-version = "0.2.1"
+version = "0.2.3"
 authors = ["Alex Merose"]
 edition = "2021"
 exclude = [

{xarray_sql-0.2.1 → xarray_sql-0.2.3}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: xarray_sql
-Version: 0.2.1
+Version: 0.2.3
 Classifier: Development Status :: 4 - Beta
 Classifier: Intended Audience :: Science/Research
 Classifier: Intended Audience :: Developers
@@ -19,9 +19,18 @@ Classifier: Topic :: Database :: Front-Ends
 Requires-Dist: dask>=2024.8.0
 Requires-Dist: datafusion==52.0.0
 Requires-Dist: xarray>=2024.7.0
+Requires-Dist: xarray-sql[docs] ; extra == 'dev'
+Requires-Dist: pre-commit ; extra == 'dev'
+Requires-Dist: pytest ; extra == 'dev'
+Requires-Dist: watchfiles ; extra == 'dev'
+Requires-Dist: zensical ; extra == 'docs'
+Requires-Dist: mkdocstrings[python] ; extra == 'docs'
+Requires-Dist: cftime ; extra == 'test'
 Requires-Dist: pytest ; extra == 'test'
 Requires-Dist: xarray[io] ; extra == 'test'
 Requires-Dist: gcsfs ; extra == 'test'
+Provides-Extra: dev
+Provides-Extra: docs
 Provides-Extra: test
 License-File: LICENSE
 Summary: Querry Xarray with SQL.
@@ -53,52 +62,97 @@ This is an experiment to provide a SQL interface for array datasets.
 import xarray as xr
 import xarray_sql as xql
-ds = xr.tutorial.open_dataset('air_temperature')
-# The same as a dask-sql Context; i.e. an Apache DataFusion Context.
+# Open a year of ARCO-ERA5 — all 273 variables. Selecting a year up front
+# keeps Dask's partition setup cheap before any chunks are read from GCS.
+ds = (
+  xr.open_zarr('gs://gcp-public-data-arco-era5/ar/full_37-1h-0p25deg-chunk-1.zarr-v3',
+               chunks=dict(time=1),
+               storage_options={'token': 'anon'})  # Anonymous read from the public GCS bucket — no auth required.
+  .sel(time='2020')
+)
 ctx = xql.XarrayContext()
-ctx.from_dataset('air', ds, chunks=dict(time=24))  # the dataset needs to be chunked!
-# data is only materialized when we make a query.
-result = ctx.sql('''
-  SELECT
-    "lat", "lon", AVG("air") as air_avg
-  FROM
-    "air"
-  GROUP BY
-   "lat", "lon"
-''')
-# DataFrame()
-# +------+-------+--------------------+
-# | lat  | lon   | air_avg            |
-# +------+-------+--------------------+
-# | 75.0 | 205.0 | 259.88662671232834 |
-# | 75.0 | 207.5 | 259.48268150684896 |
-# | 75.0 | 230.0 | 258.9192123287667  |
-# | 75.0 | 275.0 | 257.07574315068456 |
-# | 75.0 | 322.5 | 250.11792123287654 |
-# | 75.0 | 325.0 | 250.81590068493134 |
-# | 72.5 | 205.0 | 262.74933904109537 |
-# | 72.5 | 207.5 | 262.5384315068488  |
-# | 72.5 | 230.0 | 260.82879452054743 |
-# | 72.5 | 275.0 | 257.3063321917804  |
-# +------+-------+--------------------+
-# Data truncated.
-# The full query is only made when we call `collect()`, or, in this case,
-# `to_pandas()`.
-df = result.to_pandas()
-df.head()
-#     lat    lon     air_avg
-# 0  75.0  232.5  258.836188
-# 1  75.0  247.5  257.716171
-# 2  75.0  262.5  257.347959
-# 3  75.0  277.5  257.671308
-# 4  72.5  232.5  260.654401
+ctx.from_dataset('era5', ds, table_names={
+    ('time', 'latitude', 'longitude'): 'surface',
+    ('time', 'level', 'latitude', 'longitude'): 'atmosphere',
+})
+# Registration: ~0.5s for a full year of hourly ERA5, all variables.
+# Heads up: ARCO-ERA5 has 262 surface + 11 atmospheric variables. The library
+# pushes column projection down to Zarr, so SELECT only fetches what you ask
+# for — but `SELECT * FROM era5.surface` would try to pull every variable
+# across the year (terabytes from GCS).
+#  ---> Always SELECT specific columns. <---
+# Average 2m-temperature over NYC on the morning of 2020-01-01. The library
+# pushes WHERE clauses on dimension columns down to partition pruning.
+ctx.sql('''
+  SELECT AVG("2m_temperature") - 273.15 AS avg_c
+  FROM era5.surface
+  WHERE time BETWEEN TIMESTAMP '2020-01-01'
+                 AND TIMESTAMP '2020-01-01 05:00:00'
+    AND latitude  BETWEEN 39 AND 40
+    AND longitude BETWEEN 286 AND 287  -- ERA5 uses 0-360 longitudes
+''').to_pandas()
+#       avg_c
+# 0  8.640069
+# Average temperature per pressure level, globally.
+ctx.sql('''
+  SELECT level, AVG(temperature) - 273.15 AS avg_c
+  FROM era5.atmosphere
+  WHERE time BETWEEN TIMESTAMP '2020-01-01'
+                 AND TIMESTAMP '2020-01-01 05:00:00'
+  GROUP BY level
+  ORDER BY level DESC
+''').to_pandas()
+#     level      avg_c
+# 0    1000   6.621012   ← surface
+# 1     975   5.185638
+# 2     950   4.028429
+# 3     925   3.082812
+# 4     900   2.210917
+# 5     875   1.395018
+# 6     850   0.634267
+# 7     825  -0.210372
+# 8     800  -1.181075
+# 9     775  -2.306465
+# 10    750  -3.535534
+# 11    700  -6.241685
+# 12    650  -9.236364
+# 13    600 -12.580938
+# 14    550 -16.335386
+# 15    500 -20.643604
+# 16    450 -25.573401
+# 17    400 -31.156920
+# 18    350 -37.400552
+# 19    300 -43.852607
+# 20    250 -49.322132
+# 21    225 -51.569113
+# 22    200 -53.693248
+# 23    175 -55.890484
+# 24    150 -58.382290
+# 25    125 -61.091916
+# 26    100 -63.624885   ← tropopause
+# 27     70 -63.182300
+# 28     50 -60.124845
+# 29     30 -55.986327
+# 30     20 -52.433089
+# 31     10 -44.140750
+# 32      7 -38.707350
+# 33      5 -32.621999
+# 34      3 -21.509175
+# 35      2 -13.355764
+# 36      1  -9.020513   ← top of atmosphere
 ```
-Succinctly, we "pivot" Xarray Datasets (with consistent dimensions) to treat them like tables so we can run
-SQL queries against them.
+_(A runnable version of this example lives at
+[`perf_tests/era5_temp_profile.py`](perf_tests/era5_temp_profile.py).)_
+Succinctly, we "pivot" Xarray Datasets to treat them like tables so we can run
+SQL queries against them.
 ## Why build this?
@@ -128,11 +182,11 @@ That's it!
 _2025 update_: This library now implements a Dask-like `from_map` interface in
 pure DataFusion and PyArrow, but works with the same principle!
-_2026 update_: Instead of `from_map()`, we make factory functions from blocks of
-Xarray datasets that return RecordBatchReaders. These feed into a Rust-based
-DataFusion `TableProvider`. Every chunk is uses the Arrow in memory format to
-translate between Python and Rust. Even still, the core of what makes this idea
-work is the core `pivot()` operation from where this project began!
+_2026 update_: Instead of `from_map()`, we create a way to translate Xarray chunks
+into Arrow RecordBatches. We pass a Python callback into a DataFusion `TableProvider`
+that lets the DB engine translate the underlying Dataset arrays into DataFusion partitions.
+Ultimately, the initial insight of the `pivot()` function -- that any ndarray can be
+translated into a 2D table -- underlies this performant query mechanism.
 ## Why does this work?
@@ -150,11 +204,6 @@ early users – "tire kickers", if you will. We'd love your input to shape the d
 project! Please, give this a try and [file issues](https://github.com/alxmrs/xarray-sql/issues) as
 you see fit. Check out our [contributing guide](CONTRIBUTING.md), too 😉.
-I can say that for now, the library is oriented towards making whole scans of
-Xarray Datasets. Common filter optimizations (even basic ones like an `.sel()` on
-core dimensions, let alone predicate push downs) are not fully implemented yet.
-However, these operations and more are on our roadmap.
 ## What would a deeper integration look like?
 I have a few ideas so far. One approach involves applying operations directly on
@@ -169,18 +218,21 @@ and BigQuery. More thoughts on this
 in [#4](https://github.com/alxmrs/xarray-sql/issues/4).
 _2025 update_: Something like this is being built across a few projects! The ones I know about are:
 - [CartoDB's Raquet](https://github.com/CartoDB/raquet)
 - The DataFusion community's [arrow-zarr](https://github.com/datafusion-contrib/arrow-zarr)
-As of writing, this project is [amid integrating](https://github.com/alxmrs/xarray-sql/pull/69) a
-rust-based DataFusion backend provided by arrow-zarr.
+_2026 update_: A colleague and I are experimenting with native Zarr RDBMS engines. Check out:
+- [Zarr-Datafusion](https://lib.rs/crates/zarr-datafusion)
+- [DuckDB-Zarr](https://github.com/hobbes-bot/duckdb-zarr)
 ## Roadmap
 - [x] ~Lazy evaluation via the pyarrow Dataset interface [#93](https://github.com/alxmrs/xarray-sql/issues/93).~ _Implemented in [#100](https://github.com/alxmrs/xarray-sql/pull/100)_
-- [ ] Support proper parallelism via proper partition handling on the rust/datafusion side. [#106](https://github.com/alxmrs/xarray-sql/issues/106)
-- [ ] Support core datafusion optimizations to scan less data, like [104](https://github.com/alxmrs/xarray-sql/issues/104), ...
-- [ ] Translate a single Zarr to a collection of tables via DataFusion's catalog interface [#85](https://github.com/alxmrs/xarray-sql/issues/85).
+- [x] Support proper parallelism via proper partition handling on the rust/datafusion side. [#106](https://github.com/alxmrs/xarray-sql/issues/106)
+- [x] Support core datafusion optimizations to scan less data, like [104](https://github.com/alxmrs/xarray-sql/issues/104), ...
+- [ ] Translate a single Zarr to a collection of tables [#85](https://github.com/alxmrs/xarray-sql/issues/85).
 - [ ] Distributed beyond a single node through the DataFusion integration with Ray Datasets [#68](https://github.com/alxmrs/xarray-sql/issues/68) or Apache Ballista [#98](https://github.com/alxmrs/xarray-sql/issues/98).
 - [ ] Demo: calculate Sea Surface Temperature from 1940 - Present in SQL [#36](https://github.com/alxmrs/xarray-sql/issues/36).
 - [ ] Provide an option to integrate DataFusion directly to Zarr via Rust [#4](https://github.com/alxmrs/xarray-sql/issues/4).
@@ -200,6 +252,8 @@ I want to give a special thanks to the following folks and institutions:
   and DataFusion-specific collaboration.
 - The gracious volunteer data science students at [UCSD's DS3](https://www.ds3atucsd.com/) org,
   who are working to make this library better.
+- Andrew Huang for the sense of taste he brings to the project and consummate code
+  changes.
 ## License

{xarray_sql-0.2.1 → xarray_sql-0.2.3}/README.md RENAMED Viewed

@@ -19,52 +19,97 @@ This is an experiment to provide a SQL interface for array datasets.
 import xarray as xr
 import xarray_sql as xql
-ds = xr.tutorial.open_dataset('air_temperature')
-# The same as a dask-sql Context; i.e. an Apache DataFusion Context.
+# Open a year of ARCO-ERA5 — all 273 variables. Selecting a year up front
+# keeps Dask's partition setup cheap before any chunks are read from GCS.
+ds = (
+  xr.open_zarr('gs://gcp-public-data-arco-era5/ar/full_37-1h-0p25deg-chunk-1.zarr-v3',
+               chunks=dict(time=1),
+               storage_options={'token': 'anon'})  # Anonymous read from the public GCS bucket — no auth required.
+  .sel(time='2020')
+)
 ctx = xql.XarrayContext()
-ctx.from_dataset('air', ds, chunks=dict(time=24))  # the dataset needs to be chunked!
-# data is only materialized when we make a query.
-result = ctx.sql('''
-  SELECT
-    "lat", "lon", AVG("air") as air_avg
-  FROM
-    "air"
-  GROUP BY
-   "lat", "lon"
-''')
-# DataFrame()
-# +------+-------+--------------------+
-# | lat  | lon   | air_avg            |
-# +------+-------+--------------------+
-# | 75.0 | 205.0 | 259.88662671232834 |
-# | 75.0 | 207.5 | 259.48268150684896 |
-# | 75.0 | 230.0 | 258.9192123287667  |
-# | 75.0 | 275.0 | 257.07574315068456 |
-# | 75.0 | 322.5 | 250.11792123287654 |
-# | 75.0 | 325.0 | 250.81590068493134 |
-# | 72.5 | 205.0 | 262.74933904109537 |
-# | 72.5 | 207.5 | 262.5384315068488  |
-# | 72.5 | 230.0 | 260.82879452054743 |
-# | 72.5 | 275.0 | 257.3063321917804  |
-# +------+-------+--------------------+
-# Data truncated.
-# The full query is only made when we call `collect()`, or, in this case,
-# `to_pandas()`.
-df = result.to_pandas()
-df.head()
-#     lat    lon     air_avg
-# 0  75.0  232.5  258.836188
-# 1  75.0  247.5  257.716171
-# 2  75.0  262.5  257.347959
-# 3  75.0  277.5  257.671308
-# 4  72.5  232.5  260.654401
+ctx.from_dataset('era5', ds, table_names={
+    ('time', 'latitude', 'longitude'): 'surface',
+    ('time', 'level', 'latitude', 'longitude'): 'atmosphere',
+})
+# Registration: ~0.5s for a full year of hourly ERA5, all variables.
+# Heads up: ARCO-ERA5 has 262 surface + 11 atmospheric variables. The library
+# pushes column projection down to Zarr, so SELECT only fetches what you ask
+# for — but `SELECT * FROM era5.surface` would try to pull every variable
+# across the year (terabytes from GCS).
+#  ---> Always SELECT specific columns. <---
+# Average 2m-temperature over NYC on the morning of 2020-01-01. The library
+# pushes WHERE clauses on dimension columns down to partition pruning.
+ctx.sql('''
+  SELECT AVG("2m_temperature") - 273.15 AS avg_c
+  FROM era5.surface
+  WHERE time BETWEEN TIMESTAMP '2020-01-01'
+                 AND TIMESTAMP '2020-01-01 05:00:00'
+    AND latitude  BETWEEN 39 AND 40
+    AND longitude BETWEEN 286 AND 287  -- ERA5 uses 0-360 longitudes
+''').to_pandas()
+#       avg_c
+# 0  8.640069
+# Average temperature per pressure level, globally.
+ctx.sql('''
+  SELECT level, AVG(temperature) - 273.15 AS avg_c
+  FROM era5.atmosphere
+  WHERE time BETWEEN TIMESTAMP '2020-01-01'
+                 AND TIMESTAMP '2020-01-01 05:00:00'
+  GROUP BY level
+  ORDER BY level DESC
+''').to_pandas()
+#     level      avg_c
+# 0    1000   6.621012   ← surface
+# 1     975   5.185638
+# 2     950   4.028429
+# 3     925   3.082812
+# 4     900   2.210917
+# 5     875   1.395018
+# 6     850   0.634267
+# 7     825  -0.210372
+# 8     800  -1.181075
+# 9     775  -2.306465
+# 10    750  -3.535534
+# 11    700  -6.241685
+# 12    650  -9.236364
+# 13    600 -12.580938
+# 14    550 -16.335386
+# 15    500 -20.643604
+# 16    450 -25.573401
+# 17    400 -31.156920
+# 18    350 -37.400552
+# 19    300 -43.852607
+# 20    250 -49.322132
+# 21    225 -51.569113
+# 22    200 -53.693248
+# 23    175 -55.890484
+# 24    150 -58.382290
+# 25    125 -61.091916
+# 26    100 -63.624885   ← tropopause
+# 27     70 -63.182300
+# 28     50 -60.124845
+# 29     30 -55.986327
+# 30     20 -52.433089
+# 31     10 -44.140750
+# 32      7 -38.707350
+# 33      5 -32.621999
+# 34      3 -21.509175
+# 35      2 -13.355764
+# 36      1  -9.020513   ← top of atmosphere
 ```
-Succinctly, we "pivot" Xarray Datasets (with consistent dimensions) to treat them like tables so we can run
-SQL queries against them.
+_(A runnable version of this example lives at
+[`perf_tests/era5_temp_profile.py`](perf_tests/era5_temp_profile.py).)_
+Succinctly, we "pivot" Xarray Datasets to treat them like tables so we can run
+SQL queries against them.
 ## Why build this?
@@ -94,11 +139,11 @@ That's it!
 _2025 update_: This library now implements a Dask-like `from_map` interface in
 pure DataFusion and PyArrow, but works with the same principle!
-_2026 update_: Instead of `from_map()`, we make factory functions from blocks of
-Xarray datasets that return RecordBatchReaders. These feed into a Rust-based
-DataFusion `TableProvider`. Every chunk is uses the Arrow in memory format to
-translate between Python and Rust. Even still, the core of what makes this idea
-work is the core `pivot()` operation from where this project began!
+_2026 update_: Instead of `from_map()`, we create a way to translate Xarray chunks
+into Arrow RecordBatches. We pass a Python callback into a DataFusion `TableProvider`
+that lets the DB engine translate the underlying Dataset arrays into DataFusion partitions.
+Ultimately, the initial insight of the `pivot()` function -- that any ndarray can be
+translated into a 2D table -- underlies this performant query mechanism.
 ## Why does this work?
@@ -116,11 +161,6 @@ early users – "tire kickers", if you will. We'd love your input to shape the d
 project! Please, give this a try and [file issues](https://github.com/alxmrs/xarray-sql/issues) as
 you see fit. Check out our [contributing guide](CONTRIBUTING.md), too 😉.
-I can say that for now, the library is oriented towards making whole scans of
-Xarray Datasets. Common filter optimizations (even basic ones like an `.sel()` on
-core dimensions, let alone predicate push downs) are not fully implemented yet.
-However, these operations and more are on our roadmap.
 ## What would a deeper integration look like?
 I have a few ideas so far. One approach involves applying operations directly on
@@ -135,18 +175,21 @@ and BigQuery. More thoughts on this
 in [#4](https://github.com/alxmrs/xarray-sql/issues/4).
 _2025 update_: Something like this is being built across a few projects! The ones I know about are:
 - [CartoDB's Raquet](https://github.com/CartoDB/raquet)
 - The DataFusion community's [arrow-zarr](https://github.com/datafusion-contrib/arrow-zarr)
-As of writing, this project is [amid integrating](https://github.com/alxmrs/xarray-sql/pull/69) a
-rust-based DataFusion backend provided by arrow-zarr.
+_2026 update_: A colleague and I are experimenting with native Zarr RDBMS engines. Check out:
+- [Zarr-Datafusion](https://lib.rs/crates/zarr-datafusion)
+- [DuckDB-Zarr](https://github.com/hobbes-bot/duckdb-zarr)
 ## Roadmap
 - [x] ~Lazy evaluation via the pyarrow Dataset interface [#93](https://github.com/alxmrs/xarray-sql/issues/93).~ _Implemented in [#100](https://github.com/alxmrs/xarray-sql/pull/100)_
-- [ ] Support proper parallelism via proper partition handling on the rust/datafusion side. [#106](https://github.com/alxmrs/xarray-sql/issues/106)
-- [ ] Support core datafusion optimizations to scan less data, like [104](https://github.com/alxmrs/xarray-sql/issues/104), ...
-- [ ] Translate a single Zarr to a collection of tables via DataFusion's catalog interface [#85](https://github.com/alxmrs/xarray-sql/issues/85).
+- [x] Support proper parallelism via proper partition handling on the rust/datafusion side. [#106](https://github.com/alxmrs/xarray-sql/issues/106)
+- [x] Support core datafusion optimizations to scan less data, like [104](https://github.com/alxmrs/xarray-sql/issues/104), ...
+- [ ] Translate a single Zarr to a collection of tables [#85](https://github.com/alxmrs/xarray-sql/issues/85).
 - [ ] Distributed beyond a single node through the DataFusion integration with Ray Datasets [#68](https://github.com/alxmrs/xarray-sql/issues/68) or Apache Ballista [#98](https://github.com/alxmrs/xarray-sql/issues/98).
 - [ ] Demo: calculate Sea Surface Temperature from 1940 - Present in SQL [#36](https://github.com/alxmrs/xarray-sql/issues/36).
 - [ ] Provide an option to integrate DataFusion directly to Zarr via Rust [#4](https://github.com/alxmrs/xarray-sql/issues/4).
@@ -166,6 +209,8 @@ I want to give a special thanks to the following folks and institutions:
   and DataFusion-specific collaboration.
 - The gracious volunteer data science students at [UCSD's DS3](https://www.ds3atucsd.com/) org,
   who are working to make this library better.
+- Andrew Huang for the sense of taste he brings to the project and consummate code
+  changes.
 ## License

xarray_sql-0.2.3/docs/assets/logo.svg ADDED Viewed

@@ -0,0 +1,104 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   version="1.1"
+   x="0px"
+   y="0px"
+   viewBox="50 115 420 395"
+   xml:space="preserve"
+   id="svg6"
+   sodipodi:docname="logo
+   inkscape:version="1.3.2 (091e20e, 2023-11-25)"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:svg="http://www.w3.org/2000/svg"><defs
+   id="defs6" /><sodipodi:namedview
+   id="namedview6"
+   pagecolor="#ffffff"
+   bordercolor="#000000"
+   borderopacity="0.25"
+   inkscape:showpageshadow="2"
+   inkscape:pageopacity="0.0"
+   inkscape:pagecheckerboard="0"
+   inkscape:deskcolor="#d1d1d1"
+   showguides="false"
+   inkscape:zoom="0.59746835"
+   inkscape:cx="76.154661"
+   inkscape:cy="63.601695"
+   inkscape:window-width="1320"
+   inkscape:window-height="905"
+   inkscape:window-x="181"
+   inkscape:window-y="34"
+   inkscape:window-maximized="0"
+   inkscape:current-layer="g6" />
+<style
+   type="text/css"
+   id="style1">
+	.st0{fill:#216C89;}
+	.st1{fill:#4993AA;}
+	.st2{fill:#0F4565;}
+	.st3{fill:#6BE8E8;}
+	.st4{fill:#9DEEF4;}
+	.st5{fill:#4ACFDD;}
+	.st6{fill:#E38017;}
+	.st7{fill:#16AFB5;}
+</style>
+<g
+   id="g6">
+	<!-- BOTTOM DATABASE (dark) -->
+	<path
+   class="st2"
+   d="m 65,362.92813 c 0,0 0,96.42499 0,96.42499 0,17.9075 70,27.55 112,27.55 42,0 112,-9.6425 112,-27.55 v -96.42499 c 0,17.90749 -70,27.54999 -112,27.54999 -42,0 -112,-9.6425 -112,-27.54999 z"
+   id="path1"
+   style="stroke-width:0.82991" />
+	<path
+   class="st0"
+   d="m 177,390.47812 c 42,0 112,-9.6425 112,-27.54999 v 96.42499 c 0,17.9075 -70,27.55 -112,27.55 z"
+   opacity="0.4"
+   id="path2"
+   style="stroke-width:0.82991" />
+	<!-- TOP DATABASE (teal) -->
+	<path
+   class="st5"
+   d="m 65,276.83438 c 0,0 0,75.76249 0,75.76249 0,17.90751 70,27.55001 112,27.55001 42,0 112,-9.6425 112,-27.55001 v -75.76249 c 0,17.90749 -70,27.54999 -112,27.54999 -42,0 -112,-9.6425 -112,-27.54999 z"
+   id="path3"
+   style="stroke-width:0.82991" />
+	<path
+   class="st3"
+   d="m 177,304.38437 c 42,0 112,-9.6425 112,-27.54999 v 75.76249 c 0,17.90751 -70,27.55001 -112,27.55001 z"
+   opacity="0.4"
+   id="path4"
+   style="stroke-width:0.82991" />
+	<path
+   class="st5"
+   d="m 66.576,190.40937 c 0,0 0,75.7625 0,75.7625 0,17.90751 70,27.55 112,27.55 42,0 112,-9.64249 112,-27.55 v -75.7625 c 0,17.9075 -70,27.55 -112,27.55 -42,0 -112,-9.6425 -112,-27.55 z"
+   id="path3-5"
+   style="fill:#4acfdd;stroke-width:0.82991" /><path
+   class="st3"
+   d="m 178.576,217.95937 c 42,0 112,-9.6425 112,-27.55 v 75.7625 c 0,17.90751 -70,27.55 -112,27.55 z"
+   opacity="0.4"
+   id="path4-7"
+   style="fill:#6be8e8;stroke-width:0.82991" /><ellipse
+   class="st4"
+   cx="178.576"
+   cy="183.52188"
+   rx="112"
+   ry="27.549999"
+   id="ellipse4-5"
+   style="fill:#9deef4;stroke-width:0.82991" />
+	<!-- DIAGONAL BARS -->
+	<polygon
+   class="st6"
+   points="377.48,412.74 308.66,482.2 308.66,346.56 377.48,277.09"
+   id="polygon5" />
+	<polygon
+   class="st7"
+   points="457.07,412.74 388.25,482.2 388.25,346.56 457.07,277.09"
+   id="polygon6" />
+</g>
+</svg>

xarray_sql-0.2.3/docs/contributing.md ADDED Viewed

	@@ -0,0 +1 @@
1	+ --8<-- "CONTRIBUTING.md"

xarray_sql 0.2.1__tar.gz → 0.2.3__tar.gz

xarray_sql 0.2.1tar.gz → 0.2.3tar.gz