PyPI - kindling-rec - Versions diffs - 1.0.1__tar.gz - Mend

kindling-rec 1.0.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

kindling_rec-1.0.1/LICENSE +17 -0
kindling_rec-1.0.1/PKG-INFO +179 -0
kindling_rec-1.0.1/README.md +136 -0
kindling_rec-1.0.1/native/Cargo.lock +1161 -0
kindling_rec-1.0.1/native/Cargo.toml +34 -0
kindling_rec-1.0.1/native/kindling_core/Cargo.toml +36 -0
kindling_rec-1.0.1/native/kindling_core/src/engine/channels.rs +107 -0
kindling_rec-1.0.1/native/kindling_core/src/engine/mod.rs +20 -0
kindling_rec-1.0.1/native/kindling_core/src/engine/native_state.rs +711 -0
kindling_rec-1.0.1/native/kindling_core/src/engine/recommend.rs +155 -0
kindling_rec-1.0.1/native/kindling_core/src/lib.rs +33 -0
kindling_rec-1.0.1/native/kindling_core/src/loaders/mod.rs +32 -0
kindling_rec-1.0.1/native/kindling_core/src/repeat/mod.rs +23 -0
kindling_rec-1.0.1/native/kindling_core/src/repeat/multiplier.rs +271 -0
kindling_rec-1.0.1/native/kindling_core/src/repeat/period.rs +173 -0
kindling_rec-1.0.1/native/kindling_core/src/repeat/profile.rs +97 -0
kindling_rec-1.0.1/native/kindling_core/src/score/calibrator.rs +375 -0
kindling_rec-1.0.1/native/kindling_core/src/score/layered.rs +251 -0
kindling_rec-1.0.1/native/kindling_core/src/score/mod.rs +23 -0
kindling_rec-1.0.1/native/kindling_core/src/signals/cooc_transform.rs +66 -0
kindling_rec-1.0.1/native/kindling_core/src/signals/cooccurrence.rs +341 -0
kindling_rec-1.0.1/native/kindling_core/src/signals/directional_cooc.rs +272 -0
kindling_rec-1.0.1/native/kindling_core/src/signals/ease.rs +249 -0
kindling_rec-1.0.1/native/kindling_core/src/signals/metadata_knn.rs +137 -0
kindling_rec-1.0.1/native/kindling_core/src/signals/mod.rs +29 -0
kindling_rec-1.0.1/native/kindling_core/src/signals/session_cooccurrence.rs +193 -0
kindling_rec-1.0.1/pyproject.toml +159 -0
kindling_rec-1.0.1/src/kindling/__init__.py +25 -0
kindling_rec-1.0.1/src/kindling/_native.py +34 -0
kindling_rec-1.0.1/src/kindling/_native_engine.py +155 -0
kindling_rec-1.0.1/src/kindling/activation.py +151 -0
kindling_rec-1.0.1/src/kindling/benchmarks/__init__.py +6 -0
kindling_rec-1.0.1/src/kindling/benchmarks/baselines.py +199 -0
kindling_rec-1.0.1/src/kindling/benchmarks/comparison.py +209 -0
kindling_rec-1.0.1/src/kindling/benchmarks/metrics.py +42 -0
kindling_rec-1.0.1/src/kindling/benchmarks/parity.py +51 -0
kindling_rec-1.0.1/src/kindling/blend/__init__.py +7 -0
kindling_rec-1.0.1/src/kindling/blend/layer_scoring.py +166 -0
kindling_rec-1.0.1/src/kindling/engine.py +1865 -0
kindling_rec-1.0.1/src/kindling/explain/__init__.py +5 -0
kindling_rec-1.0.1/src/kindling/explain/templates.py +53 -0
kindling_rec-1.0.1/src/kindling/graph/__init__.py +5 -0
kindling_rec-1.0.1/src/kindling/graph/cooc_transform.py +81 -0
kindling_rec-1.0.1/src/kindling/graph/item_graph.py +155 -0
kindling_rec-1.0.1/src/kindling/graph/metadata_smoothing.py +223 -0
kindling_rec-1.0.1/src/kindling/ingest/__init__.py +16 -0
kindling_rec-1.0.1/src/kindling/ingest/contract.py +140 -0
kindling_rec-1.0.1/src/kindling/ingest/sessions.py +216 -0
kindling_rec-1.0.1/src/kindling/item_features.py +324 -0
kindling_rec-1.0.1/src/kindling/lifecycle/__init__.py +17 -0
kindling_rec-1.0.1/src/kindling/lifecycle/decay.py +96 -0
kindling_rec-1.0.1/src/kindling/loaders/__init__.py +33 -0
kindling_rec-1.0.1/src/kindling/loaders/_base.py +48 -0
kindling_rec-1.0.1/src/kindling/loaders/amazon.py +142 -0
kindling_rec-1.0.1/src/kindling/loaders/amazon_chrono.py +106 -0
kindling_rec-1.0.1/src/kindling/loaders/dunnhumby.py +114 -0
kindling_rec-1.0.1/src/kindling/loaders/gowalla.py +144 -0
kindling_rec-1.0.1/src/kindling/loaders/instacart.py +141 -0
kindling_rec-1.0.1/src/kindling/loaders/movielens.py +172 -0
kindling_rec-1.0.1/src/kindling/loaders/retailrocket.py +151 -0
kindling_rec-1.0.1/src/kindling/loaders/steam.py +103 -0
kindling_rec-1.0.1/src/kindling/loaders/synthetic.py +163 -0
kindling_rec-1.0.1/src/kindling/loaders/tafeng.py +117 -0
kindling_rec-1.0.1/src/kindling/loaders/yelp.py +136 -0
kindling_rec-1.0.1/src/kindling/persist.py +76 -0
kindling_rec-1.0.1/src/kindling/preprocess.py +134 -0
kindling_rec-1.0.1/src/kindling/serving.py +191 -0
kindling_rec-1.0.1/src/kindling/serving_app.py +79 -0

kindling_rec-1.0.1/LICENSE ADDED Viewed

@@ -0,0 +1,17 @@
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+Copyright 2026 Robert Hoekstra (Awry Labs)
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.

kindling_rec-1.0.1/PKG-INFO ADDED Viewed

@@ -0,0 +1,179 @@
+Metadata-Version: 2.4
+Name: kindling-rec
+Version: 1.0.1
+Classifier: Development Status :: 5 - Production/Stable
+Classifier: License :: OSI Approved :: Apache Software License
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Requires-Dist: numpy>=1.26
+Requires-Dist: pandas>=2.1
+Requires-Dist: scipy>=1.11
+Requires-Dist: implicit>=0.7 ; extra == 'baselines'
+Requires-Dist: requests>=2.31 ; extra == 'bench'
+Requires-Dist: tqdm>=4.66 ; extra == 'bench'
+Requires-Dist: matplotlib>=3.8 ; extra == 'bench'
+Requires-Dist: pytest>=8.0 ; extra == 'dev'
+Requires-Dist: pytest-cov>=5.0 ; extra == 'dev'
+Requires-Dist: hypothesis>=6.100 ; extra == 'dev'
+Requires-Dist: ruff>=0.5 ; extra == 'dev'
+Requires-Dist: mypy>=1.11 ; extra == 'dev'
+Requires-Dist: pandas-stubs ; extra == 'dev'
+Requires-Dist: types-toml ; extra == 'dev'
+Requires-Dist: umap-learn>=0.5 ; extra == 'personas'
+Requires-Dist: hdbscan>=0.8 ; extra == 'personas'
+Requires-Dist: scikit-learn>=1.3 ; extra == 'personas'
+Requires-Dist: fastapi>=0.110 ; extra == 'serve'
+Requires-Dist: uvicorn>=0.29 ; extra == 'serve'
+Provides-Extra: baselines
+Provides-Extra: bench
+Provides-Extra: dev
+Provides-Extra: personas
+Provides-Extra: serve
+License-File: LICENSE
+Summary: A hybrid recommender system that grows with your data
+Author-email: Robert Hoekstra <rhoekstr@gmail.com>
+License-Expression: Apache-2.0
+Requires-Python: >=3.11
+Description-Content-Type: text/markdown; charset=UTF-8; variant=GFM
+Project-URL: Homepage, https://github.com/rhoekstr/kindling
+Project-URL: Issues, https://github.com/rhoekstr/kindling/issues
+# kindling
+A hybrid recommender that grows with your data — closed-form, no training
+loop, no GPU. One fused base score per (user, item) built from EASE /
+wilson-cooccurrence plus auto-gated z-normalized channels (trend,
+last-item, transitions, user-CF), with a Rust core for the numerics.
+**Design goals (learned the hard way — see [`docs/EXPERIMENTS.md`](docs/EXPERIMENTS.md)):**
+1. **A wheel that imports is a wheel that works.** numpy / pandas / scipy
+   only; the linear algebra that matters (the EASE inversion) runs on a
+   pure-Rust core (`kindling_core`). No PyTorch, no BLAS system deps.
+2. **Closed-form shallow models, gated per dataset, beat speculative
+   complexity.** Every channel is closed-form or a counting statistic;
+   every channel is activated by a measurable property of the data; every
+   gate exists because the ungated version measurably hurt somewhere.
+## Install
+```bash
+pip install kindling-rec           # from PyPI
+pip install -e ".[dev]"            # dev / from source
+pip install -e ".[dev,bench]"      # + benchmark harness
+```
+## Quickstart
+```python
+from kindling import Engine
+from kindling.loaders import movielens
+interactions = movielens.load_1m()       # entity_id, item_id, timestamp[, rating]
+engine = Engine()
+engine.fit(interactions)
+for rec in engine.recommend(entity_id=42, n=10):
+    print(rec.item_id, rec.score, rec.base_kind)
+# Many users at once — runs in parallel in the Rust core (GIL released).
+batches = engine.recommend_batch([42, 99, 7], n=10)
+```
+Recommendation is served end-to-end by the Rust core (`kindling_core`): the
+EASE/cooc base, the channel blend, the boost layer, and cold-slots all run
+natively. Single recommend is sub-millisecond; batch is the parallel path.
+**New / anonymous users** (absent from training) are served from ad-hoc
+seed items with no per-user training — and a zero/all-unknown seed set
+falls back to popularity:
+```python
+engine.recommend_for_items(item_ids=[101, 205], n=10)   # personalized from seeds
+engine.recommend_for_items(item_ids=[], n=10)           # → popularity fallback
+```
+## Intelligent activation
+Channels turn on by *regime*, not configuration. The base is EASE for
+catalogs ≤ 20k items and wilson-normalized cooccurrence above that;
+the trend channel needs timestamps; transitions additionally need the
+data not to be a rating-burst; user-CF activates only on sparse-history
+data; rating-weighting engages only when true ratings are present. Each
+decision is made from the data at `fit()` time. See
+[`docs/REFERENCE.md`](docs/REFERENCE.md) §2 for the gate table.
+## Where it stands (full-ranking NDCG@10, engine defaults)
+> Full results — discovery growth **and** the repeat-regime dominance — in [`docs/RESULTS.md`](docs/RESULTS.md).
+| dataset | NDCG@10 | notes |
+|---|---:|---|
+| movielens-1m | 0.293 | rating-weighted EASE |
+| amazon-beauty | 0.033 | + user-CF channel |
+| steam (realistic tier) | 0.066 | open-catalog + cold slots |
+| amazon-book-chrono | 0.032 | timestamps activate trend/transitions |
+Strongest personalized model on all four; beats implicit ALS everywhere;
+wins cold-*user* buckets on cold-heavy catalogs. The full benchmark
+record — including the negative results, which are half the value — is in
+[`docs/EXPERIMENTS.md`](docs/EXPERIMENTS.md).
+On **repeat-regime** datasets (grocery/retail), a held-out gate turns on reorder
+recommendation; under repeat-aware eval kindling separates from the field —
+e.g. Dunnhumby 0.48 NDCG@10 vs ~0.05 for every baseline — while correctly
+*declining* on fake-repeat data like Steam (re-logs aren't repurchase). See
+[`docs/REPEAT-GATE.md`](docs/REPEAT-GATE.md). An opt-in EASE+ (EDLAE) base is
+available but off by default ([`docs/EASE-VARIANTS-ASSESSMENT.md`](docs/EASE-VARIANTS-ASSESSMENT.md)).
+### Growth curves
+How accuracy grows from cold to hot, against the standard baselines
+(`bench/plot_growth_curves.py`):
+![growth curves](bench/reports/growth_curves_grid.png)
+### Serving performance (native engine, `bench/final_state_perf.py`)
+| dataset | fit | single recommend p50 | batch throughput | NDCG@10 |
+|---|---:|---:|---:|---:|
+| movielens-1m | 4.2 s | 0.17 ms | 15.4k recs/s | 0.2928 |
+| amazon-beauty | 13.1 s | 1.21 ms | 3.0k recs/s | 0.0328 |
+| steam | 110 s | 5.81 ms | 0.8k recs/s | 0.0659 |
+The recommend path is pure Rust with the GIL released for the batch path —
+single recommend dropped from ~200 ms (the earlier Python path) to
+sub-millisecond, with byte-identical rankings.
+### Serving
+Persist a fit as a self-contained artifact and serve it with no re-fit:
+```python
+from kindling.serving import KindlingServer
+KindlingServer.from_engine(engine).save("artifact/")
+# ── in the serving process ──
+server = KindlingServer.load("artifact/")
+server.recommend("user-42", n=10)
+```
+A FastAPI example (`kindling.serving_app`) ships behind the optional
+`serve` extra: `pip install 'kindling[serve]'`.
+## Project layout
+```
+src/kindling/      library source (engine, serving, Rust bindings, loaders)
+native/kindling_core/  Rust core (EASE, cooccurrence, channel blend, recommend)
+bench/             regression gate (bench/verify.py) + frozen reports + plots
+docs/              RESULTS.md (what it brings) · REFERENCE.md (architecture) ·
+                   EXPERIMENTS.md (record) · LESSONS.md (what the build taught)
+tests/             unit, property, integration
+```
+## License
+Apache 2.0.

kindling_rec-1.0.1/README.md ADDED Viewed

@@ -0,0 +1,136 @@
+# kindling
+A hybrid recommender that grows with your data — closed-form, no training
+loop, no GPU. One fused base score per (user, item) built from EASE /
+wilson-cooccurrence plus auto-gated z-normalized channels (trend,
+last-item, transitions, user-CF), with a Rust core for the numerics.
+**Design goals (learned the hard way — see [`docs/EXPERIMENTS.md`](docs/EXPERIMENTS.md)):**
+1. **A wheel that imports is a wheel that works.** numpy / pandas / scipy
+   only; the linear algebra that matters (the EASE inversion) runs on a
+   pure-Rust core (`kindling_core`). No PyTorch, no BLAS system deps.
+2. **Closed-form shallow models, gated per dataset, beat speculative
+   complexity.** Every channel is closed-form or a counting statistic;
+   every channel is activated by a measurable property of the data; every
+   gate exists because the ungated version measurably hurt somewhere.
+## Install
+```bash
+pip install kindling-rec           # from PyPI
+pip install -e ".[dev]"            # dev / from source
+pip install -e ".[dev,bench]"      # + benchmark harness
+```
+## Quickstart
+```python
+from kindling import Engine
+from kindling.loaders import movielens
+interactions = movielens.load_1m()       # entity_id, item_id, timestamp[, rating]
+engine = Engine()
+engine.fit(interactions)
+for rec in engine.recommend(entity_id=42, n=10):
+    print(rec.item_id, rec.score, rec.base_kind)
+# Many users at once — runs in parallel in the Rust core (GIL released).
+batches = engine.recommend_batch([42, 99, 7], n=10)
+```
+Recommendation is served end-to-end by the Rust core (`kindling_core`): the
+EASE/cooc base, the channel blend, the boost layer, and cold-slots all run
+natively. Single recommend is sub-millisecond; batch is the parallel path.
+**New / anonymous users** (absent from training) are served from ad-hoc
+seed items with no per-user training — and a zero/all-unknown seed set
+falls back to popularity:
+```python
+engine.recommend_for_items(item_ids=[101, 205], n=10)   # personalized from seeds
+engine.recommend_for_items(item_ids=[], n=10)           # → popularity fallback
+```
+## Intelligent activation
+Channels turn on by *regime*, not configuration. The base is EASE for
+catalogs ≤ 20k items and wilson-normalized cooccurrence above that;
+the trend channel needs timestamps; transitions additionally need the
+data not to be a rating-burst; user-CF activates only on sparse-history
+data; rating-weighting engages only when true ratings are present. Each
+decision is made from the data at `fit()` time. See
+[`docs/REFERENCE.md`](docs/REFERENCE.md) §2 for the gate table.
+## Where it stands (full-ranking NDCG@10, engine defaults)
+> Full results — discovery growth **and** the repeat-regime dominance — in [`docs/RESULTS.md`](docs/RESULTS.md).
+| dataset | NDCG@10 | notes |
+|---|---:|---|
+| movielens-1m | 0.293 | rating-weighted EASE |
+| amazon-beauty | 0.033 | + user-CF channel |
+| steam (realistic tier) | 0.066 | open-catalog + cold slots |
+| amazon-book-chrono | 0.032 | timestamps activate trend/transitions |
+Strongest personalized model on all four; beats implicit ALS everywhere;
+wins cold-*user* buckets on cold-heavy catalogs. The full benchmark
+record — including the negative results, which are half the value — is in
+[`docs/EXPERIMENTS.md`](docs/EXPERIMENTS.md).
+On **repeat-regime** datasets (grocery/retail), a held-out gate turns on reorder
+recommendation; under repeat-aware eval kindling separates from the field —
+e.g. Dunnhumby 0.48 NDCG@10 vs ~0.05 for every baseline — while correctly
+*declining* on fake-repeat data like Steam (re-logs aren't repurchase). See
+[`docs/REPEAT-GATE.md`](docs/REPEAT-GATE.md). An opt-in EASE+ (EDLAE) base is
+available but off by default ([`docs/EASE-VARIANTS-ASSESSMENT.md`](docs/EASE-VARIANTS-ASSESSMENT.md)).
+### Growth curves
+How accuracy grows from cold to hot, against the standard baselines
+(`bench/plot_growth_curves.py`):
+![growth curves](bench/reports/growth_curves_grid.png)
+### Serving performance (native engine, `bench/final_state_perf.py`)
+| dataset | fit | single recommend p50 | batch throughput | NDCG@10 |
+|---|---:|---:|---:|---:|
+| movielens-1m | 4.2 s | 0.17 ms | 15.4k recs/s | 0.2928 |
+| amazon-beauty | 13.1 s | 1.21 ms | 3.0k recs/s | 0.0328 |
+| steam | 110 s | 5.81 ms | 0.8k recs/s | 0.0659 |
+The recommend path is pure Rust with the GIL released for the batch path —
+single recommend dropped from ~200 ms (the earlier Python path) to
+sub-millisecond, with byte-identical rankings.
+### Serving
+Persist a fit as a self-contained artifact and serve it with no re-fit:
+```python
+from kindling.serving import KindlingServer
+KindlingServer.from_engine(engine).save("artifact/")
+# ── in the serving process ──
+server = KindlingServer.load("artifact/")
+server.recommend("user-42", n=10)
+```
+A FastAPI example (`kindling.serving_app`) ships behind the optional
+`serve` extra: `pip install 'kindling[serve]'`.
+## Project layout
+```
+src/kindling/      library source (engine, serving, Rust bindings, loaders)
+native/kindling_core/  Rust core (EASE, cooccurrence, channel blend, recommend)
+bench/             regression gate (bench/verify.py) + frozen reports + plots
+docs/              RESULTS.md (what it brings) · REFERENCE.md (architecture) ·
+                   EXPERIMENTS.md (record) · LESSONS.md (what the build taught)
+tests/             unit, property, integration
+```
+## License
+Apache 2.0.