PyPI - patentml - Versions diffs - 0.1.0__tar.gz - Mend

patentml 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

patentml-0.1.0/LICENSE +28 -0
patentml-0.1.0/PKG-INFO +103 -0
patentml-0.1.0/README.md +75 -0
patentml-0.1.0/patentml/__init__.py +169 -0
patentml-0.1.0/patentml/actor_critic.py +304 -0
patentml-0.1.0/patentml/adaboost.py +168 -0
patentml-0.1.0/patentml/bayesian_network.py +300 -0
patentml-0.1.0/patentml/bayesian_optimiser.py +264 -0
patentml-0.1.0/patentml/collaborative_filter.py +254 -0
patentml-0.1.0/patentml/dbscan.py +230 -0
patentml-0.1.0/patentml/decision_tree.py +289 -0
patentml-0.1.0/patentml/deep_networks.py +426 -0
patentml-0.1.0/patentml/em_clustering.py +198 -0
patentml-0.1.0/patentml/ensemble.py +299 -0
patentml-0.1.0/patentml/feature_engineering.py +334 -0
patentml-0.1.0/patentml/gaussian_process.py +256 -0
patentml-0.1.0/patentml/genetic_algorithm.py +271 -0
patentml-0.1.0/patentml/genetic_programming.py +289 -0
patentml-0.1.0/patentml/gradient_boosting.py +227 -0
patentml-0.1.0/patentml/grammar_gp.py +546 -0
patentml-0.1.0/patentml/hidden_markov.py +312 -0
patentml-0.1.0/patentml/isolation_forest.py +223 -0
patentml-0.1.0/patentml/kalman_filter.py +258 -0
patentml-0.1.0/patentml/knn.py +255 -0
patentml-0.1.0/patentml/linear_gp.py +405 -0
patentml-0.1.0/patentml/mean_shift.py +198 -0
patentml-0.1.0/patentml/mini_neural_net.py +146 -0
patentml-0.1.0/patentml/multi_armed_bandit.py +255 -0
patentml-0.1.0/patentml/neuroevolution.py +260 -0
patentml-0.1.0/patentml/online_classifier.py +141 -0
patentml-0.1.0/patentml/optimisers.py +208 -0
patentml-0.1.0/patentml/particle_swarm.py +319 -0
patentml-0.1.0/patentml/q_learning.py +229 -0
patentml-0.1.0/patentml/scalable_kmeans.py +161 -0
patentml-0.1.0/patentml/simulated_annealing.py +205 -0
patentml-0.1.0/patentml/spectral_clustering.py +234 -0
patentml-0.1.0/patentml/svd_reducer.py +248 -0
patentml-0.1.0/patentml/svm_smo.py +181 -0
patentml-0.1.0/patentml/text_classifier.py +202 -0
patentml-0.1.0/patentml/vector_quantisation.py +254 -0
patentml-0.1.0/patentml/word_embeddings.py +325 -0
patentml-0.1.0/patentml.egg-info/PKG-INFO +103 -0
patentml-0.1.0/patentml.egg-info/SOURCES.txt +46 -0
patentml-0.1.0/patentml.egg-info/dependency_links.txt +1 -0
patentml-0.1.0/patentml.egg-info/top_level.txt +1 -0
patentml-0.1.0/pyproject.toml +41 -0
patentml-0.1.0/setup.cfg +4 -0
patentml-0.1.0/tests/test_smoke.py +136 -0

patentml-0.1.0/LICENSE ADDED Viewed

@@ -0,0 +1,28 @@
+MIT License
+Copyright (c) 2026 Martin Carr
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+---
+The algorithms implemented in this library are derived from United States
+patents that have expired and entered the public domain. The implementations
+themselves are original code, copyright as above. Source patents are
+documented per-module and in the package docstring.

patentml-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,103 @@
+Metadata-Version: 2.4
+Name: patentml
+Version: 0.1.0
+Summary: 37 machine learning algorithms reconstructed from expired US patents. Zero dependencies, pure Python stdlib.
+Author-email: Martin Carr <martincarrsy23@gmail.com>
+License: MIT
+Project-URL: Homepage, https://getoptimal8.com
+Keywords: machine-learning,zero-dependency,stdlib,patents,genetic-algorithm,genetic-programming,neural-network,reinforcement-learning,clustering,kalman-filter,gaussian-process,embedded,micropython
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Developers
+Classifier: Intended Audience :: Science/Research
+Classifier: Intended Audience :: Education
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Operating System :: OS Independent
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.8
+Classifier: Programming Language :: Python :: 3.9
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Classifier: Topic :: Software Development :: Libraries :: Python Modules
+Requires-Python: >=3.8
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Dynamic: license-file
+# patentml
+**Machine learning from expired patents. Zero dependencies. Pure Python stdlib.**
+37 modules, 131 classes and functions — every algorithm reconstructed from a United States patent that has expired into the public domain. The patents that built modern ML were filed by IBM, Bell Labs, Microsoft Research, Lockheed, AT&T and Lucent between 1995 and 2006. They have all expired. This library is what they describe, as clean modern Python, with no imports beyond the standard library.
+```
+pip install patentml
+```
+No numpy. No scipy. No compiled extensions. If it runs Python 3.8+, it runs `patentml` — locked-down corporate machines, serverless functions, air-gapped environments, Pyodide in the browser, and (with light trimming) MicroPython boards.
+## Quick start
+```python
+from patentml import RandomForest, ScalableKMeans, ThompsonSampling, KalmanFilter
+# Classification — US6816847 (Microsoft, 1999)
+forest = RandomForest(n_trees=25)
+forest.fit(X_train, y_train)
+labels = [forest.predict(x) for x in X_test]
+# Clustering — US6012058 (Microsoft, 1998)
+km = ScalableKMeans(k=3)
+km.fit(points)
+# Bandits — US6981040 (Utopy, 2000) [919 forward citations]
+bandit = ThompsonSampling(n_arms=4)
+arm = bandit.select()
+bandit.update(arm, reward=1.0)
+# State estimation — US6795794 (Univ. Illinois, 2002)
+kf = KalmanFilter(dim_state=2, dim_obs=1)
+```
+## What's inside
+| Family | Modules |
+|---|---|
+| Evolutionary & global optimisation | genetic algorithm, genetic programming, grammar GP / grammatical evolution, linear GP, particle swarm, differential evolution, CMA-ES, simulated annealing, ant colony, Bayesian optimiser / EDA, neuroevolution |
+| Neural networks | mini neural net (mini-batch backprop), Conv1D, SimpleRNN, GRU cell, SGD/RMSProp/Adam/AdamW optimisers |
+| Classifiers | decision tree, random forest, AdaBoost, SVM (SMO), online Bayes, naive Bayes, KNN (+ BallTree), gradient boosting |
+| Ensembles | voting, stacking, bagging, weighted |
+| Clustering | scalable & hierarchical k-means, DBSCAN, OPTICS, EM / Gaussian mixture, spectral, mean shift |
+| Reinforcement learning | Q-learning, SARSA, function-approximation Q, actor-critic A2C, PPO-lite, ε-greedy / UCB1 / Thompson / EXP3 / LinUCB bandits |
+| Probabilistic | Bayesian network, hidden Markov model, Gaussian process regression & classification, kernel density estimation |
+| Anomaly detection | isolation forest, one-class SVM |
+| NLP | TF-IDF + naive Bayes text pipeline, word2vec SGNS, PMI embeddings |
+| Recommenders | memory-based & Bayesian collaborative filtering |
+| Dimensionality & features | PCA, randomised SVD, vector quantisation (LBG, product quantiser), scalers, mutual-information ranking, forward selection |
+| State estimation | Kalman filter, extended Kalman filter |
+## Provenance
+Every module documents its source patent: number, assignee, filing year, and forward-citation count. Highlights:
+| Patent | Assignee | Algorithm | Citations |
+|---|---|---|---|
+| US5613012 | SmartTouch (1995) | Voting ensemble | 1,182 |
+| US6981040 | Utopy (2000) | Bandit selection | 919 |
+| US6161130 | Microsoft (1998) | Online classifier | 896 |
+| US6556983 | Microsoft (2000) | Word embeddings (PMI + SGNS) | 645 |
+| US6192360 | Microsoft (1998) | TF-IDF + naive Bayes | 364 |
+| US6317707 | AT&T (1998) | Mean shift + KDE | 269 |
+| US6931384 | Microsoft (2001) | Gaussian process regression | 258 |
+The full list of ~40 source patents is in the package docstring: `python -c "import patentml; print(patentml.__doc__)"`.
+All source patents are expired. The implementations are original code, MIT licensed.
+## Why
+Modern ML stacks are heavy, opaque, and supply-chain risky. Sometimes you need *one* algorithm — a Kalman filter on a microcontroller, a bandit in a serverless function, k-means in a browser — without 200 MB of compiled wheels. And sometimes you want code you can actually read: every module here is a single self-contained file you can audit in one sitting.
+These algorithms earned their citations the hard way. They still work.

patentml-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,75 @@
+# patentml
+**Machine learning from expired patents. Zero dependencies. Pure Python stdlib.**
+37 modules, 131 classes and functions — every algorithm reconstructed from a United States patent that has expired into the public domain. The patents that built modern ML were filed by IBM, Bell Labs, Microsoft Research, Lockheed, AT&T and Lucent between 1995 and 2006. They have all expired. This library is what they describe, as clean modern Python, with no imports beyond the standard library.
+```
+pip install patentml
+```
+No numpy. No scipy. No compiled extensions. If it runs Python 3.8+, it runs `patentml` — locked-down corporate machines, serverless functions, air-gapped environments, Pyodide in the browser, and (with light trimming) MicroPython boards.
+## Quick start
+```python
+from patentml import RandomForest, ScalableKMeans, ThompsonSampling, KalmanFilter
+# Classification — US6816847 (Microsoft, 1999)
+forest = RandomForest(n_trees=25)
+forest.fit(X_train, y_train)
+labels = [forest.predict(x) for x in X_test]
+# Clustering — US6012058 (Microsoft, 1998)
+km = ScalableKMeans(k=3)
+km.fit(points)
+# Bandits — US6981040 (Utopy, 2000) [919 forward citations]
+bandit = ThompsonSampling(n_arms=4)
+arm = bandit.select()
+bandit.update(arm, reward=1.0)
+# State estimation — US6795794 (Univ. Illinois, 2002)
+kf = KalmanFilter(dim_state=2, dim_obs=1)
+```
+## What's inside
+| Family | Modules |
+|---|---|
+| Evolutionary & global optimisation | genetic algorithm, genetic programming, grammar GP / grammatical evolution, linear GP, particle swarm, differential evolution, CMA-ES, simulated annealing, ant colony, Bayesian optimiser / EDA, neuroevolution |
+| Neural networks | mini neural net (mini-batch backprop), Conv1D, SimpleRNN, GRU cell, SGD/RMSProp/Adam/AdamW optimisers |
+| Classifiers | decision tree, random forest, AdaBoost, SVM (SMO), online Bayes, naive Bayes, KNN (+ BallTree), gradient boosting |
+| Ensembles | voting, stacking, bagging, weighted |
+| Clustering | scalable & hierarchical k-means, DBSCAN, OPTICS, EM / Gaussian mixture, spectral, mean shift |
+| Reinforcement learning | Q-learning, SARSA, function-approximation Q, actor-critic A2C, PPO-lite, ε-greedy / UCB1 / Thompson / EXP3 / LinUCB bandits |
+| Probabilistic | Bayesian network, hidden Markov model, Gaussian process regression & classification, kernel density estimation |
+| Anomaly detection | isolation forest, one-class SVM |
+| NLP | TF-IDF + naive Bayes text pipeline, word2vec SGNS, PMI embeddings |
+| Recommenders | memory-based & Bayesian collaborative filtering |
+| Dimensionality & features | PCA, randomised SVD, vector quantisation (LBG, product quantiser), scalers, mutual-information ranking, forward selection |
+| State estimation | Kalman filter, extended Kalman filter |
+## Provenance
+Every module documents its source patent: number, assignee, filing year, and forward-citation count. Highlights:
+| Patent | Assignee | Algorithm | Citations |
+|---|---|---|---|
+| US5613012 | SmartTouch (1995) | Voting ensemble | 1,182 |
+| US6981040 | Utopy (2000) | Bandit selection | 919 |
+| US6161130 | Microsoft (1998) | Online classifier | 896 |
+| US6556983 | Microsoft (2000) | Word embeddings (PMI + SGNS) | 645 |
+| US6192360 | Microsoft (1998) | TF-IDF + naive Bayes | 364 |
+| US6317707 | AT&T (1998) | Mean shift + KDE | 269 |
+| US6931384 | Microsoft (2001) | Gaussian process regression | 258 |
+The full list of ~40 source patents is in the package docstring: `python -c "import patentml; print(patentml.__doc__)"`.
+All source patents are expired. The implementations are original code, MIT licensed.
+## Why
+Modern ML stacks are heavy, opaque, and supply-chain risky. Sometimes you need *one* algorithm — a Kalman filter on a microcontroller, a bandit in a serverless function, k-means in a browser — without 200 MB of compiled wheels. And sometimes you want code you can actually read: every module here is a single self-contained file you can audit in one sitting.
+These algorithms earned their citations the hard way. They still work.

patentml-0.1.0/patentml/__init__.py ADDED Viewed

@@ -0,0 +1,169 @@
+"""
+patentml — Machine Learning from Expired Patents
+All algorithms derived from expired US patents. Zero dependencies. Pure Python stdlib.
+EXPIRED PATENT SOURCES (selected key ones):
+  US5970487  Mitsubishi (1997)  GA hardware machine
+  US6912587  AT&T       (2001)  Constraint-weighted GA fitness
+  US6477444  Fuji Xerox (2000)  Genetic programming tree evolution
+  US6212427  Kennedy    (1999)  Particle swarm optimisation
+  US6484115  Storn      (1999)  Differential evolution
+  US7047169  Univ. IL   (2002)  EDA / Bayesian optimisation
+  US7219040  GE         (2002)  Simulated annealing + constraints
+  US5835901  Lockheed   (1997)  Neuroevolution [142 cites]
+  US7162461  SAS        (2005)  Hybrid NN activation search
+  US6128606  AT&T       (1997)  Modular NN + backprop [53 cites]
+  US7747070  Microsoft  (2005)  CNN on GPU [91 cites]
+  US6963862  Texas A&M  (2001)  Recurrent network training
+  US7447669  Nanyang    (2004)  Ant Colony Optimisation
+  US6161130  Microsoft  (1998)  Online classifier [896 cites]
+  US6327581  Microsoft  (1998)  SVM-SMO [173 cites]
+  US7421415  Siemens    (2005)  AdaBoost + feature selection
+  US6816847  Microsoft  (1999)  Decision tree + ensembles [72 cites]
+  US5613012  SmartTouch (1995)  Voting ensemble [1182 cites]
+  US6012058  Microsoft  (1998)  Scalable K-means
+  US6985172  SW Research(2002)  Q-learning / TD + Actor-Critic A2C / PPO-lite [145 cites]
+  US6981040  Utopy      (2000)  Bandit selection [919 cites]
+  US7076102  Philips    (2002)  HMM event learning [116 cites]
+  US6529891  Microsoft  (1998)  PCA / Bayesian model selection [124 cites]
+  US6807536  Microsoft  (2001)  Randomised SVD / low-rank approximation [170 cites]
+  US6263337  Microsoft  (1998)  Scalable EM / Gaussian mixture clustering [142 cites]
+  US6192360  Microsoft  (1998)  Text classifier TF-IDF + Naive Bayes [364 cites]
+  US6496816  Microsoft  (1998)  Collaborative filtering + Bayesian mixture [128 cites]
+  US6374251  Microsoft  (1998)  KNN + BallTree scalable search [187 cites]
+  US6049797  Lucent     (1998)  DBSCAN + OPTICS density clustering [154 cites]
+  US7031530  Lockheed   (2001)  Gradient Boosting Machine (GBM) [188 cites]
+  US6795794  U.Illinois (2002)  Kalman Filter + Extended KF [127 cites]
+  US6931384  Microsoft  (2001)  Gaussian Process regression + classification [258 cites]
+  US6216066  GE         (1998)  Spectral clustering via Laplacian eigenmap [148 cites]
+  US6317707  AT&T       (1998)  Mean Shift + Kernel Density Estimation [269 cites]
+  US7225343  Columbia U (2003)  Isolation Forest + One-Class SVM [159 cites]
+  US6490698  Microsoft  (1999)  Bayesian Network + Naive Bayes [102 cites]
+  US6421467  Texas Tech (1999)  Vector Quantisation LBG + Product Quantiser [101 cites]
+  US6556983  Microsoft  (2000)  Word Embeddings PMI + Word2Vec SGNS [645 cites]
+"""
+__version__ = "0.1.0"
+from .genetic_algorithm   import GeneticAlgorithm, Chromosome, make_population
+from .genetic_programming import GeneticProgramming, rand_tree, Var, Const, BinOp, UnaryOp
+from .grammar_gp import (GrammarGP, GrammaticalEvolution, GNode,
+                          rand_grammar_tree, make_math_grammar, MATH_GRAMMAR,
+                          subtree_crossover, subtree_mutation, point_mutation)
+from .linear_gp import (LinearGP, Instruction, Program,
+                         rand_program, effective_program, effective_instructions,
+                         linear_crossover, micro_mutation, macro_mutation,
+                         to_expr_string, execute, OPERATIONS, FAST_OPS)
+from .particle_swarm      import ParticleSwarmOptimiser, DifferentialEvolution, CMAES
+from .online_classifier   import OnlineBayesClassifier
+from .scalable_kmeans     import ScalableKMeans, HierarchicalKMeans
+from .mini_neural_net     import MiniNeuralNet
+from .deep_networks       import Conv1D, SimpleRNN, GRUCell, AntColonyOptimiser
+from .svm_smo             import SVM, linear_kernel, rbf_kernel, poly_kernel
+from .adaboost            import AdaBoost, DecisionStump
+from .q_learning          import QLearner, SARSALearner, FunctionApproxQLearner
+from .multi_armed_bandit  import EpsilonGreedy, UCB1, ThompsonSampling, EXP3, LinUCB
+from .bayesian_optimiser  import GaussianEDA, BayesianOptimiser
+from .simulated_annealing import SimulatedAnnealing, MultiObjectiveSA
+from .decision_tree       import DecisionTree, RandomForest
+from .optimisers          import SGD, RMSProp, Adam, AdamW, LRScheduler, numerical_gradient
+from .hidden_markov       import HiddenMarkovModel
+from .neuroevolution      import EvoNet, WeightEvolution, HybridNNEvolver, ACTIVATIONS
+from .ensemble            import VotingEnsemble, StackingEnsemble, BaggingEnsemble, WeightedEnsemble
+from .knn                 import KNNClassifier, KNNRegressor, FastKNN, BallTree
+from .dbscan              import DBSCAN, OPTICS
+from .gradient_boosting   import GBMRegressor, GBMClassifier
+from .kalman_filter       import KalmanFilter, ExtendedKalmanFilter
+from .gaussian_process    import GaussianProcessRegressor, GaussianProcessClassifier, rbf_kernel as gp_rbf, matern32_kernel, periodic_kernel
+from .spectral_clustering import SpectralClustering, rbf_affinity, knn_affinity
+from .mean_shift          import MeanShift, KernelDensityEstimator, estimate_bandwidth
+from .isolation_forest    import IsolationForest, OneClassSVM
+from .bayesian_network    import BayesianNetwork, NaiveBayes, CPT
+from .vector_quantisation import LBG, AdaptiveVQ, ProductQuantiser
+from .actor_critic        import A2C, PPOLite, LinearActor, LinearCritic
+from .word_embeddings     import Word2Vec, PMIEmbeddings, build_cooccurrence, tokenise
+from .svd_reducer         import randomised_svd, pca as randomised_pca, transform as svd_transform
+from .em_clustering       import EMClustering, GaussianComponent
+from .text_classifier     import TextPipeline, TFIDFVectoriser, NaiveBayesClassifier
+from .collaborative_filter import MemoryCF, BayesianCF
+from .feature_engineering import (
+    PCA, StandardScaler, MinMaxScaler,
+    variance_threshold, correlation_filter,
+    mi_feature_ranking, forward_feature_selection,
+)
+__all__ = [
+    # Evolutionary / Global Optimisation
+    "GeneticAlgorithm", "Chromosome", "make_population",
+    "GeneticProgramming", "rand_tree", "Var", "Const", "BinOp", "UnaryOp",
+    # Grammar-Guided GP / Grammatical Evolution
+    "GrammarGP", "GrammaticalEvolution", "GNode",
+    "rand_grammar_tree", "make_math_grammar", "MATH_GRAMMAR",
+    "subtree_crossover", "subtree_mutation", "point_mutation",
+    # Linear GP
+    "LinearGP", "Instruction", "Program",
+    "rand_program", "effective_program", "effective_instructions",
+    "linear_crossover", "micro_mutation", "macro_mutation",
+    "to_expr_string", "execute", "OPERATIONS", "FAST_OPS",
+    "ParticleSwarmOptimiser", "DifferentialEvolution", "CMAES",
+    "GaussianEDA", "BayesianOptimiser",
+    "SimulatedAnnealing", "MultiObjectiveSA",
+    "AntColonyOptimiser",
+    # Neural Networks
+    "MiniNeuralNet",
+    "Conv1D", "SimpleRNN", "GRUCell",
+    "EvoNet", "WeightEvolution", "HybridNNEvolver", "ACTIVATIONS",
+    # Gradient Optimisers
+    "SGD", "RMSProp", "Adam", "AdamW", "LRScheduler", "numerical_gradient",
+    # Classifiers
+    "OnlineBayesClassifier",
+    "SVM", "linear_kernel", "rbf_kernel", "poly_kernel",
+    "AdaBoost", "DecisionStump",
+    "DecisionTree", "RandomForest",
+    # Ensembles
+    "VotingEnsemble", "StackingEnsemble", "BaggingEnsemble", "WeightedEnsemble",
+    # Clustering
+    "ScalableKMeans", "HierarchicalKMeans",
+    # Reinforcement Learning / Bandits
+    "QLearner", "SARSALearner", "FunctionApproxQLearner",
+    "EpsilonGreedy", "UCB1", "ThompsonSampling", "EXP3", "LinUCB",
+    # Sequential Models
+    "HiddenMarkovModel",
+    # Nearest Neighbours
+    "KNNClassifier", "KNNRegressor", "FastKNN", "BallTree",
+    # Density Clustering
+    "DBSCAN", "OPTICS",
+    # Gradient Boosting
+    "GBMRegressor", "GBMClassifier",
+    # Sequential / State Estimation
+    "KalmanFilter", "ExtendedKalmanFilter",
+    # Gaussian Processes
+    "GaussianProcessRegressor", "GaussianProcessClassifier",
+    "gp_rbf", "matern32_kernel", "periodic_kernel",
+    # Graph / Spectral Clustering
+    "SpectralClustering", "rbf_affinity", "knn_affinity",
+    # Density Estimation / Mode Finding
+    "MeanShift", "KernelDensityEstimator", "estimate_bandwidth",
+    # Anomaly Detection
+    "IsolationForest", "OneClassSVM",
+    # Probabilistic Graphical Models
+    "BayesianNetwork", "NaiveBayes", "CPT",
+    # Vector Quantisation
+    "LBG", "AdaptiveVQ", "ProductQuantiser",
+    # Policy Gradient RL
+    "A2C", "PPOLite", "LinearActor", "LinearCritic",
+    # Word Embeddings / NLP
+    "Word2Vec", "PMIEmbeddings", "build_cooccurrence", "tokenise",
+    # Dimensionality Reduction
+    "randomised_svd", "randomised_pca", "svd_transform",
+    # Clustering (additional)
+    "EMClustering", "GaussianComponent",
+    # Text / NLP
+    "TextPipeline", "TFIDFVectoriser", "NaiveBayesClassifier",
+    # Recommender Systems
+    "MemoryCF", "BayesianCF",
+    # Feature Engineering
+    "PCA", "StandardScaler", "MinMaxScaler",
+    "variance_threshold", "correlation_filter",
+    "mi_feature_ranking", "forward_feature_selection",
+]

patentml-0.1.0/patentml/actor_critic.py ADDED Viewed

@@ -0,0 +1,304 @@
+"""
+Actor-Critic and Advantage Actor-Critic (A2C) reinforcement learning.
+Patent basis: US6985172 (Southwest Research Institute, filed 2002, expired 2022)
+  "Q-learning with linear reward shaping" — 145 forward citations.
+  Covers concurrent value-function and policy optimisation where a critic
+  baseline reduces variance in policy gradient estimates.
+"""
+import math
+import random
+from typing import List, Tuple, Optional, Callable, Dict
+def _softmax(logits: List[float]) -> List[float]:
+    m = max(logits)
+    exps = [math.exp(x - m) for x in logits]
+    total = sum(exps)
+    return [e / total for e in exps]
+def _log_softmax(logits: List[float]) -> List[float]:
+    probs = _softmax(logits)
+    return [math.log(max(p, 1e-300)) for p in probs]
+def _relu(x: float) -> float:
+    return max(0.0, x)
+def _drelu(x: float) -> float:
+    return 1.0 if x > 0 else 0.0
+# ── Simple linear actor/critic ─────────────────────────────────────────────────
+class LinearActor:
+    """
+    Linear policy: pi(a|s) = softmax(W_a @ s + b_a).
+    """
+    def __init__(self, n_states: int, n_actions: int, seed: int = 42):
+        rng = random.Random(seed)
+        scale = 0.1
+        self.W = [[rng.gauss(0, scale) for _ in range(n_states)] for _ in range(n_actions)]
+        self.b = [0.0] * n_actions
+        self.n_states  = n_states
+        self.n_actions = n_actions
+    def logits(self, state: List[float]) -> List[float]:
+        return [sum(self.W[a][s] * state[s] for s in range(self.n_states)) + self.b[a]
+                for a in range(self.n_actions)]
+    def probs(self, state: List[float]) -> List[float]:
+        return _softmax(self.logits(state))
+    def select_action(self, state: List[float], rng: random.Random) -> int:
+        probs = self.probs(state)
+        r = rng.random()
+        cumulative = 0.0
+        for a, p in enumerate(probs):
+            cumulative += p
+            if r <= cumulative:
+                return a
+        return len(probs) - 1
+    def update(self, state: List[float], action: int, advantage: float, lr: float) -> None:
+        """Policy gradient update: theta += lr * advantage * grad log pi(a|s)."""
+        probs = self.probs(state)
+        for a in range(self.n_actions):
+            grad = (1.0 - probs[a]) if a == action else -probs[a]
+            for s in range(self.n_states):
+                self.W[a][s] += lr * advantage * grad * state[s]
+            self.b[a] += lr * advantage * grad
+class LinearCritic:
+    """
+    Linear value function: V(s) = w_v @ s + b_v.
+    Trained by TD(0): V(s) ≈ r + gamma * V(s').
+    """
+    def __init__(self, n_states: int, seed: int = 42):
+        rng = random.Random(seed)
+        self.w = [rng.gauss(0, 0.1) for _ in range(n_states)]
+        self.b = 0.0
+        self.n_states = n_states
+    def value(self, state: List[float]) -> float:
+        return sum(self.w[i] * state[i] for i in range(self.n_states)) + self.b
+    def update(self, state: List[float], target: float, lr: float) -> float:
+        """MSE gradient step. Returns TD error."""
+        v    = self.value(state)
+        td   = target - v
+        for i in range(self.n_states):
+            self.w[i] += lr * td * state[i]
+        self.b += lr * td
+        return td
+# ── Advantage Actor-Critic (A2C) ───────────────────────────────────────────────
+class A2C:
+    """
+    Advantage Actor-Critic (A2C).
+    Critic estimates V(s).  Advantage A(s,a) = r + gamma*V(s') - V(s).
+    Actor is updated with policy gradient weighted by advantage.
+    Advantage reduces variance compared to pure REINFORCE.
+    Can work with any environment exposing (state, reward, done, info) = step(action).
+    """
+    def __init__(
+        self,
+        n_states:      int,
+        n_actions:     int,
+        lr_actor:      float = 0.01,
+        lr_critic:     float = 0.05,
+        gamma:         float = 0.99,
+        entropy_coef:  float = 0.01,
+        seed:          int   = 42,
+    ):
+        self.actor     = LinearActor(n_states, n_actions, seed=seed)
+        self.critic    = LinearCritic(n_states, seed=seed + 1)
+        self.lr_actor  = lr_actor
+        self.lr_critic = lr_critic
+        self.gamma     = gamma
+        self.entropy   = entropy_coef
+        self._rng      = random.Random(seed)
+        self.episode_rewards: List[float] = []
+    def select_action(self, state: List[float]) -> int:
+        return self.actor.select_action(state, self._rng)
+    def update(
+        self,
+        state:      List[float],
+        action:     int,
+        reward:     float,
+        next_state: List[float],
+        done:       bool,
+    ) -> float:
+        """Single-step TD update. Returns advantage."""
+        v_next    = 0.0 if done else self.critic.value(next_state)
+        td_target = reward + self.gamma * v_next
+        advantage = self.critic.update(state, td_target, self.lr_critic)
+        # Entropy regularisation: add small gradient toward uniform policy
+        probs = self.actor.probs(state)
+        for a in range(self.actor.n_actions):
+            entropy_grad = -math.log(max(probs[a], 1e-9)) - 1
+            self.actor.b[a] += self.lr_actor * self.entropy * entropy_grad
+        # Policy gradient
+        self.actor.update(state, action, advantage, self.lr_actor)
+        return advantage
+    def train(
+        self,
+        env_fn: Callable,
+        n_episodes: int = 500,
+        max_steps:  int = 200,
+    ) -> List[float]:
+        """
+        Train for n_episodes.
+        env_fn() must return an object with:
+          .reset() -> state (list of floats)
+          .step(action) -> (next_state, reward, done)
+        """
+        self.episode_rewards = []
+        for ep in range(n_episodes):
+            env   = env_fn()
+            state = env.reset()
+            total = 0.0
+            for _ in range(max_steps):
+                action = self.select_action(state)
+                next_state, reward, done = env.step(action)
+                self.update(state, action, reward, next_state, done)
+                total += reward
+                state  = next_state
+                if done: break
+            self.episode_rewards.append(total)
+        return self.episode_rewards
+# ── PPO-lite (clip-based policy optimisation) ──────────────────────────────────
+class PPOLite:
+    """
+    Proximal Policy Optimisation (lite version) — clipped surrogate objective.
+    Collects a batch of transitions, computes advantages, then does k_epochs
+    of gradient updates with clipping to prevent too-large policy updates.
+    """
+    def __init__(
+        self,
+        n_states:  int,
+        n_actions: int,
+        lr:        float = 0.003,
+        gamma:     float = 0.99,
+        clip_eps:  float = 0.2,
+        k_epochs:  int   = 4,
+        seed:      int   = 42,
+    ):
+        self.actor  = LinearActor(n_states, n_actions, seed=seed)
+        self.critic = LinearCritic(n_states, seed=seed + 1)
+        self.lr       = lr
+        self.gamma    = gamma
+        self.clip_eps = clip_eps
+        self.k_epochs = k_epochs
+        self._rng     = random.Random(seed)
+        # Replay buffer
+        self._states:      List[List[float]] = []
+        self._actions:     List[int]         = []
+        self._rewards:     List[float]       = []
+        self._dones:       List[bool]        = []
+        self._old_logprobs: List[float]      = []
+    def select_action(self, state: List[float]) -> Tuple[int, float]:
+        probs    = self.actor.probs(state)
+        action   = self.actor.select_action(state, self._rng)
+        log_prob = math.log(max(probs[action], 1e-300))
+        return action, log_prob
+    def store(self, state, action, reward, done, log_prob):
+        self._states.append(state)
+        self._actions.append(action)
+        self._rewards.append(reward)
+        self._dones.append(done)
+        self._old_logprobs.append(log_prob)
+    def update(self) -> None:
+        """Compute returns, advantages, then run k_epochs of PPO clip update."""
+        n = len(self._rewards)
+        if n == 0: return
+        # Compute discounted returns
+        returns = [0.0] * n
+        running = 0.0
+        for i in reversed(range(n)):
+            if self._dones[i]: running = 0.0
+            running = self._rewards[i] + self.gamma * running
+            returns[i] = running
+        for _ in range(self.k_epochs):
+            for i in range(n):
+                state  = self._states[i]
+                action = self._actions[i]
+                ret    = returns[i]
+                v      = self.critic.value(state)
+                adv    = ret - v
+                # Normalise advantage
+                adv /= (abs(adv) + 1.0)
+                # Critic update
+                self.critic.update(state, ret, self.lr)
+                # Actor: clipped surrogate
+                new_probs   = self.actor.probs(state)
+                new_logprob = math.log(max(new_probs[action], 1e-300))
+                old_logprob = self._old_logprobs[i]
+                ratio       = math.exp(new_logprob - old_logprob)
+                ratio_clip  = max(1 - self.clip_eps, min(1 + self.clip_eps, ratio))
+                # Gradient from min(ratio*adv, clipped*adv)
+                if adv >= 0:
+                    effective_ratio = min(ratio, 1 + self.clip_eps)
+                else:
+                    effective_ratio = max(ratio, 1 - self.clip_eps)
+                self.actor.update(state, action, adv * effective_ratio / (ratio + 1e-9), self.lr)
+        # Clear buffer
+        self._states.clear(); self._actions.clear(); self._rewards.clear()
+        self._dones.clear(); self._old_logprobs.clear()
+if __name__ == "__main__":
+    # Simple environment: pole balancing proxy via CartPole-like reward signal
+    class GridWalk:
+        """1D grid: state=[pos], actions=[left,right], goal at pos=5."""
+        def __init__(self): self.pos = 2
+        def reset(self): self.pos = 2; return [self.pos / 10.0]
+        def step(self, action):
+            self.pos += 1 if action == 1 else -1
+            self.pos = max(0, min(9, self.pos))
+            done = self.pos == 5
+            reward = 1.0 if done else -0.01
+            return [self.pos / 10.0], reward, done
+    a2c = A2C(n_states=1, n_actions=2, lr_actor=0.05, lr_critic=0.1, gamma=0.99, seed=0)
+    rewards = a2c.train(GridWalk, n_episodes=300, max_steps=50)
+    last50 = sum(rewards[-50:]) / 50
+    print(f"A2C GridWalk: last-50 mean reward = {last50:.3f} (expect > 0.8)")
+    ppo = PPOLite(n_states=1, n_actions=2, lr=0.05, gamma=0.99, seed=1)
+    rng = random.Random(42)
+    ep_rewards = []
+    for ep in range(200):
+        env = GridWalk(); state = env.reset(); total = 0.0
+        for _ in range(30):
+            action, lp = ppo.select_action(state)
+            ns, r, done = env.step(action)
+            ppo.store(state, action, r, done, lp)
+            total += r; state = ns
+            if done: break
+        ep_rewards.append(total)
+        if (ep + 1) % 10 == 0: ppo.update()
+    last50_ppo = sum(ep_rewards[-50:]) / 50
+    print(f"PPO-lite GridWalk: last-50 mean reward = {last50_ppo:.3f} (expect > 0.8)")