PyPI - a-machine - Versions diffs - 0.1.0__tar.gz - Mend

a-machine 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

a_machine-0.1.0/.gitignore +14 -0
a_machine-0.1.0/CMakeLists.txt +15 -0
a_machine-0.1.0/LICENCSE.txt +7 -0
a_machine-0.1.0/PKG-INFO +97 -0
a_machine-0.1.0/README.md +68 -0
a_machine-0.1.0/amachine/__init__.py +0 -0
a_machine-0.1.0/amachine/am_causal_state.py +13 -0
a_machine-0.1.0/amachine/am_cohesion.py +52 -0
a_machine-0.1.0/amachine/am_create.py +294 -0
a_machine-0.1.0/amachine/am_fast/__init__.py +196 -0
a_machine-0.1.0/amachine/am_fast/am_fast.cpp +791 -0
a_machine-0.1.0/amachine/am_fast/distance.py +137 -0
a_machine-0.1.0/amachine/am_fast/json_utils.py +34 -0
a_machine-0.1.0/amachine/am_generator.py +168 -0
a_machine-0.1.0/amachine/am_hmm.py +1559 -0
a_machine-0.1.0/amachine/am_machine.py +19 -0
a_machine-0.1.0/amachine/am_msp.py +857 -0
a_machine-0.1.0/amachine/am_pattern.py +21 -0
a_machine-0.1.0/amachine/am_random.py +20 -0
a_machine-0.1.0/amachine/am_solve.py +95 -0
a_machine-0.1.0/amachine/am_substitution_algebra.py +13 -0
a_machine-0.1.0/amachine/am_symbol.py +4 -0
a_machine-0.1.0/amachine/am_syntagmatics.py +55 -0
a_machine-0.1.0/amachine/am_transition.py +10 -0
a_machine-0.1.0/amachine/am_vis.py +127 -0
a_machine-0.1.0/amachine/am_vocabulary.py +69 -0
a_machine-0.1.0/amachine/cli.py +6 -0
a_machine-0.1.0/data/.gitkeep +0 -0
a_machine-0.1.0/docs/amachine/am_causal_state.html +391 -0
a_machine-0.1.0/docs/amachine/am_cohesion.html +677 -0
a_machine-0.1.0/docs/amachine/am_create.html +895 -0
a_machine-0.1.0/docs/amachine/am_fast/_am_fast.html +604 -0
a_machine-0.1.0/docs/amachine/am_fast/distance.html +552 -0
a_machine-0.1.0/docs/amachine/am_fast/json_utils.html +363 -0
a_machine-0.1.0/docs/amachine/am_fast/logo.png +0 -0
a_machine-0.1.0/docs/amachine/am_fast.html +693 -0
a_machine-0.1.0/docs/amachine/am_generator.html +673 -0
a_machine-0.1.0/docs/amachine/am_hmm.html +6245 -0
a_machine-0.1.0/docs/amachine/am_machine.html +363 -0
a_machine-0.1.0/docs/amachine/am_msp.html +2242 -0
a_machine-0.1.0/docs/amachine/am_pattern.html +331 -0
a_machine-0.1.0/docs/amachine/am_random.html +355 -0
a_machine-0.1.0/docs/amachine/am_semantics.html +372 -0
a_machine-0.1.0/docs/amachine/am_solve.html +466 -0
a_machine-0.1.0/docs/amachine/am_substitution_algebra.html +333 -0
a_machine-0.1.0/docs/amachine/am_symbol.html +285 -0
a_machine-0.1.0/docs/amachine/am_syntagmatics.html +718 -0
a_machine-0.1.0/docs/amachine/am_transition.html +369 -0
a_machine-0.1.0/docs/amachine/am_vis.html +527 -0
a_machine-0.1.0/docs/amachine/am_vocabulary.html +923 -0
a_machine-0.1.0/docs/amachine/cli.html +271 -0
a_machine-0.1.0/docs/amachine/logo.png +0 -0
a_machine-0.1.0/docs/amachine.html +250 -0
a_machine-0.1.0/docs/index.html +7 -0
a_machine-0.1.0/docs/logo.png +0 -0
a_machine-0.1.0/docs/search.js +46 -0
a_machine-0.1.0/examples/__init__.py +0 -0
a_machine-0.1.0/examples/complexity.py +44 -0
a_machine-0.1.0/examples/isomorphic.py +50 -0
a_machine-0.1.0/examples/random_machine.py +25 -0
a_machine-0.1.0/gen_docs.py +17 -0
a_machine-0.1.0/pyproject.toml +75 -0
a_machine-0.1.0/uv.lock +1119 -0

a_machine-0.1.0/.gitignore ADDED Viewed

@@ -0,0 +1,14 @@
+.venv/
+__pycache__/
+.vscode/
+build/
+*.egg-info/
+.cache/
+*.so
+dist/
+data/*/
+!data/.gitkeep
+*.pdf
+.ninja*
+.skbuild*
+.cmake/

a_machine-0.1.0/CMakeLists.txt ADDED Viewed

@@ -0,0 +1,15 @@
+cmake_minimum_required(VERSION 3.15...4.0)
+project(amachine LANGUAGES CXX)
+find_package(Python COMPONENTS Interpreter Development.Module REQUIRED)
+find_package(nanobind CONFIG REQUIRED)
+nanobind_add_module(
+    _am_fast
+    NB_STATIC
+    amachine/am_fast/am_fast.cpp
+)
+install(TARGETS _am_fast
+    LIBRARY DESTINATION amachine/am_fast
+)

a_machine-0.1.0/LICENCSE.txt ADDED Viewed

@@ -0,0 +1,7 @@
+Copyright 2026 Tyson A. Neuroth
+Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the “Software”), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.

a_machine-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,97 @@
+Metadata-Version: 2.4
+Name: a-machine
+Version: 0.1.0
+Summary: Construct epsilon-machines to generate symbol sequences with ground truth causal structure and information-theoretic complexity for studying neural network learning dynamics.
+Author-Email: "Tyson A. Neuroth" <tyneuroth@gmail.com>
+License-Expression: MIT
+License-File: LICENCSE.txt
+Classifier: Programming Language :: Python :: 3
+Classifier: Operating System :: OS Independent
+Requires-Python: >=3.12
+Requires-Dist: hnswlib
+Requires-Dist: matplotlib
+Requires-Dist: networkx
+Requires-Dist: numpy
+Requires-Dist: orjson
+Requires-Dist: pyarrow
+Requires-Dist: pygraphviz
+Requires-Dist: scikit-umfpack
+Requires-Dist: scipy
+Requires-Dist: graphviz>=0.21
+Requires-Dist: automata-lib>=9.2.0
+Requires-Dist: sympy>=1.14.0
+Requires-Dist: pdoc>=16.0.0
+Requires-Dist: nanobind>=2.12.0
+Provides-Extra: cuda
+Requires-Dist: cupy-cuda13x>=14.0.1; extra == "cuda"
+Requires-Dist: cuvs-cu13==26.4.*; extra == "cuda"
+Description-Content-Type: text/markdown
+# A-Machine
+A-Machine is a library for constructing epsilon-machines[^1] and other stochastic models for generating structured symbol sequences. It was created with the goal of generating data with ground truth causal structure and information-theoretic complexity for studying neural network learning dynamics and internal representations.
+This is an early work in progress. Much more to come.
+## Installation
+```bash
+# CPU only
+pip install a-machine
+# With GPU support (requires CUDA 13)
+pip install "a-machine[cuda]" --extra-index-url https://pypi.nvidia.com
+## Quick Start
+```python
+from amachine.am_create import random_machine
+# May have multiple recurrent subgraphs, terminal states, or tranistory states
+m = random_machine(
+	n_states=11,
+	symbols=[ '0', '1', '2' ],
+	connectedness=0.75,
+	randomness=0.35 )
+# Collapse to the largest recurrent subgraph
+m.collapse_to_largest_strongly_connected_subgraph()
+# Minimize the machine -> epsilon-machine.
+m.minimize()
+# Entropy rate, statistical complexity, excess entropy, crypticity
+print( f"h_mu : {m.h_mu()}" )
+print( f"C_mu : {m.C_mu()}" )
+print( f"Chi  : {m.Chi()}" )
+# Draw the graph
+m.draw_graph( output_dir=".", show=True )
+```
+## Author
+Tyson A. Neuroth
+[tneuroth.gitlab.io](https://tneuroth.gitlab.io)
+## Citation
+If you use this package in your research, please cite:
+```
+@software{a-machine,
+  author = {Tyson A. Neuroth},
+  title  = {A-Machine},
+  year   = {2016},
+  url    = {https://gitlab.com/tneuroth/a-machine}
+}
+```
+## License
+MIT
+## References
+[^1]: Crutchfield, James P., and Karl Young. "Inferring statistical complexity." Physical review letters 63.2 (1989): 105.

a_machine-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,68 @@
+# A-Machine
+A-Machine is a library for constructing epsilon-machines[^1] and other stochastic models for generating structured symbol sequences. It was created with the goal of generating data with ground truth causal structure and information-theoretic complexity for studying neural network learning dynamics and internal representations.
+This is an early work in progress. Much more to come.
+## Installation
+```bash
+# CPU only
+pip install a-machine
+# With GPU support (requires CUDA 13)
+pip install "a-machine[cuda]" --extra-index-url https://pypi.nvidia.com
+## Quick Start
+```python
+from amachine.am_create import random_machine
+# May have multiple recurrent subgraphs, terminal states, or tranistory states
+m = random_machine(
+	n_states=11,
+	symbols=[ '0', '1', '2' ],
+	connectedness=0.75,
+	randomness=0.35 )
+# Collapse to the largest recurrent subgraph
+m.collapse_to_largest_strongly_connected_subgraph()
+# Minimize the machine -> epsilon-machine.
+m.minimize()
+# Entropy rate, statistical complexity, excess entropy, crypticity
+print( f"h_mu : {m.h_mu()}" )
+print( f"C_mu : {m.C_mu()}" )
+print( f"Chi  : {m.Chi()}" )
+# Draw the graph
+m.draw_graph( output_dir=".", show=True )
+```
+## Author
+Tyson A. Neuroth
+[tneuroth.gitlab.io](https://tneuroth.gitlab.io)
+## Citation
+If you use this package in your research, please cite:
+```
+@software{a-machine,
+  author = {Tyson A. Neuroth},
+  title  = {A-Machine},
+  year   = {2016},
+  url    = {https://gitlab.com/tneuroth/a-machine}
+}
+```
+## License
+MIT
+## References
+[^1]: Crutchfield, James P., and Karl Young. "Inferring statistical complexity." Physical review letters 63.2 (1989): 105.

a_machine-0.1.0/amachine/__init__.py ADDED Viewed

File without changes

a_machine-0.1.0/amachine/am_causal_state.py ADDED Viewed

@@ -0,0 +1,13 @@
+from dataclasses import dataclass, field
+@dataclass
+class CausalState :
+	name      : str
+	classes   : set[str] = field(default_factory=set)
+	isomorphs : set[str] = field(default_factory=set)
+	def add_class( self, class_name ) :
+		self.classes.add( class_name )
+	def add_isomorph( self, state_name ) :
+		self.isomorphs.add( state_name )

a_machine-0.1.0/amachine/am_cohesion.py ADDED Viewed

@@ -0,0 +1,52 @@
+from abc import ABC, abstractmethod
+import warnings
+from dataclasses import dataclass
+class CohesionKernel(ABC):
+	"""
+	Defines the substitution weight distributions over target symbols
+	given a source symbol.
+	"""
+	def _normalize(self, source : str, dist: dict[str, float]) -> dict[str, float]:
+		wsum = sum(w for w in dist.values())
+		if wsum <= 1e-15:
+			warnings.warn( "Weight function sums to 0, implicitly mapping source with probability 1" )
+			res = dist.copy()
+			res[ source ] = 1.0
+			return res
+		return {s: w / wsum for s, w in dist.items()}
+	@abstractmethod
+	def cohesion_scores( self, source: str, symbols: set[str] ) -> dict[str, float]:
+		"""
+		Maps a source symbol to a distribution of cohesion scores over other symbols.
+		"""
+@dataclass
+class Uniform(CohesionKernel):
+	def cohesion_scores(self, source: str, symbols: set[str]) -> dict[str, float]:
+		return { s: 1.0 for s in symbols }
+@dataclass
+class Marginal(CohesionKernel):
+	"""Per-symbol weight distribution."""
+	scores : dict[str, float]
+	def cohesion_scores(self, source: str, symbols: set[str]) -> dict[str, float]:
+		return {s: self.scores[s] for s in symbols }
+@dataclass
+class Symmetric(CohesionKernel):
+	"""w(a->b) == w(b->a)"""
+	scores : dict[frozenset, float]
+	def cohesion_scores(self, source: str, symbols: set[str]) -> dict[str, float]:
+		return {s: self.scores[frozenset({source, s})] for s in symbols }
+@dataclass
+class Asymmetric(CohesionKernel):
+	"""Directed pairwise scores."""
+	scores : dict[tuple[str,str], float]
+	def cohesion_scores(self, source: str, symbols: set[str]) -> dict[str, float]:
+		return {s: self.scores[(source, s)] for s in symbols }

a_machine-0.1.0/amachine/am_create.py ADDED Viewed

@@ -0,0 +1,294 @@
+from collections import defaultdict
+import copy
+import random
+from .am_hmm          import HMM
+from .am_causal_state import CausalState
+from .am_transition   import Transition
+from .am_random import uniform_dist, exp_uniform_blend
+def star_join(
+	exit_symbol : str,
+	enter_symbols : list[str],
+	machines : list[HMM],
+	mode_residency_factor : float ) -> HMM :
+	machine = HMM()
+	isomorphic_groups = defaultdict(list)
+	for i, m in enumerate( machines ) :
+		if m.isoclass :
+			isomorphic_groups[ m.isoclass ].append( i )
+	# since we are merging multuple machines which might have name collision
+	# we need to rename the states to ensure uniqueness
+	def rename_state( base_name : str, g : int ) :
+		return f"{g}/{base_name}"
+	def get_gid( idx : int, isoclass : int | None ) :
+		return idx if isoclass is None else isoclass
+	machine.set_alphabet( [ exit_symbol ] )
+	for m in machines :
+		machine.extend_alphabet( alphabet=m.alphabet )
+	# create a connector state and connector state class
+	connector_state = CausalState(
+		name=f"/c",
+		classes=set({"connector"})
+	)
+	# initial states before adding each machines states
+	machine.set_states( [ connector_state ] )
+	machine.start_state = 0
+	# number of machines (groups of states)
+	n_groups = len( machines )
+	# make sure we have enough symbols (otherwise connector can't be unifilar)
+	if n_groups > len(enter_symbols) :
+		raise Exception(
+			f"Too few enter symbols given number of machines"
+		)
+	# for each given machine
+	for m_idx, m in enumerate( machines ) :
+		# default to the index of the machine in the list
+		m_gid = get_gid( m_idx, m.isoclass )
+		# give the states from this machine a class name
+		m_classes = {
+			f"m_{m_idx}",
+			f"isoclass_{m.isoclass}"
+		}
+		added_states = []
+		# create a state and extend our existing machine to include it
+		for s_idx, state in enumerate( m.states ) :
+			isomorphs=set()
+			if m.isoclass is not None and m.isoclass in isomorphic_groups :
+				for other_idx in isomorphic_groups[ m.isoclass ] :
+					if other_idx == m_idx :
+						continue
+					other_m = machines[ other_idx ]
+					isomorphs.add(
+						rename_state(
+							other_m.states[ s_idx ].name,
+							get_gid( other_idx, other_m.isoclass ) )
+					)
+			added_states.append(
+				CausalState(
+					name=rename_state(state.name, m_gid),
+					classes=( m_classes | state.classes ),
+					isomorphs=isomorphs
+				)
+			)
+		machine.extend_states( added_states )
+		added_transitions = []
+		# add all of the transitions from the machine
+		for tr in m.transitions :
+			# get the names of the states for the transition
+			origin_state_name = rename_state( m.states[ tr.origin_state_idx ].name, m_gid )
+			target_state_name = rename_state( m.states[ tr.target_state_idx ].name, m_gid )
+			# idx of the symbol remaped to this machines alphabet list
+			new_symbol_idx = machine.symbol_idx_map[ m.alphabet[ tr.symbol_idx ] ]
+			# create and add the new transition
+			added_transitions.append( Transition(
+				origin_state_idx=machine.state_idx_map[ origin_state_name ],
+				target_state_idx=machine.state_idx_map[ target_state_name ],
+				prob=tr.prob,
+				symbol_idx=new_symbol_idx
+			) )
+		machine.extend_transitions( added_transitions )
+		# Add connector transitions, and adjust transition probabilities to sum to 1
+		# the name of the state that is the entry point to this group from the connector
+		m_entry_state_name = rename_state( m.states[ m.start_state ].name, m_gid )
+		# get the index of the entry state for this machine
+		m_entry_state_idx = machine.state_idx_map[ m_entry_state_name ]
+		# Get the within group transitions from m's entry state
+		# ( the probabilities will need to be adjusted )
+		transition_ids_from_m_entry = set()
+		for i, tr in enumerate( machine.transitions ) :
+			if tr.origin_state_idx == m_entry_state_idx :
+				transition_ids_from_m_entry.add( i )
+		n_from_entry = len( transition_ids_from_m_entry )
+		# Pr of staying in this group is distributed over the within group outgoing edges from the entry state
+		for i in transition_ids_from_m_entry :
+			machine.transitions[ i ] = Transition(
+				origin_state_idx=machine.transitions[ i ].origin_state_idx,
+				target_state_idx=machine.transitions[ i ].target_state_idx,
+				prob=mode_residency_factor / n_from_entry,
+				symbol_idx=machine.transitions[ i ].symbol_idx
+			)
+		# from m's entry state back to connector
+		escape_pr = 1.0 - mode_residency_factor
+		machine.extend_transitions( transitions=[
+			Transition(
+				origin_state_idx=m_entry_state_idx,
+				target_state_idx=machine.start_state,
+				prob=escape_pr,
+				symbol_idx=machine.symbol_idx_map[ exit_symbol ]
+			)
+		] )
+		# from the connector to m's entry state
+		machine.extend_alphabet( alphabet=[ enter_symbols[ m_idx ] ] )
+		machine.extend_transitions( transitions=[
+			Transition(
+				origin_state_idx=machine.start_state,
+				target_state_idx=m_entry_state_idx,
+				prob=( 1.0 / n_groups ),
+				symbol_idx=machine.symbol_idx_map[ enter_symbols[ m_idx ] ]
+			)
+		] )
+	return machine
+def star(
+	exit_symbol          : str,
+	enter_symbols        : list[str],
+	normal_symbols       : list[str],
+	n_modes              : int = 7,
+	n_isomorphic         : int = 2,
+	randomness           : float = 0.3,
+	connectedness        : float = 0.5,
+	residency_factor     : float = 0.5,
+	n_normal_symbols     : int = 4,
+	t_states_per_machine : int = 17 )  -> HMM :
+	if len( normal_symbols ) < n_normal_symbols*n_isomorphic :
+		raise ValueError( "Must have at least n_normal_symbols*n_isomorphic normal symbols" )
+	if len( enter_symbols ) < n_modes*n_isomorphic :
+		raise ValueError( "Must have at least n_modes*n_isomorphic enter symbols" )
+	alphabet     = [ f"{normal_symbols[i]}" for i in range( 0, n_normal_symbols            ) ]
+	iso_alphabet = [ f"{normal_symbols[i]}" for i in range( n_normal_symbols, n_normal_symbols*2  ) ]
+	random_machines = []
+	for i in range( n_modes ) :
+		m = random_machine(
+			n_states=t_states_per_machine,
+			symbols=alphabet,
+			randomness=randomness,
+			connectedness=connectedness )
+		m.collapse_to_largest_strongly_connected_subgraph()
+		m_iso = isomorphic_to( m, alphabet=iso_alphabet )
+		m.isoclass     = f"{i}"
+		m_iso.isoclass = f"{i}"
+		for j, state in enumerate( m.states ) :
+			m.states[ j ].add_isomorph( m_iso.states[ j ].name )
+			m_iso.states[ j ].add_isomorph( m.states[ j ].name )
+		random_machines.append( m )
+		random_machines.append( m_iso )
+	mode_machine = star_join(
+		exit_symbol=exit_symbol,
+		enter_symbols=enter_symbols,
+		machines=random_machines,
+		mode_residency_factor=residency_factor
+	)
+	return mode_machine
+def isomorphic_to(
+	m : HMM,
+	alphabet : list[str],
+	decorator : str = '@' ) -> HMM :
+	# make sure there are enough symbols
+	if len( alphabet ) < len( m.alphabet ) :
+		raise ValueError( "Not enough symbols in the alphabet" )
+	# take the as much of them as needed
+	alphabet_used = alphabet[ 0 : len( m.alphabet ) ]
+	states = [
+		CausalState(
+			name=f"{s.name}{decorator}",
+			classes=copy.deepcopy( s.classes )
+		)
+		for s in m.states
+	]
+	return HMM(
+		states=states,
+		transitions=copy.deepcopy( m.transitions ),
+		start_state=0,
+		alphabet=alphabet_used
+	)
+def random_machine(
+	n_states : int,
+	symbols  : list[str],
+	connectedness,
+	randomness )  -> HMM  :
+	states=[
+		CausalState( name=f"{i}" )
+		for i in range( n_states  )
+	]
+	n_symbols = len( symbols )
+	transitions = []
+	for state_idx, state in enumerate( states ) :
+		n_transitions = sum( random.random() < connectedness for _ in range( n_symbols - 1 ) ) + 1
+		transition_to = random.sample( range( n_states ), n_transitions )
+		transition_probabilities = exp_uniform_blend( n=n_transitions, alpha=randomness )
+		transition_symbols_indices = random.sample( range( n_symbols ), n_transitions )
+		for i, p in enumerate( transition_probabilities ) :
+			transitions.append(
+				Transition(
+					origin_state_idx=state_idx,
+					target_state_idx=transition_to[ i ],
+					prob=p,
+					symbol_idx=transition_symbols_indices[ i ]
+				)
+			)
+	return HMM(
+		states=states,
+		transitions=transitions,
+		start_state=0,
+		alphabet=symbols.copy()
+	)