PyPI - synth-ai - Versions diffs - 0.2.4.dev6__py3-none-any.whl → 0.2.4.dev8__py3-none-any.whl - Mend

synth-ai 0.2.4.dev6py3-none-any.whl → 0.2.4.dev8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (256) hide show

synth_ai/__init__.py +18 -9
synth_ai/cli/__init__.py +10 -5
synth_ai/cli/balance.py +25 -32
synth_ai/cli/calc.py +2 -3
synth_ai/cli/demo.py +3 -5
synth_ai/cli/legacy_root_backup.py +58 -32
synth_ai/cli/man.py +22 -19
synth_ai/cli/recent.py +9 -8
synth_ai/cli/root.py +58 -13
synth_ai/cli/status.py +13 -6
synth_ai/cli/traces.py +45 -21
synth_ai/cli/watch.py +40 -37
synth_ai/config/base_url.py +47 -2
synth_ai/core/experiment.py +1 -2
synth_ai/environments/__init__.py +2 -6
synth_ai/environments/environment/artifacts/base.py +3 -1
synth_ai/environments/environment/db/sqlite.py +1 -1
synth_ai/environments/environment/registry.py +19 -20
synth_ai/environments/environment/resources/sqlite.py +2 -3
synth_ai/environments/environment/rewards/core.py +3 -2
synth_ai/environments/environment/tools/__init__.py +6 -4
synth_ai/environments/examples/crafter_classic/__init__.py +1 -1
synth_ai/environments/examples/crafter_classic/engine.py +13 -13
synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +1 -0
synth_ai/environments/examples/crafter_classic/engine_helpers/action_map.py +2 -1
synth_ai/environments/examples/crafter_classic/engine_helpers/serialization.py +2 -1
synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +3 -2
synth_ai/environments/examples/crafter_classic/environment.py +16 -15
synth_ai/environments/examples/crafter_classic/taskset.py +2 -2
synth_ai/environments/examples/crafter_classic/trace_hooks_v3.py +2 -3
synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +2 -1
synth_ai/environments/examples/crafter_custom/crafter/__init__.py +2 -2
synth_ai/environments/examples/crafter_custom/crafter/config.py +2 -2
synth_ai/environments/examples/crafter_custom/crafter/env.py +1 -5
synth_ai/environments/examples/crafter_custom/crafter/objects.py +1 -2
synth_ai/environments/examples/crafter_custom/crafter/worldgen.py +1 -2
synth_ai/environments/examples/crafter_custom/dataset_builder.py +5 -5
synth_ai/environments/examples/crafter_custom/environment.py +13 -13
synth_ai/environments/examples/crafter_custom/run_dataset.py +5 -5
synth_ai/environments/examples/enron/art_helpers/email_search_tools.py +2 -2
synth_ai/environments/examples/enron/art_helpers/local_email_db.py +5 -4
synth_ai/environments/examples/enron/art_helpers/types_enron.py +2 -1
synth_ai/environments/examples/enron/engine.py +18 -14
synth_ai/environments/examples/enron/environment.py +12 -11
synth_ai/environments/examples/enron/taskset.py +7 -7
synth_ai/environments/examples/minigrid/__init__.py +6 -6
synth_ai/environments/examples/minigrid/engine.py +6 -6
synth_ai/environments/examples/minigrid/environment.py +6 -6
synth_ai/environments/examples/minigrid/puzzle_loader.py +3 -2
synth_ai/environments/examples/minigrid/taskset.py +13 -13
synth_ai/environments/examples/nethack/achievements.py +1 -1
synth_ai/environments/examples/nethack/engine.py +8 -7
synth_ai/environments/examples/nethack/environment.py +10 -9
synth_ai/environments/examples/nethack/helpers/__init__.py +8 -9
synth_ai/environments/examples/nethack/helpers/action_mapping.py +1 -1
synth_ai/environments/examples/nethack/helpers/nle_wrapper.py +2 -1
synth_ai/environments/examples/nethack/helpers/observation_utils.py +1 -1
synth_ai/environments/examples/nethack/helpers/recording_wrapper.py +3 -4
synth_ai/environments/examples/nethack/helpers/trajectory_recorder.py +6 -5
synth_ai/environments/examples/nethack/helpers/visualization/replay_viewer.py +5 -5
synth_ai/environments/examples/nethack/helpers/visualization/visualizer.py +7 -6
synth_ai/environments/examples/nethack/taskset.py +5 -5
synth_ai/environments/examples/red/engine.py +9 -8
synth_ai/environments/examples/red/engine_helpers/reward_components.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/__init__.py +7 -7
synth_ai/environments/examples/red/engine_helpers/reward_library/adaptive_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/battle_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/composite_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/economy_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/efficiency_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/exploration_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/novelty_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/pokemon_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/social_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/story_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/screen_analysis.py +3 -2
synth_ai/environments/examples/red/engine_helpers/state_extraction.py +2 -1
synth_ai/environments/examples/red/environment.py +18 -15
synth_ai/environments/examples/red/taskset.py +5 -3
synth_ai/environments/examples/sokoban/engine.py +16 -13
synth_ai/environments/examples/sokoban/engine_helpers/room_utils.py +3 -2
synth_ai/environments/examples/sokoban/engine_helpers/vendored/__init__.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/__init__.py +1 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/boxoban_env.py +7 -5
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/render_utils.py +1 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/room_utils.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env.py +5 -4
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_fixed_targets.py +3 -2
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_pull.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_two_player.py +5 -4
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_variations.py +1 -1
synth_ai/environments/examples/sokoban/environment.py +15 -14
synth_ai/environments/examples/sokoban/generate_verified_puzzles.py +5 -3
synth_ai/environments/examples/sokoban/puzzle_loader.py +3 -2
synth_ai/environments/examples/sokoban/taskset.py +13 -10
synth_ai/environments/examples/tictactoe/engine.py +6 -6
synth_ai/environments/examples/tictactoe/environment.py +8 -7
synth_ai/environments/examples/tictactoe/taskset.py +6 -5
synth_ai/environments/examples/verilog/engine.py +4 -3
synth_ai/environments/examples/verilog/environment.py +11 -10
synth_ai/environments/examples/verilog/taskset.py +14 -12
synth_ai/environments/examples/wordle/__init__.py +5 -5
synth_ai/environments/examples/wordle/engine.py +32 -25
synth_ai/environments/examples/wordle/environment.py +21 -16
synth_ai/environments/examples/wordle/helpers/generate_instances_wordfreq.py +6 -6
synth_ai/environments/examples/wordle/taskset.py +20 -12
synth_ai/environments/reproducibility/core.py +1 -1
synth_ai/environments/reproducibility/tree.py +21 -21
synth_ai/environments/service/app.py +3 -2
synth_ai/environments/service/core_routes.py +104 -110
synth_ai/environments/service/external_registry.py +1 -2
synth_ai/environments/service/registry.py +1 -1
synth_ai/environments/stateful/core.py +1 -2
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/api.py +4 -4
synth_ai/environments/tasks/core.py +14 -12
synth_ai/environments/tasks/filters.py +6 -4
synth_ai/environments/tasks/utils.py +13 -11
synth_ai/evals/base.py +2 -3
synth_ai/experimental/synth_oss.py +4 -4
synth_ai/http.py +102 -0
synth_ai/inference/__init__.py +7 -0
synth_ai/inference/client.py +20 -0
synth_ai/jobs/client.py +246 -0
synth_ai/learning/__init__.py +24 -0
synth_ai/learning/client.py +149 -0
synth_ai/learning/config.py +43 -0
synth_ai/learning/constants.py +29 -0
synth_ai/learning/ft_client.py +59 -0
synth_ai/learning/gateway.py +1 -3
synth_ai/learning/health.py +43 -0
synth_ai/learning/jobs.py +205 -0
synth_ai/learning/prompts/banking77_injection_eval.py +15 -10
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +26 -14
synth_ai/learning/prompts/mipro.py +61 -52
synth_ai/learning/prompts/random_search.py +42 -43
synth_ai/learning/prompts/run_mipro_banking77.py +32 -20
synth_ai/learning/prompts/run_random_search_banking77.py +71 -52
synth_ai/learning/rl_client.py +256 -0
synth_ai/learning/sse.py +58 -0
synth_ai/learning/validators.py +48 -0
synth_ai/lm/__init__.py +5 -5
synth_ai/lm/caching/ephemeral.py +9 -9
synth_ai/lm/caching/handler.py +20 -20
synth_ai/lm/caching/persistent.py +10 -10
synth_ai/lm/config.py +3 -3
synth_ai/lm/constants.py +7 -7
synth_ai/lm/core/all.py +17 -3
synth_ai/lm/core/exceptions.py +0 -2
synth_ai/lm/core/main.py +26 -41
synth_ai/lm/core/main_v3.py +33 -10
synth_ai/lm/core/synth_models.py +48 -0
synth_ai/lm/core/vendor_clients.py +26 -22
synth_ai/lm/injection.py +7 -8
synth_ai/lm/overrides.py +21 -19
synth_ai/lm/provider_support/__init__.py +1 -1
synth_ai/lm/provider_support/anthropic.py +15 -15
synth_ai/lm/provider_support/openai.py +23 -21
synth_ai/lm/structured_outputs/handler.py +34 -32
synth_ai/lm/structured_outputs/inject.py +24 -27
synth_ai/lm/structured_outputs/rehabilitate.py +19 -15
synth_ai/lm/tools/base.py +17 -16
synth_ai/lm/unified_interface.py +17 -18
synth_ai/lm/vendors/base.py +20 -18
synth_ai/lm/vendors/core/anthropic_api.py +36 -27
synth_ai/lm/vendors/core/gemini_api.py +31 -36
synth_ai/lm/vendors/core/mistral_api.py +19 -19
synth_ai/lm/vendors/core/openai_api.py +42 -13
synth_ai/lm/vendors/openai_standard.py +158 -101
synth_ai/lm/vendors/openai_standard_responses.py +74 -61
synth_ai/lm/vendors/retries.py +9 -1
synth_ai/lm/vendors/supported/custom_endpoint.py +38 -28
synth_ai/lm/vendors/supported/deepseek.py +10 -10
synth_ai/lm/vendors/supported/grok.py +8 -8
synth_ai/lm/vendors/supported/ollama.py +2 -1
synth_ai/lm/vendors/supported/openrouter.py +11 -9
synth_ai/lm/vendors/synth_client.py +425 -75
synth_ai/lm/warmup.py +8 -7
synth_ai/rl/__init__.py +30 -0
synth_ai/rl/contracts.py +32 -0
synth_ai/rl/env_keys.py +137 -0
synth_ai/rl/secrets.py +19 -0
synth_ai/scripts/verify_rewards.py +100 -0
synth_ai/task/__init__.py +10 -0
synth_ai/task/contracts.py +120 -0
synth_ai/task/health.py +28 -0
synth_ai/task/validators.py +12 -0
synth_ai/tracing/__init__.py +22 -10
synth_ai/tracing_v1/__init__.py +22 -20
synth_ai/tracing_v3/__init__.py +7 -7
synth_ai/tracing_v3/abstractions.py +56 -52
synth_ai/tracing_v3/config.py +4 -2
synth_ai/tracing_v3/db_config.py +6 -8
synth_ai/tracing_v3/decorators.py +29 -30
synth_ai/tracing_v3/examples/basic_usage.py +12 -12
synth_ai/tracing_v3/hooks.py +24 -22
synth_ai/tracing_v3/llm_call_record_helpers.py +85 -98
synth_ai/tracing_v3/lm_call_record_abstractions.py +2 -4
synth_ai/tracing_v3/migration_helper.py +3 -5
synth_ai/tracing_v3/replica_sync.py +30 -32
synth_ai/tracing_v3/session_tracer.py +158 -31
synth_ai/tracing_v3/storage/__init__.py +1 -1
synth_ai/tracing_v3/storage/base.py +8 -7
synth_ai/tracing_v3/storage/config.py +4 -4
synth_ai/tracing_v3/storage/factory.py +4 -4
synth_ai/tracing_v3/storage/utils.py +9 -9
synth_ai/tracing_v3/turso/__init__.py +3 -3
synth_ai/tracing_v3/turso/daemon.py +9 -9
synth_ai/tracing_v3/turso/manager.py +278 -48
synth_ai/tracing_v3/turso/models.py +77 -19
synth_ai/tracing_v3/utils.py +5 -5
synth_ai/v0/tracing/abstractions.py +28 -28
synth_ai/v0/tracing/base_client.py +9 -9
synth_ai/v0/tracing/client_manager.py +7 -7
synth_ai/v0/tracing/config.py +7 -7
synth_ai/v0/tracing/context.py +6 -6
synth_ai/v0/tracing/decorators.py +6 -5
synth_ai/v0/tracing/events/manage.py +1 -1
synth_ai/v0/tracing/events/store.py +5 -4
synth_ai/v0/tracing/immediate_client.py +4 -5
synth_ai/v0/tracing/local.py +3 -3
synth_ai/v0/tracing/log_client_base.py +4 -5
synth_ai/v0/tracing/retry_queue.py +5 -6
synth_ai/v0/tracing/trackers.py +25 -25
synth_ai/v0/tracing/upload.py +6 -0
synth_ai/v0/tracing_v1/__init__.py +1 -1
synth_ai/v0/tracing_v1/abstractions.py +28 -28
synth_ai/v0/tracing_v1/base_client.py +9 -9
synth_ai/v0/tracing_v1/client_manager.py +7 -7
synth_ai/v0/tracing_v1/config.py +7 -7
synth_ai/v0/tracing_v1/context.py +6 -6
synth_ai/v0/tracing_v1/decorators.py +7 -6
synth_ai/v0/tracing_v1/events/manage.py +1 -1
synth_ai/v0/tracing_v1/events/store.py +5 -4
synth_ai/v0/tracing_v1/immediate_client.py +4 -5
synth_ai/v0/tracing_v1/local.py +3 -3
synth_ai/v0/tracing_v1/log_client_base.py +4 -5
synth_ai/v0/tracing_v1/retry_queue.py +5 -6
synth_ai/v0/tracing_v1/trackers.py +25 -25
synth_ai/v0/tracing_v1/upload.py +25 -24
synth_ai/zyk/__init__.py +1 -0
synth_ai-0.2.4.dev8.dist-info/METADATA +635 -0
synth_ai-0.2.4.dev8.dist-info/RECORD +317 -0
synth_ai/tui/__init__.py +0 -1
synth_ai/tui/__main__.py +0 -13
synth_ai/tui/cli/__init__.py +0 -1
synth_ai/tui/cli/query_experiments.py +0 -165
synth_ai/tui/cli/query_experiments_v3.py +0 -165
synth_ai/tui/dashboard.py +0 -329
synth_ai-0.2.4.dev6.dist-info/METADATA +0 -203
synth_ai-0.2.4.dev6.dist-info/RECORD +0 -299
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/WHEEL +0 -0
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/top_level.txt +0 -0

synth_ai/learning/prompts/mipro.py CHANGED Viewed

@@ -20,9 +20,9 @@ Notes
 from __future__ import annotations
 import random
+from collections.abc import Callable, Sequence
 from dataclasses import dataclass, replace
-from typing import Any, Callable, Dict, Iterable, List, Optional, Protocol, Sequence, Tuple
+from typing import Any, Protocol
 # ---------------------------
 # Program adapter and protocols
@@ -36,16 +36,16 @@ class PredictProgram(Protocol):
     by wrapping it with `ProgramAdapter` below.
     """
-    def deepcopy(self) -> "PredictProgram": ...
+    def deepcopy(self) -> PredictProgram: ...
-    def run(self, x: Any, *, model: Optional[Any] = None) -> Any: ...
+    def run(self, x: Any, *, model: Any | None = None) -> Any: ...
-    def with_instructions(self, instructions: Dict[str, str]) -> "PredictProgram": ...
+    def with_instructions(self, instructions: dict[str, str]) -> PredictProgram: ...
-    def with_demos(self, demos: List[Tuple[Any, Any]]) -> "PredictProgram": ...
+    def with_demos(self, demos: list[tuple[Any, Any]]) -> PredictProgram: ...
     @property
-    def predictors(self) -> List[str]: ...
+    def predictors(self) -> list[str]: ...
 @dataclass
@@ -59,28 +59,28 @@ class ProgramAdapter:
     - set_demos: Callable to update demos (global or per predictor)
     """
-    run_fn: Callable[[Any, Optional[Any]], Any]
-    state: Dict[str, Any]
-    _predictors: List[str]
-    set_instructions: Callable[[Dict[str, str], Dict[str, Any]], Dict[str, Any]]
-    set_demos: Callable[[List[Tuple[Any, Any]], Dict[str, Any]], Dict[str, Any]]
+    run_fn: Callable[[Any, Any | None], Any]
+    state: dict[str, Any]
+    _predictors: list[str]
+    set_instructions: Callable[[dict[str, str], dict[str, Any]], dict[str, Any]]
+    set_demos: Callable[[list[tuple[Any, Any]], dict[str, Any]], dict[str, Any]]
-    def deepcopy(self) -> "ProgramAdapter":
+    def deepcopy(self) -> ProgramAdapter:
         return replace(self, state={**self.state})
-    def run(self, x: Any, *, model: Optional[Any] = None) -> Any:
+    def run(self, x: Any, *, model: Any | None = None) -> Any:
         return self.run_fn(x, model)
-    def with_instructions(self, instructions: Dict[str, str]) -> "ProgramAdapter":
+    def with_instructions(self, instructions: dict[str, str]) -> ProgramAdapter:
         new_state = self.set_instructions(instructions, {**self.state})
         return replace(self, state=new_state)
-    def with_demos(self, demos: List[Tuple[Any, Any]]) -> "ProgramAdapter":
+    def with_demos(self, demos: list[tuple[Any, Any]]) -> ProgramAdapter:
         new_state = self.set_demos(demos, {**self.state})
         return replace(self, state=new_state)
     @property
-    def predictors(self) -> List[str]:
+    def predictors(self) -> list[str]:
         return list(self._predictors)
@@ -89,9 +89,11 @@ class ProgramAdapter:
 # ---------------------------
-def summarize_dataset(trainset: Sequence[Tuple[Any, Any]], max_items: int = 50) -> str:
+def summarize_dataset(trainset: Sequence[tuple[Any, Any]], max_items: int = 50) -> str:
     n = len(trainset)
-    ex = ", ".join(repr(trainset[i][0])[:40] for i in range(0, min(max_items, n), max(1, n // max_items or 1)))
+    ex = ", ".join(
+        repr(trainset[i][0])[:40] for i in range(0, min(max_items, n), max(1, n // max_items or 1))
+    )
     return f"Dataset size: {n}. Example inputs: {ex}"
@@ -109,7 +111,7 @@ def random_tip(rng: random.Random) -> str:
     return rng.choice(tips)
-def choose(items: Sequence[Any], rng: Optional[random.Random] = None) -> Any:
+def choose(items: Sequence[Any], rng: random.Random | None = None) -> Any:
     r = rng or random
     return r.choice(items)
@@ -122,10 +124,12 @@ def choose(items: Sequence[Any], rng: Optional[random.Random] = None) -> Any:
 @dataclass
 class EvalResult:
     score: float
-    subscores: List[float]
+    subscores: list[float]
-def evaluate_program(program: PredictProgram, dataset: Sequence[Tuple[Any, Any]], metric: Callable[[Any, Any], float]) -> EvalResult:
+def evaluate_program(
+    program: PredictProgram, dataset: Sequence[tuple[Any, Any]], metric: Callable[[Any, Any], float]
+) -> EvalResult:
     subs = []
     for x, y in dataset:
         yhat = program.run(x)
@@ -140,8 +144,8 @@ def evaluate_program(program: PredictProgram, dataset: Sequence[Tuple[Any, Any]]
 def mipro_v2_compile(
     student: PredictProgram,
-    trainset: Sequence[Tuple[Any, Any]],
-    valset: Sequence[Tuple[Any, Any]],
+    trainset: Sequence[tuple[Any, Any]],
+    valset: Sequence[tuple[Any, Any]],
     metric: Callable[[Any, Any], float],
     *,
     prompt_model: Any,
@@ -159,7 +163,7 @@ def mipro_v2_compile(
     data_aware: bool = True,
     tip_aware: bool = True,
     fewshot_aware: bool = True,
-) -> Tuple[PredictProgram, List[Dict[str, Any]]]:
+) -> tuple[PredictProgram, list[dict[str, Any]]]:
     """MIPROv2-style optimizer.
     Arguments mirror the DSPy pseudocode but remain provider-agnostic. The
@@ -171,9 +175,9 @@ def mipro_v2_compile(
     program = student.deepcopy()
     # Step 1: bootstrap few-shot example candidates
-    demo_candidates: List[Dict[str, Any]] = []
+    demo_candidates: list[dict[str, Any]] = []
     for _ in range(num_candidates):
-        boot: List[Tuple[Any, Any]] = []
+        boot: list[tuple[Any, Any]] = []
         # collect bootstrapped, self-consistent demos
         while len(boot) < max_bootstrapped_demos:
             x, y = rng.choice(trainset)
@@ -184,9 +188,9 @@ def mipro_v2_compile(
         demo_candidates.append({"boot": boot, "labeled": labeled})
     # Step 2: propose instruction candidates per predictor
-    instr_candidates: Dict[str, List[str]] = {}
-    for pred in (program.predictors or ["predictor"]):
-        ctx: Dict[str, Any] = {}
+    instr_candidates: dict[str, list[str]] = {}
+    for pred in program.predictors or ["predictor"]:
+        ctx: dict[str, Any] = {}
         if data_aware:
             ctx["dataset_summary"] = summarize_dataset(trainset)
         if program_aware:
@@ -199,12 +203,12 @@ def mipro_v2_compile(
         instr_candidates[pred] = list(cand)
     # Step 3: Bayesian-optimization-like search (random proposer placeholder)
-    history: List[Tuple[Dict[str, Any], float]] = []
-    records: List[Dict[str, Any]] = []
+    history: list[tuple[dict[str, Any], float]] = []
+    records: list[dict[str, Any]] = []
     best_score = -1.0
-    best_cfg: Optional[Dict[str, Any]] = None
+    best_cfg: dict[str, Any] | None = None
-    def propose(history_: List[Tuple[Dict[str, Any], float]]) -> Dict[str, Any]:
+    def propose(history_: list[tuple[dict[str, Any], float]]) -> dict[str, Any]:
         # Placeholder: randomly sample from the cartesian product
         instructions = {pred: choose(instr_candidates[pred], rng) for pred in instr_candidates}
         demos = choose(demo_candidates, rng) if demo_candidates else None
@@ -227,15 +231,17 @@ def mipro_v2_compile(
         batch_res = evaluate_program(program_t, batch, metric)
         s_t = batch_res.score
         history.append((theta, s_t))
-        records.append({
-            "trial": t,
-            "evaluation": "batch" if minibatch else "full",
-            "score": s_t,
-            "intervention": {
-                "instructions": theta.get("instructions"),
-                "demo_set": theta.get("demo_set"),
-            },
-        })
+        records.append(
+            {
+                "trial": t,
+                "evaluation": "batch" if minibatch else "full",
+                "score": s_t,
+                "intervention": {
+                    "instructions": theta.get("instructions"),
+                    "demo_set": theta.get("demo_set"),
+                },
+            }
+        )
         if (not minibatch) or (t % max(1, minibatch_full_eval_steps) == 0):
             full_res = evaluate_program(program_t, valset, metric)
@@ -243,15 +249,17 @@ def mipro_v2_compile(
             if s_full > best_score:
                 best_score = s_full
                 best_cfg = theta
-            records.append({
-                "trial": t,
-                "evaluation": "full",
-                "score": s_full,
-                "intervention": {
-                    "instructions": theta.get("instructions"),
-                    "demo_set": theta.get("demo_set"),
-                },
-            })
+            records.append(
+                {
+                    "trial": t,
+                    "evaluation": "full",
+                    "score": s_full,
+                    "intervention": {
+                        "instructions": theta.get("instructions"),
+                        "demo_set": theta.get("demo_set"),
+                    },
+                }
+            )
     if best_cfg is None:
         return program, records
@@ -275,6 +283,7 @@ __all__ = [
 class ExampleTwoStepDag:
     pass
 """
 A -> B
 """

synth_ai/learning/prompts/random_search.py CHANGED Viewed

@@ -8,10 +8,11 @@ metric, and this module will explore baselines and bootstrapped few-shot variant
 from __future__ import annotations
+import contextlib
 import random
+from collections.abc import Callable, Sequence
 from dataclasses import dataclass
-from typing import Any, Callable, Dict, List, Optional, Sequence, Tuple
+from typing import Any
 # ---------------------------
 # Protocol-like expectations (duck-typed)
@@ -25,7 +26,7 @@ class _ProgramLike:
     def deepcopy(self):  # deep copy
         return self
-    def with_demos(self, demos: List[Tuple[Any, Any]]):
+    def with_demos(self, demos: list[tuple[Any, Any]]):
         return self
     def run(self, x: Any) -> Any:
@@ -40,10 +41,12 @@ class _ProgramLike:
 @dataclass
 class EvalResult:
     score: float
-    subscores: List[float]
+    subscores: list[float]
-def evaluate(program: _ProgramLike, dataset: Sequence[Tuple[Any, Any]], metric: Callable[[Any, Any], float]) -> EvalResult:
+def evaluate(
+    program: _ProgramLike, dataset: Sequence[tuple[Any, Any]], metric: Callable[[Any, Any], float]
+) -> EvalResult:
     subs = []
     for x, y in dataset:
         subs.append(metric(program.run(x), y))
@@ -54,7 +57,9 @@ class LabeledFewShot:
     def __init__(self, k: int):
         self.k = k
-    def compile(self, student: _ProgramLike, trainset: Sequence[Tuple[Any, Any]], sample: bool = True) -> _ProgramLike:
+    def compile(
+        self, student: _ProgramLike, trainset: Sequence[tuple[Any, Any]], sample: bool = True
+    ) -> _ProgramLike:
         p = getattr(student, "deepcopy", student.reset_copy)()
         demos = list(trainset)
         if sample:
@@ -68,10 +73,10 @@ class BootstrapFewShot:
         self,
         *,
         metric: Callable[[Any, Any], float],
-        metric_threshold: Optional[float] = None,
+        metric_threshold: float | None = None,
         max_bootstrapped_demos: int = 8,
         max_labeled_demos: int = 0,
-        teacher_settings: Optional[Dict[str, Any]] = None,
+        teacher_settings: dict[str, Any] | None = None,
         max_rounds: int = 1,
     ):
         self.metric = metric
@@ -84,18 +89,18 @@ class BootstrapFewShot:
     def compile(
         self,
         student: _ProgramLike,
-        teacher: Optional[_ProgramLike],
-        trainset: Sequence[Tuple[Any, Any]],
+        teacher: _ProgramLike | None,
+        trainset: Sequence[tuple[Any, Any]],
     ) -> _ProgramLike:
         p = getattr(student, "deepcopy", student.reset_copy)()
         rng = random.Random()
         # If bootstrapped demos disabled, return labeled-only few-shot quickly
         if self.max_bootstrapped_demos <= 0:
-            demos: List[Tuple[Any, Any]] = []
+            demos: list[tuple[Any, Any]] = []
             if self.max_labeled_demos > 0:
                 demos += rng.sample(list(trainset), k=min(self.max_labeled_demos, len(trainset)))
             return p.with_demos(demos)
-        boot: List[Tuple[Any, Any]] = []
+        boot: list[tuple[Any, Any]] = []
         # Bootstrap demos by self consistency
         for _ in range(self.max_rounds):
             rng.shuffle(trainset := list(trainset))
@@ -127,33 +132,29 @@ class BootstrapFewShot:
 @dataclass
 class Candidate:
     score: float
-    subscores: List[float]
+    subscores: list[float]
     seed: int
     program: _ProgramLike
 def random_search_compile(
     student: _ProgramLike,
-    trainset: Sequence[Tuple[Any, Any]],
-    valset: Sequence[Tuple[Any, Any]],
+    trainset: Sequence[tuple[Any, Any]],
+    valset: Sequence[tuple[Any, Any]],
     metric: Callable[[Any, Any], float],
     *,
     max_bootstrapped_demos: int = 8,
     max_labeled_demos: int = 4,
     max_rounds: int = 2,
     num_candidate_programs: int = 16,
-    stop_at_score: Optional[float] = None,
-    evaluate_fn: Optional[Callable[[
-        _ProgramLike,
-        Sequence[Tuple[Any, Any]],
-        Callable[[Any, Any], float]
-    ], EvalResult]] = None,
-    on_candidate_evaluated: Optional[Callable[[int, float, EvalResult, Dict[str, Any]], None]] = None,
-) -> Tuple[_ProgramLike, List[Dict[str, Any]]]:
-    best_program: Optional[_ProgramLike] = None
+    stop_at_score: float | None = None,
+    evaluate_fn: Callable[[_ProgramLike, Sequence[tuple[Any, Any]], Callable[[Any, Any], float]], EvalResult] | None = None,
+    on_candidate_evaluated: Callable[[int, float, EvalResult, dict[str, Any]], None] | None = None,
+) -> tuple[_ProgramLike, list[dict[str, Any]]]:
+    best_program: _ProgramLike | None = None
     best_score = float("-inf")
-    candidates: List[Candidate] = []
-    records: List[Dict[str, Any]] = []
+    candidates: list[Candidate] = []
+    records: list[dict[str, Any]] = []
     seeds = list(range(num_candidate_programs))
     seeds = [-3, -2, -1] + seeds  # zero-shot, labeled few-shot, bootstrapped few-shot
@@ -174,7 +175,9 @@ def random_search_compile(
             if max_bootstrapped_demos <= 0:
                 size = 0
             else:
-                size = max_bootstrapped_demos if seed == -1 else rng.randint(1, max_bootstrapped_demos)
+                size = (
+                    max_bootstrapped_demos if seed == -1 else rng.randint(1, max_bootstrapped_demos)
+                )
             program = BootstrapFewShot(
                 metric=metric,
                 metric_threshold=None,
@@ -184,14 +187,18 @@ def random_search_compile(
                 max_rounds=max_rounds,
             ).compile(student, teacher=None, trainset=train_copy)
-        res = (evaluate_fn(program, valset, metric) if evaluate_fn else evaluate(program, valset, metric))
+        res = (
+            evaluate_fn(program, valset, metric)
+            if evaluate_fn
+            else evaluate(program, valset, metric)
+        )
         cand = Candidate(score=res.score, subscores=res.subscores, seed=seed, program=program)
         candidates.append(cand)
         # Record an intervention summary for reproducibility
-        intervention: Dict[str, Any] = {"seed": seed}
+        intervention: dict[str, Any] = {"seed": seed}
         if hasattr(program, "demos"):
             try:
-                intervention["demos"] = getattr(program, "demos")  # type: ignore
+                intervention["demos"] = program.demos  # type: ignore
             except Exception:
                 intervention["demos"] = None
         # Type of candidate
@@ -203,12 +210,6 @@ def random_search_compile(
             intervention["label"] = f"labeled-{max_labeled_demos}"
         else:
             intervention["kind"] = "bootstrapped_few_shot"
-            bs = 0
-            try:
-                # try to infer from program demos length if present
-                bs = len(intervention.get("demos") or [])
-            except Exception:
-                bs = 0
             intervention["label"] = f"boot-b{max_bootstrapped_demos}-l{max_labeled_demos}"
         record_obj = {
             "score": cand.score,
@@ -224,18 +225,16 @@ def random_search_compile(
             break
         if on_candidate_evaluated is not None:
-            try:
+            with contextlib.suppress(Exception):
                 on_candidate_evaluated(idx + 1, res.score, res, intervention)
-            except Exception:
-                pass
     # Attach candidates for inspection
     if hasattr(best_program, "candidate_programs"):
         # If user object supports attribute assignment
-        try:
-            best_program.candidate_programs = sorted(candidates, key=lambda c: c.score, reverse=True)  # type: ignore[attr-defined]
-        except Exception:
-            pass
+        with contextlib.suppress(Exception):
+            best_program.candidate_programs = sorted(
+                candidates, key=lambda c: c.score, reverse=True
+            )  # type: ignore[attr-defined]
     return (best_program or getattr(student, "deepcopy", student)(), records)

synth_ai/learning/prompts/run_mipro_banking77.py CHANGED Viewed

@@ -12,39 +12,41 @@ Run:
 from __future__ import annotations
 import asyncio
+import json
 import os
 import random
-from dataclasses import dataclass, replace
-from typing import Any, Dict, List, Sequence, Tuple
+import time
+from collections.abc import Sequence
+from pathlib import Path
+from typing import Any
-from dotenv import load_dotenv
 from datasets import load_dataset
+from dotenv import load_dotenv
+from synth_ai.learning.prompts.mipro import ProgramAdapter, evaluate_program, mipro_v2_compile
 from synth_ai.lm.core.main_v3 import LM, build_messages
-import json
-import time
-from pathlib import Path
-from synth_ai.learning.prompts.mipro import ProgramAdapter, mipro_v2_compile, evaluate_program
-def choose_label(pred: str, label_names: List[str]) -> str:
+def choose_label(pred: str, label_names: list[str]) -> str:
     norm = (pred or "").strip().lower()
     d = {ln.lower(): ln for ln in label_names}
     if norm in d:
         return d[norm]
     def score(cand: str) -> int:
         c = cand.lower()
         return sum(1 for w in c.split() if w in norm)
     return max(label_names, key=score)
-def accuracy(pred: str, gold: str, labels: List[str]) -> float:
+def accuracy(pred: str, gold: str, labels: list[str]) -> float:
     return 1.0 if choose_label(pred, labels) == gold else 0.0
 class NaivePromptModel:
     """Toy prompt model that returns simple instruction variants."""
-    def generate_instructions(self, ctx: Dict[str, Any], k: int = 8) -> List[str]:
+    def generate_instructions(self, ctx: dict[str, Any], k: int = 8) -> list[str]:
         base = "Classify the Banking77 intent and return exactly one label."
         variants = [
             base,
@@ -60,28 +62,33 @@ class NaivePromptModel:
         return variants[:k]
-def build_run_fn(lm: LM, label_names: List[str]):
+def build_run_fn(lm: LM, label_names: list[str]):
     def run_fn(x: str, _model: Any | None = None) -> str:
         # Use instructions and demos from adapter state (set by set_instructions/set_demos)
         # The adapter passes state via closure; we rebuild messages here
-        instructions = state_ref.get("instructions", {}).get("main", "You are an intent classifier for Banking77.")
+        instructions = state_ref.get("instructions", {}).get(
+            "main", "You are an intent classifier for Banking77."
+        )
         examples = "\n".join(f"Input: {a}\nLabel: {b}" for a, b in state_ref.get("demos", []))
         sys = instructions
         user = (f"Examples:\n{examples}\n\n" if examples else "") + f"Message: {x}\nLabel:"
         messages = build_messages(sys, user, images_bytes=None, model_name=lm.model)
         async def _call():
             resp = await lm.respond_async(messages=messages)
             return (resp.raw_response or "").strip()
         return asyncio.run(_call())
     return run_fn
-def set_instructions(new_instr: Dict[str, str], state: Dict[str, Any]) -> Dict[str, Any]:
+def set_instructions(new_instr: dict[str, str], state: dict[str, Any]) -> dict[str, Any]:
     state["instructions"] = {**state.get("instructions", {}), **new_instr}
     return state
-def set_demos(demos: List[Tuple[str, str]], state: Dict[str, Any]) -> Dict[str, Any]:
+def set_demos(demos: list[tuple[str, str]], state: dict[str, Any]) -> dict[str, Any]:
     state["demos"] = list(demos)
     return state
@@ -96,15 +103,18 @@ def main():
     print("Loading Banking77 dataset (train/dev split of test for demo)...")
     ds = load_dataset("banking77")
-    label_names: List[str] = ds["test"].features["label"].names  # type: ignore
+    label_names: list[str] = ds["test"].features["label"].names  # type: ignore
     all_items = [(r["text"], label_names[int(r["label"])]) for r in ds["test"]]
     random.shuffle(all_items)
-    trainset: Sequence[Tuple[str, str]] = all_items[:80]
-    valset: Sequence[Tuple[str, str]] = all_items[80:160]
+    trainset: Sequence[tuple[str, str]] = all_items[:80]
+    valset: Sequence[tuple[str, str]] = all_items[80:160]
     global state_ref
-    state_ref = {"instructions": {"main": "You are an intent classifier for Banking77."}, "demos": []}
+    state_ref = {
+        "instructions": {"main": "You are an intent classifier for Banking77."},
+        "demos": [],
+    }
     adapter = ProgramAdapter(
         run_fn=build_run_fn(lm, label_names),
         state=state_ref,
@@ -138,7 +148,9 @@ def main():
     )
     res = evaluate_program(best, valset, metric)
-    print(f"Best program accuracy on val: {res.score:.2%} ({sum(res.subscores)}/{len(res.subscores)})")
+    print(
+        f"Best program accuracy on val: {res.score:.2%} ({sum(res.subscores)}/{len(res.subscores)})"
+    )
     out = {
         "context": {

synth-ai 0.2.4.dev6__py3-none-any.whl → 0.2.4.dev8__py3-none-any.whl

synth-ai 0.2.4.dev6py3-none-any.whl → 0.2.4.dev8py3-none-any.whl