PyPI - synth-ai - Versions diffs - 0.2.4.dev8__py3-none-any.whl → 0.2.4.dev9__py3-none-any.whl - Mend - Supply Chain Defender

synth-ai 0.2.4.dev8py3-none-any.whl → 0.2.4.dev9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (111) hide show

synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/crafter_synth_config.toml ADDED Viewed

@@ -0,0 +1,56 @@
+# Crafter Synth Agent Configuration
+[eval]
+# Model name (required) - Synth/Modal models
+# model_name = "Qwen/Qwen2.5-0.5B-Instruct"
+# model_name = "Qwen/Qwen2.5-7B-Instruct"
+model_name = "Qwen/Qwen2.5-14B-Instruct"
+# Number of episodes to run
+episodes = 5
+# Maximum steps per episode
+max_steps = 50
+# Difficulty: easy, normal, hard
+difficulty = "easy"
+# Random seed for reproducibility
+seed = 42
+[service]
+# Crafter service URL
+base_url = "http://localhost:8901"
+# Request timeout in seconds
+timeout = 30.0
+[output]
+# Save trace files
+save_traces = true
+# Save detailed JSON results
+save_detailed_results = true
+[tracing_v2]
+# Enable v2 tracing
+enabled = true
+# Directory for trace files (will be created automatically)
+trace_dir = "./traces_v2_synth"
+# Store traces in DuckDB only (no individual JSON files)
+duckdb_only = true
+# Clean up old files automatically
+auto_cleanup = true
+[synth]
+# Warm up model before starting
+warmup_model = true
+# Max attempts for warmup
+warmup_max_attempts = 30
+# Warmup timeout for large models (32B, 72B)
+warmup_timeout = 3600  # 60 minutes for 32B model

synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_config_modal.toml ADDED Viewed

@@ -0,0 +1,32 @@
+# Modal/Synth Fine-Tuning Filter Configuration
+# Filtering mode: "trajectory" or "window"
+mode = "trajectory"
+[filters]
+# Minimum total reward for a trajectory
+min_total_reward = 5.0
+# Minimum number of achievements unlocked
+min_achievements = 2
+# Maximum cost (in dollars) for the trajectory
+max_cost = 1.0
+# Maximum tokens used in the trajectory
+max_tokens = 50000
+# Filter by specific models (empty list means all models)
+# Uncomment to filter only Qwen model traces
+# models = ["Qwen/Qwen2.5-7B-Instruct", "Qwen/Qwen2.5-32B-Instruct"]
+[window]
+# Window-based filtering parameters (if mode = "window")
+window_size = 10
+stride = 5
+min_window_reward = 2.0
+[output]
+# Output format settings
+include_metadata = true
+max_context_length = 4096