npm - @fastino-ai/pioneer-cli - Versions diffs - 0.1.0 → 0.2.0 - Mend

@fastino-ai/pioneer-cli 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

package/README.md +161 -22
package/bun.lock +82 -0
package/cache/cache.db +0 -0
package/cache/cache.db-shm +0 -0
package/cache/cache.db-wal +0 -0
package/fastino-ai-pioneer-cli-0.2.0.tgz +0 -0
package/package.json +6 -3
package/src/agent/Agent.ts +342 -0
package/src/agent/BudgetManager.ts +167 -0
package/src/agent/FileResolver.ts +321 -0
package/src/agent/LLMClient.ts +435 -0
package/src/agent/ToolRegistry.ts +97 -0
package/src/agent/index.ts +15 -0
package/src/agent/types.ts +84 -0
package/src/chat/ChatApp.tsx +701 -0
package/src/chat/index.ts +7 -0
package/src/config.ts +185 -3
package/src/evolution/EvalRunner.ts +301 -0
package/src/evolution/EvolutionEngine.ts +319 -0
package/src/evolution/FeedbackCollector.ts +197 -0
package/src/evolution/ModelTrainer.ts +371 -0
package/src/evolution/index.ts +18 -0
package/src/evolution/types.ts +110 -0
package/src/index.tsx +101 -2
package/src/tools/bash.ts +184 -0
package/src/tools/filesystem.ts +444 -0
package/src/tools/index.ts +29 -0
package/src/tools/modal.ts +269 -0
package/src/tools/sandbox.ts +310 -0
package/src/tools/training.ts +443 -0
package/src/tools/wandb.ts +348 -0

package/src/evolution/ModelTrainer.ts ADDED Viewed

@@ -0,0 +1,371 @@
+/**
+ * ModelTrainer - Fine-tune or train models based on feedback
+ */
+import * as fs from "fs";
+import * as path from "path";
+import * as os from "os";
+import { spawn } from "child_process";
+import type { TrainingData } from "./types.js";
+export interface ModelTrainerConfig {
+  provider: "openai" | "anthropic" | "modal" | "local";
+  baseModel: string;
+  outputDir?: string;
+  openaiApiKey?: string;
+  anthropicApiKey?: string;
+  modalTokenId?: string;
+  modalTokenSecret?: string;
+}
+export interface TrainingResult {
+  success: boolean;
+  modelId?: string;
+  modelPath?: string;
+  metrics?: {
+    loss?: number;
+    accuracy?: number;
+    epochs?: number;
+  };
+  error?: string;
+}
+export class ModelTrainer {
+  private config: ModelTrainerConfig;
+  private outputDir: string;
+  constructor(config: ModelTrainerConfig) {
+    this.config = config;
+    this.outputDir =
+      config.outputDir || path.join(os.homedir(), ".pioneer", "models");
+    this.ensureOutputDir();
+  }
+  private ensureOutputDir(): void {
+    if (!fs.existsSync(this.outputDir)) {
+      fs.mkdirSync(this.outputDir, { recursive: true });
+    }
+  }
+  async train(trainingData: TrainingData[]): Promise<TrainingResult> {
+    if (trainingData.length < 10) {
+      return {
+        success: false,
+        error: "Insufficient training data. Need at least 10 examples.",
+      };
+    }
+    switch (this.config.provider) {
+      case "openai":
+        return this.trainOpenAI(trainingData);
+      case "modal":
+        return this.trainModal(trainingData);
+      case "local":
+        return this.trainLocal(trainingData);
+      default:
+        return {
+          success: false,
+          error: `Unsupported provider: ${this.config.provider}`,
+        };
+    }
+  }
+  private async trainOpenAI(trainingData: TrainingData[]): Promise<TrainingResult> {
+    const apiKey = this.config.openaiApiKey || process.env.OPENAI_API_KEY;
+    if (!apiKey) {
+      return { success: false, error: "OpenAI API key not provided" };
+    }
+    // Prepare training file
+    const tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "openai-train-"));
+    const trainingFile = path.join(tempDir, "training.jsonl");
+    const formattedData = trainingData.map((d) => ({
+      messages: d.messages,
+    }));
+    fs.writeFileSync(
+      trainingFile,
+      formattedData.map((d) => JSON.stringify(d)).join("\n")
+    );
+    try {
+      // Upload file
+      const uploadResponse = await fetch(
+        "https://api.openai.com/v1/files",
+        {
+          method: "POST",
+          headers: {
+            Authorization: `Bearer ${apiKey}`,
+          },
+          body: (() => {
+            const formData = new FormData();
+            formData.append("purpose", "fine-tune");
+            formData.append(
+              "file",
+              new Blob([fs.readFileSync(trainingFile)]),
+              "training.jsonl"
+            );
+            return formData;
+          })(),
+        }
+      );
+      if (!uploadResponse.ok) {
+        const error = await uploadResponse.text();
+        return { success: false, error: `File upload failed: ${error}` };
+      }
+      const uploadResult = await uploadResponse.json() as { id: string };
+      // Create fine-tuning job
+      const ftResponse = await fetch(
+        "https://api.openai.com/v1/fine_tuning/jobs",
+        {
+          method: "POST",
+          headers: {
+            Authorization: `Bearer ${apiKey}`,
+            "Content-Type": "application/json",
+          },
+          body: JSON.stringify({
+            training_file: uploadResult.id,
+            model: this.config.baseModel || "gpt-4o-mini-2024-07-18",
+          }),
+        }
+      );
+      if (!ftResponse.ok) {
+        const error = await ftResponse.text();
+        return { success: false, error: `Fine-tuning failed: ${error}` };
+      }
+      const ftResult = await ftResponse.json() as { id: string; fine_tuned_model?: string };
+      return {
+        success: true,
+        modelId: ftResult.id,
+        modelPath: ftResult.fine_tuned_model,
+      };
+    } finally {
+      fs.rmSync(tempDir, { recursive: true, force: true });
+    }
+  }
+  private async trainModal(trainingData: TrainingData[]): Promise<TrainingResult> {
+    const tempDir = fs.mkdtempSync(path.join(os.tmpdir(), "modal-train-"));
+    const dataFile = path.join(tempDir, "training_data.jsonl");
+    const appFile = path.join(tempDir, "train_app.py");
+    // Save training data
+    fs.writeFileSync(
+      dataFile,
+      trainingData.map((d) => JSON.stringify(d)).join("\n")
+    );
+    // Create Modal training app
+    const modalCode = `
+import modal
+import json
+app = modal.App("pioneer-finetune")
+volume = modal.Volume.from_name("pioneer-models", create_if_missing=True)
+image = modal.Image.debian_slim(python_version="3.11").pip_install([
+    "torch",
+    "transformers",
+    "datasets",
+    "accelerate",
+    "peft",
+    "bitsandbytes",
+])
+@app.function(
+    image=image,
+    gpu="A10G",
+    timeout=7200,
+    volumes={"/models": volume},
+)
+def finetune(data_json: str, base_model: str, output_name: str):
+    import torch
+    from transformers import AutoModelForCausalLM, AutoTokenizer, TrainingArguments, Trainer
+    from datasets import Dataset
+    from peft import LoraConfig, get_peft_model
+    # Parse data
+    data = [json.loads(line) for line in data_json.strip().split("\\n")]
+    # Convert to dataset
+    texts = []
+    for item in data:
+        text = ""
+        for msg in item.get("messages", []):
+            text += f"{msg['role']}: {msg['content']}\\n"
+        texts.append(text)
+    dataset = Dataset.from_dict({"text": texts})
+    # Load model
+    model = AutoModelForCausalLM.from_pretrained(
+        base_model,
+        torch_dtype=torch.float16,
+        device_map="auto",
+    )
+    tokenizer = AutoTokenizer.from_pretrained(base_model)
+    tokenizer.pad_token = tokenizer.eos_token
+    # Apply LoRA
+    lora_config = LoraConfig(r=16, lora_alpha=32, target_modules=["q_proj", "v_proj"])
+    model = get_peft_model(model, lora_config)
+    # Tokenize
+    def tokenize(examples):
+        return tokenizer(examples["text"], truncation=True, max_length=512, padding="max_length")
+    tokenized = dataset.map(tokenize, batched=True)
+    # Train
+    training_args = TrainingArguments(
+        output_dir=f"/models/{output_name}",
+        num_train_epochs=3,
+        per_device_train_batch_size=4,
+        learning_rate=2e-5,
+        save_steps=500,
+        logging_steps=10,
+    )
+    trainer = Trainer(
+        model=model,
+        args=training_args,
+        train_dataset=tokenized,
+    )
+    trainer.train()
+    # Save
+    trainer.save_model(f"/models/{output_name}")
+    volume.commit()
+    return {"success": True, "model_path": f"/models/{output_name}"}
+@app.local_entrypoint()
+def main():
+    import sys
+    data_file = sys.argv[1] if len(sys.argv) > 1 else "training_data.jsonl"
+    base_model = "${this.config.baseModel || "meta-llama/Llama-2-7b-hf"}"
+    output_name = "pioneer-ft-" + str(int(__import__("time").time()))
+    with open(data_file) as f:
+        data_json = f.read()
+    result = finetune.remote(data_json, base_model, output_name)
+    print(json.dumps(result))
+`;
+    fs.writeFileSync(appFile, modalCode);
+    try {
+      return new Promise((resolve) => {
+        let stdout = "";
+        let stderr = "";
+        const env: NodeJS.ProcessEnv = { ...process.env };
+        if (this.config.modalTokenId) {
+          env.MODAL_TOKEN_ID = this.config.modalTokenId;
+        }
+        if (this.config.modalTokenSecret) {
+          env.MODAL_TOKEN_SECRET = this.config.modalTokenSecret;
+        }
+        const proc = spawn("modal", ["run", appFile, "--", dataFile], {
+          stdio: ["pipe", "pipe", "pipe"],
+          env,
+        });
+        proc.stdout.on("data", (data: Buffer) => {
+          stdout += data.toString();
+        });
+        proc.stderr.on("data", (data: Buffer) => {
+          stderr += data.toString();
+        });
+        proc.on("close", (code) => {
+          if (code === 0) {
+            try {
+              const result = JSON.parse(stdout.trim().split("\n").pop() || "{}");
+              resolve({
+                success: true,
+                modelPath: result.model_path,
+              });
+            } catch {
+              resolve({ success: true, modelPath: stdout });
+            }
+          } else {
+            resolve({
+              success: false,
+              error: stderr || `Exit code: ${code}`,
+            });
+          }
+        });
+        proc.on("error", (err) => {
+          resolve({ success: false, error: err.message });
+        });
+      });
+    } finally {
+      fs.rmSync(tempDir, { recursive: true, force: true });
+    }
+  }
+  private async trainLocal(trainingData: TrainingData[]): Promise<TrainingResult> {
+    // For local training, we'll save the data and provide instructions
+    const outputPath = path.join(
+      this.outputDir,
+      `training_${Date.now()}.jsonl`
+    );
+    fs.writeFileSync(
+      outputPath,
+      trainingData.map((d) => JSON.stringify(d)).join("\n")
+    );
+    return {
+      success: true,
+      modelPath: outputPath,
+      metrics: {
+        epochs: 0,
+      },
+    };
+  }
+  // Prompt optimization (alternative to full fine-tuning)
+  async optimizePrompt(
+    currentPrompt: string,
+    feedback: { positive: string[]; negative: string[] }
+  ): Promise<string> {
+    // Use the agent itself to improve its system prompt based on feedback
+    const optimizationPrompt = `You are a prompt engineer. Given the current system prompt and feedback, create an improved version.
+Current Prompt:
+${currentPrompt}
+Positive Examples (what worked well):
+${feedback.positive.slice(0, 5).join("\n---\n")}
+Negative Examples (what didn't work):
+${feedback.negative.slice(0, 5).join("\n---\n")}
+Create an improved system prompt that:
+1. Keeps what's working well
+2. Addresses the issues in negative examples
+3. Maintains the core capabilities
+4. Is clear and actionable
+Improved Prompt:`;
+    // For now, return the original prompt
+    // In a full implementation, this would call an LLM to generate the improved prompt
+    return currentPrompt;
+  }
+}

package/src/evolution/index.ts ADDED Viewed

@@ -0,0 +1,18 @@
+/**
+ * Evolution module exports
+ */
+export { EvolutionEngine } from "./EvolutionEngine.js";
+export type { EvolutionEngineConfig, EvolutionEvents } from "./EvolutionEngine.js";
+export { FeedbackCollector } from "./FeedbackCollector.js";
+export type { FeedbackCollectorConfig } from "./FeedbackCollector.js";
+export { EvalRunner, DEFAULT_EVAL_CASES } from "./EvalRunner.js";
+export type { EvalRunnerConfig } from "./EvalRunner.js";
+export { ModelTrainer } from "./ModelTrainer.js";
+export type { ModelTrainerConfig, TrainingResult } from "./ModelTrainer.js";
+export * from "./types.js";

package/src/evolution/types.ts ADDED Viewed

@@ -0,0 +1,110 @@
+/**
+ * Types for the self-evolution system
+ */
+export interface Feedback {
+  id: string;
+  sessionId: string;
+  timestamp: Date;
+  userMessage: string;
+  agentResponse: string;
+  toolCalls: string[];
+  rating?: number; // 1-5
+  corrections?: string;
+  wasSuccessful: boolean;
+  metadata?: Record<string, unknown>;
+}
+export interface EvalCase {
+  id: string;
+  name: string;
+  description: string;
+  input: string;
+  expectedOutput?: string;
+  expectedToolCalls?: string[];
+  successCriteria: EvalCriteria[];
+  weight?: number;
+}
+export interface EvalCriteria {
+  type: "contains" | "not_contains" | "tool_called" | "tool_not_called" | "regex" | "custom";
+  value: string;
+  description?: string;
+}
+export interface EvalResult {
+  caseId: string;
+  passed: boolean;
+  score: number;
+  actualOutput: string;
+  toolsCalled: string[];
+  errors?: string[];
+  duration: number;
+  tokenUsage: number;
+}
+export interface EvalRunSummary {
+  runId: string;
+  timestamp: Date;
+  totalCases: number;
+  passedCases: number;
+  failedCases: number;
+  averageScore: number;
+  totalTokens: number;
+  totalDuration: number;
+  results: EvalResult[];
+}
+export interface EvolutionConfig {
+  evalCases: EvalCase[];
+  targetScore: number;
+  maxIterations: number;
+  budgetPerIteration: {
+    maxTokens?: number;
+    maxCost?: number;
+    maxTime?: number;
+  };
+  feedbackWindow: number; // Number of recent feedback items to consider
+  trainingConfig?: {
+    provider: "openai" | "anthropic" | "modal";
+    baseModel: string;
+    fineTuneMethod: "full" | "lora" | "prompt";
+  };
+}
+export interface EvolutionState {
+  iteration: number;
+  currentScore: number;
+  bestScore: number;
+  bestPrompt: string;
+  history: EvolutionHistory[];
+  totalTokensUsed: number;
+  totalCostUsed: number;
+  totalTimeUsed: number;
+  startTime: Date;
+  endTime?: Date;
+  status: "running" | "completed" | "failed" | "budget_exhausted";
+}
+export interface EvolutionHistory {
+  iteration: number;
+  prompt: string;
+  evalScore: number;
+  changes: string;
+  timestamp: Date;
+}
+export interface TrainingData {
+  id: string;
+  messages: Array<{
+    role: "user" | "assistant" | "system";
+    content: string;
+  }>;
+  toolCalls?: Array<{
+    name: string;
+    arguments: Record<string, unknown>;
+    result: string;
+  }>;
+  metadata?: Record<string, unknown>;
+}

package/src/index.tsx CHANGED Viewed

@@ -14,8 +14,15 @@ import {
   getBaseUrl,
   saveConfig,
   clearApiKey,
+  getAgentConfig,
+  getBudgetConfig,
+  getSandboxConfig,
+  getMLConfig,
+  getSystemPrompt,
 } from "./config.js";
 import * as api from "./api.js";
+import { ChatApp } from "./chat/ChatApp.js";
+import type { AgentConfig } from "./agent/types.js";
 // ─────────────────────────────────────────────────────────────────────────────
 // ASCII Banner
@@ -252,6 +259,17 @@ const Help: React.FC = () => {
       <Text bold>Usage:</Text>
       <Text>  pioneer {"<command>"} {"[options]"}</Text>
       <Text> </Text>
+      <Text bold>Chat Commands:</Text>
+      <Text>  chat                    Start interactive chat agent</Text>
+      <Text>    --provider {"<name>"}     LLM provider (anthropic, openai)</Text>
+      <Text>    --model {"<model>"}       Model to use</Text>
+      <Text>    --message {"<msg>"}       Initial message to process</Text>
+      <Text>    --max-tokens {"<n>"}      Max tokens (default: 500000, 0=unlimited)</Text>
+      <Text>    --max-cost {"<n>"}        Max cost in USD (default: 5.0, 0=unlimited)</Text>
+      <Text>    --max-time {"<n>"}        Max time in seconds (default: 7200, 0=unlimited)</Text>
+      <Text>    --max-tools {"<n>"}       Max tool calls per turn (default: 50, 0=unlimited)</Text>
+      <Text>    --no-limit            Remove all limits</Text>
+      <Text> </Text>
       <Text bold>Auth Commands:</Text>
       <Text>  auth login              Login with API key</Text>
       <Text>  auth logout             Clear stored API key</Text>
@@ -284,12 +302,88 @@ const Help: React.FC = () => {
       <Text>  --help                  Show this help</Text>
       <Text> </Text>
       <Text dimColor>Environment:</Text>
-      <Text dimColor>  PIONEER_API_URL   API base URL (default: http://localhost:5001)</Text>
-      <Text dimColor>  PIONEER_API_KEY   API key (overrides saved key)</Text>
+      <Text dimColor>  PIONEER_API_URL       API base URL (default: http://localhost:5001)</Text>
+      <Text dimColor>  PIONEER_API_KEY       API key (overrides saved key)</Text>
+      <Text dimColor>  ANTHROPIC_API_KEY     Anthropic API key for chat agent</Text>
+      <Text dimColor>  OPENAI_API_KEY        OpenAI API key for chat agent</Text>
     </Box>
   );
 };
+// ─────────────────────────────────────────────────────────────────────────────
+// Chat Wrapper Component
+// ─────────────────────────────────────────────────────────────────────────────
+interface ChatWrapperProps {
+  flags: Record<string, string>;
+}
+const ChatWrapper: React.FC<ChatWrapperProps> = ({ flags }) => {
+  const { exit } = useApp();
+  // Build agent config from flags and stored config
+  const storedConfig = getAgentConfig();
+  const budgetConfig = getBudgetConfig();
+  const systemPrompt = getSystemPrompt();
+  // Apply budget overrides from flags
+  const budget = { ...budgetConfig };
+  let maxToolCalls = 50; // Default
+  if (flags["no-limit"] === "true") {
+    // Remove all limits
+    budget.maxTokens = undefined;
+    budget.maxCost = undefined;
+    budget.maxTime = undefined;
+    budget.maxIterations = undefined;
+    maxToolCalls = 1000; // Effectively unlimited
+  } else {
+    // Apply individual overrides (0 = unlimited)
+    if (flags["max-tokens"]) {
+      const val = parseInt(flags["max-tokens"], 10);
+      budget.maxTokens = val === 0 ? undefined : val;
+    }
+    if (flags["max-cost"]) {
+      const val = parseFloat(flags["max-cost"]);
+      budget.maxCost = val === 0 ? undefined : val;
+    }
+    if (flags["max-time"]) {
+      const val = parseInt(flags["max-time"], 10);
+      budget.maxTime = val === 0 ? undefined : val;
+    }
+    if (flags["max-tools"]) {
+      const val = parseInt(flags["max-tools"], 10);
+      maxToolCalls = val === 0 ? 1000 : val;
+    }
+  }
+  const agentConfig: AgentConfig = {
+    provider: (flags.provider as "anthropic" | "openai") || storedConfig.provider,
+    model: flags.model || storedConfig.model,
+    apiKey: storedConfig.apiKey,
+    baseUrl: storedConfig.baseUrl,
+    budget,
+    systemPrompt,
+    maxToolCalls,
+  };
+  // Validate we have an API key
+  if (!agentConfig.apiKey) {
+    return (
+      <Box flexDirection="column">
+        <ErrorMessage error="No API key configured. Set ANTHROPIC_API_KEY or OPENAI_API_KEY environment variable." />
+        <Text dimColor>
+          Or run: export ANTHROPIC_API_KEY="your-key"
+        </Text>
+      </Box>
+    );
+  }
+  const initialMessage = flags.message;
+  return <ChatApp config={agentConfig} initialMessage={initialMessage} />;
+};
 // ─────────────────────────────────────────────────────────────────────────────
 // Main Router
 // ─────────────────────────────────────────────────────────────────────────────
@@ -307,6 +401,11 @@ const App: React.FC<AppProps> = ({ command, flags }) => {
     return <Help />;
   }
+  // Chat command - Interactive agent
+  if (group === "chat") {
+    return <ChatWrapper flags={flags} />;
+  }
   // Auth commands
   if (group === "auth") {
     if (action === "login") return <AuthLogin />;