RubyGems - ace-llm-providers-cli - Versions diffs - 0.27.0 - Mend

ace-llm-providers-cli 0.27.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (40) hide show

checksums.yaml +7 -0
data/.ace-defaults/llm/providers/claude.yml +24 -0
data/.ace-defaults/llm/providers/codex.yml +22 -0
data/.ace-defaults/llm/providers/codexoss.yml +13 -0
data/.ace-defaults/llm/providers/gemini.yml +32 -0
data/.ace-defaults/llm/providers/opencode.yml +26 -0
data/.ace-defaults/llm/providers/pi.yml +43 -0
data/CHANGELOG.md +457 -0
data/LICENSE +21 -0
data/README.md +36 -0
data/Rakefile +14 -0
data/exe/ace-llm-providers-cli-check +76 -0
data/lib/ace/llm/providers/cli/atoms/args_normalizer.rb +82 -0
data/lib/ace/llm/providers/cli/atoms/auth_checker.rb +74 -0
data/lib/ace/llm/providers/cli/atoms/command_formatters.rb +19 -0
data/lib/ace/llm/providers/cli/atoms/command_rewriter.rb +75 -0
data/lib/ace/llm/providers/cli/atoms/execution_context.rb +28 -0
data/lib/ace/llm/providers/cli/atoms/provider_detector.rb +48 -0
data/lib/ace/llm/providers/cli/atoms/session_finders/claude_session_finder.rb +79 -0
data/lib/ace/llm/providers/cli/atoms/session_finders/codex_session_finder.rb +84 -0
data/lib/ace/llm/providers/cli/atoms/session_finders/gemini_session_finder.rb +66 -0
data/lib/ace/llm/providers/cli/atoms/session_finders/open_code_session_finder.rb +119 -0
data/lib/ace/llm/providers/cli/atoms/session_finders/pi_session_finder.rb +87 -0
data/lib/ace/llm/providers/cli/atoms/skill_command_rewriter.rb +30 -0
data/lib/ace/llm/providers/cli/atoms/worktree_dir_resolver.rb +56 -0
data/lib/ace/llm/providers/cli/claude_code_client.rb +358 -0
data/lib/ace/llm/providers/cli/claude_oai_client.rb +322 -0
data/lib/ace/llm/providers/cli/cli_args_support.rb +19 -0
data/lib/ace/llm/providers/cli/codex_client.rb +291 -0
data/lib/ace/llm/providers/cli/codex_oai_client.rb +274 -0
data/lib/ace/llm/providers/cli/gemini_client.rb +346 -0
data/lib/ace/llm/providers/cli/molecules/health_checker.rb +80 -0
data/lib/ace/llm/providers/cli/molecules/safe_capture.rb +153 -0
data/lib/ace/llm/providers/cli/molecules/session_finder.rb +44 -0
data/lib/ace/llm/providers/cli/molecules/skill_name_reader.rb +64 -0
data/lib/ace/llm/providers/cli/open_code_client.rb +271 -0
data/lib/ace/llm/providers/cli/pi_client.rb +331 -0
data/lib/ace/llm/providers/cli/version.rb +11 -0
data/lib/ace/llm/providers/cli.rb +47 -0
metadata +139 -0

data/lib/ace/llm/providers/cli/claude_oai_client.rb ADDED Viewed

@@ -0,0 +1,322 @@
+# frozen_string_literal: true
+require "json"
+require "open3"
+require "shellwords"
+require_relative "cli_args_support"
+require_relative "atoms/execution_context"
+require_relative "atoms/command_rewriter"
+require_relative "atoms/command_formatters"
+require_relative "molecules/skill_name_reader"
+module Ace
+  module LLM
+    module Providers
+      module CLI
+        # Client for Claude over Anthropic-compatible APIs (Z.ai, OpenRouter, etc.)
+        # Uses the claude CLI subprocess with backend-specific env vars to route
+        # requests through alternative Anthropic-compatible endpoints.
+        class ClaudeOaiClient < Ace::LLM::Organisms::BaseClient
+          include CliArgsSupport
+          API_BASE_URL = "https://api.z.ai"
+          DEFAULT_GENERATION_CONFIG = {}.freeze
+          def self.provider_name
+            "claudeoai"
+          end
+          DEFAULT_MODEL = "zai/glm-5"
+          def initialize(model: nil, **options)
+            @model = model || DEFAULT_MODEL
+            @options = options
+            @generation_config = options[:generation_config] || {}
+            @backends = options[:backends] || {}
+            @skill_name_reader = Molecules::SkillNameReader.new
+          end
+          def needs_credentials?
+            false
+          end
+          # Generate a response from the LLM
+          # @param messages [Array<Hash>] Conversation messages
+          # @param options [Hash] Generation options
+          # @return [Hash] Response with text and metadata
+          def generate(messages, **options)
+            validate_claude_availability!
+            prompt = format_messages_as_prompt(messages)
+            subprocess_env = options.delete(:subprocess_env)
+            working_dir = Atoms::ExecutionContext.resolve_working_dir(
+              working_dir: options[:working_dir],
+              subprocess_env: subprocess_env
+            )
+            prompt = rewrite_skill_commands(prompt, working_dir: working_dir)
+            cmd = build_claude_command(options)
+            stdout, stderr, status = execute_claude_command(
+              cmd,
+              prompt,
+              subprocess_env: subprocess_env,
+              working_dir: working_dir
+            )
+            parse_claude_response(stdout, stderr, status, prompt, options)
+          rescue => e
+            handle_claude_error(e)
+          end
+          # List available models
+          def list_models
+            [
+              {id: "zai/glm-5", name: "GLM-5", description: "Z.ai flagship model (Anthropic-compatible)", context_size: 128_000},
+              {id: "zai/glm-4.7", name: "GLM-4.7", description: "Z.ai balanced model (Anthropic-compatible)", context_size: 128_000},
+              {id: "zai/glm-4.6", name: "GLM-4.6", description: "Z.ai fast model (Anthropic-compatible)", context_size: 128_000}
+            ]
+          end
+          # Split "backend/model" into ["backend", "model"]
+          # @param model_string [String] e.g. "zai/glm-5"
+          # @return [Array<String>] e.g. ["zai", "glm-5"]
+          def split_backend_model(model_string)
+            return [nil, nil] unless model_string
+            parts = model_string.split("/", 2)
+            return [nil, nil] unless parts.length == 2
+            parts
+          end
+          private
+          def format_messages_as_prompt(messages)
+            return messages if messages.is_a?(String)
+            system_msg = messages.find { |m| (m[:role] || m["role"]) == "system" }
+            other_msgs = messages.reject { |m| (m[:role] || m["role"]) == "system" }
+            formatted = other_msgs.map do |msg|
+              role = msg[:role] || msg["role"]
+              content = msg[:content] || msg["content"]
+              case role
+              when "user"
+                "User: #{content}"
+              when "assistant"
+                "Assistant: #{content}"
+              else
+                content
+              end
+            end
+            if system_msg
+              system_content = system_msg[:content] || system_msg["content"]
+              formatted.unshift("System: #{system_content}")
+            end
+            formatted.join("\n\n")
+          end
+          def claude_available?
+            system("which claude > /dev/null 2>&1")
+          end
+          def validate_claude_availability!
+            unless claude_available?
+              raise Ace::LLM::ProviderError, "Claude CLI not found. Install with: npm install -g @anthropic-ai/claude-cli"
+            end
+          end
+          def build_claude_command(options)
+            cmd = ["claude"]
+            cmd << "-p"
+            # Always use JSON output for consistent parsing
+            cmd << "--output-format" << "json"
+            # Use a tier alias (sonnet/opus/haiku) that claude CLI recognizes,
+            # rather than the backend model name (e.g. glm-5) which it doesn't.
+            tier = resolve_model_tier
+            cmd << "--model" << tier if tier
+            # Add max tokens if provided
+            max_tokens = options[:max_tokens] || @generation_config[:max_tokens]
+            if max_tokens
+              cmd << "--max-tokens" << max_tokens.to_s
+            end
+            # User CLI args last so they take precedence
+            cmd.concat(normalized_cli_args(options))
+            cmd
+          end
+          def execute_claude_command(cmd, prompt, subprocess_env: nil, working_dir: nil)
+            timeout_val = @options[:timeout] || 120
+            # Build env with backend-specific vars for Anthropic-compatible routing
+            env = {"CLAUDECODE" => nil}
+            env.merge!(backend_env_vars)
+            env.merge!(subprocess_env) if subprocess_env
+            debug_subprocess("spawn timeout=#{timeout_val}s cmd=#{cmd.join(" ")} prompt_bytes=#{prompt.to_s.bytesize}")
+            Molecules::SafeCapture.call(
+              cmd,
+              timeout: timeout_val,
+              stdin_data: prompt.to_s,
+              chdir: working_dir,
+              env: env,
+              provider_name: "Claude OAI"
+            )
+          end
+          # Build env vars hash for the current backend
+          # Sets ANTHROPIC_BASE_URL, ANTHROPIC_AUTH_TOKEN, and clears ANTHROPIC_API_KEY
+          def backend_env_vars
+            backend_name, _model_name = split_backend_model(@model)
+            return {} unless backend_name
+            backend_config = @backends[backend_name] || @backends[backend_name.to_sym] || {}
+            return {} if backend_config.empty?
+            env = {}
+            # Set the base URL for the Anthropic-compatible endpoint
+            if (base_url = backend_config["base_url"] || backend_config[:base_url])
+              env["ANTHROPIC_BASE_URL"] = base_url
+            end
+            # Read the API key from the env var specified in config
+            if (env_key = backend_config["env_key"] || backend_config[:env_key])
+              env["ANTHROPIC_AUTH_TOKEN"] = ENV[env_key]
+            end
+            # Clear ANTHROPIC_API_KEY so claude doesn't use cached Anthropic creds
+            env["ANTHROPIC_API_KEY"] = ""
+            # Map the tier alias to the backend's actual model name so
+            # `--model sonnet` resolves to e.g. "glm-5" at the backend
+            _bn, model_name = split_backend_model(@model)
+            tier = resolve_model_tier
+            if tier && model_name
+              env_key_for_tier = "ANTHROPIC_DEFAULT_#{tier.upcase}_MODEL"
+              env[env_key_for_tier] = model_name
+            end
+            env
+          end
+          # Resolve which Claude CLI tier alias to use for --model.
+          # Looks up model_tiers in backend config; falls back to "sonnet".
+          def resolve_model_tier
+            backend_name, model_name = split_backend_model(@model)
+            return "sonnet" unless backend_name && model_name
+            backend_config = @backends[backend_name] || @backends[backend_name.to_sym] || {}
+            tiers = backend_config["model_tiers"] || backend_config[:model_tiers] || {}
+            # Find the tier whose value matches the requested model.
+            # Note: first matching tier wins when multiple tiers map to the same model.
+            matched = tiers.find { |_tier, m| m.to_s == model_name }
+            return matched[0].to_s if matched
+            # No explicit tier mapping — default to sonnet
+            "sonnet"
+          end
+          def parse_claude_response(stdout, stderr, status, prompt, options)
+            unless status.success?
+              error_msg = stderr.empty? ? stdout : stderr
+              raise Ace::LLM::ProviderError, "Claude OAI CLI failed: #{error_msg}"
+            end
+            begin
+              response = JSON.parse(stdout, allow_duplicate_key: true)
+            rescue JSON::ParserError => e
+              raise Ace::LLM::ProviderError, "Failed to parse Claude OAI response: #{e.message}"
+            end
+            text = response["result"] || response["response"] || ""
+            metadata = build_metadata(response, prompt, options)
+            {
+              text: text,
+              metadata: metadata
+            }
+          end
+          def build_metadata(response, prompt, options)
+            usage = response["usage"] || {}
+            metadata = {
+              provider: "claudeoai",
+              model: @model || DEFAULT_MODEL,
+              input_tokens: usage["input_tokens"] || 0,
+              output_tokens: usage["output_tokens"] || 0,
+              total_tokens: (usage["input_tokens"] || 0) + (usage["output_tokens"] || 0),
+              cached_tokens: usage["cache_read_input_tokens"] || 0,
+              finish_reason: response["subtype"] || "success",
+              took: (response["duration_ms"] || 0) / 1000.0,
+              timestamp: Time.now.utc.iso8601
+            }
+            if response["total_cost_usd"]
+              metadata[:cost] = {
+                input_cost: 0.0,
+                output_cost: 0.0,
+                total_cost: response["total_cost_usd"],
+                currency: "USD"
+              }
+            end
+            metadata[:session_id] = response["session_id"] if response["session_id"]
+            metadata[:provider_specific] = {
+              uuid: response["uuid"],
+              service_tier: usage["service_tier"],
+              duration_api_ms: response["duration_api_ms"],
+              cache_creation_tokens: usage["cache_creation_input_tokens"]
+            }.compact
+            metadata
+          end
+          def handle_claude_error(error)
+            raise error
+          end
+          def rewrite_skill_commands(prompt, working_dir: nil)
+            skills_dir = resolve_skills_dir(working_dir: working_dir)
+            return prompt unless skills_dir
+            skill_names = @skill_name_reader.call(skills_dir)
+            return prompt if skill_names.empty?
+            Atoms::CommandRewriter.call(prompt, skill_names: skill_names, formatter: Atoms::CommandFormatters::CODEX_FORMATTER)
+          end
+          def resolve_skills_dir(working_dir: nil)
+            configured = @options[:skills_dir] || @generation_config[:skills_dir]
+            return configured if configured && Dir.exist?(configured)
+            working_dir ||= Atoms::ExecutionContext.resolve_working_dir
+            candidate_dirs = [
+              File.join(working_dir, ".claude", "skills"),
+              File.join(working_dir, ".agent", "skills")
+            ]
+            candidate_dirs.find { |dir| Dir.exist?(dir) }
+          end
+          def debug_subprocess(message)
+            return unless ENV["ACE_LLM_DEBUG_SUBPROCESS"] == "1"
+            warn("[ClaudeOaiClient] #{message}")
+          end
+        end
+      end
+    end
+  end
+end

data/lib/ace/llm/providers/cli/cli_args_support.rb ADDED Viewed

@@ -0,0 +1,19 @@
+# frozen_string_literal: true
+require_relative "atoms/args_normalizer"
+module Ace
+  module LLM
+    module Providers
+      module CLI
+        module CliArgsSupport
+          private
+          def normalized_cli_args(options)
+            Atoms::ArgsNormalizer.new.normalize_cli_args(options[:cli_args])
+          end
+        end
+      end
+    end
+  end
+end

data/lib/ace/llm/providers/cli/codex_client.rb ADDED Viewed

@@ -0,0 +1,291 @@
+# frozen_string_literal: true
+require "json"
+require "open3"
+require "shellwords"
+require_relative "cli_args_support"
+require_relative "atoms/execution_context"
+require_relative "atoms/command_rewriter"
+require_relative "atoms/command_formatters"
+require_relative "atoms/worktree_dir_resolver"
+require_relative "molecules/skill_name_reader"
+module Ace
+  module LLM
+    module Providers
+      module CLI
+        # Client for interacting with Codex CLI (OpenAI)
+        # Provides access to Codex models through subprocess execution
+        class CodexClient < Ace::LLM::Organisms::BaseClient
+          include CliArgsSupport
+          # Not used for CLI interaction but required by BaseClient
+          API_BASE_URL = "https://api.openai.com"
+          DEFAULT_GENERATION_CONFIG = {}.freeze
+          # Provider registration - auto-registers as "codex"
+          def self.provider_name
+            "codex"
+          end
+          # Default model (can be overridden by config)
+          DEFAULT_MODEL = "gpt-5"
+          def initialize(model: nil, **options)
+            @model = model || DEFAULT_MODEL
+            # Skip normal BaseClient initialization that requires API key
+            @options = options
+            @generation_config = options[:generation_config] || {}
+            @skill_name_reader = Molecules::SkillNameReader.new
+          end
+          # Override to indicate this client doesn't need API credentials
+          def needs_credentials?
+            false
+          end
+          # Generate a response from the LLM
+          # @param messages [Array<Hash>] Conversation messages
+          # @param options [Hash] Generation options
+          # @return [Hash] Response with text and metadata
+          def generate(messages, **options)
+            validate_codex_availability!
+            # Convert messages to prompt format
+            prompt = format_messages_as_prompt(messages)
+            subprocess_env = options[:subprocess_env]
+            working_dir = Atoms::ExecutionContext.resolve_working_dir(
+              working_dir: options[:working_dir],
+              subprocess_env: subprocess_env
+            )
+            prompt = rewrite_skill_commands(prompt, working_dir: working_dir)
+            cmd = build_codex_command(prompt, options, working_dir: working_dir)
+            stdout, stderr, status = execute_codex_command(cmd, prompt, options)
+            parse_codex_response(stdout, stderr, status, prompt, options)
+          rescue => e
+            handle_codex_error(e)
+          end
+          # List available Codex models
+          def list_models
+            # Return models based on what the CLI supports
+            # Actual models come from YAML config
+            [
+              {id: "gpt-5", name: "GPT-5", description: "Advanced Codex model", context_size: 128_000},
+              {id: "gpt-5-mini", name: "GPT-5 Mini", description: "Smaller, faster model", context_size: 128_000}
+            ]
+          end
+          private
+          def format_messages_as_prompt(messages)
+            # Handle both array of message hashes and string prompt
+            return messages if messages.is_a?(String)
+            # Extract system message if present
+            system_msg = messages.find { |m| (m[:role] || m["role"]) == "system" }
+            other_msgs = messages.reject { |m| (m[:role] || m["role"]) == "system" }
+            # Format remaining messages
+            formatted = other_msgs.map do |msg|
+              role = msg[:role] || msg["role"]
+              content = msg[:content] || msg["content"]
+              case role
+              when "user"
+                "User: #{content}"
+              when "assistant"
+                "Assistant: #{content}"
+              else
+                content
+              end
+            end
+            # Prepend system message if present
+            if system_msg
+              system_content = system_msg[:content] || system_msg["content"]
+              formatted.unshift("System: #{system_content}")
+            end
+            formatted.join("\n\n")
+          end
+          def codex_available?
+            system("which codex > /dev/null 2>&1")
+          end
+          def validate_codex_availability!
+            unless codex_available?
+              raise Ace::LLM::ProviderError, "Codex CLI not found. Install with: npm install -g @openai/codex or visit https://codex.ai"
+            end
+            # Check if Codex is authenticated
+            unless codex_authenticated?
+              raise Ace::LLM::AuthenticationError, "Codex authentication required. Run 'codex login' or configure API key"
+            end
+          end
+          def codex_authenticated?
+            # Quick check if Codex can execute (will fail fast if not authenticated)
+            cmd = ["codex", "--version"]
+            stdout, _, status = Open3.capture3(*cmd)
+            status.success? && (stdout.include?("codex") || stdout.include?("Codex"))
+          rescue
+            # If version check fails, try help command
+            begin
+              cmd = ["codex", "--help"]
+              _, _, status = Open3.capture3(*cmd)
+              status.success?
+            rescue
+              false
+            end
+          end
+          def build_codex_command(prompt, options, working_dir: nil)
+            working_dir ||= Atoms::ExecutionContext.resolve_working_dir(
+              working_dir: options[:working_dir],
+              subprocess_env: options[:subprocess_env]
+            )
+            # Use codex exec for non-interactive execution
+            cmd = ["codex", "exec"]
+            # Add sandbox mode if specified by caller
+            if options[:sandbox]
+              cmd << "--sandbox" << options[:sandbox].to_s
+            end
+            # Add model selection if not default
+            if @model && @model != DEFAULT_MODEL
+              cmd << "--model" << @model
+            end
+            # Note: Codex exec doesn't support direct system prompts or temperature/max_tokens
+            # These would need to be incorporated into the prompt itself
+            # Add writable dir for git worktree metadata
+            if (git_dir = Atoms::WorktreeDirResolver.call(working_dir: working_dir))
+              cmd << "--add-dir" << git_dir
+            end
+            # Capture last message progressively for timeout resilience
+            if options[:last_message_file]
+              cmd << "--output-last-message" << options[:last_message_file]
+            end
+            # User CLI args last so they take precedence (last-wins in most CLIs)
+            cmd.concat(normalized_cli_args(options))
+            cmd
+          end
+          def execute_codex_command(cmd, prompt, options)
+            # Prepare the input - combine system prompt with user prompt if needed
+            input = prompt.to_s
+            # Check for system prompt in options or generation config
+            system_content = options[:system_instruction] ||
+              options[:system] ||
+              options[:system_prompt] ||
+              @generation_config[:system_prompt]
+            if system_content && !prompt.include?("System:")
+              input = "System: #{system_content}\n\nUser: #{input}"
+            end
+            timeout_val = @options[:timeout] || 120
+            working_dir = Atoms::ExecutionContext.resolve_working_dir(
+              working_dir: options[:working_dir],
+              subprocess_env: options[:subprocess_env]
+            )
+            Molecules::SafeCapture.call(
+              cmd,
+              timeout: timeout_val,
+              stdin_data: input,
+              chdir: working_dir,
+              provider_name: "Codex"
+            )
+          end
+          def parse_codex_response(stdout, stderr, status, prompt, options)
+            unless status.success?
+              error_msg = stderr.empty? ? stdout : stderr
+              raise Ace::LLM::ProviderError, "Codex CLI failed: #{error_msg}"
+            end
+            # Parse Codex output format to extract the actual response
+            # Codex output includes metadata lines and the actual response
+            lines = stdout.split("\n")
+            # Find where the actual response starts (after "codex" header)
+            response_start = lines.find_index { |line| line.include?("codex") }
+            if response_start && response_start < lines.length - 1
+              # Extract text after the "codex" line, skipping empty lines
+              response_lines = lines[(response_start + 1)..-1]
+              # Remove token usage lines at the end
+              response_lines = response_lines.reject { |line| line.include?("tokens used") }
+              text = response_lines.join("\n").strip
+            else
+              # Fallback: use entire output if we can't parse the format
+              text = stdout.strip
+            end
+            # Build metadata
+            metadata = build_synthetic_metadata(text, prompt)
+            # Return hash compatible with ace-llm format
+            {
+              text: text,
+              metadata: metadata
+            }
+          end
+          def build_synthetic_metadata(response_text, prompt)
+            # Create synthetic metadata since Codex CLI might not provide detailed usage info
+            # Rough token estimation
+            prompt_tokens = (prompt.to_s.length / 4).round # Rough estimate: 4 chars per token
+            response_tokens = (response_text.length / 4).round
+            {
+              provider: "codex",
+              model: @model || DEFAULT_MODEL,
+              input_tokens: prompt_tokens,
+              output_tokens: response_tokens,
+              total_tokens: prompt_tokens + response_tokens,
+              finish_reason: "success",
+              timestamp: Time.now.utc.iso8601
+            }
+          end
+          def handle_codex_error(error)
+            # Re-raise the error for proper handling by the base client error flow
+            raise error
+          end
+          def rewrite_skill_commands(prompt, working_dir: nil)
+            skills_dir = resolve_skills_dir(working_dir: working_dir)
+            return prompt unless skills_dir
+            skill_names = @skill_name_reader.call(skills_dir)
+            return prompt if skill_names.empty?
+            Atoms::CommandRewriter.call(prompt, skill_names: skill_names, formatter: Atoms::CommandFormatters::CODEX_FORMATTER)
+          end
+          def resolve_skills_dir(working_dir: nil)
+            configured = @options[:skills_dir] || @generation_config[:skills_dir]
+            return configured if configured && Dir.exist?(configured)
+            working_dir ||= Atoms::ExecutionContext.resolve_working_dir
+            candidate_dir = File.join(working_dir, ".codex", "skills")
+            candidate_dir if Dir.exist?(candidate_dir)
+          end
+        end
+      end
+    end
+  end
+end