RubyGems - language-operator - Versions diffs - 0.1.61 → 0.1.62 - Mend

language-operator 0.1.61 → 0.1.62

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (143) hide show

checksums.yaml +4 -4
data/.claude/commands/persona.md +9 -0
data/.claude/commands/task.md +46 -1
data/.rubocop.yml +13 -0
data/.rubocop_custom/use_ux_helper.rb +44 -0
data/CHANGELOG.md +8 -0
data/Gemfile.lock +12 -1
data/Makefile +26 -7
data/Makefile.common +50 -0
data/bin/aictl +8 -1
data/components/agent/Gemfile +1 -1
data/components/agent/bin/langop-agent +7 -0
data/docs/README.md +58 -0
data/docs/{dsl/best-practices.md → best-practices.md} +4 -4
data/docs/cli-reference.md +274 -0
data/docs/{dsl/constraints.md → constraints.md} +5 -5
data/docs/how-agents-work.md +156 -0
data/docs/installation.md +218 -0
data/docs/quickstart.md +299 -0
data/docs/understanding-generated-code.md +265 -0
data/docs/using-tools.md +457 -0
data/docs/webhooks.md +509 -0
data/examples/ux_helpers_demo.rb +296 -0
data/lib/language_operator/agent/base.rb +11 -1
data/lib/language_operator/agent/executor.rb +23 -6
data/lib/language_operator/agent/safety/safe_executor.rb +41 -39
data/lib/language_operator/agent/task_executor.rb +346 -63
data/lib/language_operator/agent/web_server.rb +110 -14
data/lib/language_operator/agent/webhook_authenticator.rb +39 -5
data/lib/language_operator/agent.rb +88 -2
data/lib/language_operator/cli/base_command.rb +17 -11
data/lib/language_operator/cli/command_loader.rb +72 -0
data/lib/language_operator/cli/commands/agent/base.rb +837 -0
data/lib/language_operator/cli/commands/agent/code_operations.rb +102 -0
data/lib/language_operator/cli/commands/agent/helpers/cluster_llm_client.rb +116 -0
data/lib/language_operator/cli/commands/agent/helpers/code_parser.rb +115 -0
data/lib/language_operator/cli/commands/agent/helpers/synthesis_watcher.rb +96 -0
data/lib/language_operator/cli/commands/agent/learning.rb +289 -0
data/lib/language_operator/cli/commands/agent/lifecycle.rb +102 -0
data/lib/language_operator/cli/commands/agent/logs.rb +125 -0
data/lib/language_operator/cli/commands/agent/workspace.rb +327 -0
data/lib/language_operator/cli/commands/cluster.rb +129 -84
data/lib/language_operator/cli/commands/install.rb +1 -1
data/lib/language_operator/cli/commands/model/base.rb +215 -0
data/lib/language_operator/cli/commands/model/test.rb +165 -0
data/lib/language_operator/cli/commands/persona.rb +16 -34
data/lib/language_operator/cli/commands/quickstart.rb +3 -2
data/lib/language_operator/cli/commands/status.rb +40 -67
data/lib/language_operator/cli/commands/system/base.rb +44 -0
data/lib/language_operator/cli/commands/system/exec.rb +147 -0
data/lib/language_operator/cli/commands/system/helpers/llm_synthesis.rb +183 -0
data/lib/language_operator/cli/commands/system/helpers/pod_manager.rb +212 -0
data/lib/language_operator/cli/commands/system/helpers/template_loader.rb +57 -0
data/lib/language_operator/cli/commands/system/helpers/template_validator.rb +174 -0
data/lib/language_operator/cli/commands/system/schema.rb +92 -0
data/lib/language_operator/cli/commands/system/synthesis_template.rb +151 -0
data/lib/language_operator/cli/commands/system/synthesize.rb +224 -0
data/lib/language_operator/cli/commands/system/validate_template.rb +130 -0
data/lib/language_operator/cli/commands/tool/base.rb +271 -0
data/lib/language_operator/cli/commands/tool/install.rb +255 -0
data/lib/language_operator/cli/commands/tool/search.rb +69 -0
data/lib/language_operator/cli/commands/tool/test.rb +115 -0
data/lib/language_operator/cli/commands/use.rb +29 -6
data/lib/language_operator/cli/errors/handler.rb +20 -17
data/lib/language_operator/cli/errors/suggestions.rb +3 -5
data/lib/language_operator/cli/errors/thor_errors.rb +55 -0
data/lib/language_operator/cli/formatters/code_formatter.rb +4 -11
data/lib/language_operator/cli/formatters/log_formatter.rb +8 -15
data/lib/language_operator/cli/formatters/progress_formatter.rb +6 -8
data/lib/language_operator/cli/formatters/status_formatter.rb +26 -7
data/lib/language_operator/cli/formatters/table_formatter.rb +47 -36
data/lib/language_operator/cli/formatters/value_formatter.rb +75 -0
data/lib/language_operator/cli/helpers/cluster_context.rb +5 -3
data/lib/language_operator/cli/helpers/kubeconfig_validator.rb +2 -1
data/lib/language_operator/cli/helpers/label_utils.rb +97 -0
data/lib/language_operator/{ux/concerns/provider_helpers.rb → cli/helpers/provider_helper.rb} +10 -29
data/lib/language_operator/cli/helpers/schedule_builder.rb +21 -1
data/lib/language_operator/cli/helpers/user_prompts.rb +19 -11
data/lib/language_operator/cli/helpers/ux_helper.rb +538 -0
data/lib/language_operator/{ux/concerns/input_validation.rb → cli/helpers/validation_helper.rb} +13 -66
data/lib/language_operator/cli/main.rb +50 -40
data/lib/language_operator/cli/templates/tools/generic.yaml +3 -0
data/lib/language_operator/cli/wizards/agent_wizard.rb +12 -20
data/lib/language_operator/cli/wizards/model_wizard.rb +271 -0
data/lib/language_operator/cli/wizards/quickstart_wizard.rb +8 -34
data/lib/language_operator/client/base.rb +28 -0
data/lib/language_operator/client/config.rb +4 -1
data/lib/language_operator/client/mcp_connector.rb +1 -1
data/lib/language_operator/config/cluster_config.rb +3 -2
data/lib/language_operator/config.rb +38 -11
data/lib/language_operator/constants/kubernetes_labels.rb +80 -0
data/lib/language_operator/constants.rb +13 -0
data/lib/language_operator/dsl/http.rb +127 -10
data/lib/language_operator/dsl.rb +153 -6
data/lib/language_operator/errors.rb +50 -0
data/lib/language_operator/kubernetes/client.rb +11 -6
data/lib/language_operator/kubernetes/resource_builder.rb +58 -84
data/lib/language_operator/templates/schema/agent_dsl_openapi.yaml +1 -1
data/lib/language_operator/templates/schema/agent_dsl_schema.json +1 -1
data/lib/language_operator/type_coercion.rb +118 -34
data/lib/language_operator/utils/secure_path.rb +74 -0
data/lib/language_operator/utils.rb +7 -0
data/lib/language_operator/validators.rb +54 -2
data/lib/language_operator/version.rb +1 -1
data/synth/001/Makefile +10 -2
data/synth/001/agent.rb +16 -15
data/synth/001/output.log +27 -10
data/synth/002/Makefile +10 -2
data/synth/003/Makefile +1 -1
data/synth/003/README.md +205 -133
data/synth/003/agent.optimized.rb +66 -0
data/synth/003/agent.synthesized.rb +41 -0
metadata +111 -35
data/docs/dsl/agent-reference.md +0 -604
data/docs/dsl/mcp-integration.md +0 -1177
data/docs/dsl/webhooks.md +0 -932
data/docs/dsl/workflows.md +0 -744
data/lib/language_operator/cli/commands/agent.rb +0 -1712
data/lib/language_operator/cli/commands/model.rb +0 -366
data/lib/language_operator/cli/commands/system.rb +0 -1259
data/lib/language_operator/cli/commands/tool.rb +0 -654
data/lib/language_operator/cli/formatters/optimization_formatter.rb +0 -226
data/lib/language_operator/cli/helpers/pastel_helper.rb +0 -24
data/lib/language_operator/learning/adapters/base_adapter.rb +0 -149
data/lib/language_operator/learning/adapters/jaeger_adapter.rb +0 -221
data/lib/language_operator/learning/adapters/signoz_adapter.rb +0 -435
data/lib/language_operator/learning/adapters/tempo_adapter.rb +0 -239
data/lib/language_operator/learning/optimizer.rb +0 -319
data/lib/language_operator/learning/pattern_detector.rb +0 -260
data/lib/language_operator/learning/task_synthesizer.rb +0 -288
data/lib/language_operator/learning/trace_analyzer.rb +0 -285
data/lib/language_operator/templates/task_synthesis.tmpl +0 -98
data/lib/language_operator/ux/base.rb +0 -81
data/lib/language_operator/ux/concerns/README.md +0 -155
data/lib/language_operator/ux/concerns/headings.rb +0 -90
data/lib/language_operator/ux/create_agent.rb +0 -255
data/lib/language_operator/ux/create_model.rb +0 -267
data/lib/language_operator/ux/quickstart.rb +0 -594
data/synth/003/agent.rb +0 -41
data/synth/003/output.log +0 -68
/data/docs/{architecture/agent-runtime.md → agent-internals.md} +0 -0
/data/docs/{dsl/chat-endpoints.md → chat-endpoints.md} +0 -0
/data/docs/{dsl/SCHEMA_VERSION.md → schema-versioning.md} +0 -0

data/lib/language_operator/agent/task_executor.rb CHANGED Viewed

@@ -25,6 +25,9 @@ module LanguageOperator
     class TaskTimeoutError < TaskExecutionError
     end
+    class TaskNetworkError < TaskExecutionError
+    end
     # Task Executor for DSL v1 organic functions
     #
     # Executes both neural (LLM-based) and symbolic (code-based) tasks.
@@ -74,6 +77,11 @@ module LanguageOperator
         @agent = agent
         @tasks = tasks
         @config = default_config.merge(config)
+        # Pre-cache task lookup and timeout information for performance
+        @task_cache = build_task_cache
+        @task_timeouts = build_timeout_cache
         logger.debug('TaskExecutor initialized',
                      task_count: @tasks.size,
                      timeout_symbolic: @config[:timeout_symbolic],
@@ -104,21 +112,26 @@ module LanguageOperator
                     'task.inputs' => inputs.keys.map(&:to_s).join(','),
                     'task.max_retries' => max_retries
                   }) do
-          # Find task definition
-          task = @tasks[task_name.to_sym]
-          raise ArgumentError, "Task not found: #{task_name}. Available tasks: #{@tasks.keys.join(', ')}" unless task
+          # Fast task lookup using pre-built cache
+          task_name_sym = task_name.to_sym
+          task_info = @task_cache[task_name_sym]
+          raise ArgumentError, "Task not found: #{task_name}. Available tasks: #{@tasks.keys.join(', ')}" unless task_info
-          task_type = determine_task_type(task)
+          task = task_info[:definition]
+          task_type = task_info[:type]
-          # Determine timeout based on task type if not explicitly provided
-          timeout ||= task_timeout_for_type(task)
+          # Use cached timeout if not explicitly provided
+          timeout ||= @task_timeouts[task_name_sym]
-          logger.info('Executing task',
-                      task: task_name,
-                      type: task_type,
-                      timeout: timeout,
-                      max_retries: max_retries,
-                      inputs: summarize_values(inputs))
+          # Optimize logging - only log if debug level enabled or log_executions is true
+          if logger.logger.level <= ::Logger::DEBUG || @config[:log_executions]
+            logger.info('Executing task',
+                        task: task_name,
+                        type: task_type,
+                        timeout: timeout,
+                        max_retries: max_retries,
+                        inputs: summarize_values(inputs))
+          end
           # Add timeout to span attributes after it's determined
           OpenTelemetry::Trace.current_span&.set_attribute('task.timeout', timeout)
@@ -190,10 +203,46 @@ module LanguageOperator
           logger.info('Parsing neural task response',
                       task: task.name)
-          # Parse response within child span
+          # Parse response within child span with retry logic
           parsed_outputs = tracer.in_span('task_executor.parse_response') do |parse_span|
             record_parse_metadata(response_text, parse_span)
-            parse_neural_response(response_text, task)
+            begin
+              parse_neural_response(response_text, task)
+            rescue RuntimeError => e
+              # If parsing fails and this is a JSON parsing error, try one more time with clarified prompt
+              raise e unless e.message.include?('returned invalid JSON') && !defined?(@parsing_retry_attempted)
+              @parsing_retry_attempted = true
+              logger.warn('JSON parsing failed, retrying with clarified prompt',
+                          task: task.name,
+                          original_error: e.message,
+                          response_preview: response_text[0..300])
+              # Build retry prompt with clearer instructions
+              retry_prompt = build_parsing_retry_prompt(task, validated_inputs, response_text, e.message)
+              logger.info('Retrying LLM call with clarified prompt',
+                          task: task.name,
+                          retry_prompt_length: retry_prompt.length)
+              # Retry LLM call
+              retry_response = @agent.send_message(retry_prompt)
+              retry_response_text = retry_response.is_a?(String) ? retry_response : retry_response.content
+              logger.info('Parsing retry response',
+                          task: task.name,
+                          retry_response_length: retry_response_text.length)
+              # Try parsing the retry response
+              parse_neural_response(retry_response_text, task)
+            # Re-raise original error if not a JSON parsing error or already retried
+            ensure
+              # Reset retry flag for next task
+              @parsing_retry_attempted = nil
+            end
           end
           logger.info('Response parsed successfully',
@@ -293,13 +342,19 @@ module LanguageOperator
       def execute_parallel(tasks, in_threads: 4)
         require 'parallel'
+        # Capture current OpenTelemetry context before parallel execution
+        current_context = OpenTelemetry::Context.current
         logger.info('Executing tasks in parallel', count: tasks.size, threads: in_threads)
         results = Parallel.map(tasks, in_threads: in_threads) do |task_spec|
-          task_name = task_spec[:name]
-          task_inputs = task_spec[:inputs] || {}
+          # Restore OpenTelemetry context in worker thread
+          OpenTelemetry::Context.with_current(current_context) do
+            task_name = task_spec[:name]
+            task_inputs = task_spec[:inputs] || {}
-          execute_task(task_name, inputs: task_inputs)
+            execute_task(task_name, inputs: task_inputs)
+          end
         end
         logger.info('Parallel execution complete', results_count: results.size)
@@ -319,22 +374,41 @@ module LanguageOperator
       end
       # Summarize hash values for logging (truncate long strings)
+      # Optimized for performance with lazy computation
       #
       # @param hash [Hash] Hash to summarize
       # @return [Hash] Summarized hash with truncated values
       def summarize_values(hash)
         return {} unless hash.is_a?(Hash)
-        hash.transform_values do |v|
-          case v
-          when String
-            v.length > 100 ? "#{v[0..97]}... (#{v.length} chars)" : v
-          when Array
-            v.length > 5 ? "#{v.first(3).inspect}... (#{v.length} items)" : v.inspect
-          else
-            v.inspect
-          end
+        # OPTIMIZE: only create new hash if values need summarization
+        needs_summarization = false
+        result = {}
+        hash.each do |key, v|
+          summarized_value = case v
+                             when String
+                               if v.length > 100
+                                 needs_summarization = true
+                                 "#{v[0, 97]}... (#{v.length} chars)"
+                               else
+                                 v
+                               end
+                             when Array
+                               if v.length > 5
+                                 needs_summarization = true
+                                 "#{v.first(3).inspect}... (#{v.length} items)"
+                               else
+                                 v.inspect
+                               end
+                             else
+                               v.inspect
+                             end
+          result[key] = summarized_value
         end
+        # Return original if no summarization was needed (rare optimization)
+        needs_summarization ? result : hash
       end
       # Build prompt for neural task execution
@@ -371,6 +445,63 @@ module LanguageOperator
         prompt
       end
+      # Build retry prompt when JSON parsing fails
+      #
+      # @param task [TaskDefinition] The task definition
+      # @param inputs [Hash] Validated input parameters
+      # @param failed_response [String] The previous response that failed to parse
+      # @param error_message [String] The parsing error message
+      # @return [String] Prompt for LLM retry
+      def build_parsing_retry_prompt(task, inputs, failed_response, error_message)
+        prompt = "# Task: #{task.name} (RETRY - JSON Parsing Failed)\n\n"
+        prompt += "## Instructions\n#{task.instructions_text}\n\n"
+        if inputs.any?
+          prompt += "## Inputs\n"
+          inputs.each do |key, value|
+            prompt += "- #{key}: #{value.inspect}\n"
+          end
+          prompt += "\n"
+        end
+        prompt += "## Previous Response (Failed to Parse)\n"
+        prompt += "Your previous response caused a parsing error: #{error_message}\n"
+        prompt += "Previous response preview:\n```\n#{failed_response[0..500]}#{'...' if failed_response.length > 500}\n```\n\n"
+        prompt += "## Output Schema (CRITICAL)\n"
+        prompt += "You MUST return valid JSON with exactly these fields:\n"
+        task.outputs_schema.each do |key, type|
+          prompt += "- #{key} (#{type})\n"
+        end
+        prompt += "\n"
+        prompt += "## Response Format (CRITICAL)\n"
+        prompt += "IMPORTANT: Your response must be ONLY valid JSON. No other text.\n"
+        prompt += "Do NOT use [THINK] tags or any other text.\n"
+        prompt += "Do NOT include code blocks like ```json.\n"
+        prompt += "Return ONLY the JSON object, nothing else.\n"
+        prompt += "The JSON must match the output schema exactly.\n\n"
+        prompt += "Example correct format:\n"
+        prompt += "{\n"
+        task.outputs_schema.each_with_index do |(key, type), index|
+          value_example = case type
+                          when 'string' then '"example"'
+                          when 'integer' then '42'
+                          when 'number' then '3.14'
+                          when 'boolean' then 'true'
+                          when 'array' then '[]'
+                          when 'hash' then '{}'
+                          else '"value"'
+                          end
+          comma = index < task.outputs_schema.length - 1 ? ',' : ''
+          prompt += "  \"#{key}\": #{value_example}#{comma}\n"
+        end
+        prompt += "}\n"
+        prompt
+      end
       # Parse LLM response to extract output values
       #
       # @param response_text [String] LLM response
@@ -390,13 +521,30 @@ module LanguageOperator
         end
         # Strip thinking tags that some models add (e.g., [THINK]...[/THINK] or unclosed [THINK]...)
-        # First try to strip matched pairs, then strip any remaining unclosed [THINK] content
+        # First try to strip matched pairs, then strip unclosed [THINK] only if there's JSON after it
         logger.debug('Parsing neural response', task: task.name, response_length: response_text.length, response_start: response_text[0..100])
         cleaned_text = response_text.gsub(%r{\[THINK\].*?\[/THINK\]}m, '')
-                                    .gsub(/\[THINK\].*?(?=\{|$)/m, '')
+                                    .gsub(/\[THINK\].*?(?=\{)/m, '')
                                     .strip
+        # If cleaned text is empty or still contains unclosed [THINK], try more aggressive cleaning
+        if cleaned_text.empty? || cleaned_text.start_with?('[THINK]')
+          # Strip everything from [THINK] to end if no [/THINK] found
+          cleaned_text = response_text.gsub(/\[THINK\].*$/m, '').strip
+          # If still no JSON found, extract everything after the last [THINK] block
+          if cleaned_text.empty? && response_text.include?('{')
+            last_think = response_text.rindex('[THINK]')
+            if last_think
+              after_think = response_text[last_think..]
+              # Find first JSON-like structure after [THINK]
+              json_start = after_think.index('{')
+              cleaned_text = after_think[json_start..] if json_start
+            end
+          end
+        end
         logger.debug('After stripping THINK tags', cleaned_length: cleaned_text.length, cleaned_start: cleaned_text[0..100])
         # Try to extract JSON from response
@@ -405,9 +553,17 @@ module LanguageOperator
         json_text = if json_match
                       json_match[1]
                     else
-                      # Try to find raw JSON object
+                      # Try to find raw JSON object - be more aggressive about finding JSON
                       json_object_match = cleaned_text.match(/\{.*\}/m)
-                      json_object_match ? json_object_match[0] : cleaned_text
+                      if json_object_match
+                        json_object_match[0]
+                      elsif cleaned_text.include?('{')
+                        # Extract from first { to end of string (handles incomplete responses)
+                        json_start = cleaned_text.index('{')
+                        cleaned_text[json_start..]
+                      else
+                        cleaned_text
+                      end
                     end
         logger.debug('Extracted JSON text', json_length: json_text.length, json_start: json_text[0..100])
@@ -425,13 +581,23 @@ module LanguageOperator
         raise "Neural task '#{task.name}' returned invalid JSON: #{e.message}"
       end
-      # Recursively convert all hash keys to symbols
+      # Recursively convert all hash keys to symbols (optimized for performance)
       def deep_symbolize_keys(obj)
         case obj
         when Hash
-          obj.transform_keys(&:to_sym).transform_values { |v| deep_symbolize_keys(v) }
+          # OPTIMIZE: pre-allocate hash with correct size and avoid double iteration
+          result = {}
+          obj.each do |key, value|
+            result[key.to_sym] = deep_symbolize_keys(value)
+          end
+          result
         when Array
-          obj.map { |item| deep_symbolize_keys(item) }
+          # OPTIMIZE: pre-allocate array with correct size
+          result = Array.new(obj.size)
+          obj.each_with_index do |item, index|
+            result[index] = deep_symbolize_keys(item)
+          end
+          result
         else
           obj
         end
@@ -538,7 +704,11 @@ module LanguageOperator
         raise create_appropriate_error(task_name, last_error)
       end
-      # Execute a single attempt of a task with timeout
+      # Execute a single attempt of a task with timeout and error context preservation
+      #
+      # This method implements timeout handling that preserves original error context
+      # while maintaining error precedence hierarchy. Timeout errors always take
+      # precedence over any nested errors (including network errors).
       #
       # @param task [TaskDefinition] The task definition
       # @param task_name [Symbol] Name of the task
@@ -551,29 +721,63 @@ module LanguageOperator
         attempt_start = Time.now
         result = if timeout.positive?
-                   Timeout.timeout(timeout) do
-                     execute_task_implementation(task, inputs)
-                   end
+                   execute_with_timeout(task, task_name, inputs, timeout)
                  else
                    execute_task_implementation(task, inputs)
                  end
         execution_time = Time.now - attempt_start
-        logger.info('Task completed',
-                    task: task_name,
-                    attempt: attempt + 1,
-                    execution_time: execution_time.round(3),
-                    outputs: summarize_values(result))
+        # Optimize logging - only log if debug level enabled or log_executions is true
+        if logger.logger.level <= ::Logger::DEBUG || @config[:log_executions]
+          logger.info('Task completed',
+                      task: task_name,
+                      attempt: attempt + 1,
+                      execution_time: execution_time.round(3),
+                      outputs: summarize_values(result))
+        end
         result
+      end
+      # Execute task with timeout wrapper that preserves error context
+      #
+      # This method ensures that timeout errors always take precedence over
+      # any nested errors (e.g., network errors), solving the race condition
+      # between timeout detection and error classification.
+      #
+      # @param task [TaskDefinition] The task definition
+      # @param task_name [Symbol] Name of the task
+      # @param inputs [Hash] Input parameters
+      # @param timeout [Numeric] Timeout in seconds
+      # @return [Hash] Task outputs
+      # @raise [TaskTimeoutError] If execution times out (always takes precedence)
+      def execute_with_timeout(task, task_name, inputs, timeout)
+        attempt_start = Time.now
+        Timeout.timeout(timeout) do
+          execute_task_implementation(task, inputs)
+        end
       rescue Timeout::Error => e
+        # Timeout always wins - this solves the race condition
         execution_time = Time.now - attempt_start
         logger.warn('Task execution timed out',
                     task: task_name,
-                    attempt: attempt + 1,
                     timeout: timeout,
-                    execution_time: execution_time.round(3))
-        raise TaskTimeoutError.new(task_name, "timed out after #{timeout}s", e)
+                    execution_time: execution_time.round(3),
+                    timeout_precedence: 'timeout error takes precedence over any nested errors')
+        # Always wrap as TaskTimeoutError, preserving original timeout context
+        raise TaskTimeoutError.new(task_name, "timed out after #{timeout}s (execution_time: #{execution_time.round(3)}s)", e)
+      rescue *RETRYABLE_ERRORS => e
+        # Network errors that escape timeout handling (very rare)
+        # These occur outside the timeout window, so they're genuine network errors
+        logger.debug('Network error outside timeout window',
+                     task: task_name,
+                     error: e.class.name,
+                     message: e.message)
+        raise TaskNetworkError.new(task_name, "network error: #{e.message}", e)
       end
       # Execute the actual task implementation (neural or symbolic)
@@ -613,27 +817,51 @@ module LanguageOperator
       # @param error [Exception] The error that occurred
       # @return [Boolean] Whether the error should be retried
       def retryable_error?(error)
-        RETRYABLE_ERRORS.any? { |error_class| error.is_a?(error_class) }
+        case error
+        when TaskNetworkError
+          # Network errors wrapped in TaskNetworkError are retryable
+          true
+        when TaskTimeoutError, TaskValidationError
+          # Timeout and validation errors are never retryable
+          false
+        when TaskExecutionError
+          # Check the original error for retryability
+          error.original_error ? retryable_error?(error.original_error) : false
+        when RuntimeError
+          # JSON parsing errors from neural tasks are retryable
+          error.message.include?('returned invalid JSON')
+        else
+          # Check against the standard retryable error list
+          RETRYABLE_ERRORS.any? { |error_class| error.is_a?(error_class) }
+        end
       end
-      # Categorize error for logging and operator integration
+      # Categorize error for logging and operator integration with precedence hierarchy
+      #
+      # Error precedence (highest to lowest):
+      # 1. Timeout errors (always win, even if wrapping network errors)
+      # 2. Validation errors (argument/input validation failures)
+      # 3. Network errors (connection, socket, DNS issues)
+      # 4. Execution errors (general task execution failures)
+      # 5. System errors (unexpected/unknown errors)
       #
       # @param error [Exception] The error that occurred
       # @return [Symbol] Error category
       def categorize_error(error)
-        case error
-        when ArgumentError, TaskValidationError
-          :validation
-        when Timeout::Error, TaskTimeoutError
-          :timeout
-        when TaskExecutionError
-          # Check the original error for categorization
-          error.original_error ? categorize_error(error.original_error) : :execution
-        when *RETRYABLE_ERRORS
-          :network
-        else
-          :execution
-        end
+        # Precedence Level 1: Timeout errors always win
+        return :timeout if error.is_a?(Timeout::Error) || error.is_a?(TaskTimeoutError)
+        # Precedence Level 2: Validation errors
+        return :validation if error.is_a?(ArgumentError) || error.is_a?(TaskValidationError)
+        # For wrapped errors, check original error but preserve timeout precedence
+        return categorize_error(error.original_error) if error.is_a?(TaskExecutionError) && error.original_error
+        # Precedence Level 3: Network errors
+        return :network if error.is_a?(TaskNetworkError) || RETRYABLE_ERRORS.any? { |err_class| error.is_a?(err_class) }
+        # Precedence Level 4: General execution errors
+        :execution
       end
       # Calculate retry delay with exponential backoff
@@ -645,19 +873,24 @@ module LanguageOperator
         [delay, @config[:retry_delay_max]].min
       end
-      # Create appropriate error type based on original error
+      # Create appropriate error type based on original error with precedence hierarchy
       #
       # @param task_name [Symbol] Name of the task
       # @param original_error [Exception] The original error
       # @return [TaskExecutionError] Appropriate error type
       def create_appropriate_error(task_name, original_error)
         case original_error
-        when TaskTimeoutError
+        when TaskTimeoutError, TaskValidationError, TaskNetworkError
+          # Already wrapped in appropriate type
           original_error
         when Timeout::Error
-          TaskTimeoutError.new(task_name, 'timed out', original_error)
+          # Always wrap timeout errors, preserving original context
+          TaskTimeoutError.new(task_name, "timed out after timeout (original: #{original_error.message})", original_error)
         when ArgumentError
           TaskValidationError.new(task_name, original_error.message, original_error)
+        when *RETRYABLE_ERRORS
+          # Wrap network errors for clear categorization
+          TaskNetworkError.new(task_name, "network error: #{original_error.message}", original_error)
         else
           TaskExecutionError.new(task_name, original_error.message, original_error)
         end
@@ -683,6 +916,56 @@ module LanguageOperator
                      retryable: retryable_error?(error),
                      backtrace: error.backtrace&.first(5))
       end
+      # Build task lookup cache for O(1) task resolution
+      #
+      # Pre-computes task metadata to avoid repeated type determinations
+      # and provide fast hash-based lookup instead of linear search.
+      #
+      # @return [Hash] Cache mapping task names to metadata
+      def build_task_cache
+        cache = {}
+        @tasks.each do |name, task|
+          # Guard against test doubles that don't respond to task methods
+          cache[name] = if task.respond_to?(:neural?) && task.respond_to?(:symbolic?)
+                          {
+                            definition: task,
+                            type: determine_task_type(task),
+                            neural: task.neural?,
+                            symbolic: task.symbolic?
+                          }
+                        else
+                          # Fallback for test doubles or invalid task objects
+                          {
+                            definition: task,
+                            type: 'unknown',
+                            neural: false,
+                            symbolic: false
+                          }
+                        end
+        end
+        cache
+      end
+      # Build timeout cache for O(1) timeout resolution
+      #
+      # Pre-computes timeouts for all tasks to avoid repeated calculations
+      # during task execution hot path.
+      #
+      # @return [Hash] Cache mapping task names to timeout values
+      def build_timeout_cache
+        cache = {}
+        @tasks.each do |name, task|
+          # Guard against test doubles that don't respond to task methods
+          cache[name] = if task.respond_to?(:neural?) && task.respond_to?(:symbolic?)
+                          task_timeout_for_type(task)
+                        else
+                          # Fallback timeout for test doubles or invalid task objects
+                          @config[:timeout_symbolic]
+                        end
+        end
+        cache
+      end
     end
   end
 end