RubyGems - sage-rails - Versions diffs - 0.0.3 - Mend

sage-rails 0.0.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

checksums.yaml +7 -0
data/README.md +202 -0
data/app/assets/images/chevron-down-zinc-500.svg +1 -0
data/app/assets/images/chevron-right.svg +1 -0
data/app/assets/images/loading.svg +4 -0
data/app/assets/images/sage/chevron-down-zinc-500.svg +1 -0
data/app/assets/images/sage/chevron-right.svg +1 -0
data/app/assets/images/sage/loading.svg +4 -0
data/app/assets/javascripts/sage/application.js +18 -0
data/app/assets/stylesheets/sage/application.css +308 -0
data/app/controllers/sage/actions_controller.rb +5 -0
data/app/controllers/sage/application_controller.rb +4 -0
data/app/controllers/sage/base_controller.rb +10 -0
data/app/controllers/sage/checks_controller.rb +65 -0
data/app/controllers/sage/dashboards_controller.rb +130 -0
data/app/controllers/sage/queries/messages_controller.rb +62 -0
data/app/controllers/sage/queries_controller.rb +596 -0
data/app/helpers/sage/application_helper.rb +30 -0
data/app/helpers/sage/queries_helper.rb +23 -0
data/app/javascript/controllers/element_removal_controller.js +7 -0
data/app/javascript/sage/controllers/clipboard_controller.js +26 -0
data/app/javascript/sage/controllers/dashboard_controller.js +132 -0
data/app/javascript/sage/controllers/reverse_infinite_scroll_controller.js +146 -0
data/app/javascript/sage/controllers/search_controller.js +47 -0
data/app/javascript/sage/controllers/select_controller.js +215 -0
data/app/javascript/sage.js +19 -0
data/app/jobs/sage/application_job.rb +4 -0
data/app/jobs/sage/process_report_job.rb +80 -0
data/app/mailers/sage/application_mailer.rb +6 -0
data/app/models/sage/application_record.rb +5 -0
data/app/models/sage/message.rb +8 -0
data/app/schemas/sage/report_response_schema.rb +8 -0
data/app/views/layouts/application.html.erb +34 -0
data/app/views/layouts/sage/application.html.erb +94 -0
data/app/views/sage/checks/_form.html.erb +81 -0
data/app/views/sage/checks/_search.html.erb +8 -0
data/app/views/sage/checks/edit.html.erb +10 -0
data/app/views/sage/checks/index.html.erb +58 -0
data/app/views/sage/checks/new.html.erb +8 -0
data/app/views/sage/dashboards/_form.html.erb +50 -0
data/app/views/sage/dashboards/_search.html.erb +8 -0
data/app/views/sage/dashboards/index.html.erb +58 -0
data/app/views/sage/dashboards/new.html.erb +8 -0
data/app/views/sage/dashboards/show.html.erb +58 -0
data/app/views/sage/messages/_form.html.erb +14 -0
data/app/views/sage/queries/_caching.html.erb +17 -0
data/app/views/sage/queries/_form.html.erb +72 -0
data/app/views/sage/queries/_input.html.erb +17 -0
data/app/views/sage/queries/_message.html.erb +25 -0
data/app/views/sage/queries/_message.turbo_stream.erb +10 -0
data/app/views/sage/queries/_new_form.html.erb +43 -0
data/app/views/sage/queries/_run.html.erb +232 -0
data/app/views/sage/queries/_search.html.erb +8 -0
data/app/views/sage/queries/_statement_box.html.erb +241 -0
data/app/views/sage/queries/_streaming_message.html.erb +14 -0
data/app/views/sage/queries/create.turbo_stream.erb +114 -0
data/app/views/sage/queries/edit.html.erb +48 -0
data/app/views/sage/queries/index.html.erb +59 -0
data/app/views/sage/queries/messages/create.turbo_stream.erb +22 -0
data/app/views/sage/queries/messages/index.html.erb +44 -0
data/app/views/sage/queries/messages/index.turbo_stream.erb +15 -0
data/app/views/sage/queries/new.html.erb +195 -0
data/app/views/sage/queries/run.html.erb +1 -0
data/app/views/sage/queries/run.turbo_stream.erb +3 -0
data/app/views/sage/queries/show.html.erb +49 -0
data/app/views/sage/queries/table_schema.html.erb +77 -0
data/app/views/sage/shared/_navigation.html.erb +26 -0
data/app/views/sage/shared/_overlay.html.erb +11 -0
data/config/importmap.rb +11 -0
data/config/initializers/pagy.rb +2 -0
data/config/initializers/ransack.rb +152 -0
data/config/routes.rb +31 -0
data/lib/generators/sage/USAGE +13 -0
data/lib/generators/sage/install/install_generator.rb +128 -0
data/lib/generators/sage/install/templates/sage.rb +22 -0
data/lib/sage/database_schema_context.rb +56 -0
data/lib/sage/engine.rb +260 -0
data/lib/sage/model_scopes_context.rb +185 -0
data/lib/sage/report_processor.rb +263 -0
data/lib/sage/version.rb +3 -0
data/lib/sage.rb +25 -0
data/lib/tasks/sage_tasks.rake +4 -0
metadata +245 -0

data/lib/sage/model_scopes_context.rb ADDED Viewed

@@ -0,0 +1,185 @@
+module Sage
+  class ModelScopesContext
+    def initialize
+      # Nothing to initialize for now
+    end
+    def self.call
+      new.build_context
+    end
+    def build_context
+      context_parts = []
+      context_parts << "\n\n## AVAILABLE SCOPES → SQL MAPPINGS\n"
+      context_parts << "CRITICAL: Use these scopes to understand how to query the data!"
+      context_parts << "Each scope name shows the SQL conditions it generates."
+      context_parts << "When a user's request matches a scope's intent, use that scope's SQL pattern.\n"
+      # Get all ActiveRecord models from the host application
+      # Safely attempt to eager load, but continue if there are issues
+      begin
+        Rails.application.eager_load! if Rails.env.development?
+      rescue Zeitwerk::NameError => e
+        Rails.logger.warn "Could not eager load all files: #{e.message}"
+      end
+      models_with_scopes = collect_models_with_scopes
+      # Format the model scopes nicely
+      if models_with_scopes.any?
+        models_with_scopes.each do |model_info|
+          context_parts << "\n### #{model_info[:name]} (table: `#{model_info[:table]}`)"
+          context_parts << "Scopes and their SQL equivalents:"
+          model_info[:scopes].each do |scope|
+            context_parts << scope
+          end
+        end
+      end
+      context_parts.join("\n")
+    end
+    private
+    def collect_models_with_scopes
+      models_with_scopes = []
+      # Find all model files in the app/models directory
+      model_files = Dir.glob(Rails.root.join("app/models/**/*.rb"))
+      model_files.each do |file_path|
+        # Skip concern files and other non-model files
+        next if file_path.include?("/concerns/")
+        # Read the file content
+        file_content = File.read(file_path)
+        # Extract model name from file path
+        model_name = File.basename(file_path, ".rb").camelize
+        # Find all scope definitions using regex
+        # Match various scope patterns:
+        # scope :active, -> { where(active: true) }
+        # scope :recent, lambda { where("created_at > ?", 1.week.ago) }
+        # scope :by_role, ->(role) { where(role: role) }
+        scope_patterns = [
+          # Pattern 1: scope :name, -> { ... } or -> (...) { ... }
+          /scope\s+:(\w+)\s*,\s*->\s*(?:\([^)]*\))?\s*\{([^{}]*(?:\{[^{}]*\}[^{}]*)*)\}/m,
+          # Pattern 2: scope :name, lambda { ... }
+          /scope\s+:(\w+)\s*,\s*lambda\s*(?:\{([^{}]*(?:\{[^{}]*\}[^{}]*)*)\})/m,
+          # Pattern 3: Simple one-liner scopes
+          /scope\s+:(\w+)\s*,\s*(.+?)$/
+        ]
+        scope_matches = []
+        scope_patterns.each do |pattern|
+          matches = file_content.scan(pattern)
+          matches.each do |match|
+            scope_name = match[0]
+            scope_body = match[1] || ""
+            # Avoid duplicate entries
+            unless scope_matches.any? { |s| s[0] == scope_name }
+              scope_matches << [scope_name, scope_body]
+            end
+          end
+        end
+        if scope_matches.any?
+          # Try to get the actual model class and table name
+          begin
+            model_class = model_name.constantize
+            table_name = model_class.table_name rescue model_name.tableize
+          rescue => e
+            table_name = model_name.tableize
+            model_class = nil
+          end
+          model_info = {
+            name: model_name,
+            table: table_name,
+            scopes: []
+          }
+          scope_matches.each do |match|
+            scope_name = match[0]
+            scope_body = match[1]
+            if scope_body
+              # Try to extract SQL-like patterns from the scope body
+              # Look for where conditions, joins, etc.
+              sql_hint = extract_sql_from_scope_body(scope_body)
+              model_info[:scopes] << "  • `#{scope_name}` → SQL: `#{sql_hint}`"
+            else
+              # Scope might be using a lambda with parameters or complex logic
+              model_info[:scopes] << "  • `#{scope_name}` → (check model file for implementation)"
+            end
+          end
+          models_with_scopes << model_info if model_info[:scopes].any?
+        end
+      end
+      models_with_scopes
+    end
+    def extract_sql_from_scope_body(scope_body)
+      # Clean up the scope body
+      cleaned = scope_body.strip
+      sql_parts = []
+      # Extract WHERE conditions
+      if cleaned =~ /where\s*\(["']([^"']+)["'](?:,\s*(.+?))?\)/
+        # String SQL with potential parameters
+        sql_parts << "WHERE #{$1}"
+      elsif cleaned =~ /where\s*\(([^)]+)\)/
+        # Hash or conditions
+        where_conditions = $1.strip
+        # Convert Ruby hash syntax to SQL-like
+        where_conditions = where_conditions.gsub(/(\w+):\s*(\w+)/, '\1 = \2')
+        where_conditions = where_conditions.gsub(/(\w+):\s*["']([^"']+)["']/, '\1 = "\2"')
+        where_conditions = where_conditions.gsub(/(\w+):\s*(true|false|nil)/, '\1 = \2')
+        sql_parts << "WHERE #{where_conditions}"
+      elsif cleaned =~ /where\.not\s*\(([^)]+)\)/
+        # WHERE NOT conditions
+        not_conditions = $1.strip
+        not_conditions = not_conditions.gsub(/(\w+):\s*/, '\1 != ')
+        sql_parts << "WHERE NOT (#{not_conditions})"
+      end
+      # Extract JOINs
+      if cleaned =~ /joins?\s*\(:?(\w+)\)/
+        sql_parts << "JOIN #{$1}"
+      elsif cleaned =~ /includes?\s*\(:?(\w+)\)/
+        sql_parts << "LEFT JOIN #{$1}"
+      end
+      # Extract ORDER
+      if cleaned =~ /order\s*\(["']([^"']+)["']\)/
+        sql_parts << "ORDER BY #{$1}"
+      elsif cleaned =~ /order\s*\(([^)]+)\)/
+        order_clause = $1.strip
+        order_clause = order_clause.gsub(/(\w+):\s*:?(asc|desc)/i, '\1 \2')
+        sql_parts << "ORDER BY #{order_clause}"
+      end
+      # Extract LIMIT
+      if cleaned =~ /limit\s*\((\d+)\)/
+        sql_parts << "LIMIT #{$1}"
+      end
+      # If we found SQL parts, join them
+      if sql_parts.any?
+        sql_parts.join(" ")
+      else
+        # Check if it's a simple scope referencing another scope
+        if cleaned =~ /^(\w+)$/
+          "(uses #{$1} scope)"
+        else
+          # Return a truncated version if we can't parse it
+          cleaned.length > 60 ? "#{cleaned[0..60]}..." : cleaned
+        end
+      end
+    end
+  end
+end

data/lib/sage/report_processor.rb ADDED Viewed

@@ -0,0 +1,263 @@
+require "ruby_llm"
+require_relative "database_schema_context"
+require_relative "model_scopes_context"
+module Sage
+  class ReportProcessor
+    include ActionView::RecordIdentifier
+    attr_reader :query, :prompt, :stream_target_id, :raw_response_content
+    def initialize(query:, prompt:, stream_target_id:)
+      @query = query
+      @prompt = prompt
+      @stream_target_id = stream_target_id
+    end
+    def process
+      response = generate_llm_response
+      Rails.logger.info "LLM Response: #{response.inspect}"
+      Rails.logger.info "LLM Response content: #{response.content.inspect}"
+      @raw_response_content = response.content
+      parsed_response = parse_response(response)
+      Rails.logger.info "Parsed response: #{parsed_response.inspect}"
+      {
+        summary: parsed_response[:summary],
+        sql: parsed_response[:sql]
+      }
+    end
+    def system_prompt
+      build_system_prompt
+    end
+    def database_schema_context
+      Sage::DatabaseSchemaContext.new.build_context
+    end
+    def model_scopes_context
+      Sage::ModelScopesContext.new.build_context
+    end
+    private
+    def generate_llm_response
+      RubyLLM.chat
+        .with_instructions(system_prompt)
+        .with_schema(Sage::ReportResponseSchema)
+        .ask(prompt + ". #{structured_output}")
+    end
+    def parse_response(response)
+      if response.content.is_a?(Hash) && response.content.key?("sql") && response.content.key?("summary")
+        # Direct hash with sql and summary keys
+        {
+          summary: response.content["summary"],
+          sql: response.content["sql"]
+        }
+      elsif response.content.is_a?(String)
+        parse_json_response(response.content)
+      else
+        # Fallback for unexpected response format
+        Rails.logger.warn "Unexpected response format: #{response.content.class}"
+        {
+          summary: "Unexpected response format. Please try again.",
+          sql: nil
+        }
+      end
+    end
+    def parse_json_response(content)
+      begin
+        # First attempt: direct JSON parsing
+        parsed_response = JSON.parse(content)
+        {
+          summary: parsed_response["summary"],
+          sql: parsed_response["sql"]
+        }
+      rescue JSON::ParserError
+        # Second attempt: fix malformed JSON by properly escaping newlines within quoted strings
+        begin
+          fixed_json = content.gsub(/"([^"]*)"/) do |match|
+            # Escape newlines, tabs, and other control characters within the quoted string
+            match.gsub(/\n/, '\\n').gsub(/\t/, '\\t').gsub(/\r/, '\\r')
+          end
+          parsed_response = JSON.parse(fixed_json)
+          {
+            summary: parsed_response["summary"],
+            sql: parsed_response["sql"]
+          }
+        rescue JSON::ParserError => e
+          # Final fallback: extract using regex patterns
+          Rails.logger.warn "Failed to parse JSON even after fixing newlines: #{e.message}"
+          # Extract SQL value (everything between "sql": " and the closing quote before comma or brace)
+          sql_match = content.match(/"sql"\s*:\s*"((?:[^"\\]|\\.)*)"/m)
+          sql = sql_match[1] if sql_match
+          # Extract summary value
+          summary_match = content.match(/"summary"\s*:\s*"((?:[^"\\]|\\.)*)"/m)
+          summary = summary_match[1] if summary_match
+          if sql.nil? || summary.nil?
+            Rails.logger.error "Could not extract sql and summary from response"
+            summary = "Failed to parse response. Please try again." if summary.nil?
+          end
+          {
+            summary: summary || "Failed to parse response. Please try again.",
+            sql: sql
+          }
+        end
+      end
+    end
+    def structured_output
+      <<~INSTRUCTION
+        Return as a JSON object with sql and summary keys and no additional commentary.
+      INSTRUCTION
+    end
+    def build_system_prompt
+      prompt_parts = []
+      # Detect database type
+      database_type = detect_database_type
+      # Base instruction optimized for LLM
+      prompt_parts << <<~INSTRUCTION
+        You are an expert SQL analyst helping users iteratively refine their database queries.
+        DATABASE TYPE: #{database_type}
+        Your task:
+        1. Analyze the user's natural language request
+        2. Determine if you should:
+           a) Modify the most recent SQL query (from Previous Context if available)
+           b) Modify the baseline query (from Current Query section)
+           c) Create an entirely new query if the request is unrelated
+        3. Generate the appropriate SQL query for #{database_type}
+        4. Provide a clear explanation of what changed and why
+        Response format (STRICT JSON):
+        {
+          "summary": "Explain what this query does and what changes were made from the previous version (if any)",
+          "sql": "The complete SQL query statement"
+        }
+        CLARIFICATION REQUIRED: If you're unsure how to query based on certain criteria:
+        - Return a summary asking for clarification
+        - Set sql to null
+        - Example: {"summary": "I need clarification on what you mean by 'activated accounts'. Do you mean users with a specific status, users who have logged in, or users with a certain field set?", "sql": null}
+        IMPORTANT:#{' '}
+        - Always return the COMPLETE query, not just the changes
+        - When producing SQL, exclude ALL comments and extraneous characters - the SQL will be immediately executed against a database
+        - Format SQL to be human readable, per SQL writing best practices, but still executable
+        - When modifying existing queries, preserve the original intent while incorporating the requested changes
+        - If the user asks for adjustments (e.g., "add a filter", "group by X", "sort differently"), modify the most recent query
+        - If the user asks something completely new, create a fresh query
+        Guidelines:
+        - Write efficient, readable SQL using #{database_type}-specific syntax
+        - Use meaningful table aliases and column names
+        - Do NOT include comments in SQL queries - they will be executed directly
+        - Prefer JOINs over subqueries when appropriate
+        - Consider performance implications for large datasets
+        - ROLE HANDLING: When dealing with "roles" (e.g., "candidates", "employers", synonyms of "users"):
+          * ALWAYS check the users model/table/scopes first to understand how roles are established
+          * Look for role-related columns, scopes, or associations in the users table
+          * Map role-related terms to the actual implementation in the database
+        - SCOPE PRIORITIZATION: ALWAYS prioritize matching user requests to available model scopes
+          * FIRST check if any existing scopes match the user's intent
+          * Use scopes as the PRIMARY source for query patterns
+          * Only write custom SQL when no appropriate scope exists
+          * Analyze the intent behind user queries and map them to corresponding scopes
+          * When users describe filters or conditions, identify matching scope patterns
+          * Example: if user asks for "recent items", look for scopes like "recent", "latest", or time-based scopes
+        - JSONB COLUMNS: NEVER guess at JSONB column keys or values
+          * Only query JSONB fields that are explicitly defined in scopes or schema documentation
+          * If JSONB structure is unknown, do NOT attempt to query specific keys
+          * Avoid assumptions about JSONB content unless explicitly documented
+        - PRESENCE CHECKS: For presence/existence checks:
+          * Use "IS NOT NULL" or "IS NULL" for presence/absence checks
+          * Avoid using literal values like 'true' or specific strings unless explicitly required
+          * For boolean presence, check for NOT NULL rather than = true
+          * Example: Use "activated_at IS NOT NULL" instead of "activated = 'true'"
+        - Ensure all table and column names match the schema exactly
+        - Handle NULL values appropriately (prefer IS NULL/IS NOT NULL for presence checks)
+        - Use proper data type casting when needed
+        - Follow #{database_type} best practices and syntax conventions
+        - NEVER make assumptions about data structure - use only what's documented in schema and scopes
+      INSTRUCTION
+      # Add current query as baseline context
+      if query.statement.present?
+        prompt_parts << "\n\n## CURRENT QUERY (BASELINE)\n"
+        prompt_parts << "The currently saved query that we're working with:\n"
+        prompt_parts << "```sql\n#{query.statement}\n```"
+        prompt_parts << "\nThis is the baseline query. You may modify or completely replace it based on the user's request.\n"
+      end
+      # Add latest message as context
+      latest_message = query.messages.order(:created_at).last
+      if latest_message
+        prompt_parts << "\n\n## PREVIOUS CONTEXT\n"
+        prompt_parts << "The most recent message from this conversation:\n"
+        prompt_parts << "\nPrevious response: #{latest_message.body}" if latest_message.body.present?
+        prompt_parts << "\nPrevious SQL: #{latest_message.statement}" if latest_message.statement.present?
+        prompt_parts << "\n\nConsider this context when generating your response.\n"
+      end
+      # Add database schema
+      schema_context = database_schema_context
+      prompt_parts << schema_context if schema_context.present?
+      # Add model scopes from host application
+      scopes_context = model_scopes_context
+      prompt_parts << scopes_context if scopes_context.present?
+      prompt_parts << "\n\n## QUERY GENERATION RULES"
+      prompt_parts << "1. Match table and column names EXACTLY as shown in the schema"
+      prompt_parts << "2. NO COMMENTS OR NEWLINES in SQL - output will be executed directly against database"
+      prompt_parts << "3. SCOPE FIRST: ALWAYS prioritize using available scopes over custom SQL"
+      prompt_parts << "   - Check ALL available scopes before writing custom conditions"
+      prompt_parts << "   - Map user language directly to scope names when possible"
+      prompt_parts << "4. JSONB HANDLING: NEVER guess at JSONB structure"
+      prompt_parts << "   - Only use JSONB keys that are explicitly documented in scopes or schema"
+      prompt_parts << "   - If unsure about JSONB structure, avoid querying it"
+      prompt_parts << "5. PRESENCE/ABSENCE CHECKS:"
+      prompt_parts << "   - Use IS NOT NULL for presence (not = 'true' or = true)"
+      prompt_parts << "   - Use IS NULL for absence"
+      prompt_parts << "   - Example: 'activated users' → 'activated_at IS NOT NULL'"
+      prompt_parts << "6. ROLE HANDLING: When users mention roles like 'candidates' or 'employers':"
+      prompt_parts << "   - Check the users table/model/scopes first to understand role implementation"
+      prompt_parts << "   - Map role terms to actual database structure (columns, associations, etc.)"
+      prompt_parts << "7. Generate ONE query that best answers the user's request"
+      prompt_parts << "8. NEVER make assumptions - use only documented schema and scopes"
+      prompt_parts.join("\n")
+    end
+    def detect_database_type
+      adapter_name = ActiveRecord::Base.connection.adapter_name.downcase
+      case adapter_name
+      when /postgresql/, /postgis/
+        "PostgreSQL"
+      when /mysql/, /mysql2/
+        "MySQL"
+      when /sqlite/
+        "SQLite3"
+      when /sqlserver/, /mssql/
+        "SQL Server"
+      when /oracle/
+        "Oracle"
+      else
+        adapter_name.capitalize
+      end
+    end
+  end
+end

data/lib/sage/version.rb ADDED Viewed

@@ -0,0 +1,3 @@
+module Sage
+  VERSION = "0.0.3"
+end

data/lib/sage.rb ADDED Viewed

@@ -0,0 +1,25 @@
+require "sage/version"
+require "sage/engine"
+require "blazer"
+require "pagy"
+module Sage
+  class << self
+    attr_accessor :configuration
+  end
+  def self.configure
+    self.configuration ||= Configuration.new
+    yield(configuration)
+  end
+  class Configuration
+    attr_accessor :anthropic_api_key, :anthropic_model, :open_ai_key, :open_ai_model, :provider
+    def initialize
+      @provider = :anthropic
+      @anthropic_model = "claude-3-opus-20240229"
+      @open_ai_model = "gpt-4"
+    end
+  end
+end

data/lib/tasks/sage_tasks.rake ADDED Viewed

@@ -0,0 +1,4 @@
+# desc "Explaining what the task does"
+# task :sage do
+#   # Task goes here
+# end