RubyGems - parse-stack-next - Versions diffs - 4.5.0 - Mend

parse-stack-next 4.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (178) hide show

checksums.yaml +7 -0
data/.bundle/config +2 -0
data/.env.sample +112 -0
data/.env.test +10 -0
data/.github/workflows/ruby.yml +36 -0
data/.gitignore +49 -0
data/.ruby-version +1 -0
data/.solargraph.yml +22 -0
data/CHANGELOG.md +5816 -0
data/Gemfile +30 -0
data/Gemfile.lock +175 -0
data/LICENSE.txt +23 -0
data/Makefile +63 -0
data/README.md +5655 -0
data/Rakefile +573 -0
data/bin/console +38 -0
data/bin/parse-console +136 -0
data/bin/server +17 -0
data/bin/setup +7 -0
data/config/parse-config.json +12 -0
data/docs/TEST_SERVER.md +271 -0
data/docs/_config.yml +1 -0
data/docs/mcp_guide.md +3484 -0
data/docs/mongodb_direct_guide.md +1348 -0
data/docs/mongodb_index_optimization_guide.md +631 -0
data/examples/transaction_example.rb +219 -0
data/lib/parse/acl_scope.rb +728 -0
data/lib/parse/agent/cancellation_token.rb +80 -0
data/lib/parse/agent/constraint_translator.rb +480 -0
data/lib/parse/agent/describe.rb +420 -0
data/lib/parse/agent/errors.rb +133 -0
data/lib/parse/agent/mcp_client.rb +557 -0
data/lib/parse/agent/mcp_dispatcher.rb +1023 -0
data/lib/parse/agent/mcp_rack_app.rb +1143 -0
data/lib/parse/agent/mcp_server.rb +376 -0
data/lib/parse/agent/metadata_audit.rb +259 -0
data/lib/parse/agent/metadata_dsl.rb +733 -0
data/lib/parse/agent/metadata_registry.rb +794 -0
data/lib/parse/agent/pipeline_validator.rb +82 -0
data/lib/parse/agent/prompts.rb +351 -0
data/lib/parse/agent/rate_limiter.rb +158 -0
data/lib/parse/agent/relation_graph.rb +162 -0
data/lib/parse/agent/result_formatter.rb +453 -0
data/lib/parse/agent/tools.rb +5489 -0
data/lib/parse/agent.rb +3249 -0
data/lib/parse/api/aggregate.rb +79 -0
data/lib/parse/api/all.rb +26 -0
data/lib/parse/api/analytics.rb +18 -0
data/lib/parse/api/batch.rb +33 -0
data/lib/parse/api/cloud_functions.rb +58 -0
data/lib/parse/api/config.rb +125 -0
data/lib/parse/api/files.rb +29 -0
data/lib/parse/api/hooks.rb +117 -0
data/lib/parse/api/objects.rb +146 -0
data/lib/parse/api/path_segment.rb +75 -0
data/lib/parse/api/push.rb +20 -0
data/lib/parse/api/schema.rb +49 -0
data/lib/parse/api/server.rb +50 -0
data/lib/parse/api/sessions.rb +24 -0
data/lib/parse/api/users.rb +250 -0
data/lib/parse/atlas_search/index_manager.rb +353 -0
data/lib/parse/atlas_search/result.rb +204 -0
data/lib/parse/atlas_search/search_builder.rb +604 -0
data/lib/parse/atlas_search/session.rb +253 -0
data/lib/parse/atlas_search.rb +995 -0
data/lib/parse/client/authentication.rb +97 -0
data/lib/parse/client/batch.rb +234 -0
data/lib/parse/client/body_builder.rb +240 -0
data/lib/parse/client/caching.rb +203 -0
data/lib/parse/client/logging.rb +293 -0
data/lib/parse/client/profiling.rb +181 -0
data/lib/parse/client/protocol.rb +91 -0
data/lib/parse/client/request.rb +233 -0
data/lib/parse/client/response.rb +208 -0
data/lib/parse/client.rb +1104 -0
data/lib/parse/clp_scope.rb +361 -0
data/lib/parse/live_query/circuit_breaker.rb +256 -0
data/lib/parse/live_query/client.rb +1001 -0
data/lib/parse/live_query/configuration.rb +224 -0
data/lib/parse/live_query/event.rb +115 -0
data/lib/parse/live_query/event_queue.rb +272 -0
data/lib/parse/live_query/health_monitor.rb +214 -0
data/lib/parse/live_query/logging.rb +149 -0
data/lib/parse/live_query/subscription.rb +294 -0
data/lib/parse/live_query.rb +163 -0
data/lib/parse/lookup_rewriter.rb +445 -0
data/lib/parse/model/acl.rb +968 -0
data/lib/parse/model/associations/belongs_to.rb +275 -0
data/lib/parse/model/associations/collection_proxy.rb +435 -0
data/lib/parse/model/associations/has_many.rb +597 -0
data/lib/parse/model/associations/has_one.rb +158 -0
data/lib/parse/model/associations/pointer_collection_proxy.rb +134 -0
data/lib/parse/model/associations/relation_collection_proxy.rb +177 -0
data/lib/parse/model/bytes.rb +62 -0
data/lib/parse/model/classes/audience.rb +262 -0
data/lib/parse/model/classes/installation.rb +363 -0
data/lib/parse/model/classes/job_schedule.rb +153 -0
data/lib/parse/model/classes/job_status.rb +264 -0
data/lib/parse/model/classes/product.rb +75 -0
data/lib/parse/model/classes/push_status.rb +263 -0
data/lib/parse/model/classes/role.rb +751 -0
data/lib/parse/model/classes/session.rb +201 -0
data/lib/parse/model/classes/user.rb +943 -0
data/lib/parse/model/clp.rb +544 -0
data/lib/parse/model/core/actions.rb +1268 -0
data/lib/parse/model/core/builder.rb +139 -0
data/lib/parse/model/core/create_lock.rb +386 -0
data/lib/parse/model/core/describe.rb +382 -0
data/lib/parse/model/core/enhanced_change_tracking.rb +159 -0
data/lib/parse/model/core/errors.rb +38 -0
data/lib/parse/model/core/fetching.rb +566 -0
data/lib/parse/model/core/field_guards.rb +220 -0
data/lib/parse/model/core/indexing.rb +382 -0
data/lib/parse/model/core/parse_reference.rb +407 -0
data/lib/parse/model/core/properties.rb +809 -0
data/lib/parse/model/core/querying.rb +491 -0
data/lib/parse/model/core/schema.rb +202 -0
data/lib/parse/model/core/search_indexing.rb +174 -0
data/lib/parse/model/date.rb +88 -0
data/lib/parse/model/email.rb +213 -0
data/lib/parse/model/file.rb +527 -0
data/lib/parse/model/geojson.rb +271 -0
data/lib/parse/model/geopoint.rb +261 -0
data/lib/parse/model/model.rb +260 -0
data/lib/parse/model/object.rb +2068 -0
data/lib/parse/model/phone.rb +520 -0
data/lib/parse/model/pointer.rb +443 -0
data/lib/parse/model/polygon.rb +406 -0
data/lib/parse/model/push.rb +975 -0
data/lib/parse/model/shortnames.rb +8 -0
data/lib/parse/model/time_zone.rb +141 -0
data/lib/parse/model/validations/uniqueness_validator.rb +97 -0
data/lib/parse/model/validations.rb +96 -0
data/lib/parse/mongodb.rb +2300 -0
data/lib/parse/pipeline_security.rb +554 -0
data/lib/parse/query/constraint.rb +198 -0
data/lib/parse/query/constraints.rb +3279 -0
data/lib/parse/query/cursor.rb +434 -0
data/lib/parse/query/n_plus_one_detector.rb +445 -0
data/lib/parse/query/operation.rb +104 -0
data/lib/parse/query/ordering.rb +66 -0
data/lib/parse/query.rb +7028 -0
data/lib/parse/schema/index_migrator.rb +291 -0
data/lib/parse/schema/search_index_migrator.rb +289 -0
data/lib/parse/schema.rb +494 -0
data/lib/parse/stack/generators/rails.rb +40 -0
data/lib/parse/stack/generators/templates/model.erb +51 -0
data/lib/parse/stack/generators/templates/model_installation.rb +4 -0
data/lib/parse/stack/generators/templates/model_role.rb +4 -0
data/lib/parse/stack/generators/templates/model_session.rb +4 -0
data/lib/parse/stack/generators/templates/model_user.rb +11 -0
data/lib/parse/stack/generators/templates/parse.rb +12 -0
data/lib/parse/stack/generators/templates/webhooks.rb +10 -0
data/lib/parse/stack/railtie.rb +18 -0
data/lib/parse/stack/tasks.rb +563 -0
data/lib/parse/stack/version.rb +11 -0
data/lib/parse/stack.rb +455 -0
data/lib/parse/two_factor_auth/user_extension.rb +449 -0
data/lib/parse/two_factor_auth.rb +310 -0
data/lib/parse/webhooks/payload.rb +360 -0
data/lib/parse/webhooks/registration.rb +199 -0
data/lib/parse/webhooks/replay_protection.rb +189 -0
data/lib/parse/webhooks.rb +510 -0
data/lib/parse-stack-next.rb +5 -0
data/lib/parse-stack.rb +5 -0
data/parse-stack-next.gemspec +82 -0
data/parse-stack.png +0 -0
data/scripts/debug-ips.js +35 -0
data/scripts/docker/Dockerfile.parse +13 -0
data/scripts/docker/atlas-init.js +284 -0
data/scripts/docker/docker-compose.atlas.yml +76 -0
data/scripts/docker/docker-compose.test.yml +106 -0
data/scripts/docker/mongo-init.js +21 -0
data/scripts/eval_mcp_with_lm_studio.rb +274 -0
data/scripts/start-parse.sh +90 -0
data/scripts/start_mcp_server.rb +78 -0
data/scripts/test_server_connection.rb +82 -0
metadata +377 -0

data/lib/parse/agent/mcp_server.rb ADDED Viewed

@@ -0,0 +1,376 @@
+# encoding: UTF-8
+# frozen_string_literal: true
+require "webrick"
+require "json"
+require "stringio"
+require "active_support/core_ext/object/blank"
+require "active_support/security_utils"
+require_relative "prompts"
+require_relative "mcp_dispatcher"
+require_relative "mcp_rack_app"
+module Parse
+  class Agent
+    # MCP (Model Context Protocol) HTTP Server for Parse Stack.
+    # Enables external AI agents (Claude, LM Studio, etc.) to interact with
+    # Parse data over HTTP using the MCP protocol specification.
+    #
+    # Since the Rack refactor this class is a thin WEBrick wrapper around
+    # {Parse::Agent::MCPRackApp}. Embedded deployments (Sinatra, Rails) should
+    # mount MCPRackApp directly with their own agent factory; this class
+    # remains for standalone server deployments and back-compat.
+    #
+    # @example Start the server
+    #   Parse::Agent.enable_mcp!
+    #   Parse::Agent::MCPServer.run(port: 3001)
+    #
+    # @example With custom configuration
+    #   server = Parse::Agent::MCPServer.new(
+    #     port: 3001,
+    #     permissions: :readonly,
+    #     session_token: nil
+    #   )
+    #   server.start
+    #
+    # @see https://modelcontextprotocol.io/ MCP Protocol Specification
+    # @see Parse::Agent::MCPRackApp for embedded mounting
+    #
+    class MCPServer
+      # MCP Protocol version
+      PROTOCOL_VERSION = MCPDispatcher::PROTOCOL_VERSION
+      # Server capabilities
+      CAPABILITIES = MCPDispatcher::CAPABILITIES
+      # Default port for the MCP server
+      @default_port = 3001
+      # Maximum allowed request body size (1 MB) — kept as a back-compat constant.
+      MAX_BODY_SIZE = MCPRackApp::DEFAULT_MAX_BODY_SIZE
+      # Maximum JSON nesting depth — kept as a back-compat constant.
+      MAX_JSON_NESTING = MCPRackApp::MAX_JSON_NESTING
+      # HTTP header for MCP API key authentication
+      MCP_API_KEY_HEADER = "X-MCP-API-Key"
+      class << self
+        attr_accessor :default_port
+        # Start the MCP server (blocking)
+        #
+        # @param port [Integer] port to listen on
+        # @param permissions [Symbol] agent permission level
+        # @param session_token [String, nil] optional session token
+        # @param host [String] host to bind to
+        # @param rate_limiter [#check!, nil] optional external rate limiter
+        def run(port: nil, permissions: :readonly, session_token: nil, host: "127.0.0.1", api_key: nil, rate_limiter: nil)
+          unless Parse::Agent.mcp_enabled?
+            raise "MCP server not enabled. Call Parse::Agent.enable_mcp! first"
+          end
+          server = new(
+            port: port || @default_port,
+            permissions: permissions,
+            session_token: session_token,
+            host: host,
+            api_key: api_key,
+            rate_limiter: rate_limiter,
+          )
+          server.start
+        end
+      end
+      # @return [Integer] the port number
+      attr_reader :port
+      # @return [String] the host to bind to
+      attr_reader :host
+      # @return [Parse::Agent] the template agent used by the /tools listing
+      #   endpoint and as a settings source for per-request agents. Hot tools
+      #   in MCP requests run against fresh per-request instances; do NOT
+      #   share this object across threads for mutable state inspection.
+      attr_reader :agent
+      # Create a new MCP server instance
+      #
+      # @param port [Integer] port to listen on
+      # @param host [String] host to bind to
+      # @param permissions [Symbol] agent permission level
+      # @param session_token [String, nil] optional session token
+      # @param rate_limiter [#check!, nil] optional external rate limiter (e.g.
+      #   Redis-backed). When provided, replaces the default in-process
+      #   {Parse::Agent::RateLimiter}. Must respond to `#check!` and raise
+      #   {Parse::Agent::RateLimitExceeded} when the budget is exhausted.
+      # @raise [ArgumentError] if rate_limiter is provided but does not respond to :check!
+      # Loopback hosts that are safe to bind to without an API key.
+      LOOPBACK_HOSTS = %w[127.0.0.1 ::1 localhost].freeze
+      def initialize(port: 3001, host: "127.0.0.1", permissions: :readonly,
+                     session_token: nil, api_key: nil, rate_limiter: nil,
+                     pre_auth_rate_limiter: nil,
+                     allowed_origins: nil, require_custom_header: nil)
+        if rate_limiter && !rate_limiter.respond_to?(:check!)
+          raise ArgumentError, "rate_limiter must respond to #check!"
+        end
+        if pre_auth_rate_limiter && !pre_auth_rate_limiter.respond_to?(:check!)
+          raise ArgumentError, "pre_auth_rate_limiter must respond to #check!"
+        end
+        effective_api_key = api_key || ENV["MCP_API_KEY"]
+        # NEW-MCP-1: a non-loopback bind without an API key is an unauthenticated
+        # network-exposed JSON-RPC endpoint. Refuse to start. Operators who
+        # genuinely want this — e.g., behind a reverse proxy that handles
+        # auth — should bind to localhost and let the proxy forward, or
+        # set MCP_API_KEY explicitly even when "the proxy authenticates"
+        # (defense in depth).
+        if !LOOPBACK_HOSTS.include?(host.to_s) && effective_api_key.to_s.empty?
+          raise ArgumentError,
+                "MCPServer refuses to bind non-loopback host #{host.inspect} without an api_key. " \
+                "Set MCP_API_KEY in the environment, pass api_key: explicitly, or use a loopback " \
+                "host (one of: #{LOOPBACK_HOSTS.join(', ')})."
+        end
+        @port = port
+        @host = host
+        @api_key = effective_api_key
+        @permissions = permissions
+        @session_token = session_token
+        # Shared limiter across requests so per-request agents (built in
+        # agent_factory) don't reset their window on every call. The
+        # rate-limit budget is a server-level resource, not a per-Agent one.
+        @shared_rate_limiter = rate_limiter || RateLimiter.new
+        # Template agent for the /tools listing endpoint and for inspection
+        # via #agent. NOT used for live request dispatch — see agent_factory.
+        @agent = Parse::Agent.new(
+          permissions: @permissions,
+          session_token: @session_token,
+          rate_limiter: @shared_rate_limiter,
+        )
+        @server = nil
+        # The Rack app does the heavy lifting. Its agent_factory enforces the
+        # API key and constructs a FRESH Parse::Agent per request so the
+        # per-instance state (@conversation_history, @operation_log, token
+        # counters) cannot leak between requests.
+        # pre_auth_rate_limiter: closes NEW-MCP-6 — runs before the factory
+        # is invoked so an empty or malformed body can't amplify into a
+        # Parse Server round-trip.
+        @rack_app = MCPRackApp.new(
+          agent_factory: method(:agent_factory),
+          pre_auth_rate_limiter: pre_auth_rate_limiter,
+          allowed_origins: allowed_origins,
+          require_custom_header: require_custom_header,
+        )
+      end
+      # Start the HTTP server (blocking)
+      def start
+        @server = WEBrick::HTTPServer.new(
+          Port: @port,
+          BindAddress: @host,
+          Logger: WEBrick::Log.new($stdout, WEBrick::Log::INFO),
+          AccessLog: [[::File.open(::File::NULL, "w"), ""]], # Suppress access log
+        )
+        setup_routes
+        trap("INT") { stop }
+        trap("TERM") { stop }
+        puts "Parse MCP Server starting on http://#{@host}:#{@port}"
+        puts "Permissions: #{@agent.permissions}"
+        puts "Tools available: #{@agent.allowed_tools.join(", ")}"
+        @server.start
+      end
+      # Stop the server
+      def stop
+        @server&.shutdown
+      end
+      private
+      def setup_routes
+        # MCP endpoint — translated WEBrick request → Rack env → MCPRackApp.
+        @server.mount_proc("/mcp") { |req, res| handle_mcp_request(req, res) }
+        # Health check endpoint (unauthenticated - standard for monitoring)
+        @server.mount_proc("/health") do |_req, res|
+          json_response(res, { status: "ok", mcp_enabled: true })
+        end
+        # Tool list endpoint (requires auth if API key is configured)
+        @server.mount_proc("/tools") do |req, res|
+          if @api_key.present?
+            provided_key = req[MCP_API_KEY_HEADER].to_s
+            unless ActiveSupport::SecurityUtils.secure_compare(@api_key, provided_key)
+              error_response(res, 401, "Unauthorized: invalid or missing API key")
+              next
+            end
+          end
+          json_response(res, @agent.tool_definitions(format: :mcp))
+        end
+      end
+      # Translate a WEBrick request into a minimal Rack env and dispatch to the
+      # MCPRackApp. The agent_factory bound at construction handles API-key
+      # auth and returns the shared @agent for valid requests.
+      #
+      # WEBrick HTTPRequest#body reads lazily from the socket. We must reject
+      # oversized bodies BEFORE calling req.body. Two attack shapes:
+      #   (a) Content-Length > MAX_BODY_SIZE — caught by the explicit check.
+      #   (b) Transfer-Encoding: chunked with no Content-Length — WEBrick's
+      #       read_chunked has no size cap and will dechunk indefinitely.
+      # We refuse (b) entirely: chunked or missing-Content-Length requests
+      # return 411 "Length Required" before req.body is ever called.
+      def handle_mcp_request(req, res)
+        # NEW-MCP-5: WEBrick's mount_proc("/mcp") is prefix-matching, so
+        # `/mcp/anything/at/all` reaches this handler and forwards the
+        # extra path segments into the Rack app via PATH_INFO. Reverse
+        # proxies that enforce ACLs against `^/mcp$` (or that route
+        # `/mcp/admin` to a different upstream) will be defeated by the
+        # prefix match unless we explicitly reject sub-paths here. A
+        # trailing slash is accepted — `/mcp/` is the same endpoint —
+        # but anything beyond is 404.
+        normalized = req.path.to_s.chomp("/")
+        unless normalized == "/mcp"
+          res.status = 404
+          res.content_type = "application/json"
+          res.body = JSON.generate({
+            "jsonrpc" => "2.0",
+            "id" => nil,
+            "error" => { "code" => -32_601, "message" => "Not Found" },
+          })
+          return
+        end
+        # Method gate FIRST. Returning 411 for a GET because it lacks a
+        # Content-Length is semantically wrong (the method itself is not
+        # allowed; body requirements never apply) and surprises Rack
+        # middleware that expects 405 for method-mismatch.
+        unless req.request_method == "POST"
+          res.status = 405
+          res["Allow"] = "POST"
+          res.content_type = "application/json"
+          res.body = JSON.generate({
+            "jsonrpc" => "2.0",
+            "id" => nil,
+            "error" => { "code" => -32_600, "message" => "Method Not Allowed: only POST is accepted" },
+          })
+          return
+        end
+        transfer_encoding = req["Transfer-Encoding"].to_s.downcase
+        content_length_header = req["Content-Length"]
+        if transfer_encoding.include?("chunked") || content_length_header.nil?
+          res.status = 411
+          res.content_type = "application/json"
+          res.body = JSON.generate({
+            "jsonrpc" => "2.0",
+            "id" => nil,
+            "error" => { "code" => -32_700, "message" => "Length Required: Content-Length header is required and Transfer-Encoding: chunked is not accepted" },
+          })
+          return
+        end
+        content_length = content_length_header.to_i
+        if content_length > MCPRackApp::DEFAULT_MAX_BODY_SIZE
+          res.status = 413
+          res.content_type = "application/json"
+          res.body = JSON.generate({
+            "jsonrpc" => "2.0",
+            "id" => nil,
+            "error" => { "code" => -32_700, "message" => "Payload Too Large: body exceeds #{MCPRackApp::DEFAULT_MAX_BODY_SIZE} bytes" },
+          })
+          return
+        end
+        env = build_rack_env(req)
+        status, headers, body_chunks = @rack_app.call(env)
+        res.status = status
+        rack_ct = headers["Content-Type"] || headers["content-type"]
+        headers.each { |k, v| res[k] = v unless k.casecmp("Content-Type").zero? }
+        res.content_type = rack_ct if rack_ct
+        res.body = body_chunks.join
+      end
+      # Agent factory passed to MCPRackApp. Enforces the API-key check (raising
+      # Parse::Agent::Unauthorized so the Rack app renders a sanitized 401)
+      # and then constructs a FRESH Parse::Agent per request, sharing only
+      # the @shared_rate_limiter so the budget persists across calls.
+      #
+      # The per-instance @conversation_history, @operation_log, and token
+      # counters on each returned agent are scoped to that single request
+      # and discarded when it ends, eliminating cross-request leakage.
+      def agent_factory(env)
+        if @api_key.present?
+          provided_key = env["HTTP_X_MCP_API_KEY"].to_s
+          unless ActiveSupport::SecurityUtils.secure_compare(@api_key, provided_key)
+            raise Parse::Agent::Unauthorized.new("invalid or missing API key", reason: :bad_api_key)
+          end
+        end
+        Parse::Agent.new(
+          permissions: @permissions,
+          session_token: @session_token,
+          rate_limiter: @shared_rate_limiter,
+        )
+      end
+      # Build a minimal Rack env from a WEBrick request. We populate the
+      # fields MCPRackApp reads (REQUEST_METHOD, CONTENT_TYPE, rack.input,
+      # HTTP_X_MCP_API_KEY) plus a few Rack-required keys so middleware that
+      # might wrap us still sees a plausible env. Per the Rack SPEC, the
+      # special Content-Type and Content-Length headers are top-level keys
+      # (no HTTP_ prefix), so the header-enumeration loop excludes them.
+      RACK_TOP_LEVEL_HEADERS = %w[Content-Type Content-Length].freeze
+      def build_rack_env(req)
+        env = {
+          "REQUEST_METHOD" => req.request_method,
+          "CONTENT_TYPE" => req["Content-Type"].to_s,
+          "CONTENT_LENGTH" => req["Content-Length"].to_s,
+          "rack.input" => StringIO.new(req.body || ""),
+          "rack.errors" => $stderr,
+          "rack.url_scheme" => "http",
+          "SERVER_NAME" => @host,
+          "SERVER_PORT" => @port.to_s,
+          "PATH_INFO" => req.path,
+          "QUERY_STRING" => req.query_string.to_s,
+        }
+        req.each do |name|
+          next if RACK_TOP_LEVEL_HEADERS.any? { |h| name.casecmp(h).zero? }
+          # NEW-MCP-2: refuse header names that already contain underscores.
+          # `X-MCP-API-Key` and `X_MCP_API_KEY` both collapse to the same
+          # Rack env key (`HTTP_X_MCP_API_KEY`); a reverse proxy that
+          # injects the trusted dash-form can be undermined by an attacker
+          # also sending the underscore-form. Drop the underscore variant
+          # at the transport layer.
+          next if name.include?("_")
+          header_key = "HTTP_#{name.upcase.tr("-", "_")}"
+          env[header_key] = req[name].to_s
+        end
+        env
+      end
+      def json_response(res, data)
+        res.content_type = "application/json"
+        res.body = JSON.generate(data)
+      end
+      def error_response(res, status, message)
+        res.status = status
+        json_response(res, { error: message })
+      end
+    end
+  end
+end

data/lib/parse/agent/metadata_audit.rb ADDED Viewed

@@ -0,0 +1,259 @@
+# encoding: UTF-8
+# frozen_string_literal: true
+module Parse
+  class Agent
+    # Boot-time / on-demand audit of agent metadata declarations across
+    # the application's Parse::Object subclasses. Surfaces the gaps that
+    # silently degrade an LLM's experience of the schema: classes with no
+    # `agent_description`, properties on the allowlist with no
+    # `_description:`, and `agent_fields` entries that don't resolve to
+    # known wire columns.
+    #
+    # Returns structured data so callers can wire it into a boot warning,
+    # a CI gate, or a Rake task. `print_summary` is a convenience for
+    # interactive use (rails console, scripts).
+    #
+    # @example Programmatic use
+    #   audit = Parse::Agent.audit_metadata
+    #   if audit[:missing_class_descriptions].any?
+    #     warn "Classes without descriptions: #{audit[:missing_class_descriptions]}"
+    #   end
+    #
+    # @example Interactive use
+    #   Parse::Agent::MetadataAudit.print_summary
+    module MetadataAudit
+      extend self
+      # System/system-adjacent fields that are always present on every
+      # Parse class and don't benefit from `_description:`. Excluded from
+      # the missing-field-descriptions report.
+      ALWAYS_PRESENT_FIELDS = %i[
+        object_id objectId
+        created_at createdAt
+        updated_at updatedAt
+        acl ACL
+      ].freeze
+      # Run the audit and return structured findings.
+      #
+      # @return [Hash]
+      #   * :classes_audited [Integer] — number of classes inspected
+      #   * :visible_classes_declared [Boolean] — whether the app uses
+      #     opt-in `agent_visible` mode
+      #   * :missing_class_descriptions [Array<String>] — Parse class names
+      #     with no `agent_description`
+      #   * :missing_field_descriptions [Hash<String, Array<Symbol>>] —
+      #     class name -> property symbols missing `_description:`. When
+      #     a class declares `agent_fields`, only allowlisted properties
+      #     are counted; otherwise all declared properties.
+      #   * :unresolvable_allowlist_entries [Hash<String, Array<Symbol>>] —
+      #     `agent_fields` entries that don't appear in the class's
+      #     `field_map` (likely typos that 4.2.1's wire-name translation
+      #     will silently miss).
+      #   * :canonical_filter_summary [Hash<String, Hash>] — per-class
+      #     declared canonical filters, surfaced so the auditor can see
+      #     which classes apply silent row-level predicates by default.
+      def audit
+        classes = audit_target_classes
+        result = {
+          classes_audited: classes.size,
+          visible_classes_declared: Parse::Agent::MetadataRegistry.has_visible_classes?,
+          missing_class_descriptions: [],
+          missing_field_descriptions: {},
+          unresolvable_allowlist_entries: {},
+          canonical_filter_summary: {},
+        }
+        classes.each do |klass|
+          name = parse_class_name_for(klass)
+          next if name.nil?
+          # Skip classes flagged agent_hidden — they're intentionally
+          # opaque to the agent surface, and we shouldn't pretend the
+          # missing description on them is a gap.
+          next if klass.respond_to?(:agent_hidden?) && klass.agent_hidden?
+          # Skip Parse system classes (`_`-prefixed parse_class names:
+          # `_User`, `_Role`, `_Session`, `_Installation`, `_Product`,
+          # `_Audience`). These are framework-supplied by parse-stack and
+          # don't benefit from userland-authored agent_description — the
+          # SDK is responsible for documenting them, not the application.
+          # Without this skip, every app that doesn't opt into
+          # `agent_visible` mode sees the system classes flooding
+          # `missing_class_descriptions`, which discourages adoption of
+          # the audit tool. Apps that DO want to document their system
+          # classes can still call `agent_description` on `Parse::User`
+          # etc. — the skip only suppresses the "missing" reports, not
+          # the legitimate ones.
+          next if name.to_s.start_with?("_")
+          if klass.respond_to?(:agent_description) && klass.agent_description.nil?
+            result[:missing_class_descriptions] << name
+          end
+          missing_fields = missing_field_descriptions_for(klass)
+          result[:missing_field_descriptions][name] = missing_fields if missing_fields.any?
+          unresolvable = unresolvable_allowlist_entries_for(klass)
+          result[:unresolvable_allowlist_entries][name] = unresolvable if unresolvable.any?
+          if klass.respond_to?(:agent_canonical_filter_for_apply) &&
+             (cf = klass.agent_canonical_filter_for_apply) &&
+             cf.any?
+            result[:canonical_filter_summary][name] = cf.dup
+          end
+        end
+        result[:missing_class_descriptions].sort!
+        result
+      end
+      # Print a human-readable summary to the given IO (defaults to $stdout).
+      # The structured data from {#audit} is the source of truth; this is a
+      # convenience for interactive sessions.
+      #
+      # @param io [IO] destination (default $stdout)
+      # @return [Hash] the audit findings (same shape as {#audit})
+      def print_summary(io: $stdout)
+        data = audit
+        io.puts "Parse::Agent metadata audit"
+        io.puts "=" * 40
+        io.puts "Classes audited: #{data[:classes_audited]} " \
+                "(#{data[:visible_classes_declared] ? "agent_visible mode" : "all-subclasses fallback"})"
+        io.puts
+        missing_classes = data[:missing_class_descriptions]
+        io.puts "Missing class descriptions (#{missing_classes.size}):"
+        if missing_classes.empty?
+          io.puts "  (none)"
+        else
+          missing_classes.each { |n| io.puts "  - #{n}" }
+        end
+        io.puts
+        missing_fields = data[:missing_field_descriptions]
+        total_missing_fields = missing_fields.values.sum(&:size)
+        io.puts "Missing field descriptions (#{total_missing_fields} across #{missing_fields.size} classes):"
+        if missing_fields.empty?
+          io.puts "  (none)"
+        else
+          missing_fields.sort.each do |class_name, fields|
+            io.puts "  #{class_name} (#{fields.size}):"
+            io.puts "    #{fields.map(&:to_s).join(", ")}"
+          end
+        end
+        io.puts
+        unresolvable = data[:unresolvable_allowlist_entries]
+        io.puts "Unresolvable allowlist entries:"
+        if unresolvable.empty?
+          io.puts "  (none)"
+        else
+          unresolvable.sort.each do |class_name, entries|
+            io.puts "  #{class_name}: #{entries.map(&:to_s).join(", ")}"
+          end
+        end
+        io.puts
+        filters = data[:canonical_filter_summary]
+        io.puts "Canonical filters declared (#{filters.size}):"
+        if filters.empty?
+          io.puts "  (none)"
+        else
+          filters.sort.each do |class_name, filter|
+            io.puts "  #{class_name}: #{filter.inspect}"
+          end
+        end
+        data
+      end
+      # ----------------------------------------------------------------
+      # Internals
+      # ----------------------------------------------------------------
+      # Resolve the set of classes to audit.
+      #
+      # When the application has opted into `agent_visible` mode, that
+      # registry IS the canonical list — the developer has explicitly said
+      # "these are the agent-facing classes." Otherwise fall back to every
+      # Parse::Object subclass currently loaded (back-compat mode).
+      #
+      # @return [Array<Class>]
+      def audit_target_classes
+        if Parse::Agent::MetadataRegistry.has_visible_classes?
+          Parse::Agent::MetadataRegistry.visible_classes
+        else
+          # `Parse::Object.descendants` is the same iteration path used by
+          # `Parse::Model.find_class` to resolve a Parse class name to a
+          # Ruby class. Walks every loaded subclass without going through
+          # the find_class cache (which raises NameError on miss and would
+          # corrupt the audit's "what's declared" view).
+          Parse::Object.descendants.select do |klass|
+            klass.respond_to?(:parse_class) && klass.parse_class
+          end
+        end
+      end
+      # The Parse-side class name for a Ruby class, or nil when the class
+      # isn't a normal Parse::Object subclass (defensive — every entry in
+      # audit_target_classes should pass this).
+      def parse_class_name_for(klass)
+        return nil unless klass.respond_to?(:parse_class)
+        klass.parse_class
+      end
+      # Build the list of property symbols on a class that have no
+      # `_description:` declaration. When `agent_fields` is declared, the
+      # check is scoped to the allowlist (those are the agent-visible
+      # fields and the ones the LLM will see); otherwise it covers every
+      # declared property on the class.
+      #
+      # Excludes ALWAYS_PRESENT_FIELDS (the four system columns) since
+      # those don't benefit from per-property descriptions.
+      def missing_field_descriptions_for(klass)
+        return [] unless klass.respond_to?(:property_descriptions)
+        return [] unless klass.respond_to?(:field_map)
+        described = klass.property_descriptions.keys.map(&:to_sym).to_set
+        declared_properties = klass.field_map.keys.map(&:to_sym)
+        candidates =
+          if klass.respond_to?(:agent_field_allowlist) && klass.agent_field_allowlist.any?
+            klass.agent_field_allowlist.map(&:to_sym)
+          else
+            declared_properties
+          end
+        candidates - described.to_a - ALWAYS_PRESENT_FIELDS
+      end
+      # `agent_fields` entries that don't resolve to a known property on
+      # the class. These would silently miss after the 4.2.1 wire-name
+      # translation — the symbol would columnize to a column the schema
+      # doesn't carry, and the filter would strip nothing.
+      def unresolvable_allowlist_entries_for(klass)
+        return [] unless klass.respond_to?(:agent_field_allowlist)
+        allowlist = klass.agent_field_allowlist
+        return [] if allowlist.empty?
+        return [] unless klass.respond_to?(:field_map)
+        known = klass.field_map.keys.map(&:to_sym).to_set
+        allowlist.map(&:to_sym).reject { |sym| known.include?(sym) }
+      end
+    end
+    class << self
+      # Convenience class-method form of {Parse::Agent::MetadataAudit#audit}.
+      # See {MetadataAudit} for the full contract.
+      #
+      # @return [Hash] structured audit findings
+      def audit_metadata
+        Parse::Agent::MetadataAudit.audit
+      end
+    end
+  end
+end