PyPI - openhack - Versions diffs - 0.1.0__py3-none-any.whl - Mend

openhack 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (113) hide show

openhack/__init__.py +2 -0
openhack/__main__.py +225 -0
openhack/agents/__init__.py +30 -0
openhack/agents/base.py +230 -0
openhack/agents/browser_verifier.py +679 -0
openhack/agents/browser_verifier_swarm.py +256 -0
openhack/agents/checkpoint.py +89 -0
openhack/agents/context_manager.py +356 -0
openhack/agents/coordinator.py +1105 -0
openhack/agents/endpoint_analyst.py +307 -0
openhack/agents/feature_hunter.py +93 -0
openhack/agents/hunter.py +481 -0
openhack/agents/hunter_swarm.py +385 -0
openhack/agents/llm.py +334 -0
openhack/agents/recon.py +19 -0
openhack/agents/sandbox_verifier.py +396 -0
openhack/agents/sandbox_verifier_swarm.py +250 -0
openhack/agents/session.py +286 -0
openhack/agents/validator.py +217 -0
openhack/agents/validator_swarm.py +106 -0
openhack/auth.py +175 -0
openhack/browser/__init__.py +12 -0
openhack/browser/runner.py +385 -0
openhack/categories.py +130 -0
openhack/config.py +201 -0
openhack/deterministic_recon.py +464 -0
openhack/entry_points.py +745 -0
openhack/framework_classifier.py +515 -0
openhack/framework_detection.py +269 -0
openhack/headless_scan.py +179 -0
openhack/prompts/__init__.py +108 -0
openhack/prompts/browser_verifier.py +171 -0
openhack/prompts/coordinator.py +31 -0
openhack/prompts/django/__init__.py +32 -0
openhack/prompts/django/auth_bypass.py +76 -0
openhack/prompts/django/csrf.py +62 -0
openhack/prompts/django/data_exposure.py +67 -0
openhack/prompts/django/idor.py +74 -0
openhack/prompts/django/injection.py +67 -0
openhack/prompts/django/misconfiguration.py +70 -0
openhack/prompts/django/ssrf.py +64 -0
openhack/prompts/endpoint_analyst.py +122 -0
openhack/prompts/express/__init__.py +29 -0
openhack/prompts/express/auth_bypass.py +71 -0
openhack/prompts/express/data_exposure.py +77 -0
openhack/prompts/express/idor.py +69 -0
openhack/prompts/express/injection.py +75 -0
openhack/prompts/express/misconfiguration.py +72 -0
openhack/prompts/express/ssrf.py +63 -0
openhack/prompts/feature_hunter.py +140 -0
openhack/prompts/flask/__init__.py +29 -0
openhack/prompts/flask/auth_bypass.py +86 -0
openhack/prompts/flask/data_exposure.py +78 -0
openhack/prompts/flask/idor.py +83 -0
openhack/prompts/flask/injection.py +77 -0
openhack/prompts/flask/misconfiguration.py +73 -0
openhack/prompts/flask/ssrf.py +65 -0
openhack/prompts/hunter.py +362 -0
openhack/prompts/hunter_continuation_loop.py +12 -0
openhack/prompts/hunter_continuation_no_findings.py +19 -0
openhack/prompts/hunter_continuation_no_progress.py +22 -0
openhack/prompts/hunter_tool_instructions.py +55 -0
openhack/prompts/nextjs/__init__.py +42 -0
openhack/prompts/nextjs/auth_bypass.py +80 -0
openhack/prompts/nextjs/csrf.py +71 -0
openhack/prompts/nextjs/data_exposure.py +88 -0
openhack/prompts/nextjs/idor.py +64 -0
openhack/prompts/nextjs/injection.py +65 -0
openhack/prompts/nextjs/middleware_bypass.py +75 -0
openhack/prompts/nextjs/misconfiguration.py +92 -0
openhack/prompts/nextjs/server_actions.py +97 -0
openhack/prompts/nextjs/ssrf.py +66 -0
openhack/prompts/nextjs/xss.py +69 -0
openhack/prompts/pr_analysis_system.py +80 -0
openhack/prompts/pr_analysis_user.py +11 -0
openhack/prompts/project_context.py +89 -0
openhack/prompts/recon.py +199 -0
openhack/prompts/reporter.py +88 -0
openhack/prompts/researchers.py +434 -0
openhack/prompts/sandbox_verifier.py +128 -0
openhack/prompts/supabase/__init__.py +39 -0
openhack/prompts/supabase/auth_tokens.py +131 -0
openhack/prompts/supabase/edge_functions.py +150 -0
openhack/prompts/supabase/graphql.py +102 -0
openhack/prompts/supabase/postgrest.py +99 -0
openhack/prompts/supabase/realtime.py +93 -0
openhack/prompts/supabase/rls.py +110 -0
openhack/prompts/supabase/rpc_functions.py +127 -0
openhack/prompts/supabase/storage.py +110 -0
openhack/prompts/supabase/tenant_isolation.py +118 -0
openhack/prompts/validator.py +319 -0
openhack/prompts/validator_continuation_incomplete.py +12 -0
openhack/prompts/validator_tool_instructions.py +29 -0
openhack/quality.py +231 -0
openhack/sandbox/__init__.py +12 -0
openhack/sandbox/orchestrator.py +517 -0
openhack/sandbox/runner.py +177 -0
openhack/scan_session.py +245 -0
openhack/setup.py +452 -0
openhack/static_validator.py +612 -0
openhack/tools/__init__.py +1 -0
openhack/tools/ast_tools.py +307 -0
openhack/tools/coverage.py +1078 -0
openhack/tools/filesystem.py +404 -0
openhack/tools/nextjs.py +258 -0
openhack/tools/registry.py +52 -0
openhack/tui.py +3450 -0
openhack/updates.py +170 -0
openhack-0.1.0.dist-info/METADATA +189 -0
openhack-0.1.0.dist-info/RECORD +113 -0
openhack-0.1.0.dist-info/WHEEL +4 -0
openhack-0.1.0.dist-info/entry_points.txt +2 -0
openhack-0.1.0.dist-info/licenses/LICENSE +661 -0

openhack/prompts/supabase/rpc_functions.py ADDED Viewed

@@ -0,0 +1,127 @@
+"""
+Supabase RPC function security detection prompt.
+"""
+SUPABASE_RPC_PROMPT = """## RPC Function Security in Supabase
+### Pre-Computed Recon Available
+The `supabase_recon` context already contains:
+- `supabase_recon.rpc_functions` -- all SQL functions found in migrations with their security mode (DEFINER/INVOKER), parameters, and whether they reference `auth.uid()`
+- `supabase_recon.rpc_access` -- runtime test showing which RPC functions are callable by anon (with status codes)
+- `supabase_recon.schema.functions` -- functions exposed via PostgREST OpenAPI spec
+**Critical cross-reference: a function with `security_mode: "DEFINER"` + `has_auth_uid_check: False` + `callable: True` in `rpc_access` is likely a privilege escalation vector.**
+### What to Look For
+1. **SECURITY DEFINER without ownership checks**
+   - `SECURITY DEFINER` functions execute with the privileges of the function owner (usually `postgres`), bypassing RLS entirely
+   - If the function doesn't internally verify `auth.uid()`, any caller (including anon) can access/modify any data
+   - This is the most common and dangerous Supabase misconfiguration
+2. **Unsafe search_path**
+   - Functions with `search_path` set to `public` or not set at all
+   - Malicious users could create objects in the public schema that the function resolves instead of intended objects
+3. **Client-supplied IDs trusted over JWT**
+   - Function parameters like `p_user_id` used directly in queries instead of `auth.uid()`
+   - Caller can pass any user ID to access other users' data
+4. **Anon-callable sensitive functions**
+   - Functions that should require authentication but are callable by the anon role
+   - Check `supabase_recon.rpc_access` for functions with `callable: True`
+### Vulnerable Patterns
+```sql
+-- VULNERABLE: SECURITY DEFINER with no auth check
+CREATE OR REPLACE FUNCTION get_user_stats(p_user_id uuid)
+RETURNS json
+LANGUAGE plpgsql
+SECURITY DEFINER
+AS $$
+BEGIN
+  -- Trusts client-supplied user_id, bypasses RLS
+  RETURN (SELECT row_to_json(u) FROM users u WHERE u.id = p_user_id);
+END;
+$$;
+```
+```sql
+-- VULNERABLE: Unsafe search_path
+CREATE OR REPLACE FUNCTION admin_action()
+RETURNS void
+LANGUAGE plpgsql
+SECURITY DEFINER
+SET search_path = public  -- Attacker can shadow objects in public schema
+AS $$
+BEGIN
+  -- ...
+END;
+$$;
+```
+```sql
+-- VULNERABLE: No ownership check, any user can call
+CREATE OR REPLACE FUNCTION delete_account(p_user_id uuid)
+RETURNS void
+LANGUAGE plpgsql
+SECURITY DEFINER
+AS $$
+BEGIN
+  DELETE FROM users WHERE id = p_user_id;  -- Any anon user can delete any account!
+END;
+$$;
+```
+### Safe Patterns
+```sql
+-- SAFE: SECURITY INVOKER respects caller's RLS
+CREATE OR REPLACE FUNCTION get_my_stats()
+RETURNS json
+LANGUAGE plpgsql
+SECURITY INVOKER
+AS $$
+BEGIN
+  RETURN (SELECT row_to_json(u) FROM users u WHERE u.id = auth.uid());
+END;
+$$;
+```
+```sql
+-- SAFE: DEFINER with explicit auth check and safe search_path
+CREATE OR REPLACE FUNCTION admin_get_user(p_user_id uuid)
+RETURNS json
+LANGUAGE plpgsql
+SECURITY DEFINER
+SET search_path = ''
+AS $$
+BEGIN
+  -- Verify caller is admin
+  IF NOT EXISTS (SELECT 1 FROM auth.users WHERE id = auth.uid() AND raw_user_meta_data->>'role' = 'admin') THEN
+    RAISE EXCEPTION 'Unauthorized';
+  END IF;
+  RETURN (SELECT row_to_json(u) FROM public.users u WHERE u.id = p_user_id);
+END;
+$$;
+```
+### Search Patterns
+1. Check `supabase_recon.rpc_functions` for `security_mode: "DEFINER"` + `has_auth_uid_check: False`
+2. Cross-reference with `supabase_recon.rpc_access` for `callable: True`
+3. `grep` migrations for `SECURITY DEFINER` to find all definer functions
+4. `grep` for `search_path` settings in function definitions
+5. Read function bodies to check for `auth.uid()` usage
+6. For targeted probing: use `supabase_call_rpc` with foreign user IDs to test horizontal access
+### Severity Assessment
+- **Critical**: SECURITY DEFINER function callable by anon with no auth check, accessing sensitive data
+- **High**: SECURITY DEFINER function callable by authenticated users but trusting client-supplied user_id
+- **High**: Function with unsafe search_path allowing object shadowing
+- **Medium**: Function missing tenant isolation checks
+- **Low**: SECURITY INVOKER function with minor input validation gaps
+"""

openhack/prompts/supabase/storage.py ADDED Viewed

@@ -0,0 +1,110 @@
+"""
+Supabase Storage security detection prompt.
+"""
+SUPABASE_STORAGE_PROMPT = """## Storage Security in Supabase
+### Pre-Computed Recon Available
+The `supabase_recon` context already contains:
+- `supabase_recon.storage_policies.buckets` -- all storage buckets found in migrations with public/private status
+- `supabase_recon.storage_policies.policies` -- RLS policies on `storage.objects`
+- `supabase_recon.storage_access` -- runtime test showing which buckets are listable by anon
+**Cross-reference: a bucket marked `public: True` in migrations + `listable: True` in `storage_access` that contains sensitive files is a finding.**
+### What to Look For
+1. **Public buckets with sensitive content**
+   - Buckets marked as public serve files without authentication
+   - If the bucket holds user uploads, documents, or exports, this is a data leak
+   - Check bucket names: `documents`, `exports`, `reports`, `private`, `internal` suggest sensitive content
+2. **Missing storage policies**
+   - `storage.objects` has RLS just like regular tables
+   - Without policies, default behavior depends on bucket public/private setting
+   - Private buckets without policies may still be accessible via signed URLs that never expire
+3. **Signed URL reuse across tenants/users**
+   - Signed URLs generated for one user may be valid for any user
+   - Check if URL generation includes user-specific scoping
+   - Look for `createSignedUrl` calls without tenant/user path prefixes
+4. **Content-type abuse**
+   - Uploading HTML or SVG files that are served as `text/html` or `image/svg+xml`
+   - These can contain JavaScript and enable XSS attacks
+   - Check for `Content-Type` validation on upload and `X-Content-Type-Options: nosniff` on download
+5. **Path confusion**
+   - Mixed case, URL-encoding, or `..` segments may bypass client-side validation
+   - Server and client may normalize paths differently
+   - Users might access files outside their intended directory
+6. **Bucket listing exposure**
+   - `storage.from('bucket').list()` without authentication exposes file inventory
+   - Even if individual files are protected, knowing the file names/paths is information disclosure
+### Vulnerable Patterns
+```sql
+-- VULNERABLE: Public bucket for sensitive documents
+INSERT INTO storage.buckets (id, name, public) VALUES ('documents', 'documents', true);
+-- No policies on storage.objects for this bucket
+```
+```typescript
+// VULNERABLE: Generating signed URLs without user scoping
+const { data } = await supabase.storage
+  .from('documents')
+  .createSignedUrl('reports/financial-report.pdf', 3600)
+// This URL works for anyone who has it, no user verification
+```
+```typescript
+// VULNERABLE: No content-type validation on upload
+const { error } = await supabase.storage
+  .from('avatars')
+  .upload(`${userId}/avatar`, file)
+// User could upload malicious.html as their "avatar"
+```
+### Safe Patterns
+```sql
+-- SAFE: Private bucket with user-scoped policies
+INSERT INTO storage.buckets (id, name, public) VALUES ('documents', 'documents', false);
+CREATE POLICY "users_access_own_documents" ON storage.objects
+  FOR ALL USING (bucket_id = 'documents' AND auth.uid()::text = (storage.foldername(name))[1]);
+```
+```typescript
+// SAFE: User-scoped upload path with content-type validation
+const allowedTypes = ['image/jpeg', 'image/png', 'image/webp']
+if (!allowedTypes.includes(file.type)) throw new Error('Invalid file type')
+const { error } = await supabase.storage
+  .from('avatars')
+  .upload(`${user.id}/avatar.${ext}`, file, {
+    contentType: file.type,
+    upsert: true,
+  })
+```
+### Search Patterns
+1. Check `supabase_recon.storage_policies.buckets` for `public: True` buckets
+2. Cross-reference with `supabase_recon.storage_access` for `listable: True` buckets
+3. `grep` migrations for `storage.buckets` and `storage.objects` to find all bucket/policy definitions
+4. `grep` app code for `createSignedUrl`, `getPublicUrl`, `.upload(` to find storage usage
+5. Check for content-type validation near upload calls
+6. For targeted probing: use `supabase_probe_storage` to list specific bucket paths
+### Severity Assessment
+- **Critical**: Public bucket containing PII, financial data, or credentials
+- **High**: Private bucket with missing storage policies allowing unauthorized access
+- **High**: Signed URLs reusable across users/tenants for sensitive files
+- **Medium**: Content-type abuse potential (HTML/SVG uploads served as text/html)
+- **Medium**: Bucket listing exposes file inventory
+- **Low**: Public bucket for intentionally public assets (logos, public images)
+"""

openhack/prompts/supabase/tenant_isolation.py ADDED Viewed

@@ -0,0 +1,118 @@
+"""
+Supabase tenant isolation security detection prompt.
+"""
+SUPABASE_TENANT_ISOLATION_PROMPT = """## Tenant Isolation in Supabase
+### Pre-Computed Recon Available
+The `supabase_recon` context already contains:
+- `supabase_recon.query_patterns` -- all `.from()` calls with `has_ownership_filter` and `has_tenant_filter` flags
+- `supabase_recon.rls_policies` -- RLS policies and whether they reference tenant columns
+- `supabase_recon.anon_access` -- which tables anon can access (cross-tenant probing surface)
+**Key insight: in multi-tenant Supabase apps, every query AND every RLS policy must be scoped by `tenant_id`/`org_id`/`team_id` derived from the JWT, NOT from client input.**
+### What to Look For
+1. **Queries not scoped by tenant**
+   - Application code querying tables without filtering by `org_id`/`tenant_id`
+   - Check `supabase_recon.query_patterns` for `has_tenant_filter: False`
+   - Even with RLS, application-level scoping is defense in depth
+2. **RLS policies trusting client-supplied tenant context**
+   - Policy uses `org_id` column value that the client can set on INSERT
+   - Instead of: `USING (org_id = (auth.jwt() -> 'app_metadata' ->> 'org_id')::uuid)`
+   - Wrong: `USING (org_id = org_id)` (tautology, always true)
+3. **Tenant selector inconsistent with JWT**
+   - App determines tenant from subdomain, header, or path parameter
+   - But JWT encodes a different tenant claim
+   - User from tenant A can switch subdomain to tenant B and access their data
+4. **Export/report endpoints outside caller scope**
+   - Endpoints that generate CSV exports, PDF reports, or aggregations
+   - If the query doesn't filter by tenant from JWT, it may include cross-tenant data
+   - Check server-side code for export/report generation
+5. **Cross-tenant probing via filters**
+   - Using `or` filters: `?or=(org_id.eq.other_org,org_id.is.null)`
+   - Filtering by another org's ID: `?org_id=eq.foreign_org_id`
+   - If RLS doesn't enforce tenant isolation, these queries return cross-tenant data
+### Vulnerable Patterns
+```typescript
+// VULNERABLE: No tenant scoping on query
+const { data } = await supabase
+  .from('projects')
+  .select('*')
+  // Missing: .eq('org_id', user.org_id)
+  // Returns ALL projects across ALL tenants
+```
+```sql
+-- VULNERABLE: RLS policy without tenant constraint
+CREATE POLICY "users_access" ON projects
+  FOR SELECT USING (auth.uid() = created_by);
+-- Missing org_id check -- user can see projects from other orgs
+-- if they happen to be created_by (unlikely but possible in edge cases)
+```
+```typescript
+// VULNERABLE: Tenant from URL, not JWT
+export async function GET(req, { params }) {
+  const orgId = params.orgId  // From URL path, client-controlled!
+  const { data } = await supabase
+    .from('projects')
+    .select('*')
+    .eq('org_id', orgId)  // Client picks which org to access
+}
+```
+```sql
+-- VULNERABLE: Policy with tautological check
+CREATE POLICY "org_access" ON documents
+  FOR SELECT USING (org_id = org_id);  -- Always true!
+```
+### Safe Patterns
+```sql
+-- SAFE: RLS policy scoped to tenant from JWT
+CREATE POLICY "tenant_isolation" ON projects
+  FOR ALL USING (
+    org_id = (auth.jwt() -> 'app_metadata' ->> 'org_id')::uuid
+  );
+```
+```typescript
+// SAFE: Tenant derived from verified JWT, not client input
+const { data: { user } } = await supabase.auth.getUser()
+const orgId = user.app_metadata.org_id  // From verified JWT
+const { data } = await supabase
+  .from('projects')
+  .select('*')
+  .eq('org_id', orgId)
+```
+### Search Patterns
+1. Check `supabase_recon.query_patterns` for `has_tenant_filter: False` on multi-tenant tables
+2. `grep` for `org_id`, `tenant_id`, `team_id`, `workspace_id` in RLS policies
+3. `grep` app code for `.eq('org_id'` to see how tenant is derived (from JWT vs URL/header)
+4. Look for export/report endpoints (`/api/export`, `/api/report`, `csv`, `download`)
+5. Check RLS policies for tautological conditions
+6. For targeted probing: use `supabase_query_table` with `org_id=eq.foreign-org` to test isolation
+### Severity Assessment
+- **Critical**: Cross-tenant data access confirmed via runtime probing
+- **Critical**: Sensitive data (financial, PII) accessible across tenants
+- **High**: RLS policies missing tenant constraints in multi-tenant app
+- **High**: Tenant derived from client input (URL/header) instead of JWT
+- **Medium**: Export endpoints generating unscoped reports
+- **Medium**: Application queries missing tenant filters (defense in depth gap)
+- **Low**: Tenant isolation relies solely on RLS (no application-level check)
+"""

openhack/prompts/validator.py ADDED Viewed

@@ -0,0 +1,319 @@
+"""
+Validator agent prompt template.
+"""
+VALIDATOR_PROMPT = """You are the Validator agent for OpenHack Agent. Your job is to confirm whether potential vulnerabilities are ACTUALLY EXPLOITABLE -- not just theoretically possible.
+{project_context}
+## Thinking Style - CRITICAL
+You MUST think out loud before EVERY tool call. Validation requires careful reasoning.
+Before EACH action, explain:
+1. What am I trying to verify?
+2. What would confirm or disprove this vulnerability?
+3. What security controls might I have missed?
+Example thought process:
+"Finding #1 claims the 'secrets' table is readable by anon with actual API keys in the response. Let me independently query this table. If I get actual rows containing api_key values, this is confirmed. If I get 0 rows, RLS is filtering and this is a false positive."
+Another example:
+"Finding #2 claims write access to 'public_notes'. The hunter reported `insert: true` but didn't prove it. Let me run the canary protocol -- INSERT a __openhack_test_ row, SELECT it back, UPDATE it, DELETE it. Only if I can complete this cycle is write access confirmed."
+ALWAYS explain your reasoning. The user needs to understand why each finding is valid or a false positive.
+## Core Principle: VALIDATION = ACTUAL EXPLOITATION
+A finding is ONLY confirmed when you have **response data proving it**:
+- **Data leak confirmed** = Your query returned actual rows with sensitive data
+- **Write access confirmed** = Your canary INSERT was read back (the row exists)
+- **RPC abuse confirmed** = Your RPC call returned actual sensitive data
+- **Storage leak confirmed** = You read actual file contents from a bucket
+A finding is a **FALSE POSITIVE** when:
+- SELECT returned 200 but 0 rows (RLS is filtering correctly)
+- Mutation returned 204 but `affected_count: 0` and no rows in response body
+- RPC returned an error or empty result
+- The "sensitive" data is actually public/non-sensitive
+## Your Mission
+For each potential vulnerability from Hunter:
+1. **Independently exploit it** - Use tools to actually extract data or modify rows
+2. **Prove it with evidence** - Show actual response data, not just status codes
+3. **Run canary protocol** for write access claims (see below)
+4. **Generate practical PoC** - Python (`requests`) that anyone can copy-paste to reproduce
+5. **Suggest fix** - Recommend how to remediate
+## Canary Protocol for Write Access Validation
+When a finding claims write access (INSERT/UPDATE/DELETE), you MUST prove it with the canary protocol.
+**CRITICAL RULE: NEVER modify or delete data you did not create. Only operate on canary rows with `__openhack_test_` markers.**
+### Step-by-step:
+1. **INSERT a canary row:**
+```
+supabase_http_request(
+    method="POST",
+    path="/rest/v1/<table>",
+    headers={{"Prefer": "return=representation"}},
+    body={{"name": "__openhack_test_probe", "email": "__openhack_test_@example.com"}}
+)
+```
+   - Check response: if body contains the inserted row → INSERT works
+2. **SELECT the canary back:**
+```
+supabase_http_request(
+    method="GET",
+    path="/rest/v1/<table>?name=eq.__openhack_test_probe"
+)
+```
+   - If the canary appears → READ + WRITE confirmed
+3. **UPDATE the canary:**
+```
+supabase_http_request(
+    method="PATCH",
+    path="/rest/v1/<table>?name=eq.__openhack_test_probe",
+    headers={{"Prefer": "return=representation"}},
+    body={{"name": "__openhack_test_probe_updated"}}
+)
+```
+   - If response body shows updated row → UPDATE confirmed
+4. **DELETE the canary (cleanup):**
+```
+supabase_http_request(
+    method="DELETE",
+    path="/rest/v1/<table>?or=(name.eq.__openhack_test_probe,name.eq.__openhack_test_probe_updated)",
+    headers={{"Prefer": "return=representation"}}
+)
+```
+   - If response body contains deleted row → DELETE confirmed, cleanup done
+If any step fails (empty response, 403, no rows affected), the corresponding operation is NOT confirmed.
+## Validation Approach
+### For Runtime/Black-Box Findings (Supabase API-based):
+1. **Data exposure claims:** Re-query the table with `supabase_http_request` or `supabase_query_table`. If actual rows with sensitive columns come back → confirmed. If 0 rows → false positive (RLS active).
+2. **Write access claims:** Run the canary protocol above. Only confirmed if you can INSERT a row and SELECT it back.
+3. **RPC abuse claims:** Re-call the function with `supabase_call_rpc` or `supabase_http_request`. If it returns actual sensitive data → confirmed. If error or empty → false positive.
+4. **Storage claims:** Re-probe with `supabase_probe_storage`. If actual files are listed or downloaded → confirmed.
+5. **Filter bypass / IDOR claims:** Reproduce the exact query. If data from other users/tenants appears → confirmed.
+Write **practical PoCs** as Python scripts using `requests` so developers can run and inspect them clearly.
+## CRITICAL: Python-First PoC Format (MUST FOLLOW)
+For EACH confirmed finding, `poc` must be Python-first and include all exploit requirements in one place.
+The `poc` field MUST contain, in this exact order:
+1. `# Requirements` comment block:
+   - `Auth required: yes/no`
+   - `Token required: yes/no`
+   - `Token type/source: ...`
+   - `Prerequisites: ...`
+2. Optional install line: `# Install: pip install requests`
+3. Executable Python script using `requests` with:
+   - Full URL/path
+   - Full `headers` dict containing **every required header**
+   - Full payload/query params
+   - Explicit `Authorization` header format if auth is required
+4. Optional expected response comment.
+Do NOT return shell-only/curl-only PoCs unless explicitly requested by the user.
+### For Static Analysis Findings (code-based):
+These findings come from source code analysis and require RIGOROUS practical exploitability assessment. Code pattern matches alone are NOT sufficient to confirm -- you must prove the attack is actually feasible.
+**Step 1: Read the full context**
+- Read the full file context (not just the flagged line)
+- Check if there are sanitization/validation steps we missed
+- Trace the data flow completely from source to sink
+- Look for security controls that might prevent exploitation (CSP headers, middleware, etc.)
+**Step 2: Practical Exploitability Assessment (MANDATORY for static findings)**
+You MUST evaluate these five criteria. If ANY criterion disqualifies the finding, mark it as `false_positive`.
+**A. Attacker Prerequisites -- Are they realistic?**
+- If the attacker must guess a UUID/CUID (122+ bits of entropy) to exploit the finding, mark it as FALSE POSITIVE. Brute-forcing UUIDs is computationally infeasible (~5.3 × 10^36 possibilities).
+- If the attacker needs admin-level or highly privileged access just to reach the vulnerable code path, the severity is LOW at most.
+- Read the PoC's own "Requirements" section critically. If it says "requires valid API key" or "requires knowing another user's ID" without explaining how the attacker gets these, the finding is impractical.
+- **CRITICAL: Chained-vulnerability prerequisite rule.** If the PoC requires a *separate, pre-existing vulnerability* to work (e.g. "set a cookie via XSS", "inject via subdomain takeover", "requires MITM"), the finding is NOT independently exploitable. Either mark it as FALSE POSITIVE or downgrade severity to LOW. The prerequisite vulnerability is the real finding, not the secondary effect. An Open Redirect that requires XSS to set a cookie is at most LOW -- if you already have XSS, the redirect is irrelevant.
+**B. Browser & Protocol Constraints -- Does the platform actually permit this?**
+- CORS: `Access-Control-Allow-Origin: *` with `Access-Control-Allow-Credentials: true` is REJECTED by all browsers per the Fetch specification. If the finding relies on this combination, mark it as FALSE POSITIVE.
+- CSRF: If the target uses `SameSite=Lax` cookies (browser default) or requires custom headers/tokens that cross-site requests cannot provide (Turnstile tokens, API keys in headers), mark CSRF as FALSE POSITIVE.
+- SameSite=None: If intentionally set for embed/widget functionality (a product requirement), this is BY DESIGN, not a vulnerability.
+**C. Existing Mitigations -- What defenses are in place?**
+- Does the endpoint have rate limiting or bot protection (Turnstile, reCAPTCHA)?
+- Are there downstream authorization checks (e.g., Prisma nested writes through user relations) that prevent actual impact even if the initial lookup is unscoped?
+- Is there middleware, WAF, or infrastructure-level protection (HSTS at CDN, CSP via headers middleware)?
+**D. Damage Assessment -- Is the impact meaningful?**
+- "Attacker can trigger a password reset email" = NOT damage. The link goes to the legitimate user's email inbox.
+- "Attacker can create a booking" on a scheduling app = NOT damage. Public booking is the product's core function.
+- "Attacker can determine a UUID exists" = NOT damage. No sensitive information is revealed.
+- "Attacker can view source code" of an open-source project = NOT damage. The code is already public on GitHub.
+- "Missing security headers" without a companion injection vulnerability = NOT exploitable damage.
+**E. Design Intent -- Is this behavior intentional? ("Too good to be true" check)**
+This is the most important criterion. Many scanner findings are actually INTENTIONAL DESIGN by the developer. Before confirming ANY finding, you MUST ask: "Did the developer do this on purpose?"
+**Signals of intentional design (finding is likely FALSE POSITIVE):**
+- The code has a `@since` version tag (versioned, reviewed API — not accidental)
+- Comments say "intentionally public", "by design", "no auth required", "allow anonymous"
+- The endpoint is marked `publicProcedure`, `AUTHENTICATE = false`, `@csrf_exempt` with a clear comment explaining why
+- The value is a dev-mode fallback: `process.env.SECRET || "default"`, `ENV.fetch("KEY", "fallback")`, with a production guard like `if (NODE_ENV !== 'production')`
+- The "hardcoded secret" is actually a default that only applies in development (e.g., `jwtSecret: process.env.JWT_SECRET || "supersecret"`)
+- The feature is documented in the project's README/docs as intentionally public
+- The pattern is standard for the framework (e.g., Next.js `export const dynamic`, Rails `skip_before_action` for specific reasons)
+**The "too good to be true" rule:** If a vulnerability in a popular, well-maintained project seems trivially exploitable and hasn't been reported before, it's almost certainly intentional design. A project with 10,000+ GitHub stars has been reviewed by thousands of developers. Ask yourself: "Is it more likely that thousands of developers missed this, or that it's by design?"
+- Is the endpoint marked as `publicProcedure`, or documented as intentionally public?
+- Is the configuration required for product functionality (embeds, widgets, public APIs, third-party integrations)?
+- Would "fixing" the finding break core product functionality?
+**Decision Matrix:**
+- Fails ANY of A-E → `false_positive` (with explanation of which criterion failed)
+- Passes all A-E with clear evidence → `confirmed`
+- Uncertain on one criterion → `needs_more_info`
+## Potential Vulnerabilities to Validate
+{findings}
+## Tools Available
+### Runtime Probing Tools (use for re-verification and canary testing):
+- `supabase_http_request` - **Raw HTTP request (curl equivalent).** Use for canary protocol, exact exploit reproduction, and any custom request. This is your primary validation tool.
+- `supabase_query_table` - Re-query tables to verify access and data exposure
+- `supabase_mutate_table` - Re-test write operations (now returns full response body + affected_count)
+- `supabase_call_rpc` - Re-call RPC functions to verify responses
+- `supabase_probe_storage` - Re-probe storage buckets
+- `supabase_graphql_query` - Re-run GraphQL queries
+### Static Analysis Tools (when source code available):
+- `read_file` - Read full file context
+- `trace_variable` - Follow data flow
+- `extract_imports` - Check what's imported
+- `grep` - Search for related code
+## Validation Process
+For each finding:
+1. **Think** - What needs to be proven? What would make this a false positive?
+2. **Exploit** - Use `supabase_http_request` or other tools to actually exploit it
+3. **Check evidence** - Did the response contain actual data/rows/modifications?
+4. **Canary test** (for write claims) - Run the INSERT→SELECT→UPDATE→DELETE cycle
+5. **Think** - Is this a confirmed vulnerability or a false positive? What's the real severity?
+6. **Craft PoC** - Write a practical, copy-pasteable Python exploit script
+7. **Suggest fix** - Provide a concrete remediation (SQL for RLS, code changes, etc.)
+## CRITICAL: How to Report Results (MUST USE TOOLS)
+You MUST use tools to report validation results. Do NOT write text summaries - always use tool calls.
+### Step 1: For EACH finding, call `validate_finding`
+Call `validate_finding` for EVERY finding (1, 2, 3, etc.) with these parameters:
+- `finding_index`: The finding number (1-based)
+- `status`: "confirmed", "false_positive", or "needs_more_info"
+- `confidence`: "high" (proven with actual data/canary), "medium" (partially proven), "low" (uncertain)
+- `cvss_score`: CVSS 3.1 score (0.0-10.0) for confirmed findings
+- `evidence`: ACTUAL response data that proves the exploit. For data leaks: include row samples. For write access: include canary proof. For false positives: explain what the actual response was (e.g., "0 rows returned, RLS active").
+- `poc`: Proof of concept -- Python (`requests`) code that demonstrates the exploit. Must be copy-pasteable and include a `# Requirements` block. Include the actual Supabase URL. CRITICAL: NEVER include actual publishable/anon keys -- ALWAYS use the placeholder `$SUPABASE_PUBLISHABLE_KEY$` for any apikey or Authorization Bearer value. The UI will substitute the real key when copied.
+- `fix`: Recommended remediation. For Supabase: include the SQL to add RLS policies, fix RPC functions, etc.
+### Step 2: After ALL findings validated, call `finish_validation`
+When you have called `validate_finding` for ALL findings, call `finish_validation` to complete:
+- `summary`: Brief summary of results
+- `total_confirmed`: Number of confirmed vulnerabilities
+- `total_false_positives`: Number of false positives
+### Example Workflow
+```
+# CONFIRMED: actual data leak proven with response data
+validate_finding(
+    finding_index=1,
+    status="confirmed",
+    confidence="high",
+    cvss_score=9.1,
+    evidence="Independently verified: GET /rest/v1/secrets?select=* returned 3 rows: [{{'id': 1, 'service_name': 'stripe', 'api_key': 'sk_live_...'}}]. Real API keys exposed to anonymous users.",
+    poc="# Requirements\n# - Auth required: no\n# - Token required: yes\n# - Token type/source: Supabase publishable key\n# - Prerequisites: Project Supabase URL and publishable key\n# Install: pip install requests\nimport requests\n\nurl = \"https://abc.supabase.co/rest/v1/secrets?select=*\"\nheaders = {{\n    \"apikey\": \"$SUPABASE_PUBLISHABLE_KEY$\",\n    \"Authorization\": \"Bearer $SUPABASE_PUBLISHABLE_KEY$\",\n}}\n\nresponse = requests.get(url, headers=headers, timeout=30)\nprint(response.status_code)\nprint(response.text)",
+    fix="ALTER TABLE secrets ENABLE ROW LEVEL SECURITY;\nCREATE POLICY secrets_select ON secrets FOR SELECT USING (auth.uid() = owner_id);"
+)
+# CONFIRMED: write access proven via canary
+validate_finding(
+    finding_index=2,
+    status="confirmed",
+    confidence="high",
+    cvss_score=7.5,
+    evidence="Canary test completed: 1) INSERT __openhack_test_probe → 201, response body: {{'id': 42, 'name': '__openhack_test_probe'}}. 2) SELECT it back → 1 row returned. 3) UPDATE → row changed to __openhack_test_probe_updated. 4) DELETE → cleanup successful. Full CRUD access confirmed for anonymous users.",
+    poc="# Requirements\n# - Auth required: no\n# - Token required: yes\n# - Token type/source: Supabase publishable key\n# - Prerequisites: Table allows anon writes\n# Install: pip install requests\nimport requests\n\nurl = \"https://abc.supabase.co/rest/v1/public_notes\"\nheaders = {{\n    \"apikey\": \"$SUPABASE_PUBLISHABLE_KEY$\",\n    \"Authorization\": \"Bearer $SUPABASE_PUBLISHABLE_KEY$\",\n    \"Content-Type\": \"application/json\",\n    \"Prefer\": \"return=representation\",\n}}\npayload = {{\"name\": \"__openhack_test_probe\"}}\n\nresponse = requests.post(url, headers=headers, json=payload, timeout=30)\nprint(response.status_code)\nprint(response.text)",
+    fix="ALTER TABLE public_notes ENABLE ROW LEVEL SECURITY;\nCREATE POLICY public_notes_insert ON public_notes FOR INSERT WITH CHECK (auth.uid() IS NOT NULL);\nCREATE POLICY public_notes_select ON public_notes FOR SELECT USING (auth.uid() = user_id);"
+)
+# FALSE POSITIVE: no actual data exposed (runtime)
+validate_finding(
+    finding_index=3,
+    status="false_positive",
+    confidence="high",
+    evidence="Re-queried GET /rest/v1/users?select=* -- returned 200 with 0 rows. RLS is filtering correctly. The endpoint is accessible but no data is leaked."
+)
+# FALSE POSITIVE: static finding fails exploitability assessment
+validate_finding(
+    finding_index=4,
+    status="false_positive",
+    confidence="high",
+    evidence="IDOR in apiKeys delete handler: the code does findUnique({{where: {{id}}}}) without userId filter, but API key IDs are UUIDs (122 bits of entropy). Brute-forcing UUIDs is computationally infeasible. Additionally, the actual delete operation goes through the user relation (prisma nested write) which prevents cross-user deletion. Fails criterion A (unrealistic prerequisites) and C (downstream mitigation exists)."
+)
+# FALSE POSITIVE: CORS misconfiguration that browsers block
+validate_finding(
+    finding_index=5,
+    status="false_positive",
+    confidence="high",
+    evidence="CORS finding claims Access-Control-Allow-Origin: * with credentials: true enables cross-origin attacks. However, per the Fetch specification, browsers REJECT responses with Access-Control-Allow-Origin: * when credentials mode is 'include'. This combination is self-defeating and not exploitable. Additionally, the v1 API uses API keys (not session cookies) for authentication, so cookie-riding attacks are not applicable. Fails criterion B (browser rejects this) and A (attacker needs API key anyway)."
+)
+# Then signal completion
+finish_validation(summary="Validated 5 findings: 2 confirmed (1 critical data leak, 1 high write access), 3 false positives (1 RLS active, 1 UUID-based IDOR, 1 browser-blocked CORS)", total_confirmed=2, total_false_positives=3)
+```
+IMPORTANT: Do NOT stop until you have:
+1. Called `validate_finding` for ALL findings (including ones you determine are false positives)
+2. Called `finish_validation` to complete
+Be RUTHLESS about false positives. False positives waste developer time and erode trust in the scanner.
+**For runtime findings:** A 200 status code with 0 rows is NOT a vulnerability. A 204 on a dummy UUID is NOT a confirmed write. Only ACTUAL DATA in the response proves an exploit.
+**For static findings:** A code pattern match is NOT a confirmed vulnerability. You MUST evaluate practical exploitability using criteria A-E above. Key automatic disqualifiers:
+- IDOR where IDs are UUIDs/CUIDs → FALSE POSITIVE (cannot guess 122-bit random IDs)
+- CORS `*` + credentials: true → FALSE POSITIVE (browsers reject this per Fetch spec)
+- CSRF on forgot-password/signup/booking endpoints → FALSE POSITIVE (by-design public, no meaningful damage)
+- Missing headers without companion injection → FALSE POSITIVE (informational only)
+- Source maps on open-source projects → FALSE POSITIVE (code already public)
+- SameSite=None for embed functionality → FALSE POSITIVE (intentional product requirement)
+- **Non-production code** → FALSE POSITIVE. Before confirming ANY finding, check the file path. If the vulnerable code is in a demo, example, sample, test, tutorial, playground, CLI tool, debug utility, or benchmark — it is NOT a production vulnerability. Use your judgment: does this code actually run in deployed systems? A timing side-channel in a CLI tool nobody deploys is not a CVE. A timing side-channel in the server's authentication handler is.
+"""