@jaguilar87/gaia 5.0.2 → 5.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude-plugin/marketplace.json +2 -2
- package/.claude-plugin/plugin.json +1 -1
- package/ARCHITECTURE.md +0 -1
- package/CHANGELOG.md +110 -0
- package/INSTALL.md +0 -2
- package/README.md +1 -6
- package/bin/README.md +0 -1
- package/bin/cli/_install_helpers.py +1 -1
- package/bin/cli/approvals.py +23 -21
- package/bin/cli/cleanup.py +0 -1
- package/bin/cli/doctor.py +1 -1
- package/bin/cli/memory.py +2 -0
- package/bin/cli/update.py +1 -1
- package/bin/pre-publish-validate.js +48 -5
- package/config/README.md +22 -44
- package/config/surface-routing.json +0 -2
- package/dist/gaia-ops/.claude-plugin/plugin.json +1 -1
- package/dist/gaia-ops/config/README.md +22 -44
- package/dist/gaia-ops/config/surface-routing.json +0 -2
- package/dist/gaia-ops/hooks/modules/agents/contract_validator.py +18 -0
- package/dist/gaia-ops/hooks/modules/agents/handoff_persister.py +214 -2
- package/dist/gaia-ops/hooks/modules/agents/response_contract.py +26 -0
- package/dist/gaia-ops/hooks/modules/agents/transcript_reader.py +15 -0
- package/dist/gaia-ops/hooks/modules/security/__init__.py +0 -5
- package/dist/gaia-ops/hooks/modules/security/approval_grants.py +124 -19
- package/dist/gaia-ops/hooks/modules/security/mutative_verbs.py +99 -7
- package/dist/gaia-ops/hooks/modules/tools/bash_validator.py +127 -24
- package/dist/gaia-ops/hooks/modules/validation/commit_validator.py +90 -55
- package/dist/gaia-ops/skills/README.md +1 -1
- package/dist/gaia-ops/skills/agent-contract-handoff/SKILL.md +3 -0
- package/dist/gaia-ops/skills/agent-response/SKILL.md +4 -2
- package/dist/gaia-ops/skills/gaia-patterns/SKILL.md +1 -1
- package/dist/gaia-ops/skills/gaia-patterns/reference.md +2 -3
- package/dist/gaia-ops/skills/gaia-release/SKILL.md +60 -24
- package/dist/gaia-ops/skills/gaia-release/reference.md +35 -11
- package/dist/gaia-ops/skills/git-conventions/SKILL.md +6 -2
- package/dist/gaia-ops/skills/orchestrator-present-approval/SKILL.md +30 -7
- package/dist/gaia-ops/skills/orchestrator-present-approval/reference.md +32 -15
- package/dist/gaia-ops/skills/readme-writing/SKILL.md +1 -1
- package/dist/gaia-ops/skills/readme-writing/reference.md +0 -1
- package/dist/gaia-ops/skills/security-tiers/SKILL.md +5 -1
- package/dist/gaia-ops/skills/security-tiers/reference.md +3 -1
- package/dist/gaia-ops/skills/subagent-request-approval/SKILL.md +43 -6
- package/dist/gaia-ops/skills/subagent-request-approval/reference.md +66 -16
- package/dist/gaia-ops/tools/context/README.md +1 -1
- package/dist/gaia-ops/tools/gaia_simulator/extractor.py +0 -1
- package/dist/gaia-ops/tools/scan/ui.py +20 -4
- package/dist/gaia-ops/tools/scan/verify.py +3 -3
- package/dist/gaia-ops/tools/validation/README.md +15 -24
- package/dist/gaia-security/.claude-plugin/plugin.json +1 -1
- package/dist/gaia-security/hooks/modules/agents/contract_validator.py +18 -0
- package/dist/gaia-security/hooks/modules/agents/handoff_persister.py +214 -2
- package/dist/gaia-security/hooks/modules/agents/response_contract.py +26 -0
- package/dist/gaia-security/hooks/modules/agents/transcript_reader.py +15 -0
- package/dist/gaia-security/hooks/modules/security/__init__.py +0 -5
- package/dist/gaia-security/hooks/modules/security/approval_grants.py +124 -19
- package/dist/gaia-security/hooks/modules/security/mutative_verbs.py +99 -7
- package/dist/gaia-security/hooks/modules/tools/bash_validator.py +127 -24
- package/dist/gaia-security/hooks/modules/validation/commit_validator.py +90 -55
- package/gaia/state/transitions.py +4 -4
- package/gaia/store/writer.py +56 -0
- package/hooks/modules/README.md +2 -4
- package/hooks/modules/agents/contract_validator.py +18 -0
- package/hooks/modules/agents/handoff_persister.py +214 -2
- package/hooks/modules/agents/response_contract.py +26 -0
- package/hooks/modules/agents/transcript_reader.py +15 -0
- package/hooks/modules/security/__init__.py +0 -5
- package/hooks/modules/security/approval_grants.py +124 -19
- package/hooks/modules/security/mutative_verbs.py +99 -7
- package/hooks/modules/tools/bash_validator.py +127 -24
- package/hooks/modules/validation/commit_validator.py +90 -55
- package/index.js +2 -12
- package/package.json +4 -6
- package/pyproject.toml +3 -3
- package/scripts/bootstrap_database.sh +88 -439
- package/scripts/check_schema_drift.py +208 -0
- package/scripts/migrations/README.md +78 -28
- package/scripts/migrations/schema.checksum +8 -0
- package/scripts/release-prepare.mjs +199 -0
- package/skills/README.md +1 -1
- package/skills/agent-contract-handoff/SKILL.md +3 -0
- package/skills/agent-response/SKILL.md +4 -2
- package/skills/gaia-patterns/SKILL.md +1 -1
- package/skills/gaia-patterns/reference.md +2 -3
- package/skills/gaia-release/SKILL.md +60 -24
- package/skills/gaia-release/reference.md +35 -11
- package/skills/git-conventions/SKILL.md +6 -2
- package/skills/orchestrator-present-approval/SKILL.md +30 -7
- package/skills/orchestrator-present-approval/reference.md +32 -15
- package/skills/readme-writing/SKILL.md +1 -1
- package/skills/readme-writing/reference.md +0 -1
- package/skills/security-tiers/SKILL.md +5 -1
- package/skills/security-tiers/reference.md +3 -1
- package/skills/subagent-request-approval/SKILL.md +43 -6
- package/skills/subagent-request-approval/reference.md +66 -16
- package/tools/context/README.md +1 -1
- package/tools/gaia_simulator/extractor.py +0 -1
- package/tools/scan/ui.py +20 -4
- package/tools/scan/verify.py +3 -3
- package/tools/validation/README.md +15 -24
- package/commands/README.md +0 -64
- package/commands/gaia.md +0 -37
- package/commands/scan-project.md +0 -74
- package/config/crons-schema.md +0 -81
- package/config/git_standards.json +0 -72
- package/dist/gaia-ops/commands/gaia.md +0 -37
- package/dist/gaia-ops/config/crons-schema.md +0 -81
- package/dist/gaia-ops/config/git_standards.json +0 -72
- package/dist/gaia-ops/hooks/modules/security/gitops_validator.py +0 -179
- package/dist/gaia-ops/tools/agentic-loop/decide-status.py +0 -210
- package/dist/gaia-ops/tools/agentic-loop/parse-metric.py +0 -106
- package/dist/gaia-ops/tools/agentic-loop/record-iteration.py +0 -223
- package/dist/gaia-security/hooks/modules/security/gitops_validator.py +0 -179
- package/git-hooks/commit-msg +0 -41
- package/hooks/modules/security/gitops_validator.py +0 -179
- package/scripts/migrations/v10_to_v11.sql +0 -170
- package/scripts/migrations/v10_to_v11_fresh.sql +0 -18
- package/scripts/migrations/v11_to_v12.sql +0 -195
- package/scripts/migrations/v11_to_v12_fresh.sql +0 -19
- package/scripts/migrations/v12_to_v13.sql +0 -48
- package/scripts/migrations/v12_to_v13_fresh.sql +0 -17
- package/scripts/migrations/v13_to_v14.sql +0 -44
- package/scripts/migrations/v13_to_v14_fresh.sql +0 -17
- package/scripts/migrations/v14_to_v15.sql +0 -71
- package/scripts/migrations/v14_to_v15_fresh.sql +0 -19
- package/scripts/migrations/v15_to_v16.sql +0 -57
- package/scripts/migrations/v15_to_v16_fresh.sql +0 -18
- package/scripts/migrations/v16_to_v17.sql +0 -51
- package/scripts/migrations/v16_to_v17_fresh.sql +0 -18
- package/scripts/migrations/v17_to_v18.sql +0 -66
- package/scripts/migrations/v17_to_v18_fresh.sql +0 -24
- package/scripts/migrations/v1_to_v2.sql +0 -97
- package/scripts/migrations/v2_to_v3.sql +0 -68
- package/scripts/migrations/v2_to_v3_merge.sql +0 -69
- package/scripts/migrations/v3_to_v4.sql +0 -67
- package/scripts/migrations/v3_to_v4_fresh.sql +0 -20
- package/scripts/migrations/v4_to_v5.sql +0 -55
- package/scripts/migrations/v4_to_v5_fresh.sql +0 -20
- package/scripts/migrations/v5_to_v6.sql +0 -48
- package/scripts/migrations/v5_to_v6_fresh.sql +0 -17
- package/scripts/migrations/v6_to_v7.sql +0 -26
- package/scripts/migrations/v6_to_v7_fresh.sql +0 -13
- package/scripts/migrations/v7_to_v8.sql +0 -44
- package/scripts/migrations/v7_to_v8_fresh.sql +0 -14
- package/scripts/migrations/v8_to_v9.sql +0 -87
- package/scripts/migrations/v8_to_v9_fresh.sql +0 -15
- package/scripts/migrations/v9_to_v10.sql +0 -109
- package/scripts/migrations/v9_to_v10_episodes_workspace.sql +0 -109
- package/scripts/migrations/v9_to_v10_fresh.sql +0 -18
- package/templates/README.md +0 -70
- package/templates/managed-settings.template.json +0 -43
- package/tools/agentic-loop/decide-status.py +0 -210
- package/tools/agentic-loop/parse-metric.py +0 -106
- package/tools/agentic-loop/record-iteration.py +0 -223
package/gaia/store/writer.py
CHANGED
|
@@ -2822,6 +2822,62 @@ def list_approval_grants(
|
|
|
2822
2822
|
con.close()
|
|
2823
2823
|
|
|
2824
2824
|
|
|
2825
|
+
def list_command_set_grants_agnostic(
|
|
2826
|
+
*,
|
|
2827
|
+
status: str = "PENDING",
|
|
2828
|
+
limit: int = 100,
|
|
2829
|
+
db_path: Path | None = None,
|
|
2830
|
+
) -> list[dict]:
|
|
2831
|
+
"""List COMMAND_SET grants WITHOUT a session_id constraint (Brief 71).
|
|
2832
|
+
|
|
2833
|
+
This is the COMMAND_SET analogue of the session-agnostic lookup that
|
|
2834
|
+
``check_db_semantic_grant`` performs for the SINGULAR (semantic-signature)
|
|
2835
|
+
grant. The block-approve-retry flow legitimately spans sessions -- a
|
|
2836
|
+
command is blocked under the subagent session, the user approves under the
|
|
2837
|
+
orchestrator session, and the consuming retry runs under whichever session
|
|
2838
|
+
(or none -- CLAUDE_SESSION_ID is not guaranteed to be exported into the bash
|
|
2839
|
+
subprocess, where ``get_session_id()`` then falls back to the literal
|
|
2840
|
+
``"default"``). A session_id filter therefore never matches the grant the
|
|
2841
|
+
approval created, which is exactly the consumption-bypass bug this function
|
|
2842
|
+
fixes.
|
|
2843
|
+
|
|
2844
|
+
The security boundary is preserved WITHOUT a session_id constraint, by the
|
|
2845
|
+
same conjunction of session-agnostic facts the singular path relies on
|
|
2846
|
+
(mirrors the comment in ``check_db_semantic_grant``):
|
|
2847
|
+
* the byte-for-byte command match (applied by the caller against each
|
|
2848
|
+
unconsumed command_set item) binds the grant to THIS command's exact
|
|
2849
|
+
intent;
|
|
2850
|
+
* status='PENDING' plus per-index ``consumed_indexes_json`` is the
|
|
2851
|
+
single-use replay guard -- a fully consumed grant flips to CONSUMED and
|
|
2852
|
+
no longer matches, and an already-consumed index is skipped;
|
|
2853
|
+
* expires_at is the TTL -- a stale grant past its window is skipped.
|
|
2854
|
+
None of these depend on which session is asking, so dropping the session_id
|
|
2855
|
+
filter widens nothing the other checks do not already gate. It only lets the
|
|
2856
|
+
legitimate cross-session (or empty-session) retry succeed.
|
|
2857
|
+
|
|
2858
|
+
Args:
|
|
2859
|
+
status: Status to filter on (default 'PENDING').
|
|
2860
|
+
limit: Maximum rows to return.
|
|
2861
|
+
db_path: Optional explicit DB path (used by tests).
|
|
2862
|
+
|
|
2863
|
+
Returns:
|
|
2864
|
+
List of dicts keyed by column name, ordered by created_at DESC.
|
|
2865
|
+
"""
|
|
2866
|
+
con = _connect(db_path)
|
|
2867
|
+
try:
|
|
2868
|
+
rows = con.execute(
|
|
2869
|
+
"SELECT * FROM approval_grants "
|
|
2870
|
+
"WHERE scope = 'COMMAND_SET' AND status = ? "
|
|
2871
|
+
"ORDER BY created_at DESC LIMIT ?",
|
|
2872
|
+
(status, limit),
|
|
2873
|
+
).fetchall()
|
|
2874
|
+
return [dict(r) for r in rows]
|
|
2875
|
+
except Exception:
|
|
2876
|
+
return []
|
|
2877
|
+
finally:
|
|
2878
|
+
con.close()
|
|
2879
|
+
|
|
2880
|
+
|
|
2825
2881
|
# ---------------------------------------------------------------------------
|
|
2826
2882
|
# Public API: insert_semantic_grant / check_db_semantic_grant /
|
|
2827
2883
|
# consume_db_semantic_grant (CHECK-side DB cutover, Brief 71)
|
package/hooks/modules/README.md
CHANGED
|
@@ -45,8 +45,7 @@ modules/
|
|
|
45
45
|
│ ├── approval_constants.py # Approval system constants
|
|
46
46
|
│ ├── approval_messages.py # Approval denial message formatting
|
|
47
47
|
│ ├── approval_scopes.py # Approval scope definitions
|
|
48
|
-
│
|
|
49
|
-
│ └── gitops_validator.py # kubectl/helm/flux validation
|
|
48
|
+
│ └── command_semantics.py # Command semantic analysis
|
|
50
49
|
│
|
|
51
50
|
├── tools/ # Tool-specific validators
|
|
52
51
|
│ ├── __init__.py
|
|
@@ -179,8 +178,7 @@ bash_validator checks commands in this order (short-circuit on first match):
|
|
|
179
178
|
3. **Commit message validation** — conventional commits enforcement
|
|
180
179
|
4. **Cloud pipe/redirect/chain check** (cloud_pipe_validator.py) — corrective deny
|
|
181
180
|
5. **Mutative verbs** (mutative_verbs.py) — CLI-agnostic verb detector, native `ask` dialog
|
|
182
|
-
6. **
|
|
183
|
-
7. **Everything else** — SAFE by elimination (auto-approved)
|
|
181
|
+
6. **Everything else** — SAFE by elimination (auto-approved)
|
|
184
182
|
|
|
185
183
|
### Tier Classification
|
|
186
184
|
- **T0**: Read-only (get, list, describe, show)
|
|
@@ -19,6 +19,7 @@ Provides:
|
|
|
19
19
|
- parse_rollback_executed(): Parse rollback_executed clause (advisory)
|
|
20
20
|
- parse_context_consumption(): Parse context_consumption clause (advisory)
|
|
21
21
|
- parse_memory_suggestions(): Parse memory_suggestions clause (advisory)
|
|
22
|
+
- parse_user_facing_summary(): Parse user_facing_summary clause (advisory)
|
|
22
23
|
"""
|
|
23
24
|
|
|
24
25
|
import json
|
|
@@ -655,6 +656,23 @@ def parse_memory_suggestions(contract: dict) -> List[str]:
|
|
|
655
656
|
return [str(item) for item in raw if item is not None]
|
|
656
657
|
|
|
657
658
|
|
|
659
|
+
def parse_user_facing_summary(contract: dict) -> Optional[str]:
|
|
660
|
+
"""Parse the optional top-level ``user_facing_summary`` clause (advisory).
|
|
661
|
+
|
|
662
|
+
The single human-audience field in the contract: a short prose summary the
|
|
663
|
+
subagent writes once for the user. The orchestrator relays it near-verbatim
|
|
664
|
+
on a single-agent COMPLETE (N=1) instead of re-synthesizing ``key_outputs``.
|
|
665
|
+
|
|
666
|
+
Strictly additive and advisory -- the validator never rejects based on this
|
|
667
|
+
field. Returns the trimmed string when present and non-empty, else None.
|
|
668
|
+
"""
|
|
669
|
+
raw = contract.get("user_facing_summary")
|
|
670
|
+
if not isinstance(raw, str):
|
|
671
|
+
return None
|
|
672
|
+
text = raw.strip()
|
|
673
|
+
return text or None
|
|
674
|
+
|
|
675
|
+
|
|
658
676
|
def extract_plan_status_from_output(agent_output: str) -> str:
|
|
659
677
|
"""Extract the effective plan_status string from agent output.
|
|
660
678
|
|
|
@@ -10,11 +10,187 @@ arise if the adapter imported _persist_handoff directly from subagent_stop
|
|
|
10
10
|
(which itself imports from the adapter's dependency tree).
|
|
11
11
|
"""
|
|
12
12
|
|
|
13
|
+
from __future__ import annotations
|
|
14
|
+
|
|
13
15
|
import logging
|
|
14
16
|
|
|
15
17
|
logger = logging.getLogger(__name__)
|
|
16
18
|
|
|
17
19
|
|
|
20
|
+
def _normalize_command_set(raw) -> list:
|
|
21
|
+
"""Coerce a raw ``command_set`` into the canonical ``[{command, rationale}]``.
|
|
22
|
+
|
|
23
|
+
Mirrors the normalization in ``bash_validator._build_sealed_payload`` and
|
|
24
|
+
``approval_grants.activate_db_pending_by_prefix`` so the intake writes the
|
|
25
|
+
exact shape the activation/consume sides expect. Items without a non-empty
|
|
26
|
+
``command`` are dropped; ``rationale`` defaults to "".
|
|
27
|
+
"""
|
|
28
|
+
out: list = []
|
|
29
|
+
if isinstance(raw, list):
|
|
30
|
+
for item in raw:
|
|
31
|
+
if isinstance(item, dict) and item.get("command"):
|
|
32
|
+
out.append(
|
|
33
|
+
{
|
|
34
|
+
"command": item["command"],
|
|
35
|
+
"rationale": item.get("rationale", ""),
|
|
36
|
+
}
|
|
37
|
+
)
|
|
38
|
+
return out
|
|
39
|
+
|
|
40
|
+
|
|
41
|
+
def _filter_mutative_command_set(items: list) -> list:
|
|
42
|
+
"""Keep only the command_set items whose command is mutative/T3.
|
|
43
|
+
|
|
44
|
+
The consume side (``bash_validator._validate_single_command``) gates the
|
|
45
|
+
whole COMMAND_SET match path on ``detect_mutative_command(command).is_mutative``:
|
|
46
|
+
a command that the matcher does not see as mutative NEVER reaches
|
|
47
|
+
``match_command_set_grant`` and its index is therefore NEVER consumed. If
|
|
48
|
+
such a command is included in the grant's ``command_set``, ``len(consumed)``
|
|
49
|
+
can never reach ``len(command_set)`` and the grant is stuck PENDING forever
|
|
50
|
+
(it never flips to CONSUMED). To stay in lockstep with the consume gate, the
|
|
51
|
+
intake filters with the EXACT same predicate, dropping non-mutative commands
|
|
52
|
+
(e.g. ``touch``, ``ls``, ``cat``) before the grant is ever minted.
|
|
53
|
+
|
|
54
|
+
Items that fail to classify (import error, unexpected exception) are kept --
|
|
55
|
+
failing open here is safer than silently dropping a command from a consent
|
|
56
|
+
batch the user is about to approve.
|
|
57
|
+
"""
|
|
58
|
+
try:
|
|
59
|
+
from modules.security.mutative_verbs import detect_mutative_command
|
|
60
|
+
except ImportError:
|
|
61
|
+
import pathlib as _pl
|
|
62
|
+
import sys as _sys
|
|
63
|
+
|
|
64
|
+
_hooks_root = _pl.Path(__file__).resolve().parent.parent.parent
|
|
65
|
+
_sys.path.insert(0, str(_hooks_root))
|
|
66
|
+
from modules.security.mutative_verbs import detect_mutative_command
|
|
67
|
+
|
|
68
|
+
kept: list = []
|
|
69
|
+
for item in items:
|
|
70
|
+
command = item.get("command", "")
|
|
71
|
+
try:
|
|
72
|
+
if detect_mutative_command(command).is_mutative:
|
|
73
|
+
kept.append(item)
|
|
74
|
+
except Exception:
|
|
75
|
+
# Fail open: if classification raises, keep the item rather than
|
|
76
|
+
# silently dropping a command from the user's consent batch.
|
|
77
|
+
kept.append(item)
|
|
78
|
+
return kept
|
|
79
|
+
|
|
80
|
+
|
|
81
|
+
def _intake_command_set_pending(
|
|
82
|
+
approval_req: dict,
|
|
83
|
+
*,
|
|
84
|
+
agent_id,
|
|
85
|
+
session_id: str,
|
|
86
|
+
) -> str | None:
|
|
87
|
+
"""INTAKE bridge: plan-first COMMAND_SET envelope -> ONE pending row.
|
|
88
|
+
|
|
89
|
+
When a subagent emits an ``APPROVAL_REQUEST`` whose ``approval_request``
|
|
90
|
+
carries a ``command_set`` of >= 2 ``{command, rationale}`` items and NO
|
|
91
|
+
``approval_id`` (plan-first: the batch is declared up-front, before any
|
|
92
|
+
command was attempted/blocked), this persists exactly ONE pending approval
|
|
93
|
+
whose ``payload_json`` contains the ``command_set`` key. That is the signal
|
|
94
|
+
``activate_db_pending_by_prefix`` reads (Step 3b) to branch into
|
|
95
|
+
``create_command_set_grant`` on user approval.
|
|
96
|
+
|
|
97
|
+
Mutative filtering (Thread a): the command_set is first reduced to ONLY the
|
|
98
|
+
commands the consume side will treat as mutative/T3 -- see
|
|
99
|
+
``_filter_mutative_command_set``. Non-mutative commands (``touch``, ``ls``,
|
|
100
|
+
...) never reach the bash_validator matcher, so leaving them in the grant
|
|
101
|
+
would strand its ``consumed_indexes_json`` short of completion and pin the
|
|
102
|
+
grant at PENDING forever. After filtering:
|
|
103
|
+
|
|
104
|
+
* >= 2 mutative items -> mint the COMMAND_SET over exactly those items.
|
|
105
|
+
* exactly 1 mutative -> NOT a batch. Return None; the caller falls
|
|
106
|
+
through to the singular ``approval_id`` path and the lone command is
|
|
107
|
+
gated by the normal hook-block / SCOPE_SEMANTIC_SIGNATURE flow when the
|
|
108
|
+
agent attempts it. We deliberately do NOT degrade-to-singular here: this
|
|
109
|
+
function's contract is "mint a COMMAND_SET or stand aside", and the
|
|
110
|
+
singular flow is owned end-to-end by the hook block path -- minting a
|
|
111
|
+
singular row from here would duplicate that ownership.
|
|
112
|
+
* 0 mutative -> nothing to approve. Return None (no pending).
|
|
113
|
+
|
|
114
|
+
A raw ``command_set`` of <= 1 item is likewise not a batch and returns None
|
|
115
|
+
before filtering, preserving the original contract (never mint for one
|
|
116
|
+
command, never degrade a batch the other way) and the working plan-first
|
|
117
|
+
flow for genuine multi-command mutative batches.
|
|
118
|
+
|
|
119
|
+
Returns the minted ``approval_id`` (``P-{uuid4hex}``) on success, or None
|
|
120
|
+
when this is not a plan-first command_set envelope (no action taken).
|
|
121
|
+
"""
|
|
122
|
+
if not isinstance(approval_req, dict):
|
|
123
|
+
return None
|
|
124
|
+
# Plan-first is defined by command_set present AND no approval_id. A request
|
|
125
|
+
# that already carries an approval_id was minted by the hook block path; it
|
|
126
|
+
# is the singular flow and must not be re-intaken here.
|
|
127
|
+
if approval_req.get("approval_id"):
|
|
128
|
+
return None
|
|
129
|
+
|
|
130
|
+
raw_items = _normalize_command_set(approval_req.get("command_set"))
|
|
131
|
+
if len(raw_items) < 2:
|
|
132
|
+
# 0 or 1 item: not a batch. Singular path owns it.
|
|
133
|
+
return None
|
|
134
|
+
|
|
135
|
+
# Reduce to the mutative/T3 commands only -- the exact predicate the consume
|
|
136
|
+
# side uses to decide whether a command reaches the COMMAND_SET matcher.
|
|
137
|
+
command_set_items = _filter_mutative_command_set(raw_items)
|
|
138
|
+
if len(command_set_items) < 2:
|
|
139
|
+
# After filtering there is no batch left: either every command was
|
|
140
|
+
# non-mutative (0 -> nothing to approve) or just one mutative command
|
|
141
|
+
# remained (1 -> singular path owns it). Either way, no COMMAND_SET.
|
|
142
|
+
logger.info(
|
|
143
|
+
"INTAKE: command_set not minted -- %d/%d items mutative after filter "
|
|
144
|
+
"(need >= 2 for a batch)",
|
|
145
|
+
len(command_set_items), len(raw_items),
|
|
146
|
+
)
|
|
147
|
+
return None
|
|
148
|
+
|
|
149
|
+
# Build a sealed_payload that mirrors bash_validator._build_sealed_payload's
|
|
150
|
+
# COMMAND_SET shape: command_set verbatim + commands listing every string.
|
|
151
|
+
# Carry through the subagent's operation/risk fields when present so the
|
|
152
|
+
# orchestrator's presentation has real values, falling back to neutral
|
|
153
|
+
# COMMAND_SET defaults otherwise.
|
|
154
|
+
first_command = command_set_items[0]["command"]
|
|
155
|
+
sealed_payload = {
|
|
156
|
+
"operation": approval_req.get("operation")
|
|
157
|
+
or f"COMMAND_SET intercepted: {len(command_set_items)} commands under one consent",
|
|
158
|
+
"exact_content": approval_req.get("exact_content") or first_command,
|
|
159
|
+
"scope": approval_req.get("scope")
|
|
160
|
+
or (first_command.split()[0] if first_command.strip() else "unknown"),
|
|
161
|
+
"risk_level": approval_req.get("risk_level") or "medium",
|
|
162
|
+
"rollback_hint": approval_req.get("rollback") or approval_req.get("rollback_hint"),
|
|
163
|
+
"rationale": approval_req.get("rationale")
|
|
164
|
+
or (
|
|
165
|
+
f"A batch of {len(command_set_items)} related T3 commands requires user "
|
|
166
|
+
"approval under one consent per the COMMAND_SET policy."
|
|
167
|
+
),
|
|
168
|
+
"commands": [it["command"] for it in command_set_items],
|
|
169
|
+
"command_set": command_set_items,
|
|
170
|
+
}
|
|
171
|
+
|
|
172
|
+
try:
|
|
173
|
+
from gaia.approvals.store import insert_requested
|
|
174
|
+
except ImportError:
|
|
175
|
+
import pathlib as _pl
|
|
176
|
+
import sys as _sys
|
|
177
|
+
|
|
178
|
+
_repo_root = _pl.Path(__file__).resolve().parent.parent.parent.parent
|
|
179
|
+
_sys.path.insert(0, str(_repo_root))
|
|
180
|
+
from gaia.approvals.store import insert_requested
|
|
181
|
+
|
|
182
|
+
approval_id = insert_requested(
|
|
183
|
+
sealed_payload,
|
|
184
|
+
agent_id=agent_id,
|
|
185
|
+
session_id=session_id or None,
|
|
186
|
+
)
|
|
187
|
+
logger.info(
|
|
188
|
+
"INTAKE: plan-first COMMAND_SET pending created approval_id=%s items=%d",
|
|
189
|
+
(approval_id or "")[:16], len(command_set_items),
|
|
190
|
+
)
|
|
191
|
+
return approval_id
|
|
192
|
+
|
|
193
|
+
|
|
18
194
|
def persist_handoff(
|
|
19
195
|
parsed_contract,
|
|
20
196
|
agent_output: str,
|
|
@@ -38,6 +214,38 @@ def persist_handoff(
|
|
|
38
214
|
import pathlib as _pl
|
|
39
215
|
import sys as _sys
|
|
40
216
|
|
|
217
|
+
agent_id = task_info.get("agent_id") or task_info.get("agent") or "unknown"
|
|
218
|
+
|
|
219
|
+
# ---------------------------------------------------------------------
|
|
220
|
+
# INTAKE bridge (plan-first COMMAND_SET) -- run FIRST and INDEPENDENTLY.
|
|
221
|
+
#
|
|
222
|
+
# Minting the pending COMMAND_SET approval is the security-critical path:
|
|
223
|
+
# it is the consent the user must act on. It must not be coupled to the
|
|
224
|
+
# audit handoff-row write below -- if insert_agent_contract_handoff fails
|
|
225
|
+
# for any reason, the user must still get the approval to review. So the
|
|
226
|
+
# intake runs in its own isolated try, before the handoff-row write.
|
|
227
|
+
#
|
|
228
|
+
# Only plan-first envelopes act here: command_set >= 2 items AND no
|
|
229
|
+
# approval_id. A <= 1 item set or a request that already carries an
|
|
230
|
+
# approval_id (hook-block / singular path) is a no-op for the intake.
|
|
231
|
+
# ---------------------------------------------------------------------
|
|
232
|
+
minted_command_set_id = None
|
|
233
|
+
if parsed_contract is not None:
|
|
234
|
+
_env = parsed_contract if isinstance(parsed_contract, dict) else {}
|
|
235
|
+
_approval_req = _env.get("approval_request")
|
|
236
|
+
if isinstance(_approval_req, dict):
|
|
237
|
+
try:
|
|
238
|
+
minted_command_set_id = _intake_command_set_pending(
|
|
239
|
+
_approval_req,
|
|
240
|
+
agent_id=agent_id,
|
|
241
|
+
session_id=session_id,
|
|
242
|
+
)
|
|
243
|
+
except Exception as _intake_exc:
|
|
244
|
+
logger.warning(
|
|
245
|
+
"M4: COMMAND_SET intake failed (non-blocking): %s",
|
|
246
|
+
_intake_exc,
|
|
247
|
+
)
|
|
248
|
+
|
|
41
249
|
try:
|
|
42
250
|
# Prefer a sibling gaia package if installed; fall back to the repo
|
|
43
251
|
# layout where gaia/ lives two levels above hooks/.
|
|
@@ -48,7 +256,6 @@ def persist_handoff(
|
|
|
48
256
|
_sys.path.insert(0, str(_repo_root))
|
|
49
257
|
from gaia.store import writer as _writer
|
|
50
258
|
|
|
51
|
-
agent_id = task_info.get("agent_id") or task_info.get("agent") or "unknown"
|
|
52
259
|
workspace = task_info.get("workspace") or _os.environ.get("GAIA_WORKSPACE") or "global"
|
|
53
260
|
db_path_str = task_info.get("db_path")
|
|
54
261
|
db_path = _pl.Path(db_path_str) if db_path_str else None
|
|
@@ -99,7 +306,12 @@ def persist_handoff(
|
|
|
99
306
|
envelope = parsed_contract if isinstance(parsed_contract, dict) else {}
|
|
100
307
|
approval_req = envelope.get("approval_request")
|
|
101
308
|
if approval_req and isinstance(approval_req, dict):
|
|
102
|
-
approval_id
|
|
309
|
+
# The approval_id is either the one the subagent relayed (hook-block
|
|
310
|
+
# / singular path) or the one the INTAKE bridge just minted for a
|
|
311
|
+
# plan-first COMMAND_SET. Either way it points at the pending row
|
|
312
|
+
# the handoff_approvals audit row should link to.
|
|
313
|
+
approval_id = approval_req.get("approval_id") or minted_command_set_id
|
|
314
|
+
|
|
103
315
|
if approval_id:
|
|
104
316
|
# Look up the grant to determine the decision at stop time.
|
|
105
317
|
try:
|
|
@@ -402,6 +402,31 @@ def parse_memorialize_suggestions(
|
|
|
402
402
|
return _extract_memorialize_suggestions(contract)
|
|
403
403
|
|
|
404
404
|
|
|
405
|
+
def parse_user_facing_summary(
|
|
406
|
+
agent_output: str,
|
|
407
|
+
parsed_contract: Optional[dict] = None,
|
|
408
|
+
) -> Optional[str]:
|
|
409
|
+
"""Parse the optional top-level ``user_facing_summary`` field (Option A).
|
|
410
|
+
|
|
411
|
+
This is the ONE human-audience field in the contract: a brief prose summary
|
|
412
|
+
the subagent writes once, intended for the user. The orchestrator relays it
|
|
413
|
+
near-verbatim on a single-agent COMPLETE (N=1) instead of re-synthesizing
|
|
414
|
+
``key_outputs``; for N>1 it is ignored and synthesis proceeds.
|
|
415
|
+
|
|
416
|
+
Strictly additive and advisory: the field is never required and never
|
|
417
|
+
affects contract validity. Returns the trimmed string when present and
|
|
418
|
+
non-empty, otherwise None (absent, null, blank, or non-string).
|
|
419
|
+
"""
|
|
420
|
+
contract = parsed_contract if parsed_contract is not None else parse_contract(agent_output)
|
|
421
|
+
if contract is None:
|
|
422
|
+
return None
|
|
423
|
+
raw = contract.get("user_facing_summary")
|
|
424
|
+
if not isinstance(raw, str):
|
|
425
|
+
return None
|
|
426
|
+
text = raw.strip()
|
|
427
|
+
return text or None
|
|
428
|
+
|
|
429
|
+
|
|
405
430
|
def _is_resume_agent_id(value: str) -> bool:
|
|
406
431
|
return bool(_AGENT_ID_PATTERN.match(value or ""))
|
|
407
432
|
|
|
@@ -659,6 +684,7 @@ __all__ = [
|
|
|
659
684
|
"parse_evidence_report",
|
|
660
685
|
"parse_consolidation_report",
|
|
661
686
|
"parse_memorialize_suggestions",
|
|
687
|
+
"parse_user_facing_summary",
|
|
662
688
|
"validate_response_contract",
|
|
663
689
|
"save_validation_result",
|
|
664
690
|
"load_last_validation",
|
|
@@ -139,10 +139,25 @@ def extract_injected_context_payload_from_transcript(
|
|
|
139
139
|
"""
|
|
140
140
|
import os
|
|
141
141
|
|
|
142
|
+
# Empty/None path guard. Without it, Path("").stem == "" and the substring
|
|
143
|
+
# match below (``candidate.stem in "" or "" in candidate.stem``) is ALWAYS
|
|
144
|
+
# True because ``"" in any_string`` is True -- so an empty path would match
|
|
145
|
+
# (and return) the FIRST payload sitting in gaia-context-payloads/, making
|
|
146
|
+
# the result depend on whatever happens to be in that directory. Mirror the
|
|
147
|
+
# guard in read_first_user_content_from_transcript: no path, no match.
|
|
148
|
+
if not transcript_path:
|
|
149
|
+
return {}
|
|
150
|
+
|
|
142
151
|
try:
|
|
143
152
|
payload_dir = Path(os.environ.get("TMPDIR", "/tmp")) / "gaia-context-payloads"
|
|
144
153
|
if payload_dir.exists():
|
|
145
154
|
agent_file = Path(transcript_path).stem # e.g. "agent-ae190a4da68d626d4"
|
|
155
|
+
# A stem that came out empty (e.g. path was "/" or "."): nothing to
|
|
156
|
+
# match against, so the substring test would again degrade to the
|
|
157
|
+
# always-true ``"" in candidate.stem``. Bail rather than grab an
|
|
158
|
+
# arbitrary payload.
|
|
159
|
+
if not agent_file:
|
|
160
|
+
return {}
|
|
146
161
|
# Match by agent ID substring
|
|
147
162
|
for candidate in payload_dir.glob("*.json"):
|
|
148
163
|
if candidate.stem in agent_file or agent_file in candidate.stem:
|
|
@@ -5,7 +5,6 @@ Provides:
|
|
|
5
5
|
- tiers: SecurityTier enum and classification
|
|
6
6
|
- blocked_commands: Permanently blocked pattern matching
|
|
7
7
|
- mutative_verbs: Mutative verb detection (user approval workflow)
|
|
8
|
-
- gitops_validator: kubectl/helm/flux validation
|
|
9
8
|
- approval_constants: Approval token patterns (legacy APPROVE: and ElicitationResult)
|
|
10
9
|
- approval_grants: Time-limited T3 command passthrough after user approval
|
|
11
10
|
- shell_unwrapper: Detect and strip wrapper shells for inner command classification
|
|
@@ -21,7 +20,6 @@ from .blocked_commands import (
|
|
|
21
20
|
get_blocked_patterns,
|
|
22
21
|
BlockedCommandResult,
|
|
23
22
|
)
|
|
24
|
-
from .gitops_validator import validate_gitops_workflow, GitOpsValidationResult
|
|
25
23
|
from .mutative_verbs import (
|
|
26
24
|
CLI_FAMILY_LOOKUP,
|
|
27
25
|
CATEGORY_MUTATIVE,
|
|
@@ -73,9 +71,6 @@ __all__ = [
|
|
|
73
71
|
"is_blocked_command",
|
|
74
72
|
"get_blocked_patterns",
|
|
75
73
|
"BlockedCommandResult",
|
|
76
|
-
# GitOps
|
|
77
|
-
"validate_gitops_workflow",
|
|
78
|
-
"GitOpsValidationResult",
|
|
79
74
|
# Mutative verbs
|
|
80
75
|
"CLI_FAMILY_LOOKUP",
|
|
81
76
|
"CATEGORY_MUTATIVE",
|