ai-execution-protocol 0.3.1 → 0.4.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +5 -1
- package/README.md +41 -2
- package/behavior/audit-checklist.yaml +55 -0
- package/behavior/contract.yaml +156 -0
- package/dataset/README.md +38 -0
- package/dataset/raw-examples.md +36 -0
- package/dataset/train.jsonl +3 -0
- package/dataset/validation.jsonl +2 -0
- package/dist/minimal/AGENTS.md +4 -1
- package/dist/minimal/README.md +3 -0
- package/dist/minimal/behavior/audit-checklist.yaml +15 -0
- package/dist/minimal/behavior/contract.yaml +29 -0
- package/dist/minimal/canonical-state.yaml +1 -1
- package/dist/minimal/capabilities/registry.yaml +1 -1
- package/dist/minimal/context-map.yaml +1 -1
- package/dist/minimal/ide-rules/instruction-block.md +23 -0
- package/dist/minimal/memory/INDEX.yaml +1 -1
- package/dist/minimal/protocol/README.yaml +9 -1
- package/dist/minimal/protocol/capability-gate.yaml +56 -0
- package/dist/minimal/protocol/capability-router.yaml +1 -1
- package/dist/minimal/protocol/context-rules.yaml +2 -1
- package/dist/minimal/protocol/fast-path.yaml +6 -1
- package/dist/minimal/protocol/intelligence-router.yaml +63 -0
- package/dist/minimal/protocol/route-packs.yaml +38 -1
- package/dist/minimal/protocol/router.yaml +28 -1
- package/docs/00-visao-geral.md +41 -0
- package/docs/01-modelo-de-execucao.md +25 -0
- package/docs/02-niveis-de-risco.md +62 -0
- package/docs/03-mapeamento-antes-de-alterar.md +48 -0
- package/docs/04-janela-de-contexto.md +56 -0
- package/docs/05-validacao-e-entrega.md +48 -0
- package/docs/06-memoria-e-continuidade.md +27 -0
- package/docs/07-legibilidade-para-ia.md +47 -0
- package/docs/08-posicionamento.md +48 -0
- package/docs/09-governanca-de-mudancas.md +48 -0
- package/docs/10-economia-de-prompt.md +79 -0
- package/docs/11-retencao-de-resultados.md +26 -0
- package/docs/12-instalacao-em-outro-projeto.md +254 -0
- package/docs/13-uso-em-ides.md +137 -0
- package/docs/14-publicacao.md +128 -0
- package/docs/15-contexto-persistente.md +204 -0
- package/docs/16-release-e-atualizacao.md +146 -0
- package/docs/17-documentacao-atomica.md +117 -0
- package/docs/18-memoria-adaptativa.md +107 -0
- package/docs/19-orcamento-de-contexto.md +63 -0
- package/docs/20-validacao-seletiva.md +46 -0
- package/docs/21-roteamento-de-capacidades.md +121 -0
- package/docs/22-roadmap-v1.md +163 -0
- package/docs/23-contrato-comportamental.md +116 -0
- package/docs/24-gate-de-capacidades-e-inteligencia.md +109 -0
- package/docs/README.md +58 -0
- package/eval/README.md +27 -0
- package/eval/rubric.yaml +57 -0
- package/eval/sample-result.yaml +28 -0
- package/install-manifest.json +27 -2
- package/package.json +9 -2
- package/protocol/README.yaml +9 -1
- package/protocol/capability-gate.yaml +56 -0
- package/protocol/capability-router.yaml +1 -1
- package/protocol/context-rules.yaml +2 -1
- package/protocol/fast-path.yaml +6 -1
- package/protocol/intelligence-router.yaml +63 -0
- package/protocol/route-packs.yaml +38 -1
- package/protocol/router.yaml +28 -1
- package/roadmap/v1.yaml +139 -0
- package/schema/README.md +26 -0
- package/schema/behavior-contract.schema.json +31 -0
- package/schema/capability-registry.schema.json +51 -0
- package/schema/evaluated-response.schema.json +27 -0
- package/schema/evaluation-result.schema.json +32 -0
- package/schema/memory-entry.schema.json +55 -0
- package/schema/protocol-rule.schema.json +16 -0
- package/schema/protocol-rule.schema.yaml +28 -0
- package/schema/test-case.schema.json +44 -0
- package/schema/test-case.schema.yaml +37 -0
- package/scripts/README.md +46 -0
- package/scripts/build_dist.py +3 -0
- package/scripts/npm_install_protocol.js +60 -1
- package/scripts/verify_install.py +25 -0
- package/templates/minimal/AGENTS.md +4 -1
- package/templates/minimal/behavior/audit-checklist.yaml +15 -0
- package/templates/minimal/behavior/contract.yaml +29 -0
- package/templates/minimal/canonical-state.yaml +1 -1
- package/templates/minimal/capabilities/registry.yaml +1 -1
- package/templates/minimal/context-map.yaml +1 -1
- package/templates/minimal/ide-rules/instruction-block.md +23 -0
- package/templates/minimal/memory/INDEX.yaml +1 -1
- package/templates/minimal/protocol/capability-gate.yaml +10 -0
- package/templates/minimal/protocol/intelligence-router.yaml +10 -0
package/install-manifest.json
CHANGED
|
@@ -16,6 +16,8 @@
|
|
|
16
16
|
"persistent-context.yaml",
|
|
17
17
|
"adaptive-memory.yaml",
|
|
18
18
|
"capability-router.yaml",
|
|
19
|
+
"capability-gate.yaml",
|
|
20
|
+
"intelligence-router.yaml",
|
|
19
21
|
"formatting-rules.yaml",
|
|
20
22
|
"prompt-economy.yaml",
|
|
21
23
|
"spec-driven.yaml"
|
|
@@ -28,7 +30,9 @@
|
|
|
28
30
|
"decisions/README.md",
|
|
29
31
|
"memory/INDEX.yaml",
|
|
30
32
|
"candidate-memory/README.md",
|
|
31
|
-
"capabilities/registry.yaml"
|
|
33
|
+
"capabilities/registry.yaml",
|
|
34
|
+
"behavior/contract.yaml",
|
|
35
|
+
"behavior/audit-checklist.yaml"
|
|
32
36
|
],
|
|
33
37
|
"aiignore_lines": [
|
|
34
38
|
"results/",
|
|
@@ -45,7 +49,8 @@
|
|
|
45
49
|
"protocol/router.yaml",
|
|
46
50
|
"protocol/route-packs.yaml",
|
|
47
51
|
"Classifique o risco antes de agir",
|
|
48
|
-
"protocol/capability-router.yaml"
|
|
52
|
+
"protocol/capability-router.yaml",
|
|
53
|
+
"behavior/contract.yaml"
|
|
49
54
|
],
|
|
50
55
|
"memory/INDEX.yaml": [
|
|
51
56
|
"memory_index",
|
|
@@ -67,9 +72,29 @@
|
|
|
67
72
|
"minimum_capability_set",
|
|
68
73
|
"higher_risk_means_stricter_permissions_not_more_tools"
|
|
69
74
|
],
|
|
75
|
+
"protocol/capability-gate.yaml": [
|
|
76
|
+
"capability_gate",
|
|
77
|
+
"plan_before_use_audit_after_use",
|
|
78
|
+
"unplanned_use_is_protocol_failure"
|
|
79
|
+
],
|
|
80
|
+
"protocol/intelligence-router.yaml": [
|
|
81
|
+
"intelligence_router",
|
|
82
|
+
"cheapest_sufficient_intelligence",
|
|
83
|
+
"critical"
|
|
84
|
+
],
|
|
70
85
|
"capabilities/registry.yaml": [
|
|
71
86
|
"capability_registry",
|
|
72
87
|
"runtime_availability_must_be_verified"
|
|
88
|
+
],
|
|
89
|
+
"behavior/contract.yaml": [
|
|
90
|
+
"behavior_contract",
|
|
91
|
+
"Behavioral execution framework for safer AI agents",
|
|
92
|
+
"claimed_validation_must_match_performed_validation"
|
|
93
|
+
],
|
|
94
|
+
"behavior/audit-checklist.yaml": [
|
|
95
|
+
"behavior_audit_checklist",
|
|
96
|
+
"validation_truth",
|
|
97
|
+
"capability_economy"
|
|
73
98
|
]
|
|
74
99
|
}
|
|
75
100
|
}
|
package/package.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "ai-execution-protocol",
|
|
3
|
-
"version": "0.
|
|
3
|
+
"version": "0.4.0",
|
|
4
4
|
"private": false,
|
|
5
|
-
"description": "
|
|
5
|
+
"description": "Behavioral execution framework for safer AI agents, minimal context, risk control, validation, and evidence-based delivery.",
|
|
6
6
|
"license": "MIT",
|
|
7
7
|
"author": "AI Execution Protocol",
|
|
8
8
|
"homepage": "https://github.com/rodneigk2/ai-execution-protocol#readme",
|
|
@@ -35,6 +35,12 @@
|
|
|
35
35
|
"scripts/verify_install.py",
|
|
36
36
|
"install-manifest.json",
|
|
37
37
|
"protocol/",
|
|
38
|
+
"behavior/",
|
|
39
|
+
"dataset/",
|
|
40
|
+
"docs/",
|
|
41
|
+
"eval/",
|
|
42
|
+
"schema/",
|
|
43
|
+
"roadmap/",
|
|
38
44
|
"templates/minimal/",
|
|
39
45
|
"dist/minimal/"
|
|
40
46
|
],
|
|
@@ -43,6 +49,7 @@
|
|
|
43
49
|
"init-protocol": "node scripts/npm_install_protocol.js init",
|
|
44
50
|
"install-protocol": "node scripts/npm_install_protocol.js install",
|
|
45
51
|
"dry-run-protocol": "node scripts/npm_install_protocol.js install --dry-run",
|
|
52
|
+
"integrate-protocol": "node scripts/npm_install_protocol.js integrate",
|
|
46
53
|
"verify-protocol": "node scripts/npm_install_protocol.js verify"
|
|
47
54
|
}
|
|
48
55
|
}
|
package/protocol/README.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
id: protocol_index
|
|
2
2
|
type: index
|
|
3
3
|
format: yaml
|
|
4
|
-
protocol_version: 0.
|
|
4
|
+
protocol_version: 0.4.0
|
|
5
5
|
purpose: ai_operational_rules
|
|
6
6
|
source_docs: ../docs
|
|
7
7
|
constraints:
|
|
@@ -39,6 +39,14 @@ files:
|
|
|
39
39
|
purpose: maintain_verified_user_and_project_memory
|
|
40
40
|
- path: capability-router.yaml
|
|
41
41
|
purpose: select_minimum_skills_mcps_and_tools_by_value_cost_and_risk
|
|
42
|
+
- path: capability-gate.yaml
|
|
43
|
+
purpose: require_plan_before_capability_use_and_audit_after_use
|
|
44
|
+
- path: intelligence-router.yaml
|
|
45
|
+
purpose: choose_model_reasoning_effort_by_risk_and_complexity
|
|
46
|
+
- path: ../behavior/contract.yaml
|
|
47
|
+
purpose: define_observable_behavior_for_agent_adherence
|
|
48
|
+
- path: ../behavior/audit-checklist.yaml
|
|
49
|
+
purpose: final_self_audit_for_agent_adherence
|
|
42
50
|
- path: formatting-rules.yaml
|
|
43
51
|
purpose: ai_readable_file_format
|
|
44
52
|
- path: prompt-economy.yaml
|
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
id: capability_gate
|
|
2
|
+
type: operational_rules
|
|
3
|
+
version: 0.4.0
|
|
4
|
+
purpose: gate_capability_use_before_skill_mcp_or_tool_invocation
|
|
5
|
+
principle: plan_before_use_audit_after_use
|
|
6
|
+
guarantee_boundary:
|
|
7
|
+
framework_can:
|
|
8
|
+
- require_capability_plan_before_use
|
|
9
|
+
- mark_unplanned_use_as_protocol_failure
|
|
10
|
+
- compare_used_capabilities_with_selected_capabilities
|
|
11
|
+
- block_high_risk_workflow_when_plan_is_missing
|
|
12
|
+
host_must:
|
|
13
|
+
- hide_or_disable_tools_for_physical_enforcement
|
|
14
|
+
- enforce_runtime_permissions
|
|
15
|
+
required_before_use:
|
|
16
|
+
- task_objective
|
|
17
|
+
- risk_level
|
|
18
|
+
- operation_scope
|
|
19
|
+
- requested_operations
|
|
20
|
+
- required_outcome_tags
|
|
21
|
+
- selected_capabilities
|
|
22
|
+
- confirmation_status_when_required
|
|
23
|
+
allowed_states:
|
|
24
|
+
planned:
|
|
25
|
+
meaning: selected_but_not_invoked
|
|
26
|
+
used:
|
|
27
|
+
meaning: invoked_within_plan_and_scope
|
|
28
|
+
blocked:
|
|
29
|
+
meaning: needed_but_missing_or_unconfirmed
|
|
30
|
+
violation:
|
|
31
|
+
meaning: used_without_plan_or_outside_scope
|
|
32
|
+
rules:
|
|
33
|
+
- no_skill_mcp_or_remote_tool_before_capability_plan
|
|
34
|
+
- local_read_can_be_implicit_only_for_level_0_or_1_basic_navigation
|
|
35
|
+
- level_2_or_3_requires_explicit_capability_plan
|
|
36
|
+
- publish_write_or_destructive_requires_confirmation_when_policy_requires
|
|
37
|
+
- used_capability_must_be_subset_of_selected_capabilities
|
|
38
|
+
- unplanned_use_is_protocol_failure
|
|
39
|
+
- missing_required_capability_blocks_high_risk_workflow
|
|
40
|
+
audit:
|
|
41
|
+
compare:
|
|
42
|
+
- selected_capabilities
|
|
43
|
+
- used_capabilities
|
|
44
|
+
- operation_scope
|
|
45
|
+
- confirmation_status
|
|
46
|
+
fail_when:
|
|
47
|
+
- used_not_selected
|
|
48
|
+
- used_for_unapproved_operation
|
|
49
|
+
- used_after_blocked_status
|
|
50
|
+
- publish_without_confirmation
|
|
51
|
+
delivery:
|
|
52
|
+
include_for_level_2_or_3:
|
|
53
|
+
- capability_plan_summary
|
|
54
|
+
- used_capabilities
|
|
55
|
+
- gate_status
|
|
56
|
+
- violations_if_any
|
|
@@ -70,6 +70,7 @@ existing_project_files:
|
|
|
70
70
|
- .cursorrules
|
|
71
71
|
- CLAUDE.md
|
|
72
72
|
- .github/copilot-instructions.md
|
|
73
|
+
- .cursor/rules/ai-execution-protocol.mdc
|
|
73
74
|
- package_docs
|
|
74
75
|
- framework_configs
|
|
75
76
|
behavior:
|
|
@@ -78,7 +79,7 @@ existing_project_files:
|
|
|
78
79
|
- treat_generated_or_old_docs_as_untrusted_until_verified
|
|
79
80
|
- keep_protocol_rules_in_AGENTS_and_protocol_folder
|
|
80
81
|
- use_framework_configs_as_technical_source_when_task_touches_framework
|
|
81
|
-
-
|
|
82
|
+
- duplicate_protocol_rules_across_ide_files_only_with_marked_integration
|
|
82
83
|
conflict_order:
|
|
83
84
|
- current_user_request
|
|
84
85
|
- AGENTS_protocol_block
|
package/protocol/fast-path.yaml
CHANGED
|
@@ -1,12 +1,14 @@
|
|
|
1
1
|
id: fast_path
|
|
2
2
|
type: agent_entrypoint
|
|
3
|
-
version: 0.
|
|
3
|
+
version: 0.4.0
|
|
4
4
|
purpose: minimum_rules_to_start_any_task
|
|
5
5
|
read_next:
|
|
6
6
|
- router.yaml
|
|
7
7
|
- route-packs.yaml
|
|
8
8
|
- context-budget.yaml
|
|
9
9
|
- capability-router.yaml
|
|
10
|
+
- capability-gate.yaml
|
|
11
|
+
- intelligence-router.yaml
|
|
10
12
|
- modes.yaml
|
|
11
13
|
core_rules:
|
|
12
14
|
- classify_risk_before_action
|
|
@@ -26,6 +28,9 @@ core_rules:
|
|
|
26
28
|
- check_memory_update_result_after_task
|
|
27
29
|
- use_selective_validation_by_blast_radius
|
|
28
30
|
- select_minimum_capability_set_before_loading_skills_or_mcps
|
|
31
|
+
- require_capability_plan_before_skill_mcp_or_remote_tool_use
|
|
32
|
+
- choose_intelligence_level_proportional_to_risk_and_complexity
|
|
33
|
+
- follow_behavioral_execution_contract
|
|
29
34
|
risk_short:
|
|
30
35
|
level_0: answer_only
|
|
31
36
|
level_1: small_clear_reversible_isolated_change
|
|
@@ -0,0 +1,63 @@
|
|
|
1
|
+
id: intelligence_router
|
|
2
|
+
type: operational_rules
|
|
3
|
+
version: 0.4.0
|
|
4
|
+
purpose: choose_model_reasoning_and_effort_proportional_to_task_need
|
|
5
|
+
principle: use_the_cheapest_sufficient_intelligence_without_trading_correctness
|
|
6
|
+
levels:
|
|
7
|
+
minimal:
|
|
8
|
+
use_when:
|
|
9
|
+
- level_0_direct_answer
|
|
10
|
+
- no_current_external_data_needed
|
|
11
|
+
- no_file_change
|
|
12
|
+
model_need: low_cost_fast
|
|
13
|
+
reasoning_depth: low
|
|
14
|
+
tools: none
|
|
15
|
+
standard:
|
|
16
|
+
use_when:
|
|
17
|
+
- level_1_small_change
|
|
18
|
+
- focused_file_read
|
|
19
|
+
- simple_validation
|
|
20
|
+
model_need: default
|
|
21
|
+
reasoning_depth: medium
|
|
22
|
+
tools: local_only
|
|
23
|
+
deep:
|
|
24
|
+
use_when:
|
|
25
|
+
- level_2_flow_bug
|
|
26
|
+
- refactor
|
|
27
|
+
- ambiguous_impact
|
|
28
|
+
- failed_first_validation
|
|
29
|
+
model_need: stronger_or_more_reasoning
|
|
30
|
+
reasoning_depth: high
|
|
31
|
+
tools: selected_local_or_targeted_remote
|
|
32
|
+
critical:
|
|
33
|
+
use_when:
|
|
34
|
+
- level_3_data_auth_security_deploy_publish_destructive
|
|
35
|
+
- high_blast_radius
|
|
36
|
+
- irreversible_or_external_side_effect
|
|
37
|
+
model_need: strongest_available_for_task
|
|
38
|
+
reasoning_depth: high_with_audit
|
|
39
|
+
tools: least_privilege_confirmed
|
|
40
|
+
escalate_when:
|
|
41
|
+
- risk_level_increases
|
|
42
|
+
- ambiguity_blocks_safe_action
|
|
43
|
+
- validation_fails
|
|
44
|
+
- context_conflict_detected
|
|
45
|
+
- external_current_data_is_required
|
|
46
|
+
- specialized_modality_is_required
|
|
47
|
+
deescalate_when:
|
|
48
|
+
- task_is_direct_answer
|
|
49
|
+
- no_code_or_external_state_needed
|
|
50
|
+
- validation_plan_is_trivial
|
|
51
|
+
- previous_high_risk_assumption_is_not_supported_by_evidence
|
|
52
|
+
never_trade:
|
|
53
|
+
- security
|
|
54
|
+
- correctness
|
|
55
|
+
- required_validation
|
|
56
|
+
- explicit_user_scope
|
|
57
|
+
delivery:
|
|
58
|
+
include_when_level_2_or_3:
|
|
59
|
+
- intelligence_level
|
|
60
|
+
- escalation_reason_if_any
|
|
61
|
+
- why_lower_level_was_not_enough
|
|
62
|
+
omit_for_level_0:
|
|
63
|
+
- model_discussion_unless_user_asks
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
id: route_packs
|
|
2
2
|
type: route_summary_index
|
|
3
|
-
version: 0.
|
|
3
|
+
version: 0.4.0
|
|
4
4
|
purpose: compact_first_read_before_full_route_files
|
|
5
5
|
principle: read_pack_first_expand_only_when_needed
|
|
6
6
|
use:
|
|
@@ -120,10 +120,12 @@ packs:
|
|
|
120
120
|
- run_post_deploy_check_if_executed
|
|
121
121
|
evaluate_response:
|
|
122
122
|
read_if_pack_insufficient:
|
|
123
|
+
- ../behavior/contract.yaml
|
|
123
124
|
- ../eval/rubric.yaml
|
|
124
125
|
- ../schema/evaluated-response.schema.json
|
|
125
126
|
do:
|
|
126
127
|
- score_risk_behavior_avoidance_delivery_clarity
|
|
128
|
+
- check_behavior_contract_alignment
|
|
127
129
|
- apply_automatic_fail_rules
|
|
128
130
|
create_or_edit_yaml:
|
|
129
131
|
read_if_pack_insufficient:
|
|
@@ -186,10 +188,45 @@ packs:
|
|
|
186
188
|
risk: adaptive
|
|
187
189
|
read_if_pack_insufficient:
|
|
188
190
|
- capability-router.yaml
|
|
191
|
+
- capability-gate.yaml
|
|
189
192
|
- context-budget.yaml
|
|
190
193
|
do:
|
|
191
194
|
- define_required_outcomes_and_operations
|
|
192
195
|
- select_smallest_available_capability_set
|
|
193
196
|
- load_only_selected_skill_or_mcp
|
|
194
197
|
- require_confirmation_for_sensitive_remote_effect
|
|
198
|
+
- audit_used_capabilities_against_selected_plan
|
|
195
199
|
- stop_discovery_when_quality_coverage_is_complete
|
|
200
|
+
intelligence_selection:
|
|
201
|
+
risk: adaptive
|
|
202
|
+
read_if_pack_insufficient:
|
|
203
|
+
- intelligence-router.yaml
|
|
204
|
+
- context-budget.yaml
|
|
205
|
+
do:
|
|
206
|
+
- choose_cheapest_sufficient_intelligence_level
|
|
207
|
+
- escalate_for_risk_ambiguity_validation_failure_or_large_context
|
|
208
|
+
- deescalate_when_task_is_direct_and_low_risk
|
|
209
|
+
- do_not_trade_security_correctness_or_validation_for_cost
|
|
210
|
+
behavior_evaluation:
|
|
211
|
+
risk: 1
|
|
212
|
+
read_if_pack_insufficient:
|
|
213
|
+
- ../behavior/contract.yaml
|
|
214
|
+
- ../behavior/audit-checklist.yaml
|
|
215
|
+
- ../eval/rubric.yaml
|
|
216
|
+
do:
|
|
217
|
+
- compare_response_to_observable_behaviors
|
|
218
|
+
- verify_simple_tasks_are_not_overprocessed
|
|
219
|
+
- verify_critical_tasks_are_not_undercontrolled
|
|
220
|
+
- apply_behavior_automatic_fail_rules
|
|
221
|
+
dataset_preparation:
|
|
222
|
+
risk: 1
|
|
223
|
+
read_if_pack_insufficient:
|
|
224
|
+
- ../behavior/contract.yaml
|
|
225
|
+
- ../behavior/audit-checklist.yaml
|
|
226
|
+
- prompt-economy.yaml
|
|
227
|
+
- ../dataset/README.md
|
|
228
|
+
do:
|
|
229
|
+
- create_examples_from_observable_behavior
|
|
230
|
+
- include_good_bad_and_reason
|
|
231
|
+
- keep_training_examples_consistent
|
|
232
|
+
- avoid_rewarding_bureaucracy
|
package/protocol/router.yaml
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
id: protocol_router
|
|
2
2
|
type: read_router
|
|
3
|
-
version: 0.
|
|
3
|
+
version: 0.4.0
|
|
4
4
|
purpose: choose_minimum_protocol_files_by_task
|
|
5
5
|
default_read:
|
|
6
6
|
- fast-path.yaml
|
|
@@ -76,8 +76,17 @@ routes:
|
|
|
76
76
|
evaluate_response:
|
|
77
77
|
read:
|
|
78
78
|
- fast-path.yaml
|
|
79
|
+
- ../behavior/contract.yaml
|
|
79
80
|
- ../eval/rubric.yaml
|
|
80
81
|
- ../schema/evaluated-response.schema.json
|
|
82
|
+
behavior_evaluation:
|
|
83
|
+
risk: 1
|
|
84
|
+
read:
|
|
85
|
+
- fast-path.yaml
|
|
86
|
+
- ../behavior/contract.yaml
|
|
87
|
+
- ../behavior/audit-checklist.yaml
|
|
88
|
+
- ../eval/rubric.yaml
|
|
89
|
+
- ../dataset/README.md
|
|
81
90
|
create_or_edit_yaml:
|
|
82
91
|
read:
|
|
83
92
|
- fast-path.yaml
|
|
@@ -118,7 +127,22 @@ routes:
|
|
|
118
127
|
read:
|
|
119
128
|
- fast-path.yaml
|
|
120
129
|
- capability-router.yaml
|
|
130
|
+
- capability-gate.yaml
|
|
131
|
+
- context-budget.yaml
|
|
132
|
+
intelligence_selection:
|
|
133
|
+
risk: adaptive
|
|
134
|
+
read:
|
|
135
|
+
- fast-path.yaml
|
|
136
|
+
- intelligence-router.yaml
|
|
121
137
|
- context-budget.yaml
|
|
138
|
+
dataset_preparation:
|
|
139
|
+
risk: 1
|
|
140
|
+
read:
|
|
141
|
+
- fast-path.yaml
|
|
142
|
+
- ../behavior/contract.yaml
|
|
143
|
+
- ../behavior/audit-checklist.yaml
|
|
144
|
+
- prompt-economy.yaml
|
|
145
|
+
- ../dataset/README.md
|
|
122
146
|
rules:
|
|
123
147
|
- start_with_default_read
|
|
124
148
|
- choose_one_route_if_task_type_is_clear
|
|
@@ -127,6 +151,9 @@ rules:
|
|
|
127
151
|
- apply_context_budget_to_selected_route
|
|
128
152
|
- retrieve_only_matching_memory_subjects
|
|
129
153
|
- select_capabilities_before_loading_skill_or_connecting_mcp
|
|
154
|
+
- require_capability_gate_before_invocation
|
|
155
|
+
- route_model_or_reasoning_effort_by_risk_and_complexity
|
|
156
|
+
- use_behavior_contract_when_task_is_about_adherence_dataset_or_training
|
|
130
157
|
- if_route_unclear_read_risk_levels_then_choose_route
|
|
131
158
|
- do_not_read_docs_unless_protocol_is_insufficient
|
|
132
159
|
- do_not_read_cases_unless_testing_or_comparing_behavior
|
package/roadmap/v1.yaml
ADDED
|
@@ -0,0 +1,139 @@
|
|
|
1
|
+
id: roadmap_v1
|
|
2
|
+
type: release_roadmap
|
|
3
|
+
version: 0.1
|
|
4
|
+
target_release: 1.0.0
|
|
5
|
+
purpose: guide_each_update_until_public_v1
|
|
6
|
+
status: active
|
|
7
|
+
principle:
|
|
8
|
+
- do_not_market_as_stable_before_v1
|
|
9
|
+
- each_release_must_close_one_maturity_gap
|
|
10
|
+
- prove_context_economy_quality_and_safety_with_examples
|
|
11
|
+
- keep_protocol_core_stable_before_broad_public_launch
|
|
12
|
+
current_position:
|
|
13
|
+
current_series: 0.4.x
|
|
14
|
+
maturity: behavioral_execution_layer
|
|
15
|
+
public_positioning: experimental_until_v1
|
|
16
|
+
publish_strategy: publish_packages_for_testing_not_broad_marketing
|
|
17
|
+
v1_success_criteria:
|
|
18
|
+
protocol_stability:
|
|
19
|
+
- risk_levels_stable
|
|
20
|
+
- context_budget_stable
|
|
21
|
+
- adaptive_memory_stable
|
|
22
|
+
- capability_routing_stable
|
|
23
|
+
- selective_validation_stable
|
|
24
|
+
evidence:
|
|
25
|
+
- real_cases_documented
|
|
26
|
+
- before_after_examples_available
|
|
27
|
+
- benchmark_report_current
|
|
28
|
+
- install_and_update_flow_verified
|
|
29
|
+
adoption:
|
|
30
|
+
- codex_guide_clear
|
|
31
|
+
- other_agent_portability_documented
|
|
32
|
+
- troubleshooting_documented
|
|
33
|
+
- contribution_rules_clear
|
|
34
|
+
safety:
|
|
35
|
+
- secret_handling_documented
|
|
36
|
+
- sensitive_actions_require_confirmation
|
|
37
|
+
- memory_deduplication_and_replacement_validated
|
|
38
|
+
- capability_permissions_follow_least_privilege
|
|
39
|
+
release_path:
|
|
40
|
+
- version: 0.3.x
|
|
41
|
+
goal: harden_current_capability_context_memory_stack
|
|
42
|
+
status: completed
|
|
43
|
+
exit_criteria:
|
|
44
|
+
- capability_routing_documented_and_tested
|
|
45
|
+
- docs_commands_and_install_flow_stay_synced
|
|
46
|
+
- no_known_packaging_gap_blocks_testing
|
|
47
|
+
- version: 0.4.0
|
|
48
|
+
goal: add_behavioral_execution_contract_and_economy_reports
|
|
49
|
+
status: current
|
|
50
|
+
focus:
|
|
51
|
+
- behavioral_contract
|
|
52
|
+
- trainable_behavior_units
|
|
53
|
+
- token_and_file_read_savings
|
|
54
|
+
- tools_avoided
|
|
55
|
+
- validation_cost_by_risk
|
|
56
|
+
- quality_preserved_examples
|
|
57
|
+
exit_criteria:
|
|
58
|
+
- behavior_contract_is_installed_and_validated
|
|
59
|
+
- benchmark_report_has_clear_before_after_numbers
|
|
60
|
+
- benchmark_can_be_reproduced_locally
|
|
61
|
+
- version: 0.5.0
|
|
62
|
+
goal: add_real_world_cases
|
|
63
|
+
focus:
|
|
64
|
+
- simple_task
|
|
65
|
+
- medium_risk_bug
|
|
66
|
+
- docs_update
|
|
67
|
+
- capability_or_mcp_task
|
|
68
|
+
- memory_update_task
|
|
69
|
+
- release_task
|
|
70
|
+
exit_criteria:
|
|
71
|
+
- at_least_6_real_or_realistic_cases
|
|
72
|
+
- each_case_has_context_used_validation_and_outcome
|
|
73
|
+
- version: 0.6.0
|
|
74
|
+
goal: document_portability_beyond_codex
|
|
75
|
+
focus:
|
|
76
|
+
- codex_primary_flow
|
|
77
|
+
- cursor_adaptation
|
|
78
|
+
- claude_or_generic_agent_adaptation
|
|
79
|
+
- mcp_capability_boundaries
|
|
80
|
+
exit_criteria:
|
|
81
|
+
- portability_limits_are_explicit
|
|
82
|
+
- codex_specific_rules_are_separated_from_generic_rules
|
|
83
|
+
- version: 0.7.0
|
|
84
|
+
goal: harden_schemas_validation_and_health_checks
|
|
85
|
+
focus:
|
|
86
|
+
- schema_coverage
|
|
87
|
+
- health_check_coverage
|
|
88
|
+
- install_manifest_consistency
|
|
89
|
+
- package_content_checks
|
|
90
|
+
exit_criteria:
|
|
91
|
+
- health_check_catches_missing_core_files
|
|
92
|
+
- release_checks_cover_docs_protocol_templates_and_packages
|
|
93
|
+
- version: 0.8.0
|
|
94
|
+
goal: finish_adoption_documentation
|
|
95
|
+
focus:
|
|
96
|
+
- getting_started
|
|
97
|
+
- install_update_verify
|
|
98
|
+
- project_adaptation
|
|
99
|
+
- troubleshooting
|
|
100
|
+
- contribution_guidelines
|
|
101
|
+
exit_criteria:
|
|
102
|
+
- new_user_can_install_verify_and_understand_core_flow
|
|
103
|
+
- docs_are_atomic_and_indexed
|
|
104
|
+
- version: 0.9.0
|
|
105
|
+
goal: release_candidate
|
|
106
|
+
focus:
|
|
107
|
+
- freeze_core_contracts
|
|
108
|
+
- remove_or_mark_unstable_experimental_parts
|
|
109
|
+
- run_full_validation
|
|
110
|
+
- prepare_v1_release_notes
|
|
111
|
+
exit_criteria:
|
|
112
|
+
- no_known_blocker_for_v1
|
|
113
|
+
- docs_and_protocol_are_consistent
|
|
114
|
+
- packages_install_cleanly
|
|
115
|
+
- version: 1.0.0
|
|
116
|
+
goal: stable_public_release
|
|
117
|
+
focus:
|
|
118
|
+
- stable_protocol_core
|
|
119
|
+
- clear_public_positioning
|
|
120
|
+
- reproducible_evidence
|
|
121
|
+
- safe_installation
|
|
122
|
+
exit_criteria:
|
|
123
|
+
- v1_success_criteria_met
|
|
124
|
+
update_rule:
|
|
125
|
+
before_each_release:
|
|
126
|
+
- read_this_roadmap
|
|
127
|
+
- choose_next_smallest_maturity_gap
|
|
128
|
+
- update_docs_protocol_tests_when_behavior_changes
|
|
129
|
+
- record_completed_and_remaining_exit_criteria
|
|
130
|
+
after_each_release:
|
|
131
|
+
- update_current_position
|
|
132
|
+
- mark_exit_criteria_done_or_pending
|
|
133
|
+
- update_docs_22_roadmap_v1
|
|
134
|
+
- keep_changelog_release_notes_synced
|
|
135
|
+
avoid:
|
|
136
|
+
- broad_marketing_before_v1
|
|
137
|
+
- claiming_security_guarantees
|
|
138
|
+
- changing_core_terms_without_migration_note
|
|
139
|
+
- adding_new_surfaces_without_tests_or_docs
|
package/schema/README.md
ADDED
|
@@ -0,0 +1,26 @@
|
|
|
1
|
+
# Schemas
|
|
2
|
+
|
|
3
|
+
Esta pasta descreve o formato esperado dos arquivos YAML.
|
|
4
|
+
|
|
5
|
+
Os schemas sao leves e servem como contrato de organizacao. Eles ajudam a IA a
|
|
6
|
+
manter arquivos parecidos entre si.
|
|
7
|
+
|
|
8
|
+
## Arquivos
|
|
9
|
+
|
|
10
|
+
- [protocol-rule.schema.yaml](./protocol-rule.schema.yaml): formato de regra
|
|
11
|
+
operacional.
|
|
12
|
+
- [test-case.schema.yaml](./test-case.schema.yaml): formato de caso de teste.
|
|
13
|
+
- [protocol-rule.schema.json](./protocol-rule.schema.json): JSON Schema
|
|
14
|
+
validavel para regras operacionais.
|
|
15
|
+
- [test-case.schema.json](./test-case.schema.json): JSON Schema validavel para
|
|
16
|
+
casos.
|
|
17
|
+
- [evaluated-response.schema.json](./evaluated-response.schema.json): JSON
|
|
18
|
+
Schema validavel para respostas avaliaveis.
|
|
19
|
+
- [evaluation-result.schema.json](./evaluation-result.schema.json): JSON Schema
|
|
20
|
+
validavel para resultados.
|
|
21
|
+
- [memory-entry.schema.json](./memory-entry.schema.json): contrato de uma
|
|
22
|
+
entrada de memoria adaptativa.
|
|
23
|
+
- [capability-registry.schema.json](./capability-registry.schema.json):
|
|
24
|
+
contrato do registro de skills, MCPs e ferramentas.
|
|
25
|
+
- [behavior-contract.schema.json](./behavior-contract.schema.json): contrato
|
|
26
|
+
da camada comportamental observavel.
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "https://json-schema.org/draft/2020-12/schema",
|
|
3
|
+
"$id": "https://ai-research.local/schema/behavior-contract.schema.json",
|
|
4
|
+
"title": "Behavior contract",
|
|
5
|
+
"type": "object",
|
|
6
|
+
"required": [
|
|
7
|
+
"id",
|
|
8
|
+
"type",
|
|
9
|
+
"version",
|
|
10
|
+
"purpose",
|
|
11
|
+
"principle",
|
|
12
|
+
"automatic_fail_when"
|
|
13
|
+
],
|
|
14
|
+
"properties": {
|
|
15
|
+
"id": { "type": "string" },
|
|
16
|
+
"type": { "const": "behavior_contract" },
|
|
17
|
+
"version": { "type": ["string", "number"] },
|
|
18
|
+
"purpose": { "type": "string" },
|
|
19
|
+
"subtitle": { "type": "string" },
|
|
20
|
+
"status": { "type": "string" },
|
|
21
|
+
"principle": { "type": "array", "items": { "type": "string" } },
|
|
22
|
+
"scope": { "type": "object" },
|
|
23
|
+
"behavior_sets": { "type": "array" },
|
|
24
|
+
"core_behaviors": { "type": "array", "items": { "type": "string" } },
|
|
25
|
+
"trainable_units": { "type": "array" },
|
|
26
|
+
"evaluation_dimensions": { "type": "array" },
|
|
27
|
+
"automatic_fail_when": { "type": "array", "items": { "type": "string" } },
|
|
28
|
+
"dataset_policy": { "type": "object" }
|
|
29
|
+
},
|
|
30
|
+
"additionalProperties": false
|
|
31
|
+
}
|
|
@@ -0,0 +1,51 @@
|
|
|
1
|
+
{
|
|
2
|
+
"$schema": "https://json-schema.org/draft/2020-12/schema",
|
|
3
|
+
"$id": "https://ai-research.local/schema/capability-registry.schema.json",
|
|
4
|
+
"title": "Capability registry",
|
|
5
|
+
"type": "object",
|
|
6
|
+
"required": ["id", "type", "version", "capabilities"],
|
|
7
|
+
"properties": {
|
|
8
|
+
"id": { "type": "string" },
|
|
9
|
+
"type": { "const": "capability_registry" },
|
|
10
|
+
"version": { "type": ["string", "number"] },
|
|
11
|
+
"purpose": { "type": "string" },
|
|
12
|
+
"policy": { "type": "object" },
|
|
13
|
+
"capabilities": {
|
|
14
|
+
"type": "array",
|
|
15
|
+
"items": {
|
|
16
|
+
"type": "object",
|
|
17
|
+
"required": [
|
|
18
|
+
"id",
|
|
19
|
+
"type",
|
|
20
|
+
"available",
|
|
21
|
+
"tags",
|
|
22
|
+
"operations",
|
|
23
|
+
"cost",
|
|
24
|
+
"side_effect",
|
|
25
|
+
"confirmation"
|
|
26
|
+
],
|
|
27
|
+
"properties": {
|
|
28
|
+
"id": { "type": "string" },
|
|
29
|
+
"type": {
|
|
30
|
+
"enum": [
|
|
31
|
+
"built_in_reasoning",
|
|
32
|
+
"local_tool",
|
|
33
|
+
"skill",
|
|
34
|
+
"mcp",
|
|
35
|
+
"remote_service"
|
|
36
|
+
]
|
|
37
|
+
},
|
|
38
|
+
"available": { "type": ["boolean", "string"] },
|
|
39
|
+
"tags": { "type": "array", "items": { "type": "string" } },
|
|
40
|
+
"operations": { "type": "array", "items": { "type": "string" } },
|
|
41
|
+
"cost": { "type": "object" },
|
|
42
|
+
"side_effect": { "type": "string" },
|
|
43
|
+
"confirmation": { "type": "string" },
|
|
44
|
+
"depends_on": { "type": "array", "items": { "type": "string" } }
|
|
45
|
+
},
|
|
46
|
+
"additionalProperties": false
|
|
47
|
+
}
|
|
48
|
+
}
|
|
49
|
+
},
|
|
50
|
+
"additionalProperties": false
|
|
51
|
+
}
|