agent-os-kernel 1.1.0__py3-none-any.whl → 1.2.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- agent_os/__init__.py +66 -4
- agent_os/agents_compat.py +286 -0
- agent_os/base_agent.py +308 -0
- agent_os/cli.py +1079 -19
- agent_os/integrations/__init__.py +37 -2
- agent_os/integrations/openai_adapter.py +502 -0
- agent_os/integrations/semantic_kernel_adapter.py +569 -0
- agent_os/stateless.py +349 -0
- agent_os_kernel-1.2.0.dist-info/METADATA +676 -0
- agent_os_kernel-1.2.0.dist-info/RECORD +1053 -0
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/entry_points.txt +0 -1
- modules/amb/.github/workflows/ci.yml +102 -0
- modules/amb/.github/workflows/publish.yml +146 -0
- modules/amb/.gitignore +134 -0
- modules/amb/CHANGELOG.md +118 -0
- modules/amb/CONTRIBUTING.md +141 -0
- modules/amb/LICENSE +21 -0
- modules/amb/README.md +188 -0
- modules/amb/amb_core/__init__.py +175 -0
- modules/amb/amb_core/adapters/__init__.py +55 -0
- modules/amb/amb_core/adapters/aws_sqs_broker.py +374 -0
- modules/amb/amb_core/adapters/azure_servicebus_broker.py +338 -0
- modules/amb/amb_core/adapters/kafka_broker.py +258 -0
- modules/amb/amb_core/adapters/nats_broker.py +283 -0
- modules/amb/amb_core/adapters/rabbitmq_broker.py +233 -0
- modules/amb/amb_core/adapters/redis_broker.py +260 -0
- modules/amb/amb_core/broker.py +143 -0
- modules/amb/amb_core/bus.py +479 -0
- modules/amb/amb_core/cloudevents.py +507 -0
- modules/amb/amb_core/dlq.py +343 -0
- modules/amb/amb_core/hf_utils.py +534 -0
- modules/amb/amb_core/memory_broker.py +408 -0
- modules/amb/amb_core/models.py +139 -0
- modules/amb/amb_core/persistence.py +527 -0
- modules/amb/amb_core/schema.py +292 -0
- modules/amb/amb_core/tracing.py +356 -0
- modules/amb/examples/advanced_features.py +223 -0
- modules/amb/examples/backpressure_demo.py +225 -0
- modules/amb/examples/basic_usage.py +117 -0
- modules/amb/examples/tracing_demo.py +104 -0
- modules/amb/experiments/README.md +52 -0
- modules/amb/experiments/reproduce_results.py +467 -0
- modules/amb/experiments/results.json +324 -0
- modules/amb/paper/README.md +40 -0
- modules/amb/paper/paper.tex +365 -0
- modules/amb/paper/whitepaper.md +377 -0
- modules/amb/pyproject.toml +117 -0
- modules/amb/tests/__init__.py +1 -0
- modules/amb/tests/test_backpressure_priority.py +280 -0
- modules/amb/tests/test_bus.py +198 -0
- modules/amb/tests/test_cloudevents.py +443 -0
- modules/amb/tests/test_features.py +531 -0
- modules/amb/tests/test_models.py +74 -0
- modules/amb/tests/test_tracing.py +254 -0
- modules/atr/.github/workflows/ci.yml +101 -0
- modules/atr/.github/workflows/publish.yml +140 -0
- modules/atr/.gitignore +134 -0
- modules/atr/.pre-commit-config.yaml +37 -0
- modules/atr/CHANGELOG.md +39 -0
- modules/atr/CONTRIBUTING.md +96 -0
- modules/atr/IMPLEMENTATION_SUMMARY.md +143 -0
- modules/atr/README.md +180 -0
- modules/atr/atr/__init__.py +638 -0
- modules/atr/atr/access.py +346 -0
- modules/atr/atr/composition.py +643 -0
- modules/atr/atr/decorator.py +355 -0
- modules/atr/atr/executor.py +382 -0
- modules/atr/atr/health.py +555 -0
- modules/atr/atr/hf_utils.py +447 -0
- modules/atr/atr/injection.py +420 -0
- modules/atr/atr/metrics.py +438 -0
- modules/atr/atr/policies.py +401 -0
- modules/atr/atr/py.typed +2 -0
- modules/atr/atr/registry.py +450 -0
- modules/atr/atr/schema.py +478 -0
- modules/atr/atr/tools/safe/__init__.py +73 -0
- modules/atr/atr/tools/safe/calculator.py +380 -0
- modules/atr/atr/tools/safe/datetime_tool.py +441 -0
- modules/atr/atr/tools/safe/file_reader.py +400 -0
- modules/atr/atr/tools/safe/http_client.py +314 -0
- modules/atr/atr/tools/safe/json_parser.py +372 -0
- modules/atr/atr/tools/safe/text_tool.py +526 -0
- modules/atr/atr/tools/safe/toolkit.py +173 -0
- modules/atr/docs/PYPI_SETUP.md +113 -0
- modules/atr/examples/README.md +27 -0
- modules/atr/examples/demo.py +144 -0
- modules/atr/examples/sandbox_demo.py +218 -0
- modules/atr/experiments/README.md +69 -0
- modules/atr/experiments/reproduce_results.py +509 -0
- modules/atr/experiments/results/.gitkeep +0 -0
- modules/atr/experiments/results/results_20260123_140334.json +71 -0
- modules/atr/paper/README.md +36 -0
- modules/atr/paper/figures/.gitkeep +0 -0
- modules/atr/paper/references.bib +84 -0
- modules/atr/paper/structure.tex +293 -0
- modules/atr/paper/whitepaper.md +234 -0
- modules/atr/pyproject.toml +148 -0
- modules/atr/requirements.txt +1 -0
- modules/atr/setup.py +30 -0
- modules/atr/tests/__init__.py +1 -0
- modules/atr/tests/test_decorator.py +317 -0
- modules/atr/tests/test_executor.py +245 -0
- modules/atr/tests/test_integration_executor.py +184 -0
- modules/atr/tests/test_registry.py +312 -0
- modules/atr/tests/test_schema.py +182 -0
- modules/atr/tests/test_v2_features.py +708 -0
- modules/caas/.dockerignore +63 -0
- modules/caas/.github/ISSUE_TEMPLATE/bug_report.md +38 -0
- modules/caas/.github/ISSUE_TEMPLATE/custom.md +10 -0
- modules/caas/.github/ISSUE_TEMPLATE/feature_request.md +20 -0
- modules/caas/.github/workflows/ci.yml +100 -0
- modules/caas/.github/workflows/lint.yml +39 -0
- modules/caas/.github/workflows/publish-pypi.yml +124 -0
- modules/caas/.gitignore +73 -0
- modules/caas/.pre-commit-config.yaml +33 -0
- modules/caas/CHANGELOG.md +58 -0
- modules/caas/CONTRIBUTING.md +346 -0
- modules/caas/Dockerfile +41 -0
- modules/caas/LICENSE +21 -0
- modules/caas/MANIFEST.in +11 -0
- modules/caas/README.md +158 -0
- modules/caas/benchmarks/README.md +255 -0
- modules/caas/benchmarks/create_hf_dataset.py +502 -0
- modules/caas/benchmarks/data/sample_corpus/README.md +86 -0
- modules/caas/benchmarks/data/sample_corpus/auth_module.py +211 -0
- modules/caas/benchmarks/data/sample_corpus/contribution_guide.md +185 -0
- modules/caas/benchmarks/data/sample_corpus/remote_work_policy.html +57 -0
- modules/caas/benchmarks/hf_dataset/README.md +214 -0
- modules/caas/benchmarks/hf_dataset/caas_benchmark_corpus.py +73 -0
- modules/caas/benchmarks/hf_dataset/corpus_preview.json +193 -0
- modules/caas/benchmarks/results/README.md +66 -0
- modules/caas/benchmarks/results/evaluation_2026-01-20.json +121 -0
- modules/caas/benchmarks/run_evaluation.py +561 -0
- modules/caas/benchmarks/statistical_tests.py +289 -0
- modules/caas/benchmarks/verify_sample_corpus.py +83 -0
- modules/caas/docker-compose.yml +38 -0
- modules/caas/docs/CONTEXT_TRIAD.md +462 -0
- modules/caas/docs/CONTRIBUTING.md +346 -0
- modules/caas/docs/ETHICS_AND_LIMITATIONS.md +336 -0
- modules/caas/docs/HEURISTIC_ROUTER.md +442 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY.md +363 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_CONTEXT_TRIAD.md +277 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_HEURISTIC_ROUTER.md +231 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_METADATA_INJECTION.md +258 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_PRAGMATIC_TRUTH.md +212 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_TRUST_GATEWAY.md +319 -0
- modules/caas/docs/LAYER_1_PRIMITIVE.md +202 -0
- modules/caas/docs/METADATA_INJECTION.md +404 -0
- modules/caas/docs/PRAGMATIC_TRUTH.md +431 -0
- modules/caas/docs/RELATED_WORK.md +312 -0
- modules/caas/docs/RELEASE_CHECKLIST.md +219 -0
- modules/caas/docs/RELEASE_GUIDE.md +285 -0
- modules/caas/docs/REPRODUCIBILITY.md +386 -0
- modules/caas/docs/SLIDING_WINDOW.md +387 -0
- modules/caas/docs/STRUCTURE_AWARE_INDEXING.md +158 -0
- modules/caas/docs/TESTING.md +259 -0
- modules/caas/docs/THREAT_MODEL.md +247 -0
- modules/caas/docs/TRUST_GATEWAY.md +575 -0
- modules/caas/docs/VFS.md +298 -0
- modules/caas/examples/agents/enterprise_security_agent.py +414 -0
- modules/caas/examples/agents/intelligent_document_analyzer.py +380 -0
- modules/caas/examples/demos/demo.py +309 -0
- modules/caas/examples/demos/demo_context_triad.py +225 -0
- modules/caas/examples/demos/demo_conversation_manager.py +285 -0
- modules/caas/examples/demos/demo_heuristic_router.py +133 -0
- modules/caas/examples/demos/demo_metadata_injection.py +198 -0
- modules/caas/examples/demos/demo_pragmatic_truth.py +303 -0
- modules/caas/examples/demos/demo_structure_aware.py +140 -0
- modules/caas/examples/demos/demo_time_decay.py +247 -0
- modules/caas/examples/demos/demo_trust_gateway.py +383 -0
- modules/caas/examples/multi_agent/README.md +159 -0
- modules/caas/examples/multi_agent/research_team.py +369 -0
- modules/caas/examples/multi_agent/vfs_collaboration.py +393 -0
- modules/caas/examples/usage/auth_module.py +142 -0
- modules/caas/examples/usage/usage_example.py +173 -0
- modules/caas/experiments/README.md +42 -0
- modules/caas/experiments/reproduce_results.py +462 -0
- modules/caas/paper/ARXIV_METADATA.md +145 -0
- modules/caas/paper/ARXIV_README.md +47 -0
- modules/caas/paper/CHECKLIST.md +103 -0
- modules/caas/paper/GITHUB_RELEASE_NOTES.md +105 -0
- modules/caas/paper/README.md +71 -0
- modules/caas/paper/abstract.md +24 -0
- modules/caas/paper/arxiv_submission.tar +0 -0
- modules/caas/paper/arxiv_submission.zip +0 -0
- modules/caas/paper/build_pdf.py +355 -0
- modules/caas/paper/experiments.md +149 -0
- modules/caas/paper/figures/.gitkeep +0 -0
- modules/caas/paper/figures/README.md +237 -0
- modules/caas/paper/figures/fig1_system_architecture.png +0 -0
- modules/caas/paper/figures/fig1_system_architecture.svg +198 -0
- modules/caas/paper/figures/fig2_context_triad.png +0 -0
- modules/caas/paper/figures/fig2_context_triad.svg +105 -0
- modules/caas/paper/figures/fig3_ablation_results.png +0 -0
- modules/caas/paper/figures/fig3_ablation_results.svg +113 -0
- modules/caas/paper/figures/fig4_routing_latency.png +0 -0
- modules/caas/paper/figures/fig4_routing_latency.svg +97 -0
- modules/caas/paper/intro.md +103 -0
- modules/caas/paper/latex/figures/fig1_system_architecture.png +0 -0
- modules/caas/paper/latex/figures/fig2_context_triad.png +0 -0
- modules/caas/paper/latex/figures/fig3_ablation_results.png +0 -0
- modules/caas/paper/latex/figures/fig4_routing_latency.png +0 -0
- modules/caas/paper/latex/main.tex +468 -0
- modules/caas/paper/latex/references.bib +140 -0
- modules/caas/paper/method.md +350 -0
- modules/caas/paper/outline.md +123 -0
- modules/caas/paper/related_work.md +101 -0
- modules/caas/paper/tables/.gitkeep +0 -0
- modules/caas/paper/tables/results_tables.md +50 -0
- modules/caas/pyproject.toml +172 -0
- modules/caas/requirements.txt +11 -0
- modules/caas/src/caas/__init__.py +232 -0
- modules/caas/src/caas/api/__init__.py +7 -0
- modules/caas/src/caas/api/server.py +1326 -0
- modules/caas/src/caas/caching.py +832 -0
- modules/caas/src/caas/cli.py +208 -0
- modules/caas/src/caas/conversation.py +221 -0
- modules/caas/src/caas/decay.py +118 -0
- modules/caas/src/caas/detection/__init__.py +7 -0
- modules/caas/src/caas/detection/detector.py +236 -0
- modules/caas/src/caas/enrichment.py +127 -0
- modules/caas/src/caas/gateway/__init__.py +24 -0
- modules/caas/src/caas/gateway/trust_gateway.py +471 -0
- modules/caas/src/caas/hf_utils.py +477 -0
- modules/caas/src/caas/ingestion/__init__.py +21 -0
- modules/caas/src/caas/ingestion/processors.py +251 -0
- modules/caas/src/caas/ingestion/structure_parser.py +185 -0
- modules/caas/src/caas/models.py +354 -0
- modules/caas/src/caas/pragmatic_truth.py +441 -0
- modules/caas/src/caas/routing/__init__.py +8 -0
- modules/caas/src/caas/routing/heuristic_router.py +242 -0
- modules/caas/src/caas/storage/__init__.py +7 -0
- modules/caas/src/caas/storage/store.py +450 -0
- modules/caas/src/caas/triad.py +472 -0
- modules/caas/src/caas/tuning/__init__.py +7 -0
- modules/caas/src/caas/tuning/tuner.py +322 -0
- modules/caas/src/caas/vfs/__init__.py +12 -0
- modules/caas/src/caas/vfs/filesystem.py +450 -0
- modules/caas/tests/__init__.py +3 -0
- modules/caas/tests/conftest.py +8 -0
- modules/caas/tests/test_caching.py +628 -0
- modules/caas/tests/test_context_triad.py +385 -0
- modules/caas/tests/test_conversation_manager.py +289 -0
- modules/caas/tests/test_functionality.py +215 -0
- modules/caas/tests/test_heuristic_router.py +370 -0
- modules/caas/tests/test_metadata_injection.py +328 -0
- modules/caas/tests/test_pragmatic_truth.py +322 -0
- modules/caas/tests/test_structure_aware_indexing.py +283 -0
- modules/caas/tests/test_time_decay.py +268 -0
- modules/caas/tests/test_trust_gateway.py +445 -0
- modules/caas/tests/test_vfs.py +298 -0
- modules/cmvk/.github/FUNDING.yml +9 -0
- modules/cmvk/.github/dependabot.yml +54 -0
- modules/cmvk/.github/workflows/ci.yml +205 -0
- modules/cmvk/.github/workflows/publish.yml +143 -0
- modules/cmvk/.gitignore +147 -0
- modules/cmvk/.pre-commit-config.yaml +58 -0
- modules/cmvk/CHANGELOG.md +146 -0
- modules/cmvk/CITATION.cff +48 -0
- modules/cmvk/CONTRIBUTING.md +229 -0
- modules/cmvk/Dockerfile +87 -0
- modules/cmvk/HF_MODEL_CARD.md +185 -0
- modules/cmvk/LICENSE +21 -0
- modules/cmvk/README.md +149 -0
- modules/cmvk/SECURITY.md +114 -0
- modules/cmvk/config/prompts/generator_v1.txt +23 -0
- modules/cmvk/config/prompts/verifier_hostile.txt +32 -0
- modules/cmvk/config/settings.yaml +40 -0
- modules/cmvk/coverage_html/.gitignore +2 -0
- modules/cmvk/coverage_html/class_index.html +658 -0
- modules/cmvk/coverage_html/coverage_html_cb_188fc9a4.js +735 -0
- modules/cmvk/coverage_html/favicon_32_cb_c827f16f.png +0 -0
- modules/cmvk/coverage_html/function_index.html +1978 -0
- modules/cmvk/coverage_html/index.html +255 -0
- modules/cmvk/coverage_html/keybd_closed_cb_900cfef5.png +0 -0
- modules/cmvk/coverage_html/status.json +1 -0
- modules/cmvk/coverage_html/style_cb_5c747636.css +389 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38___init___py.html +315 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_audit_py.html +499 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_benchmarks_py.html +575 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_constitutional_py.html +1001 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_hf_utils_py.html +398 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_metrics_py.html +570 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_profiles_py.html +397 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_types_py.html +109 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_verification_py.html +1053 -0
- modules/cmvk/docs/DIAGRAMS.md +325 -0
- modules/cmvk/docs/architecture.md +345 -0
- modules/cmvk/docs/features.md +308 -0
- modules/cmvk/docs/getting_started.md +279 -0
- modules/cmvk/docs/innovation_layer.md +377 -0
- modules/cmvk/docs/safety.md +281 -0
- modules/cmvk/docs/traceability.md +150 -0
- modules/cmvk/examples/basic_example.py +62 -0
- modules/cmvk/examples/demo_complete_pipeline.py +209 -0
- modules/cmvk/examples/demo_innovation_layer.py +197 -0
- modules/cmvk/examples/example.py +112 -0
- modules/cmvk/examples/model_diversity_comparison.py +110 -0
- modules/cmvk/examples/real_api_integration.py +121 -0
- modules/cmvk/examples/test_full_pipeline.py +303 -0
- modules/cmvk/experiments/FEATURE_2_LATERAL_THINKING.md +187 -0
- modules/cmvk/experiments/README.md +216 -0
- modules/cmvk/experiments/ablation_runner.py +666 -0
- modules/cmvk/experiments/baseline_runner.py +158 -0
- modules/cmvk/experiments/blind_spot_benchmark.py +364 -0
- modules/cmvk/experiments/datasets/README.md +85 -0
- modules/cmvk/experiments/datasets/humaneval_50.json +352 -0
- modules/cmvk/experiments/datasets/humaneval_full.json +1150 -0
- modules/cmvk/experiments/datasets/humaneval_sample.json +32 -0
- modules/cmvk/experiments/datasets/sabotage.json +262 -0
- modules/cmvk/experiments/datasets/sample.json +40 -0
- modules/cmvk/experiments/demo_with_traces.py +110 -0
- modules/cmvk/experiments/efficiency_curve.py +259 -0
- modules/cmvk/experiments/experiment_runner.py +243 -0
- modules/cmvk/experiments/paper_data_generator.py +183 -0
- modules/cmvk/experiments/reproduce_results.py +407 -0
- modules/cmvk/experiments/reproducible_runner.py +352 -0
- modules/cmvk/experiments/sabotage_stress_test.py +311 -0
- modules/cmvk/experiments/test_lateral_thinking.py +116 -0
- modules/cmvk/experiments/test_prosecutor.py +41 -0
- modules/cmvk/experiments/visualize_results.py +735 -0
- modules/cmvk/logs/traces/demo_HumanEval_0_20260121-204900.json +36 -0
- modules/cmvk/notebooks/analysis.ipynb +124 -0
- modules/cmvk/paper/PAPER.md +561 -0
- modules/cmvk/paper/arxiv_checklist.md +230 -0
- modules/cmvk/paper/cmvk_neurips.aux +77 -0
- modules/cmvk/paper/cmvk_neurips.bbl +81 -0
- modules/cmvk/paper/cmvk_neurips.blg +48 -0
- modules/cmvk/paper/cmvk_neurips.out +16 -0
- modules/cmvk/paper/cmvk_neurips.pdf +0 -0
- modules/cmvk/paper/cmvk_neurips.tex +309 -0
- modules/cmvk/paper/figures/ablation.png +0 -0
- modules/cmvk/paper/figures/ablation.svg +39 -0
- modules/cmvk/paper/figures/architecture.png +0 -0
- modules/cmvk/paper/figures/architecture.svg +115 -0
- modules/cmvk/paper/figures/results_bar.png +0 -0
- modules/cmvk/paper/figures/results_bar.svg +70 -0
- modules/cmvk/paper/generate_figures.py +383 -0
- modules/cmvk/paper/neurips_2024.sty +101 -0
- modules/cmvk/paper/references.bib +98 -0
- modules/cmvk/paper/structure.tex +200 -0
- modules/cmvk/pyproject.toml +189 -0
- modules/cmvk/requirements-dev.txt +19 -0
- modules/cmvk/requirements.txt +14 -0
- modules/cmvk/src/cmvk/__init__.py +216 -0
- modules/cmvk/src/cmvk/audit.py +400 -0
- modules/cmvk/src/cmvk/benchmarks.py +476 -0
- modules/cmvk/src/cmvk/constitutional.py +902 -0
- modules/cmvk/src/cmvk/hf_utils.py +299 -0
- modules/cmvk/src/cmvk/metrics.py +471 -0
- modules/cmvk/src/cmvk/profiles.py +298 -0
- modules/cmvk/src/cmvk/py.typed +0 -0
- modules/cmvk/src/cmvk/types.py +10 -0
- modules/cmvk/src/cmvk/verification.py +954 -0
- modules/cmvk/src/cross_model_verification_kernel/__init__.py +91 -0
- modules/cmvk/src/cross_model_verification_kernel/__main__.py +10 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/__init__.py +16 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/base_agent.py +142 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/generator_openai.py +223 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/verifier_anthropic.py +448 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/verifier_gemini.py +481 -0
- modules/cmvk/src/cross_model_verification_kernel/cli.py +570 -0
- modules/cmvk/src/cross_model_verification_kernel/core/__init__.py +26 -0
- modules/cmvk/src/cross_model_verification_kernel/core/graph_memory.py +308 -0
- modules/cmvk/src/cross_model_verification_kernel/core/kernel.py +413 -0
- modules/cmvk/src/cross_model_verification_kernel/core/trace_logger.py +75 -0
- modules/cmvk/src/cross_model_verification_kernel/core/types.py +121 -0
- modules/cmvk/src/cross_model_verification_kernel/datasets/__init__.py +20 -0
- modules/cmvk/src/cross_model_verification_kernel/datasets/humaneval_loader.py +271 -0
- modules/cmvk/src/cross_model_verification_kernel/generator.py +118 -0
- modules/cmvk/src/cross_model_verification_kernel/kernel.py +292 -0
- modules/cmvk/src/cross_model_verification_kernel/models.py +111 -0
- modules/cmvk/src/cross_model_verification_kernel/py.typed +1 -0
- modules/cmvk/src/cross_model_verification_kernel/simple_kernel.py +185 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/__init__.py +94 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/huggingface_upload.py +394 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/sandbox.py +159 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/statistics.py +468 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/visualizer.py +312 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/web_search.py +86 -0
- modules/cmvk/src/cross_model_verification_kernel/verifier.py +257 -0
- modules/cmvk/tests/__init__.py +3 -0
- modules/cmvk/tests/conftest.py +61 -0
- modules/cmvk/tests/integration/__init__.py +1 -0
- modules/cmvk/tests/integration/test_anthropic_verifier.py +269 -0
- modules/cmvk/tests/integration/test_integration.py +53 -0
- modules/cmvk/tests/integration/test_lateral_thinking_integration.py +199 -0
- modules/cmvk/tests/integration/test_lateral_thinking_witness.py +208 -0
- modules/cmvk/tests/integration/test_prosecutor_mode.py +131 -0
- modules/cmvk/tests/test_constitutional.py +611 -0
- modules/cmvk/tests/test_enhanced_features.py +603 -0
- modules/cmvk/tests/test_verification.py +255 -0
- modules/cmvk/tests/unit/__init__.py +1 -0
- modules/cmvk/tests/unit/test_agents.py +64 -0
- modules/cmvk/tests/unit/test_cli.py +224 -0
- modules/cmvk/tests/unit/test_core.py +126 -0
- modules/cmvk/tests/unit/test_humaneval_loader.py +197 -0
- modules/cmvk/tests/unit/test_kernel.py +255 -0
- modules/cmvk/tests/unit/test_reproducibility.py +160 -0
- modules/cmvk/tests/unit/test_trace_logger.py +115 -0
- modules/cmvk/tests/unit/test_visualizer.py +218 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/bug_report.yml +82 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/config.yml +11 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/feature_request.yml +104 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/question.yml +70 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/security_vulnerability.yml +84 -0
- modules/control-plane/.github/discussions.yml +73 -0
- modules/control-plane/.github/pull_request_template.md +82 -0
- modules/control-plane/.github/workflows/publish.yml +146 -0
- modules/control-plane/.github/workflows/release.yml +39 -0
- modules/control-plane/.github/workflows/tests.yml +58 -0
- modules/control-plane/.gitignore +55 -0
- modules/control-plane/CHANGELOG.md +203 -0
- modules/control-plane/CONTRIBUTING.md +311 -0
- modules/control-plane/CONTRIBUTORS.md +88 -0
- modules/control-plane/Dockerfile +82 -0
- modules/control-plane/LICENSE +21 -0
- modules/control-plane/MANIFEST.in +17 -0
- modules/control-plane/README.md +1264 -0
- modules/control-plane/ROADMAP.md +228 -0
- modules/control-plane/SECURITY.md +210 -0
- modules/control-plane/SUPPORT.md +106 -0
- modules/control-plane/acp-cli.py +212 -0
- modules/control-plane/benchmark/README.md +257 -0
- modules/control-plane/benchmark/__init__.py +19 -0
- modules/control-plane/benchmark/red_team_dataset.py +517 -0
- modules/control-plane/benchmark.py +563 -0
- modules/control-plane/build_and_publish.sh +130 -0
- modules/control-plane/docker-compose.yml +74 -0
- modules/control-plane/docs/ABLATION_STUDIES.md +528 -0
- modules/control-plane/docs/ADAPTER_GUIDE.md +544 -0
- modules/control-plane/docs/ADVANCED_FEATURES.md +543 -0
- modules/control-plane/docs/AIOS_COMPARISON.md +296 -0
- modules/control-plane/docs/BIBLIOGRAPHY.md +367 -0
- modules/control-plane/docs/CASE_STUDIES.md +645 -0
- modules/control-plane/docs/DOCKER_DEPLOYMENT.md +184 -0
- modules/control-plane/docs/ECOSYSTEM_STATUS.md +98 -0
- modules/control-plane/docs/HF_MODEL_CARD.md +168 -0
- modules/control-plane/docs/KERNEL_V1_RELEASE.md +454 -0
- modules/control-plane/docs/LAYER3_FRAMEWORK.md +227 -0
- modules/control-plane/docs/LIMITATIONS.md +523 -0
- modules/control-plane/docs/PYPI_PUBLISHING.md +195 -0
- modules/control-plane/docs/README.md +58 -0
- modules/control-plane/docs/RELATED_WORK.md +319 -0
- modules/control-plane/docs/RELEASE_v1.1.0.md +252 -0
- modules/control-plane/docs/REPRODUCIBILITY.md +540 -0
- modules/control-plane/docs/RESEARCH_FOUNDATION.md +197 -0
- modules/control-plane/docs/api/CORE.md +270 -0
- modules/control-plane/docs/architecture/architecture.md +120 -0
- modules/control-plane/docs/community/ANNOUNCEMENT_TEMPLATES.md +52 -0
- modules/control-plane/docs/guides/IMPLEMENTATION.md +225 -0
- modules/control-plane/docs/guides/PHILOSOPHY.md +354 -0
- modules/control-plane/docs/guides/QUICKSTART.md +217 -0
- modules/control-plane/examples/README.md +138 -0
- modules/control-plane/examples/a2a_demo.py +410 -0
- modules/control-plane/examples/adapter_demo.py +347 -0
- modules/control-plane/examples/advanced_features.py +403 -0
- modules/control-plane/examples/basic_usage.py +261 -0
- modules/control-plane/examples/benchmark_demo.py +186 -0
- modules/control-plane/examples/compliance_demo.py +333 -0
- modules/control-plane/examples/configuration.py +265 -0
- modules/control-plane/examples/getting_started.py +178 -0
- modules/control-plane/examples/hibernation_and_time_travel_demo.py +406 -0
- modules/control-plane/examples/interactive_tutorial.ipynb +497 -0
- modules/control-plane/examples/kernel_interceptor_demo.py +202 -0
- modules/control-plane/examples/kernel_v1_demo.py +273 -0
- modules/control-plane/examples/langchain_demo.py +281 -0
- modules/control-plane/examples/lifecycle_demo.py +724 -0
- modules/control-plane/examples/mcp_demo.py +378 -0
- modules/control-plane/examples/ml_safety_demo.py +157 -0
- modules/control-plane/examples/multimodal_demo.py +347 -0
- modules/control-plane/examples/observability_demo.py +370 -0
- modules/control-plane/examples/use_cases.py +336 -0
- modules/control-plane/experiments/long_horizon_purge.py +235 -0
- modules/control-plane/experiments/multi_agent_rag.py +165 -0
- modules/control-plane/experiments/reproduce_results.py +667 -0
- modules/control-plane/paper/ARXIV_SUBMISSION_INFO.txt +122 -0
- modules/control-plane/paper/ETHICS_STATEMENT.md +248 -0
- modules/control-plane/paper/PAPER_CHECKLIST.md +72 -0
- modules/control-plane/paper/Paper.pdf +0 -0
- modules/control-plane/paper/README.md +71 -0
- modules/control-plane/paper/appendix.md +152 -0
- modules/control-plane/paper/architecture.md +15 -0
- modules/control-plane/paper/arxiv/figures/ablation_chart.png +0 -0
- modules/control-plane/paper/arxiv/figures/architecture.png +0 -0
- modules/control-plane/paper/arxiv/figures/constraint_graphs.png +0 -0
- modules/control-plane/paper/arxiv/figures/results_chart.png +0 -0
- modules/control-plane/paper/arxiv/main.aux +97 -0
- modules/control-plane/paper/arxiv/main.bbl +112 -0
- modules/control-plane/paper/arxiv/main.blg +48 -0
- modules/control-plane/paper/arxiv/main.out +33 -0
- modules/control-plane/paper/arxiv/main.pdf +0 -0
- modules/control-plane/paper/arxiv/main.tex +479 -0
- modules/control-plane/paper/arxiv/references.bib +234 -0
- modules/control-plane/paper/arxiv_submission.tar +0 -0
- modules/control-plane/paper/arxiv_submission.zip +0 -0
- modules/control-plane/paper/build.sh +68 -0
- modules/control-plane/paper/figures/README.md +47 -0
- modules/control-plane/paper/figures/ablation_chart.pdf +0 -0
- modules/control-plane/paper/figures/ablation_chart.png +0 -0
- modules/control-plane/paper/figures/architecture.pdf +0 -0
- modules/control-plane/paper/figures/architecture.png +0 -0
- modules/control-plane/paper/figures/constraint_graphs.pdf +0 -0
- modules/control-plane/paper/figures/constraint_graphs.png +0 -0
- modules/control-plane/paper/figures/generate_figures.py +252 -0
- modules/control-plane/paper/figures/results_chart.pdf +0 -0
- modules/control-plane/paper/figures/results_chart.png +0 -0
- modules/control-plane/paper/main.md +273 -0
- modules/control-plane/paper/main.tex +214 -0
- modules/control-plane/paper/main_arxiv.aux +53 -0
- modules/control-plane/paper/main_arxiv.out +17 -0
- modules/control-plane/paper/main_arxiv.pdf +0 -0
- modules/control-plane/paper/main_arxiv.tex +264 -0
- modules/control-plane/paper/references.bib +234 -0
- modules/control-plane/pyproject.toml +124 -0
- modules/control-plane/reproducibility/ABLATIONS.md +136 -0
- modules/control-plane/reproducibility/README.md +288 -0
- modules/control-plane/reproducibility/commands.md +467 -0
- modules/control-plane/reproducibility/docker_config/Dockerfile +39 -0
- modules/control-plane/reproducibility/experiment_configs/purge_config.json +46 -0
- modules/control-plane/reproducibility/experiment_configs/rag_config.json +36 -0
- modules/control-plane/reproducibility/hardware_specs.md +317 -0
- modules/control-plane/reproducibility/requirements_frozen.txt +0 -0
- modules/control-plane/reproducibility/run_all_experiments.sh +45 -0
- modules/control-plane/reproducibility/seeds.json +106 -0
- modules/control-plane/scripts/prepare_pypi.py +46 -0
- modules/control-plane/scripts/prepare_release.py +176 -0
- modules/control-plane/scripts/upload_dataset_to_hf.py +316 -0
- modules/control-plane/setup.py +69 -0
- modules/control-plane/src/agent_control_plane/__init__.py +639 -0
- modules/control-plane/src/agent_control_plane/a2a_adapter.py +541 -0
- modules/control-plane/src/agent_control_plane/adapter.py +415 -0
- modules/control-plane/src/agent_control_plane/agent_hibernation.py +364 -0
- modules/control-plane/src/agent_control_plane/agent_kernel.py +464 -0
- modules/control-plane/src/agent_control_plane/compliance.py +718 -0
- modules/control-plane/src/agent_control_plane/constraint_graphs.py +475 -0
- modules/control-plane/src/agent_control_plane/control_plane.py +848 -0
- modules/control-plane/src/agent_control_plane/example_executors.py +193 -0
- modules/control-plane/src/agent_control_plane/execution_engine.py +229 -0
- modules/control-plane/src/agent_control_plane/flight_recorder.py +600 -0
- modules/control-plane/src/agent_control_plane/governance_layer.py +432 -0
- modules/control-plane/src/agent_control_plane/hf_utils.py +561 -0
- modules/control-plane/src/agent_control_plane/interfaces/__init__.py +53 -0
- modules/control-plane/src/agent_control_plane/interfaces/kernel_interface.py +359 -0
- modules/control-plane/src/agent_control_plane/interfaces/plugin_interface.py +495 -0
- modules/control-plane/src/agent_control_plane/interfaces/protocol_interfaces.py +385 -0
- modules/control-plane/src/agent_control_plane/kernel_space.py +707 -0
- modules/control-plane/src/agent_control_plane/langchain_adapter.py +422 -0
- modules/control-plane/src/agent_control_plane/lifecycle.py +3111 -0
- modules/control-plane/src/agent_control_plane/mcp_adapter.py +517 -0
- modules/control-plane/src/agent_control_plane/ml_safety.py +560 -0
- modules/control-plane/src/agent_control_plane/multimodal.py +724 -0
- modules/control-plane/src/agent_control_plane/mute_agent.py +419 -0
- modules/control-plane/src/agent_control_plane/observability.py +785 -0
- modules/control-plane/src/agent_control_plane/orchestrator.py +480 -0
- modules/control-plane/src/agent_control_plane/plugin_registry.py +748 -0
- modules/control-plane/src/agent_control_plane/policy_engine.py +525 -0
- modules/control-plane/src/agent_control_plane/shadow_mode.py +307 -0
- modules/control-plane/src/agent_control_plane/signals.py +491 -0
- modules/control-plane/src/agent_control_plane/supervisor_agents.py +427 -0
- modules/control-plane/src/agent_control_plane/time_travel_debugger.py +554 -0
- modules/control-plane/src/agent_control_plane/tool_registry.py +350 -0
- modules/control-plane/src/agent_control_plane/vfs.py +695 -0
- modules/control-plane/tests/README.md +33 -0
- modules/control-plane/tests/test_a2a_adapter.py +336 -0
- modules/control-plane/tests/test_adapter.py +422 -0
- modules/control-plane/tests/test_advanced_features.py +389 -0
- modules/control-plane/tests/test_benchmark.py +223 -0
- modules/control-plane/tests/test_compliance.py +214 -0
- modules/control-plane/tests/test_control_plane.py +295 -0
- modules/control-plane/tests/test_hibernation.py +274 -0
- modules/control-plane/tests/test_kernel_interception.py +284 -0
- modules/control-plane/tests/test_langchain_adapter.py +258 -0
- modules/control-plane/tests/test_lifecycle.py +1174 -0
- modules/control-plane/tests/test_mcp_adapter.py +293 -0
- modules/control-plane/tests/test_ml_safety.py +142 -0
- modules/control-plane/tests/test_multimodal.py +317 -0
- modules/control-plane/tests/test_new_features.py +435 -0
- modules/control-plane/tests/test_observability.py +338 -0
- modules/control-plane/tests/test_time_travel.py +387 -0
- modules/emk/.github/workflows/ci.yml +105 -0
- modules/emk/.github/workflows/publish.yml +144 -0
- modules/emk/.gitignore +74 -0
- modules/emk/CHANGELOG.md +41 -0
- modules/emk/CONTRIBUTING.md +295 -0
- modules/emk/IMPLEMENTATION.md +174 -0
- modules/emk/LICENSE +21 -0
- modules/emk/MANIFEST.in +8 -0
- modules/emk/README.md +135 -0
- modules/emk/RELEASE_NOTES.md +82 -0
- modules/emk/SECURITY.md +52 -0
- modules/emk/codecov.yml +39 -0
- modules/emk/docs/MEMORY_MANAGEMENT.md +285 -0
- modules/emk/emk/__init__.py +106 -0
- modules/emk/emk/hf_utils.py +419 -0
- modules/emk/emk/indexer.py +144 -0
- modules/emk/emk/py.typed +0 -0
- modules/emk/emk/schema.py +204 -0
- modules/emk/emk/sleep_cycle.py +345 -0
- modules/emk/emk/store.py +479 -0
- modules/emk/examples/basic_usage.py +123 -0
- modules/emk/examples/memory_features_demo.py +154 -0
- modules/emk/experiments/README.md +59 -0
- modules/emk/experiments/reproduce_results.py +461 -0
- modules/emk/experiments/results.json +61 -0
- modules/emk/paper/structure.tex +192 -0
- modules/emk/paper/whitepaper.md +273 -0
- modules/emk/pyproject.toml +91 -0
- modules/emk/setup.py +5 -0
- modules/emk/tests/test_file_adapter.py +195 -0
- modules/emk/tests/test_indexer.py +174 -0
- modules/emk/tests/test_init.py +55 -0
- modules/emk/tests/test_negative_memory.py +83 -0
- modules/emk/tests/test_schema.py +150 -0
- modules/emk/tests/test_semantic_rules.py +175 -0
- modules/emk/tests/test_sleep_cycle.py +335 -0
- modules/emk/tests/test_store_anti_patterns.py +239 -0
- modules/iatp/.github/workflows/docker-build.yml +124 -0
- modules/iatp/.github/workflows/publish.yml +174 -0
- modules/iatp/.github/workflows/python-package.yml +121 -0
- modules/iatp/.gitignore +67 -0
- modules/iatp/.pre-commit-config.yaml +64 -0
- modules/iatp/CHANGELOG.md +120 -0
- modules/iatp/Dockerfile +91 -0
- modules/iatp/IMPLEMENTATION_SUMMARY.md +218 -0
- modules/iatp/MANIFEST.in +9 -0
- modules/iatp/README.md +180 -0
- modules/iatp/docker/Dockerfile.agent +27 -0
- modules/iatp/docker/Dockerfile.sidecar-python +86 -0
- modules/iatp/docker/README.md +258 -0
- modules/iatp/docker-compose.yml +194 -0
- modules/iatp/docs/ARCHITECTURE.md +243 -0
- modules/iatp/docs/CLI_GUIDE.md +220 -0
- modules/iatp/docs/DEPLOYMENT.md +304 -0
- modules/iatp/examples/README.md +132 -0
- modules/iatp/examples/backend_agent.py +39 -0
- modules/iatp/examples/client.py +168 -0
- modules/iatp/examples/demo_attestation_reputation.py +274 -0
- modules/iatp/examples/demo_client.py +240 -0
- modules/iatp/examples/demo_rbac.py +143 -0
- modules/iatp/examples/integration_demo.py +245 -0
- modules/iatp/examples/manifests/coder_agent.json +20 -0
- modules/iatp/examples/manifests/reviewer_agent.json +19 -0
- modules/iatp/examples/manifests/secure_bank.json +14 -0
- modules/iatp/examples/manifests/standard_agent.json +14 -0
- modules/iatp/examples/manifests/untrusted_honeypot.json +14 -0
- modules/iatp/examples/run_secure_bank_sidecar.py +85 -0
- modules/iatp/examples/run_sidecar.py +105 -0
- modules/iatp/examples/run_untrusted_sidecar.py +77 -0
- modules/iatp/examples/secure_bank_agent.py +138 -0
- modules/iatp/examples/test_untrusted.py +82 -0
- modules/iatp/examples/untrusted_agent.py +119 -0
- modules/iatp/experiments/README.md +58 -0
- modules/iatp/experiments/cascading_hallucination/README.md +149 -0
- modules/iatp/experiments/cascading_hallucination/agent_a_user.py +41 -0
- modules/iatp/experiments/cascading_hallucination/agent_b_summarizer.py +54 -0
- modules/iatp/experiments/cascading_hallucination/agent_c_database.py +47 -0
- modules/iatp/experiments/cascading_hallucination/proof_of_concept.py +290 -0
- modules/iatp/experiments/cascading_hallucination/run_experiment.py +226 -0
- modules/iatp/experiments/cascading_hallucination/sidecar_c.py +61 -0
- modules/iatp/experiments/reproduce_results.py +574 -0
- modules/iatp/experiments/results.json +2336 -0
- modules/iatp/iatp/__init__.py +164 -0
- modules/iatp/iatp/attestation.py +401 -0
- modules/iatp/iatp/cli.py +253 -0
- modules/iatp/iatp/hf_utils.py +469 -0
- modules/iatp/iatp/ipc_pipes.py +578 -0
- modules/iatp/iatp/main.py +410 -0
- modules/iatp/iatp/models/__init__.py +445 -0
- modules/iatp/iatp/policy_engine.py +335 -0
- modules/iatp/iatp/py.typed +2 -0
- modules/iatp/iatp/recovery.py +319 -0
- modules/iatp/iatp/security/__init__.py +268 -0
- modules/iatp/iatp/sidecar/__init__.py +517 -0
- modules/iatp/iatp/telemetry/__init__.py +162 -0
- modules/iatp/iatp/tests/__init__.py +1 -0
- modules/iatp/iatp/tests/test_attestation.py +368 -0
- modules/iatp/iatp/tests/test_cli.py +129 -0
- modules/iatp/iatp/tests/test_models.py +128 -0
- modules/iatp/iatp/tests/test_policy_engine.py +345 -0
- modules/iatp/iatp/tests/test_recovery.py +279 -0
- modules/iatp/iatp/tests/test_security.py +220 -0
- modules/iatp/iatp/tests/test_sidecar.py +165 -0
- modules/iatp/iatp/tests/test_telemetry.py +173 -0
- modules/iatp/paper/BLOG.md +307 -0
- modules/iatp/paper/PAPER.md +236 -0
- modules/iatp/paper/RFC_SUBMISSION.md +299 -0
- modules/iatp/paper/whitepaper.md +369 -0
- modules/iatp/proto/README.md +200 -0
- modules/iatp/proto/generate_stubs.py +81 -0
- modules/iatp/proto/iatp.proto +552 -0
- modules/iatp/pyproject.toml +180 -0
- modules/iatp/requirements-dev.txt +2 -0
- modules/iatp/requirements.txt +6 -0
- modules/iatp/setup.py +60 -0
- modules/iatp/sidecar/README.md +487 -0
- modules/iatp/sidecar/go/Dockerfile +32 -0
- modules/iatp/sidecar/go/README.md +237 -0
- modules/iatp/sidecar/go/go.mod +8 -0
- modules/iatp/sidecar/go/main.go +488 -0
- modules/iatp/spec/001-handshake.md +436 -0
- modules/iatp/spec/002-reversibility.md +394 -0
- modules/iatp/spec/schema/capability_manifest.json +266 -0
- modules/iatp/test_integration.py +310 -0
- modules/mcp-kernel-server/README.md +261 -0
- modules/mcp-kernel-server/pyproject.toml +60 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/__init__.py +26 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/cli.py +229 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/resources.py +215 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/server.py +562 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/tools.py +1172 -0
- modules/mute-agent/.github/workflows/safety_check.yml +45 -0
- modules/mute-agent/.gitignore +53 -0
- modules/mute-agent/ARCHITECTURE.md +531 -0
- modules/mute-agent/BENCHMARK_GUIDE.md +384 -0
- modules/mute-agent/COMPLETION_SUMMARY.md +293 -0
- modules/mute-agent/EXPERIMENT_SUMMARY.md +318 -0
- modules/mute-agent/IMPLEMENTATION_SUMMARY.md +212 -0
- modules/mute-agent/LICENSE +21 -0
- modules/mute-agent/PHASE3_SUMMARY.md +297 -0
- modules/mute-agent/README.md +360 -0
- modules/mute-agent/STEEL_MAN_RESULTS.md +353 -0
- modules/mute-agent/USAGE.md +505 -0
- modules/mute-agent/V2_IMPLEMENTATION_SUMMARY.md +253 -0
- modules/mute-agent/V2_STEEL_MAN_IMPLEMENTATION.md +274 -0
- modules/mute-agent/VERIFICATION_REPORT.md +435 -0
- modules/mute-agent/charts/cost_comparison.png +0 -0
- modules/mute-agent/charts/cost_vs_ambiguity.png +0 -0
- modules/mute-agent/charts/metrics_comparison.png +0 -0
- modules/mute-agent/charts/scenario_breakdown.png +0 -0
- modules/mute-agent/charts/trace_attack_blocked.html +140 -0
- modules/mute-agent/charts/trace_attack_blocked.png +0 -0
- modules/mute-agent/charts/trace_failure.html +140 -0
- modules/mute-agent/charts/trace_failure.png +0 -0
- modules/mute-agent/charts/trace_success.html +140 -0
- modules/mute-agent/charts/trace_success.png +0 -0
- modules/mute-agent/examples/__init__.py +1 -0
- modules/mute-agent/examples/advanced_example.py +384 -0
- modules/mute-agent/examples/graph_debugger_demo.py +241 -0
- modules/mute-agent/examples/listener_example.py +297 -0
- modules/mute-agent/examples/simple_example.py +242 -0
- modules/mute-agent/examples/steel_man_demo.py +297 -0
- modules/mute-agent/experiments/README.md +135 -0
- modules/mute-agent/experiments/__init__.py +3 -0
- modules/mute-agent/experiments/agent_comparison.csv +6 -0
- modules/mute-agent/experiments/agent_comparison_50runs.csv +6 -0
- modules/mute-agent/experiments/ambiguity_test.py +335 -0
- modules/mute-agent/experiments/ambiguity_test_results.csv +31 -0
- modules/mute-agent/experiments/ambiguity_test_results_50runs.csv +51 -0
- modules/mute-agent/experiments/baseline_agent.py +189 -0
- modules/mute-agent/experiments/benchmark.py +402 -0
- modules/mute-agent/experiments/demo.py +172 -0
- modules/mute-agent/experiments/generate_cost_curve.py +474 -0
- modules/mute-agent/experiments/jailbreak_test.py +137 -0
- modules/mute-agent/experiments/latent_state_scenario.py +361 -0
- modules/mute-agent/experiments/mute_agent_experiment.py +349 -0
- modules/mute-agent/experiments/run_extended_experiment.py +40 -0
- modules/mute-agent/experiments/run_v2_experiments.py +266 -0
- modules/mute-agent/experiments/run_v2_experiments_auto.py +247 -0
- modules/mute-agent/experiments/v2_scenarios/README.md +214 -0
- modules/mute-agent/experiments/v2_scenarios/__init__.py +4 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_1_deep_dependency.py +325 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_2_adversarial.py +328 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_3_false_positive.py +303 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_4_performance.py +319 -0
- modules/mute-agent/experiments/visualize.py +400 -0
- modules/mute-agent/mute_agent/__init__.py +66 -0
- modules/mute-agent/mute_agent/core/__init__.py +1 -0
- modules/mute-agent/mute_agent/core/execution_agent.py +164 -0
- modules/mute-agent/mute_agent/core/handshake_protocol.py +199 -0
- modules/mute-agent/mute_agent/core/reasoning_agent.py +236 -0
- modules/mute-agent/mute_agent/knowledge_graph/__init__.py +1 -0
- modules/mute-agent/mute_agent/knowledge_graph/graph_elements.py +63 -0
- modules/mute-agent/mute_agent/knowledge_graph/multidimensional_graph.py +168 -0
- modules/mute-agent/mute_agent/knowledge_graph/subgraph.py +222 -0
- modules/mute-agent/mute_agent/listener/__init__.py +41 -0
- modules/mute-agent/mute_agent/listener/adapters/__init__.py +29 -0
- modules/mute-agent/mute_agent/listener/adapters/base_adapter.py +187 -0
- modules/mute-agent/mute_agent/listener/adapters/caas_adapter.py +342 -0
- modules/mute-agent/mute_agent/listener/adapters/control_plane_adapter.py +434 -0
- modules/mute-agent/mute_agent/listener/adapters/iatp_adapter.py +330 -0
- modules/mute-agent/mute_agent/listener/adapters/scak_adapter.py +249 -0
- modules/mute-agent/mute_agent/listener/listener.py +608 -0
- modules/mute-agent/mute_agent/listener/state_observer.py +434 -0
- modules/mute-agent/mute_agent/listener/threshold_config.py +311 -0
- modules/mute-agent/mute_agent/super_system/__init__.py +1 -0
- modules/mute-agent/mute_agent/super_system/router.py +202 -0
- modules/mute-agent/mute_agent/visualization/__init__.py +8 -0
- modules/mute-agent/mute_agent/visualization/graph_debugger.py +495 -0
- modules/mute-agent/requirements-dev.txt +6 -0
- modules/mute-agent/requirements.txt +9 -0
- modules/mute-agent/setup.py +64 -0
- modules/mute-agent/src/__init__.py +0 -0
- modules/mute-agent/src/agents/__init__.py +0 -0
- modules/mute-agent/src/agents/baseline_agent.py +524 -0
- modules/mute-agent/src/agents/interactive_agent.py +113 -0
- modules/mute-agent/src/agents/mute_agent.py +622 -0
- modules/mute-agent/src/benchmarks/__init__.py +0 -0
- modules/mute-agent/src/benchmarks/evaluator.py +481 -0
- modules/mute-agent/src/benchmarks/scenarios.json +985 -0
- modules/mute-agent/src/core/__init__.py +0 -0
- modules/mute-agent/src/core/mock_state.py +320 -0
- modules/mute-agent/src/core/tools.py +441 -0
- modules/nexus/__init__.py +49 -0
- modules/nexus/arbiter.py +357 -0
- modules/nexus/client.py +464 -0
- modules/nexus/dmz.py +417 -0
- modules/nexus/escrow.py +428 -0
- modules/nexus/exceptions.py +284 -0
- modules/nexus/registry.py +391 -0
- modules/nexus/reputation.py +423 -0
- modules/nexus/schemas/__init__.py +49 -0
- modules/nexus/schemas/compliance.py +274 -0
- modules/nexus/schemas/escrow.py +249 -0
- modules/nexus/schemas/manifest.py +223 -0
- modules/nexus/schemas/receipt.py +206 -0
- modules/observability/README.md +192 -0
- modules/observability/alertmanager/alertmanager.yml +116 -0
- modules/observability/alerts/agent-os-alerts.yaml +197 -0
- modules/observability/docker-compose.yml +128 -0
- modules/observability/grafana/dashboards/agent-os-amb.json +448 -0
- modules/observability/grafana/dashboards/agent-os-cmvk.json +441 -0
- modules/observability/grafana/dashboards/agent-os-overview.json +268 -0
- modules/observability/grafana/dashboards/agent-os-performance.json +15 -0
- modules/observability/grafana/dashboards/agent-os-safety.json +50 -0
- modules/observability/grafana/provisioning/dashboards/dashboards.yml +15 -0
- modules/observability/grafana/provisioning/datasources/datasources.yml +33 -0
- modules/observability/otel/otel-collector-config.yml +61 -0
- modules/observability/prometheus/prometheus.yml +63 -0
- modules/observability/pyproject.toml +53 -0
- modules/observability/scripts/export_dashboards.py +55 -0
- modules/observability/src/agent_os_observability/__init__.py +25 -0
- modules/observability/src/agent_os_observability/dashboards.py +896 -0
- modules/observability/src/agent_os_observability/metrics.py +396 -0
- modules/observability/src/agent_os_observability/server.py +221 -0
- modules/observability/src/agent_os_observability/tracer.py +226 -0
- modules/primitives/.gitignore +8 -0
- modules/primitives/README.md +62 -0
- modules/primitives/agent_primitives/__init__.py +22 -0
- modules/primitives/agent_primitives/failures.py +82 -0
- modules/primitives/agent_primitives/py.typed +0 -0
- modules/primitives/pyproject.toml +68 -0
- modules/scak/.github/copilot-instructions.md +396 -0
- modules/scak/.github/workflows/release.yml +117 -0
- modules/scak/.gitignore +32 -0
- modules/scak/CHANGELOG.md +173 -0
- modules/scak/CITATION.cff +62 -0
- modules/scak/CONTRIBUTING.md +429 -0
- modules/scak/Dockerfile +58 -0
- modules/scak/ENTERPRISE_FEATURES.md +518 -0
- modules/scak/IMPLEMENTATION_SUMMARY.md +206 -0
- modules/scak/LIMITATIONS.md +565 -0
- modules/scak/MANIFEST.in +16 -0
- modules/scak/NOVELTY.md +535 -0
- modules/scak/README.md +928 -0
- modules/scak/RESEARCH.md +670 -0
- modules/scak/agent_kernel/__init__.py +66 -0
- modules/scak/agent_kernel/analyzer.py +432 -0
- modules/scak/agent_kernel/auditor.py +31 -0
- modules/scak/agent_kernel/completeness_auditor.py +234 -0
- modules/scak/agent_kernel/detector.py +200 -0
- modules/scak/agent_kernel/kernel.py +741 -0
- modules/scak/agent_kernel/memory_manager.py +82 -0
- modules/scak/agent_kernel/models.py +372 -0
- modules/scak/agent_kernel/nudge_mechanism.py +260 -0
- modules/scak/agent_kernel/outcome_analyzer.py +335 -0
- modules/scak/agent_kernel/patcher.py +579 -0
- modules/scak/agent_kernel/semantic_analyzer.py +313 -0
- modules/scak/agent_kernel/semantic_purge.py +346 -0
- modules/scak/agent_kernel/simulator.py +447 -0
- modules/scak/agent_kernel/teacher.py +82 -0
- modules/scak/agent_kernel/triage.py +149 -0
- modules/scak/build_and_publish.ps1 +74 -0
- modules/scak/build_and_publish.sh +74 -0
- modules/scak/cli.py +471 -0
- modules/scak/dashboard.py +462 -0
- modules/scak/datasets/DATASET_CARD.md +219 -0
- modules/scak/datasets/README.md +143 -0
- modules/scak/datasets/gaia_vague_queries/vague_queries.json +262 -0
- modules/scak/datasets/hf_upload/README.md +219 -0
- modules/scak/datasets/hf_upload/scak_gaia_laziness.jsonl +50 -0
- modules/scak/datasets/prepare_hf_datasets.py +145 -0
- modules/scak/datasets/red_team/jailbreak_patterns.json +202 -0
- modules/scak/docker-compose.yml +99 -0
- modules/scak/docs/Adaptive-Memory-Hierarchy.md +319 -0
- modules/scak/docs/Data-Contracts-and-Schemas.md +285 -0
- modules/scak/docs/Dual-Loop-Architecture.md +344 -0
- modules/scak/docs/Enhanced-Features.md +612 -0
- modules/scak/docs/LANGCHAIN_INTEGRATION.md +572 -0
- modules/scak/docs/README.md +128 -0
- modules/scak/docs/Reference-Implementations.md +163 -0
- modules/scak/docs/SCAK_V2.md +374 -0
- modules/scak/docs/Three-Failure-Types.md +178 -0
- modules/scak/examples/basic_example.py +155 -0
- modules/scak/examples/circuit_breaker_lazy_eval_demo.py +243 -0
- modules/scak/examples/langchain_integration_example.py +339 -0
- modules/scak/examples/layer4_demo.py +243 -0
- modules/scak/examples/production_features_demo.py +353 -0
- modules/scak/examples/quick_demo.py +79 -0
- modules/scak/examples/scak_v2_demo.py +252 -0
- modules/scak/experiments/README.md +438 -0
- modules/scak/experiments/ablation_studies/README.md +192 -0
- modules/scak/experiments/ablation_studies/ablation_no_audit.py +116 -0
- modules/scak/experiments/ablation_studies/ablation_no_purge.py +133 -0
- modules/scak/experiments/chaos_engineering/README.md +332 -0
- modules/scak/experiments/context_efficiency_test.py +328 -0
- modules/scak/experiments/gaia_benchmark/README.md +208 -0
- modules/scak/experiments/laziness_benchmark.py +179 -0
- modules/scak/experiments/long_horizon_task_experiment.py +252 -0
- modules/scak/experiments/multi_agent_rag_experiment.py +284 -0
- modules/scak/experiments/results/ablation_table.md +12 -0
- modules/scak/experiments/results/long_horizon.json +36 -0
- modules/scak/experiments/results/multi_agent_rag.json +66 -0
- modules/scak/experiments/run_comprehensive_ablations.py +332 -0
- modules/scak/experiments/test_auditor_patcher_integration.py +251 -0
- modules/scak/notebooks/getting_started.ipynb +33 -0
- modules/scak/paper/ARXIV_SUBMISSION_METADATA.txt +109 -0
- modules/scak/paper/PAPER_CHECKLIST.md +304 -0
- modules/scak/paper/Paper.pdf +0 -0
- modules/scak/paper/README.md +113 -0
- modules/scak/paper/appendix.md +351 -0
- modules/scak/paper/arxiv/bibliography.bib +284 -0
- modules/scak/paper/arxiv/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/arxiv/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/arxiv/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/arxiv/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/arxiv/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/arxiv/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/arxiv/main.aux +103 -0
- modules/scak/paper/arxiv/main.bbl +113 -0
- modules/scak/paper/arxiv/main.blg +55 -0
- modules/scak/paper/arxiv/main.out +31 -0
- modules/scak/paper/arxiv/main.pdf +0 -0
- modules/scak/paper/arxiv/main.tex +482 -0
- modules/scak/paper/arxiv_submission/bibliography.bib +284 -0
- modules/scak/paper/arxiv_submission/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/arxiv_submission/main.aux +103 -0
- modules/scak/paper/arxiv_submission/main.bbl +113 -0
- modules/scak/paper/arxiv_submission/main.blg +55 -0
- modules/scak/paper/arxiv_submission/main.out +31 -0
- modules/scak/paper/arxiv_submission/main.pdf +0 -0
- modules/scak/paper/arxiv_submission/main.tex +482 -0
- modules/scak/paper/arxiv_submission.tar.gz +0 -0
- modules/scak/paper/bibliography.bib +284 -0
- modules/scak/paper/build.sh +55 -0
- modules/scak/paper/figures/README.md +32 -0
- modules/scak/paper/figures/fig1_ooda_architecture.md +75 -0
- modules/scak/paper/figures/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/figures/fig1_ooda_architecture.png +0 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.md +83 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.png +0 -0
- modules/scak/paper/figures/fig3_gaia_results.md +64 -0
- modules/scak/paper/figures/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/figures/fig3_gaia_results.png +0 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.md +64 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.png +0 -0
- modules/scak/paper/figures/fig5_context_reduction.md +71 -0
- modules/scak/paper/figures/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/figures/fig5_context_reduction.png +0 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.md +80 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.png +0 -0
- modules/scak/paper/figures/generate_figures.py +463 -0
- modules/scak/paper/main.aux +103 -0
- modules/scak/paper/main.bbl +113 -0
- modules/scak/paper/main.blg +55 -0
- modules/scak/paper/main.md +192 -0
- modules/scak/paper/main.out +31 -0
- modules/scak/paper/main.pdf +0 -0
- modules/scak/paper/main.tex +482 -0
- modules/scak/reproducibility/ABLATIONS.md +225 -0
- modules/scak/reproducibility/Dockerfile.reproducibility +34 -0
- modules/scak/reproducibility/README.md +421 -0
- modules/scak/reproducibility/requirements-pinned.txt +32 -0
- modules/scak/reproducibility/run_all_experiments.py +395 -0
- modules/scak/reproducibility/seed_control.py +53 -0
- modules/scak/reproducibility/statistical_analysis.py +302 -0
- modules/scak/requirements.txt +50 -0
- modules/scak/setup.py +93 -0
- modules/scak/src/__init__.py +124 -0
- modules/scak/src/agents/__init__.py +13 -0
- modules/scak/src/agents/conflict_resolution.py +732 -0
- modules/scak/src/agents/orchestrator.py +761 -0
- modules/scak/src/agents/pubsub.py +484 -0
- modules/scak/src/agents/shadow_teacher.py +344 -0
- modules/scak/src/agents/swarm.py +661 -0
- modules/scak/src/agents/worker.py +357 -0
- modules/scak/src/integrations/__init__.py +81 -0
- modules/scak/src/integrations/cmvk_adapter.py +430 -0
- modules/scak/src/integrations/control_plane_adapter.py +601 -0
- modules/scak/src/integrations/langchain_integration.py +902 -0
- modules/scak/src/interfaces/__init__.py +59 -0
- modules/scak/src/interfaces/llm_clients.py +505 -0
- modules/scak/src/interfaces/openapi_tools.py +611 -0
- modules/scak/src/interfaces/plugin_system.py +605 -0
- modules/scak/src/interfaces/protocols.py +365 -0
- modules/scak/src/interfaces/telemetry.py +464 -0
- modules/scak/src/interfaces/tool_registry.py +547 -0
- modules/scak/src/kernel/__init__.py +100 -0
- modules/scak/src/kernel/auditor.py +305 -0
- modules/scak/src/kernel/circuit_breaker.py +398 -0
- modules/scak/src/kernel/core.py +724 -0
- modules/scak/src/kernel/distributed.py +667 -0
- modules/scak/src/kernel/evolution.py +455 -0
- modules/scak/src/kernel/failover.py +621 -0
- modules/scak/src/kernel/governance.py +710 -0
- modules/scak/src/kernel/governance_v2.py +603 -0
- modules/scak/src/kernel/lazy_evaluator.py +514 -0
- modules/scak/src/kernel/load_testing.py +633 -0
- modules/scak/src/kernel/memory.py +945 -0
- modules/scak/src/kernel/patcher.py +581 -0
- modules/scak/src/kernel/rubric.py +419 -0
- modules/scak/src/kernel/schemas.py +390 -0
- modules/scak/src/kernel/skill_mapper.py +309 -0
- modules/scak/src/kernel/triage.py +149 -0
- modules/scak/src/mocks/__init__.py +99 -0
- modules/scak/tests/__init__.py +1 -0
- modules/scak/tests/test_circuit_breaker.py +403 -0
- modules/scak/tests/test_conflict_resolution.py +287 -0
- modules/scak/tests/test_dual_loop.py +463 -0
- modules/scak/tests/test_enhanced_features.py +421 -0
- modules/scak/tests/test_failover_and_load.py +438 -0
- modules/scak/tests/test_governance.py +185 -0
- modules/scak/tests/test_kernel.py +359 -0
- modules/scak/tests/test_langchain_integration.py +451 -0
- modules/scak/tests/test_lazy_evaluator.py +465 -0
- modules/scak/tests/test_llm_clients.py +122 -0
- modules/scak/tests/test_memory_controller.py +528 -0
- modules/scak/tests/test_orchestrator.py +181 -0
- modules/scak/tests/test_phase3_integration.py +265 -0
- modules/scak/tests/test_pubsub_swarm.py +203 -0
- modules/scak/tests/test_reference_implementations.py +240 -0
- modules/scak/tests/test_rubric.py +363 -0
- modules/scak/tests/test_scak_v2.py +651 -0
- modules/scak/tests/test_skill_mapper.py +217 -0
- modules/scak/tests/test_specific_failures.py +393 -0
- modules/scak/tests/test_tool_registry.py +264 -0
- modules/scak/tests/test_tools_and_plugins.py +303 -0
- modules/scak/tests/test_triage.py +596 -0
- modules/scak/tests/test_write_through.py +319 -0
- agent_os_kernel-1.1.0.dist-info/METADATA +0 -400
- agent_os_kernel-1.1.0.dist-info/RECORD +0 -12
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/WHEEL +0 -0
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/licenses/LICENSE +0 -0
|
@@ -0,0 +1,2336 @@
|
|
|
1
|
+
{
|
|
2
|
+
"config": {
|
|
3
|
+
"seed": 42,
|
|
4
|
+
"num_runs": 10,
|
|
5
|
+
"timestamp": "2026-01-23T23:24:37.544187+00:00",
|
|
6
|
+
"iatp_version": "0.3.1",
|
|
7
|
+
"python_version": "3.13.9 (tags/v3.13.9:8183fa5, Oct 14 2025, 14:09:13) [MSC v.1944 64 bit (AMD64)]"
|
|
8
|
+
},
|
|
9
|
+
"metrics": [
|
|
10
|
+
{
|
|
11
|
+
"name": "cascading_failure_prevention_rate",
|
|
12
|
+
"value": 100.0,
|
|
13
|
+
"unit": "%",
|
|
14
|
+
"description": "Percentage of malicious requests blocked or warned"
|
|
15
|
+
},
|
|
16
|
+
{
|
|
17
|
+
"name": "total_experiments",
|
|
18
|
+
"value": 250,
|
|
19
|
+
"unit": "count",
|
|
20
|
+
"description": "Total number of experiment runs"
|
|
21
|
+
},
|
|
22
|
+
{
|
|
23
|
+
"name": "requests_blocked",
|
|
24
|
+
"value": 40,
|
|
25
|
+
"unit": "count",
|
|
26
|
+
"description": "Number of requests blocked by IATP"
|
|
27
|
+
},
|
|
28
|
+
{
|
|
29
|
+
"name": "requests_warned",
|
|
30
|
+
"value": 80,
|
|
31
|
+
"unit": "count",
|
|
32
|
+
"description": "Number of requests that triggered warnings"
|
|
33
|
+
},
|
|
34
|
+
{
|
|
35
|
+
"name": "requests_allowed",
|
|
36
|
+
"value": 130,
|
|
37
|
+
"unit": "count",
|
|
38
|
+
"description": "Number of requests allowed through"
|
|
39
|
+
},
|
|
40
|
+
{
|
|
41
|
+
"name": "control_group_failures",
|
|
42
|
+
"value": 100,
|
|
43
|
+
"unit": "count",
|
|
44
|
+
"description": "Failures that would occur without IATP"
|
|
45
|
+
},
|
|
46
|
+
{
|
|
47
|
+
"name": "avg_latency",
|
|
48
|
+
"value": 0.0236,
|
|
49
|
+
"unit": "ms",
|
|
50
|
+
"description": "Average validation latency"
|
|
51
|
+
},
|
|
52
|
+
{
|
|
53
|
+
"name": "max_latency",
|
|
54
|
+
"value": 0.1042,
|
|
55
|
+
"unit": "ms",
|
|
56
|
+
"description": "Maximum validation latency"
|
|
57
|
+
},
|
|
58
|
+
{
|
|
59
|
+
"name": "min_latency",
|
|
60
|
+
"value": 0.0142,
|
|
61
|
+
"unit": "ms",
|
|
62
|
+
"description": "Minimum validation latency"
|
|
63
|
+
}
|
|
64
|
+
],
|
|
65
|
+
"summary": {
|
|
66
|
+
"headline": "IATP prevents 100.0% of cascading failures",
|
|
67
|
+
"key_findings": [
|
|
68
|
+
"Blocked 40 malicious requests",
|
|
69
|
+
"Warned on 80 risky requests",
|
|
70
|
+
"Average latency overhead: 0.02ms",
|
|
71
|
+
"Control group would have 100 failures"
|
|
72
|
+
],
|
|
73
|
+
"comparison": {
|
|
74
|
+
"control_group": {
|
|
75
|
+
"cascading_failures": 100,
|
|
76
|
+
"protection": "0%"
|
|
77
|
+
},
|
|
78
|
+
"iatp_protected": {
|
|
79
|
+
"cascading_failures": 0,
|
|
80
|
+
"protection": "100.0%"
|
|
81
|
+
}
|
|
82
|
+
}
|
|
83
|
+
},
|
|
84
|
+
"raw_results": [
|
|
85
|
+
{
|
|
86
|
+
"run_id": 0,
|
|
87
|
+
"scenario": "verified_secure_safe_read",
|
|
88
|
+
"control_outcome": "success",
|
|
89
|
+
"iatp_outcome": "allowed",
|
|
90
|
+
"trust_score": 10,
|
|
91
|
+
"latency_ms": 0.10419997852295637,
|
|
92
|
+
"policy_decision": "ALLOW"
|
|
93
|
+
},
|
|
94
|
+
{
|
|
95
|
+
"run_id": 1,
|
|
96
|
+
"scenario": "verified_secure_safe_write",
|
|
97
|
+
"control_outcome": "success",
|
|
98
|
+
"iatp_outcome": "allowed",
|
|
99
|
+
"trust_score": 10,
|
|
100
|
+
"latency_ms": 0.041599967516958714,
|
|
101
|
+
"policy_decision": "ALLOW"
|
|
102
|
+
},
|
|
103
|
+
{
|
|
104
|
+
"run_id": 2,
|
|
105
|
+
"scenario": "verified_secure_destructive",
|
|
106
|
+
"control_outcome": "success",
|
|
107
|
+
"iatp_outcome": "allowed",
|
|
108
|
+
"trust_score": 10,
|
|
109
|
+
"latency_ms": 0.024499953724443913,
|
|
110
|
+
"policy_decision": "ALLOW"
|
|
111
|
+
},
|
|
112
|
+
{
|
|
113
|
+
"run_id": 3,
|
|
114
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
115
|
+
"control_outcome": "success",
|
|
116
|
+
"iatp_outcome": "allowed",
|
|
117
|
+
"trust_score": 10,
|
|
118
|
+
"latency_ms": 0.0868999632075429,
|
|
119
|
+
"policy_decision": "ALLOW"
|
|
120
|
+
},
|
|
121
|
+
{
|
|
122
|
+
"run_id": 4,
|
|
123
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
124
|
+
"control_outcome": "success",
|
|
125
|
+
"iatp_outcome": "allowed",
|
|
126
|
+
"trust_score": 10,
|
|
127
|
+
"latency_ms": 0.029099988751113415,
|
|
128
|
+
"policy_decision": "ALLOW"
|
|
129
|
+
},
|
|
130
|
+
{
|
|
131
|
+
"run_id": 5,
|
|
132
|
+
"scenario": "trusted_partial_safe_read",
|
|
133
|
+
"control_outcome": "success",
|
|
134
|
+
"iatp_outcome": "allowed",
|
|
135
|
+
"trust_score": 10,
|
|
136
|
+
"latency_ms": 0.03290001768618822,
|
|
137
|
+
"policy_decision": "ALLOW"
|
|
138
|
+
},
|
|
139
|
+
{
|
|
140
|
+
"run_id": 6,
|
|
141
|
+
"scenario": "trusted_partial_safe_write",
|
|
142
|
+
"control_outcome": "success",
|
|
143
|
+
"iatp_outcome": "allowed",
|
|
144
|
+
"trust_score": 10,
|
|
145
|
+
"latency_ms": 0.02289994154125452,
|
|
146
|
+
"policy_decision": "ALLOW"
|
|
147
|
+
},
|
|
148
|
+
{
|
|
149
|
+
"run_id": 7,
|
|
150
|
+
"scenario": "trusted_partial_destructive",
|
|
151
|
+
"control_outcome": "success",
|
|
152
|
+
"iatp_outcome": "allowed",
|
|
153
|
+
"trust_score": 10,
|
|
154
|
+
"latency_ms": 0.018300022929906845,
|
|
155
|
+
"policy_decision": "ALLOW"
|
|
156
|
+
},
|
|
157
|
+
{
|
|
158
|
+
"run_id": 8,
|
|
159
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
160
|
+
"control_outcome": "success",
|
|
161
|
+
"iatp_outcome": "blocked",
|
|
162
|
+
"trust_score": 10,
|
|
163
|
+
"latency_ms": 0.043199979700148106,
|
|
164
|
+
"policy_decision": "ALLOW"
|
|
165
|
+
},
|
|
166
|
+
{
|
|
167
|
+
"run_id": 9,
|
|
168
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
169
|
+
"control_outcome": "success",
|
|
170
|
+
"iatp_outcome": "allowed",
|
|
171
|
+
"trust_score": 10,
|
|
172
|
+
"latency_ms": 0.026499968953430653,
|
|
173
|
+
"policy_decision": "ALLOW"
|
|
174
|
+
},
|
|
175
|
+
{
|
|
176
|
+
"run_id": 10,
|
|
177
|
+
"scenario": "standard_unknown_safe_read",
|
|
178
|
+
"control_outcome": "failure",
|
|
179
|
+
"iatp_outcome": "warned",
|
|
180
|
+
"trust_score": 1,
|
|
181
|
+
"latency_ms": 0.04099996294826269,
|
|
182
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
183
|
+
},
|
|
184
|
+
{
|
|
185
|
+
"run_id": 11,
|
|
186
|
+
"scenario": "standard_unknown_safe_write",
|
|
187
|
+
"control_outcome": "failure",
|
|
188
|
+
"iatp_outcome": "warned",
|
|
189
|
+
"trust_score": 1,
|
|
190
|
+
"latency_ms": 0.029999995604157448,
|
|
191
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
192
|
+
},
|
|
193
|
+
{
|
|
194
|
+
"run_id": 12,
|
|
195
|
+
"scenario": "standard_unknown_destructive",
|
|
196
|
+
"control_outcome": "failure",
|
|
197
|
+
"iatp_outcome": "warned",
|
|
198
|
+
"trust_score": 1,
|
|
199
|
+
"latency_ms": 0.021000043489038944,
|
|
200
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
201
|
+
},
|
|
202
|
+
{
|
|
203
|
+
"run_id": 13,
|
|
204
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
205
|
+
"control_outcome": "failure",
|
|
206
|
+
"iatp_outcome": "blocked",
|
|
207
|
+
"trust_score": 1,
|
|
208
|
+
"latency_ms": 0.03720005042850971,
|
|
209
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
210
|
+
},
|
|
211
|
+
{
|
|
212
|
+
"run_id": 14,
|
|
213
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
214
|
+
"control_outcome": "failure",
|
|
215
|
+
"iatp_outcome": "warned",
|
|
216
|
+
"trust_score": 1,
|
|
217
|
+
"latency_ms": 0.026600086130201817,
|
|
218
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
219
|
+
},
|
|
220
|
+
{
|
|
221
|
+
"run_id": 15,
|
|
222
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
223
|
+
"control_outcome": "failure",
|
|
224
|
+
"iatp_outcome": "warned",
|
|
225
|
+
"trust_score": 0,
|
|
226
|
+
"latency_ms": 0.026999972760677338,
|
|
227
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
228
|
+
},
|
|
229
|
+
{
|
|
230
|
+
"run_id": 16,
|
|
231
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
232
|
+
"control_outcome": "failure",
|
|
233
|
+
"iatp_outcome": "warned",
|
|
234
|
+
"trust_score": 0,
|
|
235
|
+
"latency_ms": 0.02329994458705187,
|
|
236
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
237
|
+
},
|
|
238
|
+
{
|
|
239
|
+
"run_id": 17,
|
|
240
|
+
"scenario": "untrusted_malicious_destructive",
|
|
241
|
+
"control_outcome": "failure",
|
|
242
|
+
"iatp_outcome": "warned",
|
|
243
|
+
"trust_score": 0,
|
|
244
|
+
"latency_ms": 0.018700025975704193,
|
|
245
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
246
|
+
},
|
|
247
|
+
{
|
|
248
|
+
"run_id": 18,
|
|
249
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
250
|
+
"control_outcome": "failure",
|
|
251
|
+
"iatp_outcome": "blocked",
|
|
252
|
+
"trust_score": 0,
|
|
253
|
+
"latency_ms": 0.03300001844763756,
|
|
254
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
255
|
+
},
|
|
256
|
+
{
|
|
257
|
+
"run_id": 19,
|
|
258
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
259
|
+
"control_outcome": "failure",
|
|
260
|
+
"iatp_outcome": "warned",
|
|
261
|
+
"trust_score": 0,
|
|
262
|
+
"latency_ms": 0.028399983420968056,
|
|
263
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
264
|
+
},
|
|
265
|
+
{
|
|
266
|
+
"run_id": 20,
|
|
267
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
268
|
+
"control_outcome": "success",
|
|
269
|
+
"iatp_outcome": "allowed",
|
|
270
|
+
"trust_score": 7,
|
|
271
|
+
"latency_ms": 0.02259993925690651,
|
|
272
|
+
"policy_decision": "ALLOW"
|
|
273
|
+
},
|
|
274
|
+
{
|
|
275
|
+
"run_id": 21,
|
|
276
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
277
|
+
"control_outcome": "success",
|
|
278
|
+
"iatp_outcome": "allowed",
|
|
279
|
+
"trust_score": 7,
|
|
280
|
+
"latency_ms": 0.02220005262643099,
|
|
281
|
+
"policy_decision": "ALLOW"
|
|
282
|
+
},
|
|
283
|
+
{
|
|
284
|
+
"run_id": 22,
|
|
285
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
286
|
+
"control_outcome": "success",
|
|
287
|
+
"iatp_outcome": "allowed",
|
|
288
|
+
"trust_score": 7,
|
|
289
|
+
"latency_ms": 0.017400016076862812,
|
|
290
|
+
"policy_decision": "ALLOW"
|
|
291
|
+
},
|
|
292
|
+
{
|
|
293
|
+
"run_id": 23,
|
|
294
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
295
|
+
"control_outcome": "success",
|
|
296
|
+
"iatp_outcome": "blocked",
|
|
297
|
+
"trust_score": 7,
|
|
298
|
+
"latency_ms": 0.030800001695752144,
|
|
299
|
+
"policy_decision": "ALLOW"
|
|
300
|
+
},
|
|
301
|
+
{
|
|
302
|
+
"run_id": 24,
|
|
303
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
304
|
+
"control_outcome": "success",
|
|
305
|
+
"iatp_outcome": "allowed",
|
|
306
|
+
"trust_score": 7,
|
|
307
|
+
"latency_ms": 0.024399952962994576,
|
|
308
|
+
"policy_decision": "ALLOW"
|
|
309
|
+
},
|
|
310
|
+
{
|
|
311
|
+
"run_id": 25,
|
|
312
|
+
"scenario": "verified_secure_safe_read",
|
|
313
|
+
"control_outcome": "success",
|
|
314
|
+
"iatp_outcome": "allowed",
|
|
315
|
+
"trust_score": 10,
|
|
316
|
+
"latency_ms": 0.020700041204690933,
|
|
317
|
+
"policy_decision": "ALLOW"
|
|
318
|
+
},
|
|
319
|
+
{
|
|
320
|
+
"run_id": 26,
|
|
321
|
+
"scenario": "verified_secure_safe_write",
|
|
322
|
+
"control_outcome": "success",
|
|
323
|
+
"iatp_outcome": "allowed",
|
|
324
|
+
"trust_score": 10,
|
|
325
|
+
"latency_ms": 0.021699932403862476,
|
|
326
|
+
"policy_decision": "ALLOW"
|
|
327
|
+
},
|
|
328
|
+
{
|
|
329
|
+
"run_id": 27,
|
|
330
|
+
"scenario": "verified_secure_destructive",
|
|
331
|
+
"control_outcome": "success",
|
|
332
|
+
"iatp_outcome": "allowed",
|
|
333
|
+
"trust_score": 10,
|
|
334
|
+
"latency_ms": 0.017700018361210823,
|
|
335
|
+
"policy_decision": "ALLOW"
|
|
336
|
+
},
|
|
337
|
+
{
|
|
338
|
+
"run_id": 28,
|
|
339
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
340
|
+
"control_outcome": "success",
|
|
341
|
+
"iatp_outcome": "allowed",
|
|
342
|
+
"trust_score": 10,
|
|
343
|
+
"latency_ms": 0.031000003218650818,
|
|
344
|
+
"policy_decision": "ALLOW"
|
|
345
|
+
},
|
|
346
|
+
{
|
|
347
|
+
"run_id": 29,
|
|
348
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
349
|
+
"control_outcome": "success",
|
|
350
|
+
"iatp_outcome": "allowed",
|
|
351
|
+
"trust_score": 10,
|
|
352
|
+
"latency_ms": 0.024099950678646564,
|
|
353
|
+
"policy_decision": "ALLOW"
|
|
354
|
+
},
|
|
355
|
+
{
|
|
356
|
+
"run_id": 30,
|
|
357
|
+
"scenario": "trusted_partial_safe_read",
|
|
358
|
+
"control_outcome": "success",
|
|
359
|
+
"iatp_outcome": "allowed",
|
|
360
|
+
"trust_score": 10,
|
|
361
|
+
"latency_ms": 0.02110004425048828,
|
|
362
|
+
"policy_decision": "ALLOW"
|
|
363
|
+
},
|
|
364
|
+
{
|
|
365
|
+
"run_id": 31,
|
|
366
|
+
"scenario": "trusted_partial_safe_write",
|
|
367
|
+
"control_outcome": "success",
|
|
368
|
+
"iatp_outcome": "allowed",
|
|
369
|
+
"trust_score": 10,
|
|
370
|
+
"latency_ms": 0.021400046534836292,
|
|
371
|
+
"policy_decision": "ALLOW"
|
|
372
|
+
},
|
|
373
|
+
{
|
|
374
|
+
"run_id": 32,
|
|
375
|
+
"scenario": "trusted_partial_destructive",
|
|
376
|
+
"control_outcome": "success",
|
|
377
|
+
"iatp_outcome": "allowed",
|
|
378
|
+
"trust_score": 10,
|
|
379
|
+
"latency_ms": 0.018600025214254856,
|
|
380
|
+
"policy_decision": "ALLOW"
|
|
381
|
+
},
|
|
382
|
+
{
|
|
383
|
+
"run_id": 33,
|
|
384
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
385
|
+
"control_outcome": "success",
|
|
386
|
+
"iatp_outcome": "blocked",
|
|
387
|
+
"trust_score": 10,
|
|
388
|
+
"latency_ms": 0.03250001464039087,
|
|
389
|
+
"policy_decision": "ALLOW"
|
|
390
|
+
},
|
|
391
|
+
{
|
|
392
|
+
"run_id": 34,
|
|
393
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
394
|
+
"control_outcome": "success",
|
|
395
|
+
"iatp_outcome": "allowed",
|
|
396
|
+
"trust_score": 10,
|
|
397
|
+
"latency_ms": 0.023400061763823032,
|
|
398
|
+
"policy_decision": "ALLOW"
|
|
399
|
+
},
|
|
400
|
+
{
|
|
401
|
+
"run_id": 35,
|
|
402
|
+
"scenario": "standard_unknown_safe_read",
|
|
403
|
+
"control_outcome": "failure",
|
|
404
|
+
"iatp_outcome": "warned",
|
|
405
|
+
"trust_score": 1,
|
|
406
|
+
"latency_ms": 0.023499946109950542,
|
|
407
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
408
|
+
},
|
|
409
|
+
{
|
|
410
|
+
"run_id": 36,
|
|
411
|
+
"scenario": "standard_unknown_safe_write",
|
|
412
|
+
"control_outcome": "failure",
|
|
413
|
+
"iatp_outcome": "warned",
|
|
414
|
+
"trust_score": 1,
|
|
415
|
+
"latency_ms": 0.02359994687139988,
|
|
416
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
417
|
+
},
|
|
418
|
+
{
|
|
419
|
+
"run_id": 37,
|
|
420
|
+
"scenario": "standard_unknown_destructive",
|
|
421
|
+
"control_outcome": "failure",
|
|
422
|
+
"iatp_outcome": "warned",
|
|
423
|
+
"trust_score": 1,
|
|
424
|
+
"latency_ms": 0.019000028260052204,
|
|
425
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
426
|
+
},
|
|
427
|
+
{
|
|
428
|
+
"run_id": 38,
|
|
429
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
430
|
+
"control_outcome": "failure",
|
|
431
|
+
"iatp_outcome": "blocked",
|
|
432
|
+
"trust_score": 1,
|
|
433
|
+
"latency_ms": 0.031400006264448166,
|
|
434
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
435
|
+
},
|
|
436
|
+
{
|
|
437
|
+
"run_id": 39,
|
|
438
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
439
|
+
"control_outcome": "failure",
|
|
440
|
+
"iatp_outcome": "warned",
|
|
441
|
+
"trust_score": 1,
|
|
442
|
+
"latency_ms": 0.02629996743053198,
|
|
443
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
444
|
+
},
|
|
445
|
+
{
|
|
446
|
+
"run_id": 40,
|
|
447
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
448
|
+
"control_outcome": "failure",
|
|
449
|
+
"iatp_outcome": "warned",
|
|
450
|
+
"trust_score": 0,
|
|
451
|
+
"latency_ms": 0.02189993392676115,
|
|
452
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
453
|
+
},
|
|
454
|
+
{
|
|
455
|
+
"run_id": 41,
|
|
456
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
457
|
+
"control_outcome": "failure",
|
|
458
|
+
"iatp_outcome": "warned",
|
|
459
|
+
"trust_score": 0,
|
|
460
|
+
"latency_ms": 0.02320006024092436,
|
|
461
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
462
|
+
},
|
|
463
|
+
{
|
|
464
|
+
"run_id": 42,
|
|
465
|
+
"scenario": "untrusted_malicious_destructive",
|
|
466
|
+
"control_outcome": "failure",
|
|
467
|
+
"iatp_outcome": "warned",
|
|
468
|
+
"trust_score": 0,
|
|
469
|
+
"latency_ms": 0.018399907276034355,
|
|
470
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
471
|
+
},
|
|
472
|
+
{
|
|
473
|
+
"run_id": 43,
|
|
474
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
475
|
+
"control_outcome": "failure",
|
|
476
|
+
"iatp_outcome": "blocked",
|
|
477
|
+
"trust_score": 0,
|
|
478
|
+
"latency_ms": 0.030700000934302807,
|
|
479
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
480
|
+
},
|
|
481
|
+
{
|
|
482
|
+
"run_id": 44,
|
|
483
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
484
|
+
"control_outcome": "failure",
|
|
485
|
+
"iatp_outcome": "warned",
|
|
486
|
+
"trust_score": 0,
|
|
487
|
+
"latency_ms": 0.024699955247342587,
|
|
488
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
489
|
+
},
|
|
490
|
+
{
|
|
491
|
+
"run_id": 45,
|
|
492
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
493
|
+
"control_outcome": "success",
|
|
494
|
+
"iatp_outcome": "allowed",
|
|
495
|
+
"trust_score": 7,
|
|
496
|
+
"latency_ms": 0.022500054910779,
|
|
497
|
+
"policy_decision": "ALLOW"
|
|
498
|
+
},
|
|
499
|
+
{
|
|
500
|
+
"run_id": 46,
|
|
501
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
502
|
+
"control_outcome": "success",
|
|
503
|
+
"iatp_outcome": "allowed",
|
|
504
|
+
"trust_score": 7,
|
|
505
|
+
"latency_ms": 0.021799933165311813,
|
|
506
|
+
"policy_decision": "ALLOW"
|
|
507
|
+
},
|
|
508
|
+
{
|
|
509
|
+
"run_id": 47,
|
|
510
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
511
|
+
"control_outcome": "success",
|
|
512
|
+
"iatp_outcome": "allowed",
|
|
513
|
+
"trust_score": 7,
|
|
514
|
+
"latency_ms": 0.03890006337314844,
|
|
515
|
+
"policy_decision": "ALLOW"
|
|
516
|
+
},
|
|
517
|
+
{
|
|
518
|
+
"run_id": 48,
|
|
519
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
520
|
+
"control_outcome": "success",
|
|
521
|
+
"iatp_outcome": "blocked",
|
|
522
|
+
"trust_score": 7,
|
|
523
|
+
"latency_ms": 0.031100003980100155,
|
|
524
|
+
"policy_decision": "ALLOW"
|
|
525
|
+
},
|
|
526
|
+
{
|
|
527
|
+
"run_id": 49,
|
|
528
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
529
|
+
"control_outcome": "success",
|
|
530
|
+
"iatp_outcome": "allowed",
|
|
531
|
+
"trust_score": 7,
|
|
532
|
+
"latency_ms": 0.02420006785541773,
|
|
533
|
+
"policy_decision": "ALLOW"
|
|
534
|
+
},
|
|
535
|
+
{
|
|
536
|
+
"run_id": 50,
|
|
537
|
+
"scenario": "verified_secure_safe_read",
|
|
538
|
+
"control_outcome": "success",
|
|
539
|
+
"iatp_outcome": "allowed",
|
|
540
|
+
"trust_score": 10,
|
|
541
|
+
"latency_ms": 0.01950003206729889,
|
|
542
|
+
"policy_decision": "ALLOW"
|
|
543
|
+
},
|
|
544
|
+
{
|
|
545
|
+
"run_id": 51,
|
|
546
|
+
"scenario": "verified_secure_safe_write",
|
|
547
|
+
"control_outcome": "success",
|
|
548
|
+
"iatp_outcome": "allowed",
|
|
549
|
+
"trust_score": 10,
|
|
550
|
+
"latency_ms": 0.021200045011937618,
|
|
551
|
+
"policy_decision": "ALLOW"
|
|
552
|
+
},
|
|
553
|
+
{
|
|
554
|
+
"run_id": 52,
|
|
555
|
+
"scenario": "verified_secure_destructive",
|
|
556
|
+
"control_outcome": "success",
|
|
557
|
+
"iatp_outcome": "allowed",
|
|
558
|
+
"trust_score": 10,
|
|
559
|
+
"latency_ms": 0.016399892047047615,
|
|
560
|
+
"policy_decision": "ALLOW"
|
|
561
|
+
},
|
|
562
|
+
{
|
|
563
|
+
"run_id": 53,
|
|
564
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
565
|
+
"control_outcome": "success",
|
|
566
|
+
"iatp_outcome": "allowed",
|
|
567
|
+
"trust_score": 10,
|
|
568
|
+
"latency_ms": 0.0295999925583601,
|
|
569
|
+
"policy_decision": "ALLOW"
|
|
570
|
+
},
|
|
571
|
+
{
|
|
572
|
+
"run_id": 54,
|
|
573
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
574
|
+
"control_outcome": "success",
|
|
575
|
+
"iatp_outcome": "allowed",
|
|
576
|
+
"trust_score": 10,
|
|
577
|
+
"latency_ms": 0.023700064048171043,
|
|
578
|
+
"policy_decision": "ALLOW"
|
|
579
|
+
},
|
|
580
|
+
{
|
|
581
|
+
"run_id": 55,
|
|
582
|
+
"scenario": "trusted_partial_safe_read",
|
|
583
|
+
"control_outcome": "success",
|
|
584
|
+
"iatp_outcome": "allowed",
|
|
585
|
+
"trust_score": 10,
|
|
586
|
+
"latency_ms": 0.02059992402791977,
|
|
587
|
+
"policy_decision": "ALLOW"
|
|
588
|
+
},
|
|
589
|
+
{
|
|
590
|
+
"run_id": 56,
|
|
591
|
+
"scenario": "trusted_partial_safe_write",
|
|
592
|
+
"control_outcome": "success",
|
|
593
|
+
"iatp_outcome": "allowed",
|
|
594
|
+
"trust_score": 10,
|
|
595
|
+
"latency_ms": 0.021600048057734966,
|
|
596
|
+
"policy_decision": "ALLOW"
|
|
597
|
+
},
|
|
598
|
+
{
|
|
599
|
+
"run_id": 57,
|
|
600
|
+
"scenario": "trusted_partial_destructive",
|
|
601
|
+
"control_outcome": "success",
|
|
602
|
+
"iatp_outcome": "allowed",
|
|
603
|
+
"trust_score": 10,
|
|
604
|
+
"latency_ms": 0.01989991869777441,
|
|
605
|
+
"policy_decision": "ALLOW"
|
|
606
|
+
},
|
|
607
|
+
{
|
|
608
|
+
"run_id": 58,
|
|
609
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
610
|
+
"control_outcome": "success",
|
|
611
|
+
"iatp_outcome": "blocked",
|
|
612
|
+
"trust_score": 10,
|
|
613
|
+
"latency_ms": 0.0295999925583601,
|
|
614
|
+
"policy_decision": "ALLOW"
|
|
615
|
+
},
|
|
616
|
+
{
|
|
617
|
+
"run_id": 59,
|
|
618
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
619
|
+
"control_outcome": "success",
|
|
620
|
+
"iatp_outcome": "allowed",
|
|
621
|
+
"trust_score": 10,
|
|
622
|
+
"latency_ms": 0.024000066332519054,
|
|
623
|
+
"policy_decision": "ALLOW"
|
|
624
|
+
},
|
|
625
|
+
{
|
|
626
|
+
"run_id": 60,
|
|
627
|
+
"scenario": "standard_unknown_safe_read",
|
|
628
|
+
"control_outcome": "failure",
|
|
629
|
+
"iatp_outcome": "warned",
|
|
630
|
+
"trust_score": 1,
|
|
631
|
+
"latency_ms": 0.024700071662664413,
|
|
632
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
633
|
+
},
|
|
634
|
+
{
|
|
635
|
+
"run_id": 61,
|
|
636
|
+
"scenario": "standard_unknown_safe_write",
|
|
637
|
+
"control_outcome": "failure",
|
|
638
|
+
"iatp_outcome": "warned",
|
|
639
|
+
"trust_score": 1,
|
|
640
|
+
"latency_ms": 0.024000066332519054,
|
|
641
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
642
|
+
},
|
|
643
|
+
{
|
|
644
|
+
"run_id": 62,
|
|
645
|
+
"scenario": "standard_unknown_destructive",
|
|
646
|
+
"control_outcome": "failure",
|
|
647
|
+
"iatp_outcome": "warned",
|
|
648
|
+
"trust_score": 1,
|
|
649
|
+
"latency_ms": 0.019099912606179714,
|
|
650
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
651
|
+
},
|
|
652
|
+
{
|
|
653
|
+
"run_id": 63,
|
|
654
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
655
|
+
"control_outcome": "failure",
|
|
656
|
+
"iatp_outcome": "blocked",
|
|
657
|
+
"trust_score": 1,
|
|
658
|
+
"latency_ms": 0.031400006264448166,
|
|
659
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
660
|
+
},
|
|
661
|
+
{
|
|
662
|
+
"run_id": 64,
|
|
663
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
664
|
+
"control_outcome": "failure",
|
|
665
|
+
"iatp_outcome": "warned",
|
|
666
|
+
"trust_score": 1,
|
|
667
|
+
"latency_ms": 0.025499961338937283,
|
|
668
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
669
|
+
},
|
|
670
|
+
{
|
|
671
|
+
"run_id": 65,
|
|
672
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
673
|
+
"control_outcome": "failure",
|
|
674
|
+
"iatp_outcome": "warned",
|
|
675
|
+
"trust_score": 0,
|
|
676
|
+
"latency_ms": 0.021900050342082977,
|
|
677
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
678
|
+
},
|
|
679
|
+
{
|
|
680
|
+
"run_id": 66,
|
|
681
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
682
|
+
"control_outcome": "failure",
|
|
683
|
+
"iatp_outcome": "warned",
|
|
684
|
+
"trust_score": 0,
|
|
685
|
+
"latency_ms": 0.026999972760677338,
|
|
686
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
687
|
+
},
|
|
688
|
+
{
|
|
689
|
+
"run_id": 67,
|
|
690
|
+
"scenario": "untrusted_malicious_destructive",
|
|
691
|
+
"control_outcome": "failure",
|
|
692
|
+
"iatp_outcome": "warned",
|
|
693
|
+
"trust_score": 0,
|
|
694
|
+
"latency_ms": 0.018000020645558834,
|
|
695
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
696
|
+
},
|
|
697
|
+
{
|
|
698
|
+
"run_id": 68,
|
|
699
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
700
|
+
"control_outcome": "failure",
|
|
701
|
+
"iatp_outcome": "blocked",
|
|
702
|
+
"trust_score": 0,
|
|
703
|
+
"latency_ms": 0.030399998649954796,
|
|
704
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
705
|
+
},
|
|
706
|
+
{
|
|
707
|
+
"run_id": 69,
|
|
708
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
709
|
+
"control_outcome": "failure",
|
|
710
|
+
"iatp_outcome": "warned",
|
|
711
|
+
"trust_score": 0,
|
|
712
|
+
"latency_ms": 0.02680008765310049,
|
|
713
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
714
|
+
},
|
|
715
|
+
{
|
|
716
|
+
"run_id": 70,
|
|
717
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
718
|
+
"control_outcome": "success",
|
|
719
|
+
"iatp_outcome": "allowed",
|
|
720
|
+
"trust_score": 7,
|
|
721
|
+
"latency_ms": 0.020300038158893585,
|
|
722
|
+
"policy_decision": "ALLOW"
|
|
723
|
+
},
|
|
724
|
+
{
|
|
725
|
+
"run_id": 71,
|
|
726
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
727
|
+
"control_outcome": "success",
|
|
728
|
+
"iatp_outcome": "allowed",
|
|
729
|
+
"trust_score": 7,
|
|
730
|
+
"latency_ms": 0.02110004425048828,
|
|
731
|
+
"policy_decision": "ALLOW"
|
|
732
|
+
},
|
|
733
|
+
{
|
|
734
|
+
"run_id": 72,
|
|
735
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
736
|
+
"control_outcome": "success",
|
|
737
|
+
"iatp_outcome": "allowed",
|
|
738
|
+
"trust_score": 7,
|
|
739
|
+
"latency_ms": 0.016999896615743637,
|
|
740
|
+
"policy_decision": "ALLOW"
|
|
741
|
+
},
|
|
742
|
+
{
|
|
743
|
+
"run_id": 73,
|
|
744
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
745
|
+
"control_outcome": "success",
|
|
746
|
+
"iatp_outcome": "blocked",
|
|
747
|
+
"trust_score": 7,
|
|
748
|
+
"latency_ms": 0.028699985705316067,
|
|
749
|
+
"policy_decision": "ALLOW"
|
|
750
|
+
},
|
|
751
|
+
{
|
|
752
|
+
"run_id": 74,
|
|
753
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
754
|
+
"control_outcome": "success",
|
|
755
|
+
"iatp_outcome": "allowed",
|
|
756
|
+
"trust_score": 7,
|
|
757
|
+
"latency_ms": 0.023000058718025684,
|
|
758
|
+
"policy_decision": "ALLOW"
|
|
759
|
+
},
|
|
760
|
+
{
|
|
761
|
+
"run_id": 75,
|
|
762
|
+
"scenario": "verified_secure_safe_read",
|
|
763
|
+
"control_outcome": "success",
|
|
764
|
+
"iatp_outcome": "allowed",
|
|
765
|
+
"trust_score": 10,
|
|
766
|
+
"latency_ms": 0.0195999164134264,
|
|
767
|
+
"policy_decision": "ALLOW"
|
|
768
|
+
},
|
|
769
|
+
{
|
|
770
|
+
"run_id": 76,
|
|
771
|
+
"scenario": "verified_secure_safe_write",
|
|
772
|
+
"control_outcome": "success",
|
|
773
|
+
"iatp_outcome": "allowed",
|
|
774
|
+
"trust_score": 10,
|
|
775
|
+
"latency_ms": 0.021000043489038944,
|
|
776
|
+
"policy_decision": "ALLOW"
|
|
777
|
+
},
|
|
778
|
+
{
|
|
779
|
+
"run_id": 77,
|
|
780
|
+
"scenario": "verified_secure_destructive",
|
|
781
|
+
"control_outcome": "success",
|
|
782
|
+
"iatp_outcome": "allowed",
|
|
783
|
+
"trust_score": 10,
|
|
784
|
+
"latency_ms": 0.0168998958542943,
|
|
785
|
+
"policy_decision": "ALLOW"
|
|
786
|
+
},
|
|
787
|
+
{
|
|
788
|
+
"run_id": 78,
|
|
789
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
790
|
+
"control_outcome": "success",
|
|
791
|
+
"iatp_outcome": "allowed",
|
|
792
|
+
"trust_score": 10,
|
|
793
|
+
"latency_ms": 0.02819998189806938,
|
|
794
|
+
"policy_decision": "ALLOW"
|
|
795
|
+
},
|
|
796
|
+
{
|
|
797
|
+
"run_id": 79,
|
|
798
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
799
|
+
"control_outcome": "success",
|
|
800
|
+
"iatp_outcome": "allowed",
|
|
801
|
+
"trust_score": 10,
|
|
802
|
+
"latency_ms": 0.02320006024092436,
|
|
803
|
+
"policy_decision": "ALLOW"
|
|
804
|
+
},
|
|
805
|
+
{
|
|
806
|
+
"run_id": 80,
|
|
807
|
+
"scenario": "trusted_partial_safe_read",
|
|
808
|
+
"control_outcome": "success",
|
|
809
|
+
"iatp_outcome": "allowed",
|
|
810
|
+
"trust_score": 10,
|
|
811
|
+
"latency_ms": 0.02089992631226778,
|
|
812
|
+
"policy_decision": "ALLOW"
|
|
813
|
+
},
|
|
814
|
+
{
|
|
815
|
+
"run_id": 81,
|
|
816
|
+
"scenario": "trusted_partial_safe_write",
|
|
817
|
+
"control_outcome": "success",
|
|
818
|
+
"iatp_outcome": "allowed",
|
|
819
|
+
"trust_score": 10,
|
|
820
|
+
"latency_ms": 0.021400046534836292,
|
|
821
|
+
"policy_decision": "ALLOW"
|
|
822
|
+
},
|
|
823
|
+
{
|
|
824
|
+
"run_id": 82,
|
|
825
|
+
"scenario": "trusted_partial_destructive",
|
|
826
|
+
"control_outcome": "success",
|
|
827
|
+
"iatp_outcome": "allowed",
|
|
828
|
+
"trust_score": 10,
|
|
829
|
+
"latency_ms": 0.018499908037483692,
|
|
830
|
+
"policy_decision": "ALLOW"
|
|
831
|
+
},
|
|
832
|
+
{
|
|
833
|
+
"run_id": 83,
|
|
834
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
835
|
+
"control_outcome": "success",
|
|
836
|
+
"iatp_outcome": "blocked",
|
|
837
|
+
"trust_score": 10,
|
|
838
|
+
"latency_ms": 0.0295999925583601,
|
|
839
|
+
"policy_decision": "ALLOW"
|
|
840
|
+
},
|
|
841
|
+
{
|
|
842
|
+
"run_id": 84,
|
|
843
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
844
|
+
"control_outcome": "success",
|
|
845
|
+
"iatp_outcome": "allowed",
|
|
846
|
+
"trust_score": 10,
|
|
847
|
+
"latency_ms": 0.023400061763823032,
|
|
848
|
+
"policy_decision": "ALLOW"
|
|
849
|
+
},
|
|
850
|
+
{
|
|
851
|
+
"run_id": 85,
|
|
852
|
+
"scenario": "standard_unknown_safe_read",
|
|
853
|
+
"control_outcome": "failure",
|
|
854
|
+
"iatp_outcome": "warned",
|
|
855
|
+
"trust_score": 1,
|
|
856
|
+
"latency_ms": 0.022999942302703857,
|
|
857
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
858
|
+
},
|
|
859
|
+
{
|
|
860
|
+
"run_id": 86,
|
|
861
|
+
"scenario": "standard_unknown_safe_write",
|
|
862
|
+
"control_outcome": "failure",
|
|
863
|
+
"iatp_outcome": "warned",
|
|
864
|
+
"trust_score": 1,
|
|
865
|
+
"latency_ms": 0.023099943064153194,
|
|
866
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
867
|
+
},
|
|
868
|
+
{
|
|
869
|
+
"run_id": 87,
|
|
870
|
+
"scenario": "standard_unknown_destructive",
|
|
871
|
+
"control_outcome": "failure",
|
|
872
|
+
"iatp_outcome": "warned",
|
|
873
|
+
"trust_score": 1,
|
|
874
|
+
"latency_ms": 0.019300030544400215,
|
|
875
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
876
|
+
},
|
|
877
|
+
{
|
|
878
|
+
"run_id": 88,
|
|
879
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
880
|
+
"control_outcome": "failure",
|
|
881
|
+
"iatp_outcome": "blocked",
|
|
882
|
+
"trust_score": 1,
|
|
883
|
+
"latency_ms": 0.03029999788850546,
|
|
884
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
885
|
+
},
|
|
886
|
+
{
|
|
887
|
+
"run_id": 89,
|
|
888
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
889
|
+
"control_outcome": "failure",
|
|
890
|
+
"iatp_outcome": "warned",
|
|
891
|
+
"trust_score": 1,
|
|
892
|
+
"latency_ms": 0.025499961338937283,
|
|
893
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
894
|
+
},
|
|
895
|
+
{
|
|
896
|
+
"run_id": 90,
|
|
897
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
898
|
+
"control_outcome": "failure",
|
|
899
|
+
"iatp_outcome": "warned",
|
|
900
|
+
"trust_score": 0,
|
|
901
|
+
"latency_ms": 0.021499930880963802,
|
|
902
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
903
|
+
},
|
|
904
|
+
{
|
|
905
|
+
"run_id": 91,
|
|
906
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
907
|
+
"control_outcome": "failure",
|
|
908
|
+
"iatp_outcome": "warned",
|
|
909
|
+
"trust_score": 0,
|
|
910
|
+
"latency_ms": 0.02280005719512701,
|
|
911
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
912
|
+
},
|
|
913
|
+
{
|
|
914
|
+
"run_id": 92,
|
|
915
|
+
"scenario": "untrusted_malicious_destructive",
|
|
916
|
+
"control_outcome": "failure",
|
|
917
|
+
"iatp_outcome": "warned",
|
|
918
|
+
"trust_score": 0,
|
|
919
|
+
"latency_ms": 0.021399930119514465,
|
|
920
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
921
|
+
},
|
|
922
|
+
{
|
|
923
|
+
"run_id": 93,
|
|
924
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
925
|
+
"control_outcome": "failure",
|
|
926
|
+
"iatp_outcome": "blocked",
|
|
927
|
+
"trust_score": 0,
|
|
928
|
+
"latency_ms": 0.030800001695752144,
|
|
929
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
930
|
+
},
|
|
931
|
+
{
|
|
932
|
+
"run_id": 94,
|
|
933
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
934
|
+
"control_outcome": "failure",
|
|
935
|
+
"iatp_outcome": "warned",
|
|
936
|
+
"trust_score": 0,
|
|
937
|
+
"latency_ms": 0.025799963623285294,
|
|
938
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
939
|
+
},
|
|
940
|
+
{
|
|
941
|
+
"run_id": 95,
|
|
942
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
943
|
+
"control_outcome": "success",
|
|
944
|
+
"iatp_outcome": "allowed",
|
|
945
|
+
"trust_score": 7,
|
|
946
|
+
"latency_ms": 0.02080004196614027,
|
|
947
|
+
"policy_decision": "ALLOW"
|
|
948
|
+
},
|
|
949
|
+
{
|
|
950
|
+
"run_id": 96,
|
|
951
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
952
|
+
"control_outcome": "success",
|
|
953
|
+
"iatp_outcome": "allowed",
|
|
954
|
+
"trust_score": 7,
|
|
955
|
+
"latency_ms": 0.021099927835166454,
|
|
956
|
+
"policy_decision": "ALLOW"
|
|
957
|
+
},
|
|
958
|
+
{
|
|
959
|
+
"run_id": 97,
|
|
960
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
961
|
+
"control_outcome": "success",
|
|
962
|
+
"iatp_outcome": "allowed",
|
|
963
|
+
"trust_score": 7,
|
|
964
|
+
"latency_ms": 0.0171000137925148,
|
|
965
|
+
"policy_decision": "ALLOW"
|
|
966
|
+
},
|
|
967
|
+
{
|
|
968
|
+
"run_id": 98,
|
|
969
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
970
|
+
"control_outcome": "success",
|
|
971
|
+
"iatp_outcome": "blocked",
|
|
972
|
+
"trust_score": 7,
|
|
973
|
+
"latency_ms": 0.031400006264448166,
|
|
974
|
+
"policy_decision": "ALLOW"
|
|
975
|
+
},
|
|
976
|
+
{
|
|
977
|
+
"run_id": 99,
|
|
978
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
979
|
+
"control_outcome": "success",
|
|
980
|
+
"iatp_outcome": "allowed",
|
|
981
|
+
"trust_score": 7,
|
|
982
|
+
"latency_ms": 0.023699947632849216,
|
|
983
|
+
"policy_decision": "ALLOW"
|
|
984
|
+
},
|
|
985
|
+
{
|
|
986
|
+
"run_id": 100,
|
|
987
|
+
"scenario": "verified_secure_safe_read",
|
|
988
|
+
"control_outcome": "success",
|
|
989
|
+
"iatp_outcome": "allowed",
|
|
990
|
+
"trust_score": 10,
|
|
991
|
+
"latency_ms": 0.019200029782950878,
|
|
992
|
+
"policy_decision": "ALLOW"
|
|
993
|
+
},
|
|
994
|
+
{
|
|
995
|
+
"run_id": 101,
|
|
996
|
+
"scenario": "verified_secure_safe_write",
|
|
997
|
+
"control_outcome": "success",
|
|
998
|
+
"iatp_outcome": "allowed",
|
|
999
|
+
"trust_score": 10,
|
|
1000
|
+
"latency_ms": 0.02089992631226778,
|
|
1001
|
+
"policy_decision": "ALLOW"
|
|
1002
|
+
},
|
|
1003
|
+
{
|
|
1004
|
+
"run_id": 102,
|
|
1005
|
+
"scenario": "verified_secure_destructive",
|
|
1006
|
+
"control_outcome": "success",
|
|
1007
|
+
"iatp_outcome": "allowed",
|
|
1008
|
+
"trust_score": 10,
|
|
1009
|
+
"latency_ms": 0.01650000922381878,
|
|
1010
|
+
"policy_decision": "ALLOW"
|
|
1011
|
+
},
|
|
1012
|
+
{
|
|
1013
|
+
"run_id": 103,
|
|
1014
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
1015
|
+
"control_outcome": "success",
|
|
1016
|
+
"iatp_outcome": "allowed",
|
|
1017
|
+
"trust_score": 10,
|
|
1018
|
+
"latency_ms": 0.028699985705316067,
|
|
1019
|
+
"policy_decision": "ALLOW"
|
|
1020
|
+
},
|
|
1021
|
+
{
|
|
1022
|
+
"run_id": 104,
|
|
1023
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
1024
|
+
"control_outcome": "success",
|
|
1025
|
+
"iatp_outcome": "allowed",
|
|
1026
|
+
"trust_score": 10,
|
|
1027
|
+
"latency_ms": 0.022699940018355846,
|
|
1028
|
+
"policy_decision": "ALLOW"
|
|
1029
|
+
},
|
|
1030
|
+
{
|
|
1031
|
+
"run_id": 105,
|
|
1032
|
+
"scenario": "trusted_partial_safe_read",
|
|
1033
|
+
"control_outcome": "success",
|
|
1034
|
+
"iatp_outcome": "allowed",
|
|
1035
|
+
"trust_score": 10,
|
|
1036
|
+
"latency_ms": 0.020200037397444248,
|
|
1037
|
+
"policy_decision": "ALLOW"
|
|
1038
|
+
},
|
|
1039
|
+
{
|
|
1040
|
+
"run_id": 106,
|
|
1041
|
+
"scenario": "trusted_partial_safe_write",
|
|
1042
|
+
"control_outcome": "success",
|
|
1043
|
+
"iatp_outcome": "allowed",
|
|
1044
|
+
"trust_score": 10,
|
|
1045
|
+
"latency_ms": 0.022699940018355846,
|
|
1046
|
+
"policy_decision": "ALLOW"
|
|
1047
|
+
},
|
|
1048
|
+
{
|
|
1049
|
+
"run_id": 107,
|
|
1050
|
+
"scenario": "trusted_partial_destructive",
|
|
1051
|
+
"control_outcome": "success",
|
|
1052
|
+
"iatp_outcome": "allowed",
|
|
1053
|
+
"trust_score": 10,
|
|
1054
|
+
"latency_ms": 0.016700010746717453,
|
|
1055
|
+
"policy_decision": "ALLOW"
|
|
1056
|
+
},
|
|
1057
|
+
{
|
|
1058
|
+
"run_id": 108,
|
|
1059
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
1060
|
+
"control_outcome": "success",
|
|
1061
|
+
"iatp_outcome": "blocked",
|
|
1062
|
+
"trust_score": 10,
|
|
1063
|
+
"latency_ms": 0.028999987989664078,
|
|
1064
|
+
"policy_decision": "ALLOW"
|
|
1065
|
+
},
|
|
1066
|
+
{
|
|
1067
|
+
"run_id": 109,
|
|
1068
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
1069
|
+
"control_outcome": "success",
|
|
1070
|
+
"iatp_outcome": "allowed",
|
|
1071
|
+
"trust_score": 10,
|
|
1072
|
+
"latency_ms": 0.0241999514400959,
|
|
1073
|
+
"policy_decision": "ALLOW"
|
|
1074
|
+
},
|
|
1075
|
+
{
|
|
1076
|
+
"run_id": 110,
|
|
1077
|
+
"scenario": "standard_unknown_safe_read",
|
|
1078
|
+
"control_outcome": "failure",
|
|
1079
|
+
"iatp_outcome": "warned",
|
|
1080
|
+
"trust_score": 1,
|
|
1081
|
+
"latency_ms": 0.02219993621110916,
|
|
1082
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1083
|
+
},
|
|
1084
|
+
{
|
|
1085
|
+
"run_id": 111,
|
|
1086
|
+
"scenario": "standard_unknown_safe_write",
|
|
1087
|
+
"control_outcome": "failure",
|
|
1088
|
+
"iatp_outcome": "warned",
|
|
1089
|
+
"trust_score": 1,
|
|
1090
|
+
"latency_ms": 0.024000066332519054,
|
|
1091
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1092
|
+
},
|
|
1093
|
+
{
|
|
1094
|
+
"run_id": 112,
|
|
1095
|
+
"scenario": "standard_unknown_destructive",
|
|
1096
|
+
"control_outcome": "failure",
|
|
1097
|
+
"iatp_outcome": "warned",
|
|
1098
|
+
"trust_score": 1,
|
|
1099
|
+
"latency_ms": 0.018799910321831703,
|
|
1100
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1101
|
+
},
|
|
1102
|
+
{
|
|
1103
|
+
"run_id": 113,
|
|
1104
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
1105
|
+
"control_outcome": "failure",
|
|
1106
|
+
"iatp_outcome": "blocked",
|
|
1107
|
+
"trust_score": 1,
|
|
1108
|
+
"latency_ms": 0.03060000017285347,
|
|
1109
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1110
|
+
},
|
|
1111
|
+
{
|
|
1112
|
+
"run_id": 114,
|
|
1113
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
1114
|
+
"control_outcome": "failure",
|
|
1115
|
+
"iatp_outcome": "warned",
|
|
1116
|
+
"trust_score": 1,
|
|
1117
|
+
"latency_ms": 0.024799956008791924,
|
|
1118
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1119
|
+
},
|
|
1120
|
+
{
|
|
1121
|
+
"run_id": 115,
|
|
1122
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
1123
|
+
"control_outcome": "failure",
|
|
1124
|
+
"iatp_outcome": "warned",
|
|
1125
|
+
"trust_score": 0,
|
|
1126
|
+
"latency_ms": 0.021600048057734966,
|
|
1127
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1128
|
+
},
|
|
1129
|
+
{
|
|
1130
|
+
"run_id": 116,
|
|
1131
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
1132
|
+
"control_outcome": "failure",
|
|
1133
|
+
"iatp_outcome": "warned",
|
|
1134
|
+
"trust_score": 0,
|
|
1135
|
+
"latency_ms": 0.022099935449659824,
|
|
1136
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1137
|
+
},
|
|
1138
|
+
{
|
|
1139
|
+
"run_id": 117,
|
|
1140
|
+
"scenario": "untrusted_malicious_destructive",
|
|
1141
|
+
"control_outcome": "failure",
|
|
1142
|
+
"iatp_outcome": "warned",
|
|
1143
|
+
"trust_score": 0,
|
|
1144
|
+
"latency_ms": 0.01910002902150154,
|
|
1145
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1146
|
+
},
|
|
1147
|
+
{
|
|
1148
|
+
"run_id": 118,
|
|
1149
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
1150
|
+
"control_outcome": "failure",
|
|
1151
|
+
"iatp_outcome": "blocked",
|
|
1152
|
+
"trust_score": 0,
|
|
1153
|
+
"latency_ms": 0.03090000245720148,
|
|
1154
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1155
|
+
},
|
|
1156
|
+
{
|
|
1157
|
+
"run_id": 119,
|
|
1158
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
1159
|
+
"control_outcome": "failure",
|
|
1160
|
+
"iatp_outcome": "warned",
|
|
1161
|
+
"trust_score": 0,
|
|
1162
|
+
"latency_ms": 0.029699993319809437,
|
|
1163
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1164
|
+
},
|
|
1165
|
+
{
|
|
1166
|
+
"run_id": 120,
|
|
1167
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
1168
|
+
"control_outcome": "success",
|
|
1169
|
+
"iatp_outcome": "allowed",
|
|
1170
|
+
"trust_score": 7,
|
|
1171
|
+
"latency_ms": 0.021000043489038944,
|
|
1172
|
+
"policy_decision": "ALLOW"
|
|
1173
|
+
},
|
|
1174
|
+
{
|
|
1175
|
+
"run_id": 121,
|
|
1176
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
1177
|
+
"control_outcome": "success",
|
|
1178
|
+
"iatp_outcome": "allowed",
|
|
1179
|
+
"trust_score": 7,
|
|
1180
|
+
"latency_ms": 0.021499930880963802,
|
|
1181
|
+
"policy_decision": "ALLOW"
|
|
1182
|
+
},
|
|
1183
|
+
{
|
|
1184
|
+
"run_id": 122,
|
|
1185
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
1186
|
+
"control_outcome": "success",
|
|
1187
|
+
"iatp_outcome": "allowed",
|
|
1188
|
+
"trust_score": 7,
|
|
1189
|
+
"latency_ms": 0.01650000922381878,
|
|
1190
|
+
"policy_decision": "ALLOW"
|
|
1191
|
+
},
|
|
1192
|
+
{
|
|
1193
|
+
"run_id": 123,
|
|
1194
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
1195
|
+
"control_outcome": "success",
|
|
1196
|
+
"iatp_outcome": "blocked",
|
|
1197
|
+
"trust_score": 7,
|
|
1198
|
+
"latency_ms": 0.0295999925583601,
|
|
1199
|
+
"policy_decision": "ALLOW"
|
|
1200
|
+
},
|
|
1201
|
+
{
|
|
1202
|
+
"run_id": 124,
|
|
1203
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
1204
|
+
"control_outcome": "success",
|
|
1205
|
+
"iatp_outcome": "allowed",
|
|
1206
|
+
"trust_score": 7,
|
|
1207
|
+
"latency_ms": 0.023300061002373695,
|
|
1208
|
+
"policy_decision": "ALLOW"
|
|
1209
|
+
},
|
|
1210
|
+
{
|
|
1211
|
+
"run_id": 125,
|
|
1212
|
+
"scenario": "verified_secure_safe_read",
|
|
1213
|
+
"control_outcome": "success",
|
|
1214
|
+
"iatp_outcome": "allowed",
|
|
1215
|
+
"trust_score": 10,
|
|
1216
|
+
"latency_ms": 0.03170000854879618,
|
|
1217
|
+
"policy_decision": "ALLOW"
|
|
1218
|
+
},
|
|
1219
|
+
{
|
|
1220
|
+
"run_id": 126,
|
|
1221
|
+
"scenario": "verified_secure_safe_write",
|
|
1222
|
+
"control_outcome": "success",
|
|
1223
|
+
"iatp_outcome": "allowed",
|
|
1224
|
+
"trust_score": 10,
|
|
1225
|
+
"latency_ms": 0.022000051103532314,
|
|
1226
|
+
"policy_decision": "ALLOW"
|
|
1227
|
+
},
|
|
1228
|
+
{
|
|
1229
|
+
"run_id": 127,
|
|
1230
|
+
"scenario": "verified_secure_destructive",
|
|
1231
|
+
"control_outcome": "success",
|
|
1232
|
+
"iatp_outcome": "allowed",
|
|
1233
|
+
"trust_score": 10,
|
|
1234
|
+
"latency_ms": 0.01650000922381878,
|
|
1235
|
+
"policy_decision": "ALLOW"
|
|
1236
|
+
},
|
|
1237
|
+
{
|
|
1238
|
+
"run_id": 128,
|
|
1239
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
1240
|
+
"control_outcome": "success",
|
|
1241
|
+
"iatp_outcome": "allowed",
|
|
1242
|
+
"trust_score": 10,
|
|
1243
|
+
"latency_ms": 0.034800032153725624,
|
|
1244
|
+
"policy_decision": "ALLOW"
|
|
1245
|
+
},
|
|
1246
|
+
{
|
|
1247
|
+
"run_id": 129,
|
|
1248
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
1249
|
+
"control_outcome": "success",
|
|
1250
|
+
"iatp_outcome": "allowed",
|
|
1251
|
+
"trust_score": 10,
|
|
1252
|
+
"latency_ms": 0.02319994382560253,
|
|
1253
|
+
"policy_decision": "ALLOW"
|
|
1254
|
+
},
|
|
1255
|
+
{
|
|
1256
|
+
"run_id": 130,
|
|
1257
|
+
"scenario": "trusted_partial_safe_read",
|
|
1258
|
+
"control_outcome": "success",
|
|
1259
|
+
"iatp_outcome": "allowed",
|
|
1260
|
+
"trust_score": 10,
|
|
1261
|
+
"latency_ms": 0.019300030544400215,
|
|
1262
|
+
"policy_decision": "ALLOW"
|
|
1263
|
+
},
|
|
1264
|
+
{
|
|
1265
|
+
"run_id": 131,
|
|
1266
|
+
"scenario": "trusted_partial_safe_write",
|
|
1267
|
+
"control_outcome": "success",
|
|
1268
|
+
"iatp_outcome": "allowed",
|
|
1269
|
+
"trust_score": 10,
|
|
1270
|
+
"latency_ms": 0.021499930880963802,
|
|
1271
|
+
"policy_decision": "ALLOW"
|
|
1272
|
+
},
|
|
1273
|
+
{
|
|
1274
|
+
"run_id": 132,
|
|
1275
|
+
"scenario": "trusted_partial_destructive",
|
|
1276
|
+
"control_outcome": "success",
|
|
1277
|
+
"iatp_outcome": "allowed",
|
|
1278
|
+
"trust_score": 10,
|
|
1279
|
+
"latency_ms": 0.015700003132224083,
|
|
1280
|
+
"policy_decision": "ALLOW"
|
|
1281
|
+
},
|
|
1282
|
+
{
|
|
1283
|
+
"run_id": 133,
|
|
1284
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
1285
|
+
"control_outcome": "success",
|
|
1286
|
+
"iatp_outcome": "blocked",
|
|
1287
|
+
"trust_score": 10,
|
|
1288
|
+
"latency_ms": 0.02829998265951872,
|
|
1289
|
+
"policy_decision": "ALLOW"
|
|
1290
|
+
},
|
|
1291
|
+
{
|
|
1292
|
+
"run_id": 134,
|
|
1293
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
1294
|
+
"control_outcome": "success",
|
|
1295
|
+
"iatp_outcome": "allowed",
|
|
1296
|
+
"trust_score": 10,
|
|
1297
|
+
"latency_ms": 0.02210005186498165,
|
|
1298
|
+
"policy_decision": "ALLOW"
|
|
1299
|
+
},
|
|
1300
|
+
{
|
|
1301
|
+
"run_id": 135,
|
|
1302
|
+
"scenario": "standard_unknown_safe_read",
|
|
1303
|
+
"control_outcome": "failure",
|
|
1304
|
+
"iatp_outcome": "warned",
|
|
1305
|
+
"trust_score": 1,
|
|
1306
|
+
"latency_ms": 0.022799940779805183,
|
|
1307
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1308
|
+
},
|
|
1309
|
+
{
|
|
1310
|
+
"run_id": 136,
|
|
1311
|
+
"scenario": "standard_unknown_safe_write",
|
|
1312
|
+
"control_outcome": "failure",
|
|
1313
|
+
"iatp_outcome": "warned",
|
|
1314
|
+
"trust_score": 1,
|
|
1315
|
+
"latency_ms": 0.022400054149329662,
|
|
1316
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1317
|
+
},
|
|
1318
|
+
{
|
|
1319
|
+
"run_id": 137,
|
|
1320
|
+
"scenario": "standard_unknown_destructive",
|
|
1321
|
+
"control_outcome": "failure",
|
|
1322
|
+
"iatp_outcome": "warned",
|
|
1323
|
+
"trust_score": 1,
|
|
1324
|
+
"latency_ms": 0.01780001912266016,
|
|
1325
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1326
|
+
},
|
|
1327
|
+
{
|
|
1328
|
+
"run_id": 138,
|
|
1329
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
1330
|
+
"control_outcome": "failure",
|
|
1331
|
+
"iatp_outcome": "blocked",
|
|
1332
|
+
"trust_score": 1,
|
|
1333
|
+
"latency_ms": 0.029199989512562752,
|
|
1334
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1335
|
+
},
|
|
1336
|
+
{
|
|
1337
|
+
"run_id": 139,
|
|
1338
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
1339
|
+
"control_outcome": "failure",
|
|
1340
|
+
"iatp_outcome": "warned",
|
|
1341
|
+
"trust_score": 1,
|
|
1342
|
+
"latency_ms": 0.023999949917197227,
|
|
1343
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1344
|
+
},
|
|
1345
|
+
{
|
|
1346
|
+
"run_id": 140,
|
|
1347
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
1348
|
+
"control_outcome": "failure",
|
|
1349
|
+
"iatp_outcome": "warned",
|
|
1350
|
+
"trust_score": 0,
|
|
1351
|
+
"latency_ms": 0.02010003663599491,
|
|
1352
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1353
|
+
},
|
|
1354
|
+
{
|
|
1355
|
+
"run_id": 141,
|
|
1356
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
1357
|
+
"control_outcome": "failure",
|
|
1358
|
+
"iatp_outcome": "warned",
|
|
1359
|
+
"trust_score": 0,
|
|
1360
|
+
"latency_ms": 0.02189993392676115,
|
|
1361
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1362
|
+
},
|
|
1363
|
+
{
|
|
1364
|
+
"run_id": 142,
|
|
1365
|
+
"scenario": "untrusted_malicious_destructive",
|
|
1366
|
+
"control_outcome": "failure",
|
|
1367
|
+
"iatp_outcome": "warned",
|
|
1368
|
+
"trust_score": 0,
|
|
1369
|
+
"latency_ms": 0.017300015315413475,
|
|
1370
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1371
|
+
},
|
|
1372
|
+
{
|
|
1373
|
+
"run_id": 143,
|
|
1374
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
1375
|
+
"control_outcome": "failure",
|
|
1376
|
+
"iatp_outcome": "blocked",
|
|
1377
|
+
"trust_score": 0,
|
|
1378
|
+
"latency_ms": 0.029799994081258774,
|
|
1379
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1380
|
+
},
|
|
1381
|
+
{
|
|
1382
|
+
"run_id": 144,
|
|
1383
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
1384
|
+
"control_outcome": "failure",
|
|
1385
|
+
"iatp_outcome": "warned",
|
|
1386
|
+
"trust_score": 0,
|
|
1387
|
+
"latency_ms": 0.02289994154125452,
|
|
1388
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1389
|
+
},
|
|
1390
|
+
{
|
|
1391
|
+
"run_id": 145,
|
|
1392
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
1393
|
+
"control_outcome": "success",
|
|
1394
|
+
"iatp_outcome": "allowed",
|
|
1395
|
+
"trust_score": 7,
|
|
1396
|
+
"latency_ms": 0.01910002902150154,
|
|
1397
|
+
"policy_decision": "ALLOW"
|
|
1398
|
+
},
|
|
1399
|
+
{
|
|
1400
|
+
"run_id": 146,
|
|
1401
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
1402
|
+
"control_outcome": "success",
|
|
1403
|
+
"iatp_outcome": "allowed",
|
|
1404
|
+
"trust_score": 7,
|
|
1405
|
+
"latency_ms": 0.020200037397444248,
|
|
1406
|
+
"policy_decision": "ALLOW"
|
|
1407
|
+
},
|
|
1408
|
+
{
|
|
1409
|
+
"run_id": 147,
|
|
1410
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
1411
|
+
"control_outcome": "success",
|
|
1412
|
+
"iatp_outcome": "allowed",
|
|
1413
|
+
"trust_score": 7,
|
|
1414
|
+
"latency_ms": 0.015900004655122757,
|
|
1415
|
+
"policy_decision": "ALLOW"
|
|
1416
|
+
},
|
|
1417
|
+
{
|
|
1418
|
+
"run_id": 148,
|
|
1419
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
1420
|
+
"control_outcome": "success",
|
|
1421
|
+
"iatp_outcome": "blocked",
|
|
1422
|
+
"trust_score": 7,
|
|
1423
|
+
"latency_ms": 0.026600086130201817,
|
|
1424
|
+
"policy_decision": "ALLOW"
|
|
1425
|
+
},
|
|
1426
|
+
{
|
|
1427
|
+
"run_id": 149,
|
|
1428
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
1429
|
+
"control_outcome": "success",
|
|
1430
|
+
"iatp_outcome": "allowed",
|
|
1431
|
+
"trust_score": 7,
|
|
1432
|
+
"latency_ms": 0.02280005719512701,
|
|
1433
|
+
"policy_decision": "ALLOW"
|
|
1434
|
+
},
|
|
1435
|
+
{
|
|
1436
|
+
"run_id": 150,
|
|
1437
|
+
"scenario": "verified_secure_safe_read",
|
|
1438
|
+
"control_outcome": "success",
|
|
1439
|
+
"iatp_outcome": "allowed",
|
|
1440
|
+
"trust_score": 10,
|
|
1441
|
+
"latency_ms": 0.018499908037483692,
|
|
1442
|
+
"policy_decision": "ALLOW"
|
|
1443
|
+
},
|
|
1444
|
+
{
|
|
1445
|
+
"run_id": 151,
|
|
1446
|
+
"scenario": "verified_secure_safe_write",
|
|
1447
|
+
"control_outcome": "success",
|
|
1448
|
+
"iatp_outcome": "allowed",
|
|
1449
|
+
"trust_score": 10,
|
|
1450
|
+
"latency_ms": 0.01950003206729889,
|
|
1451
|
+
"policy_decision": "ALLOW"
|
|
1452
|
+
},
|
|
1453
|
+
{
|
|
1454
|
+
"run_id": 152,
|
|
1455
|
+
"scenario": "verified_secure_destructive",
|
|
1456
|
+
"control_outcome": "success",
|
|
1457
|
+
"iatp_outcome": "allowed",
|
|
1458
|
+
"trust_score": 10,
|
|
1459
|
+
"latency_ms": 0.015500001609325409,
|
|
1460
|
+
"policy_decision": "ALLOW"
|
|
1461
|
+
},
|
|
1462
|
+
{
|
|
1463
|
+
"run_id": 153,
|
|
1464
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
1465
|
+
"control_outcome": "success",
|
|
1466
|
+
"iatp_outcome": "allowed",
|
|
1467
|
+
"trust_score": 10,
|
|
1468
|
+
"latency_ms": 0.026699970476329327,
|
|
1469
|
+
"policy_decision": "ALLOW"
|
|
1470
|
+
},
|
|
1471
|
+
{
|
|
1472
|
+
"run_id": 154,
|
|
1473
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
1474
|
+
"control_outcome": "success",
|
|
1475
|
+
"iatp_outcome": "allowed",
|
|
1476
|
+
"trust_score": 10,
|
|
1477
|
+
"latency_ms": 0.021300045773386955,
|
|
1478
|
+
"policy_decision": "ALLOW"
|
|
1479
|
+
},
|
|
1480
|
+
{
|
|
1481
|
+
"run_id": 155,
|
|
1482
|
+
"scenario": "trusted_partial_safe_read",
|
|
1483
|
+
"control_outcome": "success",
|
|
1484
|
+
"iatp_outcome": "allowed",
|
|
1485
|
+
"trust_score": 10,
|
|
1486
|
+
"latency_ms": 0.02080004196614027,
|
|
1487
|
+
"policy_decision": "ALLOW"
|
|
1488
|
+
},
|
|
1489
|
+
{
|
|
1490
|
+
"run_id": 156,
|
|
1491
|
+
"scenario": "trusted_partial_safe_write",
|
|
1492
|
+
"control_outcome": "success",
|
|
1493
|
+
"iatp_outcome": "allowed",
|
|
1494
|
+
"trust_score": 10,
|
|
1495
|
+
"latency_ms": 0.019900035113096237,
|
|
1496
|
+
"policy_decision": "ALLOW"
|
|
1497
|
+
},
|
|
1498
|
+
{
|
|
1499
|
+
"run_id": 157,
|
|
1500
|
+
"scenario": "trusted_partial_destructive",
|
|
1501
|
+
"control_outcome": "success",
|
|
1502
|
+
"iatp_outcome": "allowed",
|
|
1503
|
+
"trust_score": 10,
|
|
1504
|
+
"latency_ms": 0.016900012269616127,
|
|
1505
|
+
"policy_decision": "ALLOW"
|
|
1506
|
+
},
|
|
1507
|
+
{
|
|
1508
|
+
"run_id": 158,
|
|
1509
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
1510
|
+
"control_outcome": "success",
|
|
1511
|
+
"iatp_outcome": "blocked",
|
|
1512
|
+
"trust_score": 10,
|
|
1513
|
+
"latency_ms": 0.02720009069889784,
|
|
1514
|
+
"policy_decision": "ALLOW"
|
|
1515
|
+
},
|
|
1516
|
+
{
|
|
1517
|
+
"run_id": 159,
|
|
1518
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
1519
|
+
"control_outcome": "success",
|
|
1520
|
+
"iatp_outcome": "allowed",
|
|
1521
|
+
"trust_score": 10,
|
|
1522
|
+
"latency_ms": 0.022399937734007835,
|
|
1523
|
+
"policy_decision": "ALLOW"
|
|
1524
|
+
},
|
|
1525
|
+
{
|
|
1526
|
+
"run_id": 160,
|
|
1527
|
+
"scenario": "standard_unknown_safe_read",
|
|
1528
|
+
"control_outcome": "failure",
|
|
1529
|
+
"iatp_outcome": "warned",
|
|
1530
|
+
"trust_score": 1,
|
|
1531
|
+
"latency_ms": 0.021400046534836292,
|
|
1532
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1533
|
+
},
|
|
1534
|
+
{
|
|
1535
|
+
"run_id": 161,
|
|
1536
|
+
"scenario": "standard_unknown_safe_write",
|
|
1537
|
+
"control_outcome": "failure",
|
|
1538
|
+
"iatp_outcome": "warned",
|
|
1539
|
+
"trust_score": 1,
|
|
1540
|
+
"latency_ms": 0.02450007013976574,
|
|
1541
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1542
|
+
},
|
|
1543
|
+
{
|
|
1544
|
+
"run_id": 162,
|
|
1545
|
+
"scenario": "standard_unknown_destructive",
|
|
1546
|
+
"control_outcome": "failure",
|
|
1547
|
+
"iatp_outcome": "warned",
|
|
1548
|
+
"trust_score": 1,
|
|
1549
|
+
"latency_ms": 0.017600017599761486,
|
|
1550
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1551
|
+
},
|
|
1552
|
+
{
|
|
1553
|
+
"run_id": 163,
|
|
1554
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
1555
|
+
"control_outcome": "failure",
|
|
1556
|
+
"iatp_outcome": "blocked",
|
|
1557
|
+
"trust_score": 1,
|
|
1558
|
+
"latency_ms": 0.028700102120637894,
|
|
1559
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1560
|
+
},
|
|
1561
|
+
{
|
|
1562
|
+
"run_id": 164,
|
|
1563
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
1564
|
+
"control_outcome": "failure",
|
|
1565
|
+
"iatp_outcome": "warned",
|
|
1566
|
+
"trust_score": 1,
|
|
1567
|
+
"latency_ms": 0.024000066332519054,
|
|
1568
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1569
|
+
},
|
|
1570
|
+
{
|
|
1571
|
+
"run_id": 165,
|
|
1572
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
1573
|
+
"control_outcome": "failure",
|
|
1574
|
+
"iatp_outcome": "warned",
|
|
1575
|
+
"trust_score": 0,
|
|
1576
|
+
"latency_ms": 0.020699924789369106,
|
|
1577
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1578
|
+
},
|
|
1579
|
+
{
|
|
1580
|
+
"run_id": 166,
|
|
1581
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
1582
|
+
"control_outcome": "failure",
|
|
1583
|
+
"iatp_outcome": "warned",
|
|
1584
|
+
"trust_score": 0,
|
|
1585
|
+
"latency_ms": 0.02110004425048828,
|
|
1586
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1587
|
+
},
|
|
1588
|
+
{
|
|
1589
|
+
"run_id": 167,
|
|
1590
|
+
"scenario": "untrusted_malicious_destructive",
|
|
1591
|
+
"control_outcome": "failure",
|
|
1592
|
+
"iatp_outcome": "warned",
|
|
1593
|
+
"trust_score": 0,
|
|
1594
|
+
"latency_ms": 0.017200014553964138,
|
|
1595
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1596
|
+
},
|
|
1597
|
+
{
|
|
1598
|
+
"run_id": 168,
|
|
1599
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
1600
|
+
"control_outcome": "failure",
|
|
1601
|
+
"iatp_outcome": "blocked",
|
|
1602
|
+
"trust_score": 0,
|
|
1603
|
+
"latency_ms": 0.03790005575865507,
|
|
1604
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1605
|
+
},
|
|
1606
|
+
{
|
|
1607
|
+
"run_id": 169,
|
|
1608
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
1609
|
+
"control_outcome": "failure",
|
|
1610
|
+
"iatp_outcome": "warned",
|
|
1611
|
+
"trust_score": 0,
|
|
1612
|
+
"latency_ms": 0.023499946109950542,
|
|
1613
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1614
|
+
},
|
|
1615
|
+
{
|
|
1616
|
+
"run_id": 170,
|
|
1617
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
1618
|
+
"control_outcome": "success",
|
|
1619
|
+
"iatp_outcome": "allowed",
|
|
1620
|
+
"trust_score": 7,
|
|
1621
|
+
"latency_ms": 0.01950003206729889,
|
|
1622
|
+
"policy_decision": "ALLOW"
|
|
1623
|
+
},
|
|
1624
|
+
{
|
|
1625
|
+
"run_id": 171,
|
|
1626
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
1627
|
+
"control_outcome": "success",
|
|
1628
|
+
"iatp_outcome": "allowed",
|
|
1629
|
+
"trust_score": 7,
|
|
1630
|
+
"latency_ms": 0.02019992098212242,
|
|
1631
|
+
"policy_decision": "ALLOW"
|
|
1632
|
+
},
|
|
1633
|
+
{
|
|
1634
|
+
"run_id": 172,
|
|
1635
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
1636
|
+
"control_outcome": "success",
|
|
1637
|
+
"iatp_outcome": "allowed",
|
|
1638
|
+
"trust_score": 7,
|
|
1639
|
+
"latency_ms": 0.016300007700920105,
|
|
1640
|
+
"policy_decision": "ALLOW"
|
|
1641
|
+
},
|
|
1642
|
+
{
|
|
1643
|
+
"run_id": 173,
|
|
1644
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
1645
|
+
"control_outcome": "success",
|
|
1646
|
+
"iatp_outcome": "blocked",
|
|
1647
|
+
"trust_score": 7,
|
|
1648
|
+
"latency_ms": 0.027699978090822697,
|
|
1649
|
+
"policy_decision": "ALLOW"
|
|
1650
|
+
},
|
|
1651
|
+
{
|
|
1652
|
+
"run_id": 174,
|
|
1653
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
1654
|
+
"control_outcome": "success",
|
|
1655
|
+
"iatp_outcome": "allowed",
|
|
1656
|
+
"trust_score": 7,
|
|
1657
|
+
"latency_ms": 0.022300053387880325,
|
|
1658
|
+
"policy_decision": "ALLOW"
|
|
1659
|
+
},
|
|
1660
|
+
{
|
|
1661
|
+
"run_id": 175,
|
|
1662
|
+
"scenario": "verified_secure_safe_read",
|
|
1663
|
+
"control_outcome": "success",
|
|
1664
|
+
"iatp_outcome": "allowed",
|
|
1665
|
+
"trust_score": 10,
|
|
1666
|
+
"latency_ms": 0.01880002673715353,
|
|
1667
|
+
"policy_decision": "ALLOW"
|
|
1668
|
+
},
|
|
1669
|
+
{
|
|
1670
|
+
"run_id": 176,
|
|
1671
|
+
"scenario": "verified_secure_safe_write",
|
|
1672
|
+
"control_outcome": "success",
|
|
1673
|
+
"iatp_outcome": "allowed",
|
|
1674
|
+
"trust_score": 10,
|
|
1675
|
+
"latency_ms": 0.019300030544400215,
|
|
1676
|
+
"policy_decision": "ALLOW"
|
|
1677
|
+
},
|
|
1678
|
+
{
|
|
1679
|
+
"run_id": 177,
|
|
1680
|
+
"scenario": "verified_secure_destructive",
|
|
1681
|
+
"control_outcome": "success",
|
|
1682
|
+
"iatp_outcome": "allowed",
|
|
1683
|
+
"trust_score": 10,
|
|
1684
|
+
"latency_ms": 0.015900004655122757,
|
|
1685
|
+
"policy_decision": "ALLOW"
|
|
1686
|
+
},
|
|
1687
|
+
{
|
|
1688
|
+
"run_id": 178,
|
|
1689
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
1690
|
+
"control_outcome": "success",
|
|
1691
|
+
"iatp_outcome": "allowed",
|
|
1692
|
+
"trust_score": 10,
|
|
1693
|
+
"latency_ms": 0.02720009069889784,
|
|
1694
|
+
"policy_decision": "ALLOW"
|
|
1695
|
+
},
|
|
1696
|
+
{
|
|
1697
|
+
"run_id": 179,
|
|
1698
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
1699
|
+
"control_outcome": "success",
|
|
1700
|
+
"iatp_outcome": "allowed",
|
|
1701
|
+
"trust_score": 10,
|
|
1702
|
+
"latency_ms": 0.02189993392676115,
|
|
1703
|
+
"policy_decision": "ALLOW"
|
|
1704
|
+
},
|
|
1705
|
+
{
|
|
1706
|
+
"run_id": 180,
|
|
1707
|
+
"scenario": "trusted_partial_safe_read",
|
|
1708
|
+
"control_outcome": "success",
|
|
1709
|
+
"iatp_outcome": "allowed",
|
|
1710
|
+
"trust_score": 10,
|
|
1711
|
+
"latency_ms": 0.02050003968179226,
|
|
1712
|
+
"policy_decision": "ALLOW"
|
|
1713
|
+
},
|
|
1714
|
+
{
|
|
1715
|
+
"run_id": 181,
|
|
1716
|
+
"scenario": "trusted_partial_safe_write",
|
|
1717
|
+
"control_outcome": "success",
|
|
1718
|
+
"iatp_outcome": "allowed",
|
|
1719
|
+
"trust_score": 10,
|
|
1720
|
+
"latency_ms": 0.020099920220673084,
|
|
1721
|
+
"policy_decision": "ALLOW"
|
|
1722
|
+
},
|
|
1723
|
+
{
|
|
1724
|
+
"run_id": 182,
|
|
1725
|
+
"scenario": "trusted_partial_destructive",
|
|
1726
|
+
"control_outcome": "success",
|
|
1727
|
+
"iatp_outcome": "allowed",
|
|
1728
|
+
"trust_score": 10,
|
|
1729
|
+
"latency_ms": 0.015900004655122757,
|
|
1730
|
+
"policy_decision": "ALLOW"
|
|
1731
|
+
},
|
|
1732
|
+
{
|
|
1733
|
+
"run_id": 183,
|
|
1734
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
1735
|
+
"control_outcome": "success",
|
|
1736
|
+
"iatp_outcome": "blocked",
|
|
1737
|
+
"trust_score": 10,
|
|
1738
|
+
"latency_ms": 0.026899971999228,
|
|
1739
|
+
"policy_decision": "ALLOW"
|
|
1740
|
+
},
|
|
1741
|
+
{
|
|
1742
|
+
"run_id": 184,
|
|
1743
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
1744
|
+
"control_outcome": "success",
|
|
1745
|
+
"iatp_outcome": "allowed",
|
|
1746
|
+
"trust_score": 10,
|
|
1747
|
+
"latency_ms": 0.021900050342082977,
|
|
1748
|
+
"policy_decision": "ALLOW"
|
|
1749
|
+
},
|
|
1750
|
+
{
|
|
1751
|
+
"run_id": 185,
|
|
1752
|
+
"scenario": "standard_unknown_safe_read",
|
|
1753
|
+
"control_outcome": "failure",
|
|
1754
|
+
"iatp_outcome": "warned",
|
|
1755
|
+
"trust_score": 1,
|
|
1756
|
+
"latency_ms": 0.021099927835166454,
|
|
1757
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1758
|
+
},
|
|
1759
|
+
{
|
|
1760
|
+
"run_id": 186,
|
|
1761
|
+
"scenario": "standard_unknown_safe_write",
|
|
1762
|
+
"control_outcome": "failure",
|
|
1763
|
+
"iatp_outcome": "warned",
|
|
1764
|
+
"trust_score": 1,
|
|
1765
|
+
"latency_ms": 0.02210005186498165,
|
|
1766
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1767
|
+
},
|
|
1768
|
+
{
|
|
1769
|
+
"run_id": 187,
|
|
1770
|
+
"scenario": "standard_unknown_destructive",
|
|
1771
|
+
"control_outcome": "failure",
|
|
1772
|
+
"iatp_outcome": "warned",
|
|
1773
|
+
"trust_score": 1,
|
|
1774
|
+
"latency_ms": 0.01780001912266016,
|
|
1775
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1776
|
+
},
|
|
1777
|
+
{
|
|
1778
|
+
"run_id": 188,
|
|
1779
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
1780
|
+
"control_outcome": "failure",
|
|
1781
|
+
"iatp_outcome": "blocked",
|
|
1782
|
+
"trust_score": 1,
|
|
1783
|
+
"latency_ms": 0.031100003980100155,
|
|
1784
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1785
|
+
},
|
|
1786
|
+
{
|
|
1787
|
+
"run_id": 189,
|
|
1788
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
1789
|
+
"control_outcome": "failure",
|
|
1790
|
+
"iatp_outcome": "warned",
|
|
1791
|
+
"trust_score": 1,
|
|
1792
|
+
"latency_ms": 0.023799948394298553,
|
|
1793
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1794
|
+
},
|
|
1795
|
+
{
|
|
1796
|
+
"run_id": 190,
|
|
1797
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
1798
|
+
"control_outcome": "failure",
|
|
1799
|
+
"iatp_outcome": "warned",
|
|
1800
|
+
"trust_score": 0,
|
|
1801
|
+
"latency_ms": 0.019900035113096237,
|
|
1802
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1803
|
+
},
|
|
1804
|
+
{
|
|
1805
|
+
"run_id": 191,
|
|
1806
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
1807
|
+
"control_outcome": "failure",
|
|
1808
|
+
"iatp_outcome": "warned",
|
|
1809
|
+
"trust_score": 0,
|
|
1810
|
+
"latency_ms": 0.02159993164241314,
|
|
1811
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1812
|
+
},
|
|
1813
|
+
{
|
|
1814
|
+
"run_id": 192,
|
|
1815
|
+
"scenario": "untrusted_malicious_destructive",
|
|
1816
|
+
"control_outcome": "failure",
|
|
1817
|
+
"iatp_outcome": "warned",
|
|
1818
|
+
"trust_score": 0,
|
|
1819
|
+
"latency_ms": 0.018400023691356182,
|
|
1820
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1821
|
+
},
|
|
1822
|
+
{
|
|
1823
|
+
"run_id": 193,
|
|
1824
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
1825
|
+
"control_outcome": "failure",
|
|
1826
|
+
"iatp_outcome": "blocked",
|
|
1827
|
+
"trust_score": 0,
|
|
1828
|
+
"latency_ms": 0.031200004741549492,
|
|
1829
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1830
|
+
},
|
|
1831
|
+
{
|
|
1832
|
+
"run_id": 194,
|
|
1833
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
1834
|
+
"control_outcome": "failure",
|
|
1835
|
+
"iatp_outcome": "warned",
|
|
1836
|
+
"trust_score": 0,
|
|
1837
|
+
"latency_ms": 0.023099943064153194,
|
|
1838
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
1839
|
+
},
|
|
1840
|
+
{
|
|
1841
|
+
"run_id": 195,
|
|
1842
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
1843
|
+
"control_outcome": "success",
|
|
1844
|
+
"iatp_outcome": "allowed",
|
|
1845
|
+
"trust_score": 7,
|
|
1846
|
+
"latency_ms": 0.019700033590197563,
|
|
1847
|
+
"policy_decision": "ALLOW"
|
|
1848
|
+
},
|
|
1849
|
+
{
|
|
1850
|
+
"run_id": 196,
|
|
1851
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
1852
|
+
"control_outcome": "success",
|
|
1853
|
+
"iatp_outcome": "allowed",
|
|
1854
|
+
"trust_score": 7,
|
|
1855
|
+
"latency_ms": 0.019900035113096237,
|
|
1856
|
+
"policy_decision": "ALLOW"
|
|
1857
|
+
},
|
|
1858
|
+
{
|
|
1859
|
+
"run_id": 197,
|
|
1860
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
1861
|
+
"control_outcome": "success",
|
|
1862
|
+
"iatp_outcome": "allowed",
|
|
1863
|
+
"trust_score": 7,
|
|
1864
|
+
"latency_ms": 0.01580000389367342,
|
|
1865
|
+
"policy_decision": "ALLOW"
|
|
1866
|
+
},
|
|
1867
|
+
{
|
|
1868
|
+
"run_id": 198,
|
|
1869
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
1870
|
+
"control_outcome": "success",
|
|
1871
|
+
"iatp_outcome": "blocked",
|
|
1872
|
+
"trust_score": 7,
|
|
1873
|
+
"latency_ms": 0.026600086130201817,
|
|
1874
|
+
"policy_decision": "ALLOW"
|
|
1875
|
+
},
|
|
1876
|
+
{
|
|
1877
|
+
"run_id": 199,
|
|
1878
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
1879
|
+
"control_outcome": "success",
|
|
1880
|
+
"iatp_outcome": "allowed",
|
|
1881
|
+
"trust_score": 7,
|
|
1882
|
+
"latency_ms": 0.02180004958063364,
|
|
1883
|
+
"policy_decision": "ALLOW"
|
|
1884
|
+
},
|
|
1885
|
+
{
|
|
1886
|
+
"run_id": 200,
|
|
1887
|
+
"scenario": "verified_secure_safe_read",
|
|
1888
|
+
"control_outcome": "success",
|
|
1889
|
+
"iatp_outcome": "allowed",
|
|
1890
|
+
"trust_score": 10,
|
|
1891
|
+
"latency_ms": 0.018400023691356182,
|
|
1892
|
+
"policy_decision": "ALLOW"
|
|
1893
|
+
},
|
|
1894
|
+
{
|
|
1895
|
+
"run_id": 201,
|
|
1896
|
+
"scenario": "verified_secure_safe_write",
|
|
1897
|
+
"control_outcome": "success",
|
|
1898
|
+
"iatp_outcome": "allowed",
|
|
1899
|
+
"trust_score": 10,
|
|
1900
|
+
"latency_ms": 0.019900035113096237,
|
|
1901
|
+
"policy_decision": "ALLOW"
|
|
1902
|
+
},
|
|
1903
|
+
{
|
|
1904
|
+
"run_id": 202,
|
|
1905
|
+
"scenario": "verified_secure_destructive",
|
|
1906
|
+
"control_outcome": "success",
|
|
1907
|
+
"iatp_outcome": "allowed",
|
|
1908
|
+
"trust_score": 10,
|
|
1909
|
+
"latency_ms": 0.015400000847876072,
|
|
1910
|
+
"policy_decision": "ALLOW"
|
|
1911
|
+
},
|
|
1912
|
+
{
|
|
1913
|
+
"run_id": 203,
|
|
1914
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
1915
|
+
"control_outcome": "success",
|
|
1916
|
+
"iatp_outcome": "allowed",
|
|
1917
|
+
"trust_score": 10,
|
|
1918
|
+
"latency_ms": 0.026999972760677338,
|
|
1919
|
+
"policy_decision": "ALLOW"
|
|
1920
|
+
},
|
|
1921
|
+
{
|
|
1922
|
+
"run_id": 204,
|
|
1923
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
1924
|
+
"control_outcome": "success",
|
|
1925
|
+
"iatp_outcome": "allowed",
|
|
1926
|
+
"trust_score": 10,
|
|
1927
|
+
"latency_ms": 0.02150004729628563,
|
|
1928
|
+
"policy_decision": "ALLOW"
|
|
1929
|
+
},
|
|
1930
|
+
{
|
|
1931
|
+
"run_id": 205,
|
|
1932
|
+
"scenario": "trusted_partial_safe_read",
|
|
1933
|
+
"control_outcome": "success",
|
|
1934
|
+
"iatp_outcome": "allowed",
|
|
1935
|
+
"trust_score": 10,
|
|
1936
|
+
"latency_ms": 0.020400038920342922,
|
|
1937
|
+
"policy_decision": "ALLOW"
|
|
1938
|
+
},
|
|
1939
|
+
{
|
|
1940
|
+
"run_id": 206,
|
|
1941
|
+
"scenario": "trusted_partial_safe_write",
|
|
1942
|
+
"control_outcome": "success",
|
|
1943
|
+
"iatp_outcome": "allowed",
|
|
1944
|
+
"trust_score": 10,
|
|
1945
|
+
"latency_ms": 0.020200037397444248,
|
|
1946
|
+
"policy_decision": "ALLOW"
|
|
1947
|
+
},
|
|
1948
|
+
{
|
|
1949
|
+
"run_id": 207,
|
|
1950
|
+
"scenario": "trusted_partial_destructive",
|
|
1951
|
+
"control_outcome": "success",
|
|
1952
|
+
"iatp_outcome": "allowed",
|
|
1953
|
+
"trust_score": 10,
|
|
1954
|
+
"latency_ms": 0.01619989052414894,
|
|
1955
|
+
"policy_decision": "ALLOW"
|
|
1956
|
+
},
|
|
1957
|
+
{
|
|
1958
|
+
"run_id": 208,
|
|
1959
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
1960
|
+
"control_outcome": "success",
|
|
1961
|
+
"iatp_outcome": "blocked",
|
|
1962
|
+
"trust_score": 10,
|
|
1963
|
+
"latency_ms": 0.02750009298324585,
|
|
1964
|
+
"policy_decision": "ALLOW"
|
|
1965
|
+
},
|
|
1966
|
+
{
|
|
1967
|
+
"run_id": 209,
|
|
1968
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
1969
|
+
"control_outcome": "success",
|
|
1970
|
+
"iatp_outcome": "allowed",
|
|
1971
|
+
"trust_score": 10,
|
|
1972
|
+
"latency_ms": 0.03370002377778292,
|
|
1973
|
+
"policy_decision": "ALLOW"
|
|
1974
|
+
},
|
|
1975
|
+
{
|
|
1976
|
+
"run_id": 210,
|
|
1977
|
+
"scenario": "standard_unknown_safe_read",
|
|
1978
|
+
"control_outcome": "failure",
|
|
1979
|
+
"iatp_outcome": "warned",
|
|
1980
|
+
"trust_score": 1,
|
|
1981
|
+
"latency_ms": 0.021300045773386955,
|
|
1982
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1983
|
+
},
|
|
1984
|
+
{
|
|
1985
|
+
"run_id": 211,
|
|
1986
|
+
"scenario": "standard_unknown_safe_write",
|
|
1987
|
+
"control_outcome": "failure",
|
|
1988
|
+
"iatp_outcome": "warned",
|
|
1989
|
+
"trust_score": 1,
|
|
1990
|
+
"latency_ms": 0.020999927073717117,
|
|
1991
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
1992
|
+
},
|
|
1993
|
+
{
|
|
1994
|
+
"run_id": 212,
|
|
1995
|
+
"scenario": "standard_unknown_destructive",
|
|
1996
|
+
"control_outcome": "failure",
|
|
1997
|
+
"iatp_outcome": "warned",
|
|
1998
|
+
"trust_score": 1,
|
|
1999
|
+
"latency_ms": 0.0171000137925148,
|
|
2000
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
2001
|
+
},
|
|
2002
|
+
{
|
|
2003
|
+
"run_id": 213,
|
|
2004
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
2005
|
+
"control_outcome": "failure",
|
|
2006
|
+
"iatp_outcome": "blocked",
|
|
2007
|
+
"trust_score": 1,
|
|
2008
|
+
"latency_ms": 0.02859998494386673,
|
|
2009
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
2010
|
+
},
|
|
2011
|
+
{
|
|
2012
|
+
"run_id": 214,
|
|
2013
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
2014
|
+
"control_outcome": "failure",
|
|
2015
|
+
"iatp_outcome": "warned",
|
|
2016
|
+
"trust_score": 1,
|
|
2017
|
+
"latency_ms": 0.022699940018355846,
|
|
2018
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
2019
|
+
},
|
|
2020
|
+
{
|
|
2021
|
+
"run_id": 215,
|
|
2022
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
2023
|
+
"control_outcome": "failure",
|
|
2024
|
+
"iatp_outcome": "warned",
|
|
2025
|
+
"trust_score": 0,
|
|
2026
|
+
"latency_ms": 0.01950003206729889,
|
|
2027
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2028
|
+
},
|
|
2029
|
+
{
|
|
2030
|
+
"run_id": 216,
|
|
2031
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
2032
|
+
"control_outcome": "failure",
|
|
2033
|
+
"iatp_outcome": "warned",
|
|
2034
|
+
"trust_score": 0,
|
|
2035
|
+
"latency_ms": 0.020399922505021095,
|
|
2036
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2037
|
+
},
|
|
2038
|
+
{
|
|
2039
|
+
"run_id": 217,
|
|
2040
|
+
"scenario": "untrusted_malicious_destructive",
|
|
2041
|
+
"control_outcome": "failure",
|
|
2042
|
+
"iatp_outcome": "warned",
|
|
2043
|
+
"trust_score": 0,
|
|
2044
|
+
"latency_ms": 0.01780001912266016,
|
|
2045
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2046
|
+
},
|
|
2047
|
+
{
|
|
2048
|
+
"run_id": 218,
|
|
2049
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
2050
|
+
"control_outcome": "failure",
|
|
2051
|
+
"iatp_outcome": "blocked",
|
|
2052
|
+
"trust_score": 0,
|
|
2053
|
+
"latency_ms": 0.026799971237778664,
|
|
2054
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2055
|
+
},
|
|
2056
|
+
{
|
|
2057
|
+
"run_id": 219,
|
|
2058
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
2059
|
+
"control_outcome": "failure",
|
|
2060
|
+
"iatp_outcome": "warned",
|
|
2061
|
+
"trust_score": 0,
|
|
2062
|
+
"latency_ms": 0.0241999514400959,
|
|
2063
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2064
|
+
},
|
|
2065
|
+
{
|
|
2066
|
+
"run_id": 220,
|
|
2067
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
2068
|
+
"control_outcome": "success",
|
|
2069
|
+
"iatp_outcome": "allowed",
|
|
2070
|
+
"trust_score": 7,
|
|
2071
|
+
"latency_ms": 0.017700018361210823,
|
|
2072
|
+
"policy_decision": "ALLOW"
|
|
2073
|
+
},
|
|
2074
|
+
{
|
|
2075
|
+
"run_id": 221,
|
|
2076
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
2077
|
+
"control_outcome": "success",
|
|
2078
|
+
"iatp_outcome": "allowed",
|
|
2079
|
+
"trust_score": 7,
|
|
2080
|
+
"latency_ms": 0.01950003206729889,
|
|
2081
|
+
"policy_decision": "ALLOW"
|
|
2082
|
+
},
|
|
2083
|
+
{
|
|
2084
|
+
"run_id": 222,
|
|
2085
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
2086
|
+
"control_outcome": "success",
|
|
2087
|
+
"iatp_outcome": "allowed",
|
|
2088
|
+
"trust_score": 7,
|
|
2089
|
+
"latency_ms": 0.014499993994832039,
|
|
2090
|
+
"policy_decision": "ALLOW"
|
|
2091
|
+
},
|
|
2092
|
+
{
|
|
2093
|
+
"run_id": 223,
|
|
2094
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
2095
|
+
"control_outcome": "success",
|
|
2096
|
+
"iatp_outcome": "blocked",
|
|
2097
|
+
"trust_score": 7,
|
|
2098
|
+
"latency_ms": 0.026899971999228,
|
|
2099
|
+
"policy_decision": "ALLOW"
|
|
2100
|
+
},
|
|
2101
|
+
{
|
|
2102
|
+
"run_id": 224,
|
|
2103
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
2104
|
+
"control_outcome": "success",
|
|
2105
|
+
"iatp_outcome": "allowed",
|
|
2106
|
+
"trust_score": 7,
|
|
2107
|
+
"latency_ms": 0.021099927835166454,
|
|
2108
|
+
"policy_decision": "ALLOW"
|
|
2109
|
+
},
|
|
2110
|
+
{
|
|
2111
|
+
"run_id": 225,
|
|
2112
|
+
"scenario": "verified_secure_safe_read",
|
|
2113
|
+
"control_outcome": "success",
|
|
2114
|
+
"iatp_outcome": "allowed",
|
|
2115
|
+
"trust_score": 10,
|
|
2116
|
+
"latency_ms": 0.01780001912266016,
|
|
2117
|
+
"policy_decision": "ALLOW"
|
|
2118
|
+
},
|
|
2119
|
+
{
|
|
2120
|
+
"run_id": 226,
|
|
2121
|
+
"scenario": "verified_secure_safe_write",
|
|
2122
|
+
"control_outcome": "success",
|
|
2123
|
+
"iatp_outcome": "allowed",
|
|
2124
|
+
"trust_score": 10,
|
|
2125
|
+
"latency_ms": 0.018200022168457508,
|
|
2126
|
+
"policy_decision": "ALLOW"
|
|
2127
|
+
},
|
|
2128
|
+
{
|
|
2129
|
+
"run_id": 227,
|
|
2130
|
+
"scenario": "verified_secure_destructive",
|
|
2131
|
+
"control_outcome": "success",
|
|
2132
|
+
"iatp_outcome": "allowed",
|
|
2133
|
+
"trust_score": 10,
|
|
2134
|
+
"latency_ms": 0.014199991710484028,
|
|
2135
|
+
"policy_decision": "ALLOW"
|
|
2136
|
+
},
|
|
2137
|
+
{
|
|
2138
|
+
"run_id": 228,
|
|
2139
|
+
"scenario": "verified_secure_sensitive_pii",
|
|
2140
|
+
"control_outcome": "success",
|
|
2141
|
+
"iatp_outcome": "allowed",
|
|
2142
|
+
"trust_score": 10,
|
|
2143
|
+
"latency_ms": 0.028000096790492535,
|
|
2144
|
+
"policy_decision": "ALLOW"
|
|
2145
|
+
},
|
|
2146
|
+
{
|
|
2147
|
+
"run_id": 229,
|
|
2148
|
+
"scenario": "verified_secure_poisoned_injection",
|
|
2149
|
+
"control_outcome": "success",
|
|
2150
|
+
"iatp_outcome": "allowed",
|
|
2151
|
+
"trust_score": 10,
|
|
2152
|
+
"latency_ms": 0.02189993392676115,
|
|
2153
|
+
"policy_decision": "ALLOW"
|
|
2154
|
+
},
|
|
2155
|
+
{
|
|
2156
|
+
"run_id": 230,
|
|
2157
|
+
"scenario": "trusted_partial_safe_read",
|
|
2158
|
+
"control_outcome": "success",
|
|
2159
|
+
"iatp_outcome": "allowed",
|
|
2160
|
+
"trust_score": 10,
|
|
2161
|
+
"latency_ms": 0.018000020645558834,
|
|
2162
|
+
"policy_decision": "ALLOW"
|
|
2163
|
+
},
|
|
2164
|
+
{
|
|
2165
|
+
"run_id": 231,
|
|
2166
|
+
"scenario": "trusted_partial_safe_write",
|
|
2167
|
+
"control_outcome": "success",
|
|
2168
|
+
"iatp_outcome": "allowed",
|
|
2169
|
+
"trust_score": 10,
|
|
2170
|
+
"latency_ms": 0.019299914129078388,
|
|
2171
|
+
"policy_decision": "ALLOW"
|
|
2172
|
+
},
|
|
2173
|
+
{
|
|
2174
|
+
"run_id": 232,
|
|
2175
|
+
"scenario": "trusted_partial_destructive",
|
|
2176
|
+
"control_outcome": "success",
|
|
2177
|
+
"iatp_outcome": "allowed",
|
|
2178
|
+
"trust_score": 10,
|
|
2179
|
+
"latency_ms": 0.014999997802078724,
|
|
2180
|
+
"policy_decision": "ALLOW"
|
|
2181
|
+
},
|
|
2182
|
+
{
|
|
2183
|
+
"run_id": 233,
|
|
2184
|
+
"scenario": "trusted_partial_sensitive_pii",
|
|
2185
|
+
"control_outcome": "success",
|
|
2186
|
+
"iatp_outcome": "blocked",
|
|
2187
|
+
"trust_score": 10,
|
|
2188
|
+
"latency_ms": 0.026099965907633305,
|
|
2189
|
+
"policy_decision": "ALLOW"
|
|
2190
|
+
},
|
|
2191
|
+
{
|
|
2192
|
+
"run_id": 234,
|
|
2193
|
+
"scenario": "trusted_partial_poisoned_injection",
|
|
2194
|
+
"control_outcome": "success",
|
|
2195
|
+
"iatp_outcome": "allowed",
|
|
2196
|
+
"trust_score": 10,
|
|
2197
|
+
"latency_ms": 0.02080004196614027,
|
|
2198
|
+
"policy_decision": "ALLOW"
|
|
2199
|
+
},
|
|
2200
|
+
{
|
|
2201
|
+
"run_id": 235,
|
|
2202
|
+
"scenario": "standard_unknown_safe_read",
|
|
2203
|
+
"control_outcome": "failure",
|
|
2204
|
+
"iatp_outcome": "warned",
|
|
2205
|
+
"trust_score": 1,
|
|
2206
|
+
"latency_ms": 0.020600040443241596,
|
|
2207
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
2208
|
+
},
|
|
2209
|
+
{
|
|
2210
|
+
"run_id": 236,
|
|
2211
|
+
"scenario": "standard_unknown_safe_write",
|
|
2212
|
+
"control_outcome": "failure",
|
|
2213
|
+
"iatp_outcome": "warned",
|
|
2214
|
+
"trust_score": 1,
|
|
2215
|
+
"latency_ms": 0.02050003968179226,
|
|
2216
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
2217
|
+
},
|
|
2218
|
+
{
|
|
2219
|
+
"run_id": 237,
|
|
2220
|
+
"scenario": "standard_unknown_destructive",
|
|
2221
|
+
"control_outcome": "failure",
|
|
2222
|
+
"iatp_outcome": "warned",
|
|
2223
|
+
"trust_score": 1,
|
|
2224
|
+
"latency_ms": 0.017200014553964138,
|
|
2225
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
2226
|
+
},
|
|
2227
|
+
{
|
|
2228
|
+
"run_id": 238,
|
|
2229
|
+
"scenario": "standard_unknown_sensitive_pii",
|
|
2230
|
+
"control_outcome": "failure",
|
|
2231
|
+
"iatp_outcome": "blocked",
|
|
2232
|
+
"trust_score": 1,
|
|
2233
|
+
"latency_ms": 0.026799971237778664,
|
|
2234
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
2235
|
+
},
|
|
2236
|
+
{
|
|
2237
|
+
"run_id": 239,
|
|
2238
|
+
"scenario": "standard_unknown_poisoned_injection",
|
|
2239
|
+
"control_outcome": "failure",
|
|
2240
|
+
"iatp_outcome": "warned",
|
|
2241
|
+
"trust_score": 1,
|
|
2242
|
+
"latency_ms": 0.022699940018355846,
|
|
2243
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'third-party-api' does not support transaction reversal\n \u2022 Agent 'third-party-api' may not handle duplicate requests safely\n \u2022 Agent 'third-party-api' may have humans review your data"
|
|
2244
|
+
},
|
|
2245
|
+
{
|
|
2246
|
+
"run_id": 240,
|
|
2247
|
+
"scenario": "untrusted_malicious_safe_read",
|
|
2248
|
+
"control_outcome": "failure",
|
|
2249
|
+
"iatp_outcome": "warned",
|
|
2250
|
+
"trust_score": 0,
|
|
2251
|
+
"latency_ms": 0.018900027498602867,
|
|
2252
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2253
|
+
},
|
|
2254
|
+
{
|
|
2255
|
+
"run_id": 241,
|
|
2256
|
+
"scenario": "untrusted_malicious_safe_write",
|
|
2257
|
+
"control_outcome": "failure",
|
|
2258
|
+
"iatp_outcome": "warned",
|
|
2259
|
+
"trust_score": 0,
|
|
2260
|
+
"latency_ms": 0.02059992402791977,
|
|
2261
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2262
|
+
},
|
|
2263
|
+
{
|
|
2264
|
+
"run_id": 242,
|
|
2265
|
+
"scenario": "untrusted_malicious_destructive",
|
|
2266
|
+
"control_outcome": "failure",
|
|
2267
|
+
"iatp_outcome": "warned",
|
|
2268
|
+
"trust_score": 0,
|
|
2269
|
+
"latency_ms": 0.017000013031065464,
|
|
2270
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2271
|
+
},
|
|
2272
|
+
{
|
|
2273
|
+
"run_id": 243,
|
|
2274
|
+
"scenario": "untrusted_malicious_sensitive_pii",
|
|
2275
|
+
"control_outcome": "failure",
|
|
2276
|
+
"iatp_outcome": "blocked",
|
|
2277
|
+
"trust_score": 0,
|
|
2278
|
+
"latency_ms": 0.026499968953430653,
|
|
2279
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2280
|
+
},
|
|
2281
|
+
{
|
|
2282
|
+
"run_id": 244,
|
|
2283
|
+
"scenario": "untrusted_malicious_poisoned_injection",
|
|
2284
|
+
"control_outcome": "failure",
|
|
2285
|
+
"iatp_outcome": "warned",
|
|
2286
|
+
"trust_score": 0,
|
|
2287
|
+
"latency_ms": 0.02410006709396839,
|
|
2288
|
+
"policy_decision": "WARN: \u26a0\ufe0f Policy Warning:\n \u2022 Agent 'honeypot-agent' does not support transaction reversal\n \u2022 Agent 'honeypot-agent' may not handle duplicate requests safely\n \u2022 Agent 'honeypot-agent' may have humans review your data"
|
|
2289
|
+
},
|
|
2290
|
+
{
|
|
2291
|
+
"run_id": 245,
|
|
2292
|
+
"scenario": "trusted_bad_privacy_safe_read",
|
|
2293
|
+
"control_outcome": "success",
|
|
2294
|
+
"iatp_outcome": "allowed",
|
|
2295
|
+
"trust_score": 7,
|
|
2296
|
+
"latency_ms": 0.018099904991686344,
|
|
2297
|
+
"policy_decision": "ALLOW"
|
|
2298
|
+
},
|
|
2299
|
+
{
|
|
2300
|
+
"run_id": 246,
|
|
2301
|
+
"scenario": "trusted_bad_privacy_safe_write",
|
|
2302
|
+
"control_outcome": "success",
|
|
2303
|
+
"iatp_outcome": "allowed",
|
|
2304
|
+
"trust_score": 7,
|
|
2305
|
+
"latency_ms": 0.018900027498602867,
|
|
2306
|
+
"policy_decision": "ALLOW"
|
|
2307
|
+
},
|
|
2308
|
+
{
|
|
2309
|
+
"run_id": 247,
|
|
2310
|
+
"scenario": "trusted_bad_privacy_destructive",
|
|
2311
|
+
"control_outcome": "success",
|
|
2312
|
+
"iatp_outcome": "allowed",
|
|
2313
|
+
"trust_score": 7,
|
|
2314
|
+
"latency_ms": 0.015600002370774746,
|
|
2315
|
+
"policy_decision": "ALLOW"
|
|
2316
|
+
},
|
|
2317
|
+
{
|
|
2318
|
+
"run_id": 248,
|
|
2319
|
+
"scenario": "trusted_bad_privacy_sensitive_pii",
|
|
2320
|
+
"control_outcome": "success",
|
|
2321
|
+
"iatp_outcome": "blocked",
|
|
2322
|
+
"trust_score": 7,
|
|
2323
|
+
"latency_ms": 0.02559996210038662,
|
|
2324
|
+
"policy_decision": "ALLOW"
|
|
2325
|
+
},
|
|
2326
|
+
{
|
|
2327
|
+
"run_id": 249,
|
|
2328
|
+
"scenario": "trusted_bad_privacy_poisoned_injection",
|
|
2329
|
+
"control_outcome": "success",
|
|
2330
|
+
"iatp_outcome": "allowed",
|
|
2331
|
+
"trust_score": 7,
|
|
2332
|
+
"latency_ms": 0.02110004425048828,
|
|
2333
|
+
"policy_decision": "ALLOW"
|
|
2334
|
+
}
|
|
2335
|
+
]
|
|
2336
|
+
}
|