npm - @syrin/cli - Versions diffs - 1.3.0 - Mend

@syrin/cli 1.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (438) hide show

package/LICENSE +15 -0
package/README.md +302 -0
package/dist/cli/commands/analyse.d.ts +16 -0
package/dist/cli/commands/analyse.js +61 -0
package/dist/cli/commands/dev.d.ts +23 -0
package/dist/cli/commands/dev.js +419 -0
package/dist/cli/commands/doctor.d.ts +10 -0
package/dist/cli/commands/doctor.js +195 -0
package/dist/cli/commands/index.d.ts +12 -0
package/dist/cli/commands/index.js +12 -0
package/dist/cli/commands/init.d.ts +16 -0
package/dist/cli/commands/init.js +90 -0
package/dist/cli/commands/list.d.ts +15 -0
package/dist/cli/commands/list.js +50 -0
package/dist/cli/commands/rollback.d.ts +12 -0
package/dist/cli/commands/rollback.js +101 -0
package/dist/cli/commands/test.d.ts +31 -0
package/dist/cli/commands/test.js +88 -0
package/dist/cli/commands/update.d.ts +9 -0
package/dist/cli/commands/update.js +76 -0
package/dist/cli/index.d.ts +13 -0
package/dist/cli/index.js +342 -0
package/dist/cli/prompts/index.d.ts +5 -0
package/dist/cli/prompts/index.js +5 -0
package/dist/cli/prompts/init-prompt.d.ts +17 -0
package/dist/cli/prompts/init-prompt.js +263 -0
package/dist/cli/utils/command-error-handler.d.ts +14 -0
package/dist/cli/utils/command-error-handler.js +35 -0
package/dist/cli/utils/common-types.d.ts +24 -0
package/dist/cli/utils/common-types.js +6 -0
package/dist/cli/utils/connection-handler.d.ts +37 -0
package/dist/cli/utils/connection-handler.js +90 -0
package/dist/cli/utils/index.d.ts +11 -0
package/dist/cli/utils/index.js +11 -0
package/dist/cli/utils/option-parsers.d.ts +41 -0
package/dist/cli/utils/option-parsers.js +92 -0
package/dist/cli/utils/output-utils.d.ts +12 -0
package/dist/cli/utils/output-utils.js +21 -0
package/dist/cli/utils/transport-resolver.d.ts +33 -0
package/dist/cli/utils/transport-resolver.js +82 -0
package/dist/cli/utils/version-banner.d.ts +10 -0
package/dist/cli/utils/version-banner.js +26 -0
package/dist/config/env-checker.d.ts +37 -0
package/dist/config/env-checker.js +136 -0
package/dist/config/generator.d.ts +19 -0
package/dist/config/generator.js +196 -0
package/dist/config/index.d.ts +9 -0
package/dist/config/index.js +9 -0
package/dist/config/loader.d.ts +19 -0
package/dist/config/loader.js +57 -0
package/dist/config/schema.d.ts +42 -0
package/dist/config/schema.js +181 -0
package/dist/config/syrin.template.yaml +127 -0
package/dist/config/types.d.ts +87 -0
package/dist/config/types.js +6 -0
package/dist/constants/app.d.ts +9 -0
package/dist/constants/app.js +9 -0
package/dist/constants/commands.d.ts +43 -0
package/dist/constants/commands.js +43 -0
package/dist/constants/defaults.d.ts +18 -0
package/dist/constants/defaults.js +18 -0
package/dist/constants/env-vars.d.ts +11 -0
package/dist/constants/env-vars.js +11 -0
package/dist/constants/icons.d.ts +23 -0
package/dist/constants/icons.js +23 -0
package/dist/constants/index.d.ts +17 -0
package/dist/constants/index.js +17 -0
package/dist/constants/labels.d.ts +38 -0
package/dist/constants/labels.js +42 -0
package/dist/constants/links.d.ts +10 -0
package/dist/constants/links.js +11 -0
package/dist/constants/list.d.ts +10 -0
package/dist/constants/list.js +9 -0
package/dist/constants/llm.d.ts +26 -0
package/dist/constants/llm.js +25 -0
package/dist/constants/messages.d.ts +107 -0
package/dist/constants/messages.js +138 -0
package/dist/constants/paths.d.ts +29 -0
package/dist/constants/paths.js +29 -0
package/dist/constants/transport.d.ts +9 -0
package/dist/constants/transport.js +8 -0
package/dist/events/emitter.d.ts +64 -0
package/dist/events/emitter.js +142 -0
package/dist/events/event-type.d.ts +66 -0
package/dist/events/event-type.js +81 -0
package/dist/events/payloads/diagnostics.d.ts +24 -0
package/dist/events/payloads/diagnostics.js +5 -0
package/dist/events/payloads/index.d.ts +15 -0
package/dist/events/payloads/index.js +6 -0
package/dist/events/payloads/llm.d.ts +58 -0
package/dist/events/payloads/llm.js +6 -0
package/dist/events/payloads/registry.d.ts +28 -0
package/dist/events/payloads/registry.js +5 -0
package/dist/events/payloads/session.d.ts +32 -0
package/dist/events/payloads/session.js +5 -0
package/dist/events/payloads/testing.d.ts +17 -0
package/dist/events/payloads/testing.js +5 -0
package/dist/events/payloads/tool.d.ts +29 -0
package/dist/events/payloads/tool.js +5 -0
package/dist/events/payloads/transport.d.ts +30 -0
package/dist/events/payloads/transport.js +5 -0
package/dist/events/payloads/validation.d.ts +37 -0
package/dist/events/payloads/validation.js +5 -0
package/dist/events/payloads/workflow.d.ts +45 -0
package/dist/events/payloads/workflow.js +5 -0
package/dist/events/store/file-store.d.ts +37 -0
package/dist/events/store/file-store.js +113 -0
package/dist/events/store/index.d.ts +7 -0
package/dist/events/store/index.js +6 -0
package/dist/events/store/memory-store.d.ts +26 -0
package/dist/events/store/memory-store.js +39 -0
package/dist/events/store.d.ts +11 -0
package/dist/events/store.js +2 -0
package/dist/events/types.d.ts +14 -0
package/dist/events/types.js +2 -0
package/dist/index.d.ts +8 -0
package/dist/index.js +30 -0
package/dist/presentation/analysis-ui.d.ts +24 -0
package/dist/presentation/analysis-ui.js +158 -0
package/dist/presentation/dev/chat-ui-types.d.ts +68 -0
package/dist/presentation/dev/chat-ui-types.js +5 -0
package/dist/presentation/dev/chat-ui.d.ts +61 -0
package/dist/presentation/dev/chat-ui.js +714 -0
package/dist/presentation/dev/components/assistant-message.d.ts +19 -0
package/dist/presentation/dev/components/assistant-message.js +36 -0
package/dist/presentation/dev/components/header.d.ts +16 -0
package/dist/presentation/dev/components/header.js +22 -0
package/dist/presentation/dev/components/index.d.ts +13 -0
package/dist/presentation/dev/components/index.js +13 -0
package/dist/presentation/dev/components/input-panel.d.ts +22 -0
package/dist/presentation/dev/components/input-panel.js +43 -0
package/dist/presentation/dev/components/message-component.d.ts +16 -0
package/dist/presentation/dev/components/message-component.js +51 -0
package/dist/presentation/dev/components/messages-list.d.ts +24 -0
package/dist/presentation/dev/components/messages-list.js +48 -0
package/dist/presentation/dev/components/system-message.d.ts +16 -0
package/dist/presentation/dev/components/system-message.js +26 -0
package/dist/presentation/dev/components/user-message.d.ts +21 -0
package/dist/presentation/dev/components/user-message.js +35 -0
package/dist/presentation/dev/components/welcome-banner.d.ts +24 -0
package/dist/presentation/dev/components/welcome-banner.js +146 -0
package/dist/presentation/dev/goodbye-messages.d.ts +31 -0
package/dist/presentation/dev/goodbye-messages.js +100 -0
package/dist/presentation/dev/index.d.ts +5 -0
package/dist/presentation/dev/index.js +5 -0
package/dist/presentation/dev/text-wrapper.d.ts +30 -0
package/dist/presentation/dev/text-wrapper.js +74 -0
package/dist/presentation/dev-ui.d.ts +33 -0
package/dist/presentation/dev-ui.js +246 -0
package/dist/presentation/doctor-ui.d.ts +40 -0
package/dist/presentation/doctor-ui.js +157 -0
package/dist/presentation/init-ui.d.ts +14 -0
package/dist/presentation/init-ui.js +41 -0
package/dist/presentation/list-ui.d.ts +44 -0
package/dist/presentation/list-ui.js +139 -0
package/dist/presentation/test-ui.d.ts +49 -0
package/dist/presentation/test-ui.js +358 -0
package/dist/runtime/analysis/analyser.d.ts +14 -0
package/dist/runtime/analysis/analyser.js +88 -0
package/dist/runtime/analysis/dependencies.d.ts +10 -0
package/dist/runtime/analysis/dependencies.js +140 -0
package/dist/runtime/analysis/index.d.ts +10 -0
package/dist/runtime/analysis/index.js +10 -0
package/dist/runtime/analysis/indexer.d.ts +10 -0
package/dist/runtime/analysis/indexer.js +62 -0
package/dist/runtime/analysis/loader.d.ts +15 -0
package/dist/runtime/analysis/loader.js +47 -0
package/dist/runtime/analysis/normalizer.d.ts +14 -0
package/dist/runtime/analysis/normalizer.js +184 -0
package/dist/runtime/analysis/rules/__test-helpers__.d.ts +18 -0
package/dist/runtime/analysis/rules/__test-helpers__.js +40 -0
package/dist/runtime/analysis/rules/base.d.ts +38 -0
package/dist/runtime/analysis/rules/base.js +23 -0
package/dist/runtime/analysis/rules/error-codes.d.ts +64 -0
package/dist/runtime/analysis/rules/error-codes.js +73 -0
package/dist/runtime/analysis/rules/errors/e000-tool-not-found.d.ts +35 -0
package/dist/runtime/analysis/rules/errors/e000-tool-not-found.js +32 -0
package/dist/runtime/analysis/rules/errors/e001-missing-output-schema.d.ts +22 -0
package/dist/runtime/analysis/rules/errors/e001-missing-output-schema.js +30 -0
package/dist/runtime/analysis/rules/errors/e002-underspecified-input.d.ts +24 -0
package/dist/runtime/analysis/rules/errors/e002-underspecified-input.js +52 -0
package/dist/runtime/analysis/rules/errors/e003-type-mismatch.d.ts +23 -0
package/dist/runtime/analysis/rules/errors/e003-type-mismatch.js +73 -0
package/dist/runtime/analysis/rules/errors/e004-free-text-propagation.d.ts +23 -0
package/dist/runtime/analysis/rules/errors/e004-free-text-propagation.js +47 -0
package/dist/runtime/analysis/rules/errors/e005-tool-ambiguity.d.ts +25 -0
package/dist/runtime/analysis/rules/errors/e005-tool-ambiguity.js +73 -0
package/dist/runtime/analysis/rules/errors/e006-param-not-in-description.d.ts +22 -0
package/dist/runtime/analysis/rules/errors/e006-param-not-in-description.js +57 -0
package/dist/runtime/analysis/rules/errors/e007-output-not-guaranteed.d.ts +23 -0
package/dist/runtime/analysis/rules/errors/e007-output-not-guaranteed.js +56 -0
package/dist/runtime/analysis/rules/errors/e008-circular-dependency.d.ts +22 -0
package/dist/runtime/analysis/rules/errors/e008-circular-dependency.js +84 -0
package/dist/runtime/analysis/rules/errors/e009-implicit-user-input.d.ts +23 -0
package/dist/runtime/analysis/rules/errors/e009-implicit-user-input.js +89 -0
package/dist/runtime/analysis/rules/errors/e010-non-serializable.d.ts +25 -0
package/dist/runtime/analysis/rules/errors/e010-non-serializable.js +46 -0
package/dist/runtime/analysis/rules/errors/e011-missing-tool-description.d.ts +24 -0
package/dist/runtime/analysis/rules/errors/e011-missing-tool-description.js +33 -0
package/dist/runtime/analysis/rules/errors/e012-side-effect-detected.d.ts +39 -0
package/dist/runtime/analysis/rules/errors/e012-side-effect-detected.js +40 -0
package/dist/runtime/analysis/rules/errors/e013-non-deterministic-output.d.ts +37 -0
package/dist/runtime/analysis/rules/errors/e013-non-deterministic-output.js +34 -0
package/dist/runtime/analysis/rules/errors/e013-output-explosion.d.ts +39 -0
package/dist/runtime/analysis/rules/errors/e013-output-explosion.js +36 -0
package/dist/runtime/analysis/rules/errors/e014-hidden-dependency.d.ts +42 -0
package/dist/runtime/analysis/rules/errors/e014-hidden-dependency.js +46 -0
package/dist/runtime/analysis/rules/errors/e014-output-explosion.d.ts +39 -0
package/dist/runtime/analysis/rules/errors/e014-output-explosion.js +36 -0
package/dist/runtime/analysis/rules/errors/e015-hidden-dependency.d.ts +42 -0
package/dist/runtime/analysis/rules/errors/e015-hidden-dependency.js +46 -0
package/dist/runtime/analysis/rules/errors/e015-unbounded-execution.d.ts +44 -0
package/dist/runtime/analysis/rules/errors/e015-unbounded-execution.js +66 -0
package/dist/runtime/analysis/rules/errors/e016-output-validation-failed.d.ts +43 -0
package/dist/runtime/analysis/rules/errors/e016-output-validation-failed.js +42 -0
package/dist/runtime/analysis/rules/errors/e016-unbounded-execution.d.ts +44 -0
package/dist/runtime/analysis/rules/errors/e016-unbounded-execution.js +66 -0
package/dist/runtime/analysis/rules/errors/e017-input-validation-failed.d.ts +57 -0
package/dist/runtime/analysis/rules/errors/e017-input-validation-failed.js +80 -0
package/dist/runtime/analysis/rules/errors/e017-output-validation-failed.d.ts +43 -0
package/dist/runtime/analysis/rules/errors/e017-output-validation-failed.js +42 -0
package/dist/runtime/analysis/rules/errors/e018-input-validation-failed.d.ts +57 -0
package/dist/runtime/analysis/rules/errors/e018-input-validation-failed.js +80 -0
package/dist/runtime/analysis/rules/errors/e018-tool-execution-failed.d.ts +38 -0
package/dist/runtime/analysis/rules/errors/e018-tool-execution-failed.js +37 -0
package/dist/runtime/analysis/rules/errors/e019-tool-execution-failed.d.ts +38 -0
package/dist/runtime/analysis/rules/errors/e019-tool-execution-failed.js +37 -0
package/dist/runtime/analysis/rules/errors/e019-unexpected-test-result.d.ts +65 -0
package/dist/runtime/analysis/rules/errors/e019-unexpected-test-result.js +109 -0
package/dist/runtime/analysis/rules/errors/e020-unexpected-test-result.d.ts +65 -0
package/dist/runtime/analysis/rules/errors/e020-unexpected-test-result.js +109 -0
package/dist/runtime/analysis/rules/errors/e100-missing-output-schema.d.ts +22 -0
package/dist/runtime/analysis/rules/errors/e100-missing-output-schema.js +30 -0
package/dist/runtime/analysis/rules/errors/e101-missing-tool-description.d.ts +24 -0
package/dist/runtime/analysis/rules/errors/e101-missing-tool-description.js +33 -0
package/dist/runtime/analysis/rules/errors/e102-underspecified-input.d.ts +24 -0
package/dist/runtime/analysis/rules/errors/e102-underspecified-input.js +52 -0
package/dist/runtime/analysis/rules/errors/e103-type-mismatch.d.ts +23 -0
package/dist/runtime/analysis/rules/errors/e103-type-mismatch.js +72 -0
package/dist/runtime/analysis/rules/errors/e104-param-not-in-description.d.ts +22 -0
package/dist/runtime/analysis/rules/errors/e104-param-not-in-description.js +57 -0
package/dist/runtime/analysis/rules/errors/e105-free-text-propagation.d.ts +23 -0
package/dist/runtime/analysis/rules/errors/e105-free-text-propagation.js +47 -0
package/dist/runtime/analysis/rules/errors/e106-output-not-guaranteed.d.ts +23 -0
package/dist/runtime/analysis/rules/errors/e106-output-not-guaranteed.js +58 -0
package/dist/runtime/analysis/rules/errors/e107-circular-dependency.d.ts +22 -0
package/dist/runtime/analysis/rules/errors/e107-circular-dependency.js +84 -0
package/dist/runtime/analysis/rules/errors/e108-implicit-user-input.d.ts +23 -0
package/dist/runtime/analysis/rules/errors/e108-implicit-user-input.js +94 -0
package/dist/runtime/analysis/rules/errors/e109-non-serializable.d.ts +25 -0
package/dist/runtime/analysis/rules/errors/e109-non-serializable.js +44 -0
package/dist/runtime/analysis/rules/errors/e110-tool-ambiguity.d.ts +25 -0
package/dist/runtime/analysis/rules/errors/e110-tool-ambiguity.js +73 -0
package/dist/runtime/analysis/rules/errors/e200-input-validation-failed.d.ts +57 -0
package/dist/runtime/analysis/rules/errors/e200-input-validation-failed.js +71 -0
package/dist/runtime/analysis/rules/errors/e300-output-validation-failed.d.ts +43 -0
package/dist/runtime/analysis/rules/errors/e300-output-validation-failed.js +44 -0
package/dist/runtime/analysis/rules/errors/e301-output-explosion.d.ts +39 -0
package/dist/runtime/analysis/rules/errors/e301-output-explosion.js +36 -0
package/dist/runtime/analysis/rules/errors/e400-tool-execution-failed.d.ts +38 -0
package/dist/runtime/analysis/rules/errors/e400-tool-execution-failed.js +37 -0
package/dist/runtime/analysis/rules/errors/e403-unbounded-execution.d.ts +44 -0
package/dist/runtime/analysis/rules/errors/e403-unbounded-execution.js +66 -0
package/dist/runtime/analysis/rules/errors/e500-side-effect-detected.d.ts +39 -0
package/dist/runtime/analysis/rules/errors/e500-side-effect-detected.js +40 -0
package/dist/runtime/analysis/rules/errors/e501-hidden-dependency.d.ts +47 -0
package/dist/runtime/analysis/rules/errors/e501-hidden-dependency.js +46 -0
package/dist/runtime/analysis/rules/errors/e600-unexpected-test-result.d.ts +65 -0
package/dist/runtime/analysis/rules/errors/e600-unexpected-test-result.js +109 -0
package/dist/runtime/analysis/rules/index.d.ts +18 -0
package/dist/runtime/analysis/rules/index.js +94 -0
package/dist/runtime/analysis/rules/warnings/w001-implicit-dependency.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w001-implicit-dependency.js +39 -0
package/dist/runtime/analysis/rules/warnings/w002-free-text-without-normalization.d.ts +24 -0
package/dist/runtime/analysis/rules/warnings/w002-free-text-without-normalization.js +40 -0
package/dist/runtime/analysis/rules/warnings/w003-missing-examples.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w003-missing-examples.js +84 -0
package/dist/runtime/analysis/rules/warnings/w004-overloaded-responsibility.d.ts +23 -0
package/dist/runtime/analysis/rules/warnings/w004-overloaded-responsibility.js +96 -0
package/dist/runtime/analysis/rules/warnings/w005-generic-description.d.ts +53 -0
package/dist/runtime/analysis/rules/warnings/w005-generic-description.js +108 -0
package/dist/runtime/analysis/rules/warnings/w006-optional-as-required.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w006-optional-as-required.js +44 -0
package/dist/runtime/analysis/rules/warnings/w007-broad-output-schema.d.ts +23 -0
package/dist/runtime/analysis/rules/warnings/w007-broad-output-schema.js +37 -0
package/dist/runtime/analysis/rules/warnings/w008-multiple-entry-points.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w008-multiple-entry-points.js +97 -0
package/dist/runtime/analysis/rules/warnings/w009-hidden-side-effects.d.ts +23 -0
package/dist/runtime/analysis/rules/warnings/w009-hidden-side-effects.js +88 -0
package/dist/runtime/analysis/rules/warnings/w010-output-not-reusable.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w010-output-not-reusable.js +81 -0
package/dist/runtime/analysis/rules/warnings/w021-weak-schema.d.ts +40 -0
package/dist/runtime/analysis/rules/warnings/w021-weak-schema.js +32 -0
package/dist/runtime/analysis/rules/warnings/w022-high-entropy-output.d.ts +39 -0
package/dist/runtime/analysis/rules/warnings/w022-high-entropy-output.js +36 -0
package/dist/runtime/analysis/rules/warnings/w023-unstable-defaults.d.ts +38 -0
package/dist/runtime/analysis/rules/warnings/w023-unstable-defaults.js +36 -0
package/dist/runtime/analysis/rules/warnings/w100-implicit-dependency.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w100-implicit-dependency.js +89 -0
package/dist/runtime/analysis/rules/warnings/w101-free-text-without-normalization.d.ts +24 -0
package/dist/runtime/analysis/rules/warnings/w101-free-text-without-normalization.js +40 -0
package/dist/runtime/analysis/rules/warnings/w102-missing-examples.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w102-missing-examples.js +76 -0
package/dist/runtime/analysis/rules/warnings/w103-overloaded-responsibility.d.ts +23 -0
package/dist/runtime/analysis/rules/warnings/w103-overloaded-responsibility.js +91 -0
package/dist/runtime/analysis/rules/warnings/w104-generic-description.d.ts +53 -0
package/dist/runtime/analysis/rules/warnings/w104-generic-description.js +108 -0
package/dist/runtime/analysis/rules/warnings/w105-optional-as-required.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w105-optional-as-required.js +45 -0
package/dist/runtime/analysis/rules/warnings/w106-broad-output-schema.d.ts +23 -0
package/dist/runtime/analysis/rules/warnings/w106-broad-output-schema.js +37 -0
package/dist/runtime/analysis/rules/warnings/w107-multiple-entry-points.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w107-multiple-entry-points.js +97 -0
package/dist/runtime/analysis/rules/warnings/w108-hidden-side-effects.d.ts +23 -0
package/dist/runtime/analysis/rules/warnings/w108-hidden-side-effects.js +94 -0
package/dist/runtime/analysis/rules/warnings/w109-output-not-reusable.d.ts +22 -0
package/dist/runtime/analysis/rules/warnings/w109-output-not-reusable.js +63 -0
package/dist/runtime/analysis/rules/warnings/w110-weak-schema.d.ts +40 -0
package/dist/runtime/analysis/rules/warnings/w110-weak-schema.js +32 -0
package/dist/runtime/analysis/rules/warnings/w300-high-entropy-output.d.ts +39 -0
package/dist/runtime/analysis/rules/warnings/w300-high-entropy-output.js +47 -0
package/dist/runtime/analysis/rules/warnings/w301-unstable-defaults.d.ts +38 -0
package/dist/runtime/analysis/rules/warnings/w301-unstable-defaults.js +36 -0
package/dist/runtime/analysis/strict-mode.d.ts +21 -0
package/dist/runtime/analysis/strict-mode.js +44 -0
package/dist/runtime/analysis/types.d.ts +133 -0
package/dist/runtime/analysis/types.js +6 -0
package/dist/runtime/analysis/utils.d.ts +19 -0
package/dist/runtime/analysis/utils.js +21 -0
package/dist/runtime/dev/data-manager.d.ts +55 -0
package/dist/runtime/dev/data-manager.js +87 -0
package/dist/runtime/dev/event-mapper.d.ts +100 -0
package/dist/runtime/dev/event-mapper.js +400 -0
package/dist/runtime/dev/formatter.d.ts +94 -0
package/dist/runtime/dev/formatter.js +236 -0
package/dist/runtime/dev/index.d.ts +9 -0
package/dist/runtime/dev/index.js +9 -0
package/dist/runtime/dev/repl.d.ts +114 -0
package/dist/runtime/dev/repl.js +310 -0
package/dist/runtime/dev/session.d.ts +86 -0
package/dist/runtime/dev/session.js +447 -0
package/dist/runtime/dev/stack-trace.d.ts +77 -0
package/dist/runtime/dev/stack-trace.js +286 -0
package/dist/runtime/dev/types.d.ts +54 -0
package/dist/runtime/dev/types.js +5 -0
package/dist/runtime/llm/claude.d.ts +27 -0
package/dist/runtime/llm/claude.js +150 -0
package/dist/runtime/llm/factory.d.ts +30 -0
package/dist/runtime/llm/factory.js +78 -0
package/dist/runtime/llm/index.d.ts +10 -0
package/dist/runtime/llm/index.js +10 -0
package/dist/runtime/llm/ollama.d.ts +45 -0
package/dist/runtime/llm/ollama.js +449 -0
package/dist/runtime/llm/openai.d.ts +27 -0
package/dist/runtime/llm/openai.js +170 -0
package/dist/runtime/llm/provider.d.ts +32 -0
package/dist/runtime/llm/provider.js +6 -0
package/dist/runtime/llm/types.d.ts +55 -0
package/dist/runtime/llm/types.js +6 -0
package/dist/runtime/mcp/client/base.d.ts +40 -0
package/dist/runtime/mcp/client/base.js +157 -0
package/dist/runtime/mcp/client/manager.d.ts +91 -0
package/dist/runtime/mcp/client/manager.js +248 -0
package/dist/runtime/mcp/client/process.d.ts +31 -0
package/dist/runtime/mcp/client/process.js +82 -0
package/dist/runtime/mcp/connection.d.ts +63 -0
package/dist/runtime/mcp/connection.js +449 -0
package/dist/runtime/mcp/index.d.ts +9 -0
package/dist/runtime/mcp/index.js +9 -0
package/dist/runtime/mcp/list.d.ts +50 -0
package/dist/runtime/mcp/list.js +65 -0
package/dist/runtime/mcp/stdio-transport.d.ts +23 -0
package/dist/runtime/mcp/stdio-transport.js +71 -0
package/dist/runtime/mcp/types.d.ts +85 -0
package/dist/runtime/mcp/types.js +6 -0
package/dist/runtime/sandbox/executor.d.ts +102 -0
package/dist/runtime/sandbox/executor.js +537 -0
package/dist/runtime/sandbox/index.d.ts +9 -0
package/dist/runtime/sandbox/index.js +9 -0
package/dist/runtime/sandbox/io-monitor.d.ts +78 -0
package/dist/runtime/sandbox/io-monitor.js +98 -0
package/dist/runtime/sandbox/time-parser.d.ts +19 -0
package/dist/runtime/sandbox/time-parser.js +67 -0
package/dist/runtime/sandbox/types.d.ts +58 -0
package/dist/runtime/sandbox/types.js +23 -0
package/dist/runtime/test/behavior-observer.d.ts +61 -0
package/dist/runtime/test/behavior-observer.js +140 -0
package/dist/runtime/test/contract-loader.d.ts +41 -0
package/dist/runtime/test/contract-loader.js +158 -0
package/dist/runtime/test/contract-schema.d.ts +46 -0
package/dist/runtime/test/contract-schema.js +107 -0
package/dist/runtime/test/contract-types.d.ts +106 -0
package/dist/runtime/test/contract-types.js +6 -0
package/dist/runtime/test/dependency-tracker.d.ts +66 -0
package/dist/runtime/test/dependency-tracker.js +80 -0
package/dist/runtime/test/formatters.d.ts +18 -0
package/dist/runtime/test/formatters.js +172 -0
package/dist/runtime/test/index.d.ts +12 -0
package/dist/runtime/test/index.js +13 -0
package/dist/runtime/test/input-generator.d.ts +33 -0
package/dist/runtime/test/input-generator.js +498 -0
package/dist/runtime/test/mcp-root-detector.d.ts +31 -0
package/dist/runtime/test/mcp-root-detector.js +105 -0
package/dist/runtime/test/orchestrator.d.ts +131 -0
package/dist/runtime/test/orchestrator.js +738 -0
package/dist/runtime/test/output-validator.d.ts +44 -0
package/dist/runtime/test/output-validator.js +262 -0
package/dist/runtime/test/retry-tester.d.ts +44 -0
package/dist/runtime/test/retry-tester.js +103 -0
package/dist/runtime/test/runner.d.ts +28 -0
package/dist/runtime/test/runner.js +55 -0
package/dist/runtime/test/synthetic-input-generator.d.ts +11 -0
package/dist/runtime/test/synthetic-input-generator.js +154 -0
package/dist/runtime/test/test-runner.d.ts +28 -0
package/dist/runtime/test/test-runner.js +55 -0
package/dist/types/factories.d.ts +16 -0
package/dist/types/factories.js +43 -0
package/dist/types/ids.d.ts +16 -0
package/dist/types/ids.js +2 -0
package/dist/types/opaque.d.ts +4 -0
package/dist/types/opaque.js +2 -0
package/dist/utils/errors.d.ts +92 -0
package/dist/utils/errors.js +97 -0
package/dist/utils/gitignore.d.ts +11 -0
package/dist/utils/gitignore.js +59 -0
package/dist/utils/json-file-saver.d.ts +17 -0
package/dist/utils/json-file-saver.js +81 -0
package/dist/utils/json-formatter.d.ts +63 -0
package/dist/utils/json-formatter.js +344 -0
package/dist/utils/logger.d.ts +184 -0
package/dist/utils/logger.js +330 -0
package/dist/utils/package-manager.d.ts +30 -0
package/dist/utils/package-manager.js +157 -0
package/dist/utils/version-checker.d.ts +47 -0
package/dist/utils/version-checker.js +167 -0
package/dist/utils/version-display.d.ts +10 -0
package/dist/utils/version-display.js +20 -0
package/package.json +106 -0

package/dist/runtime/test/orchestrator.js ADDED Viewed

@@ -0,0 +1,738 @@
+/**
+ * Test orchestrator.
+ * Coordinates contract loading, sandboxed execution, and rule evaluation.
+ */
+import * as path from 'path';
+import * as fs from 'fs';
+import { loadConfig } from '../../config/loader.js';
+import { loadAllContracts } from './contract-loader.js';
+import { SandboxExecutor, ToolExecutionErrorType } from '../../runtime/sandbox/index.js';
+import { IOMonitor } from '../../runtime/sandbox/index.js';
+import { BehaviorObserver } from './behavior-observer.js';
+import { runContractTests } from './runner.js';
+import { validateOutputStructure } from './output-validator.js';
+import { parseTimeString } from '../../runtime/sandbox/index.js';
+// Error rule imports - these provide diagnostic generation methods
+// Note: Error codes are centralized in ERROR_CODES/ERROR_TYPE_TO_CODE below
+// to maintain a single source of truth. Individual error classes provide
+// rule-specific diagnostic creation via checkWithBehavioralContext methods.
+import { E000ToolNotFound } from '../../runtime/analysis/rules/errors/e000-tool-not-found.js';
+import { E500SideEffectDetected } from '../../runtime/analysis/rules/errors/e500-side-effect-detected.js';
+import { E301OutputExplosion } from '../../runtime/analysis/rules/errors/e301-output-explosion.js';
+import { E403UnboundedExecution } from '../../runtime/analysis/rules/errors/e403-unbounded-execution.js';
+import { E300OutputValidationFailed } from '../../runtime/analysis/rules/errors/e300-output-validation-failed.js';
+import { E200InputValidationFailed } from '../../runtime/analysis/rules/errors/e200-input-validation-failed.js';
+import { E400ToolExecutionFailed } from '../../runtime/analysis/rules/errors/e400-tool-execution-failed.js';
+import { E600UnexpectedTestResult } from '../../runtime/analysis/rules/errors/e600-unexpected-test-result.js';
+// Centralized error code constants - single source of truth for error codes
+import { ERROR_CODES, ERROR_TYPE_TO_CODE, } from '../../runtime/analysis/rules/error-codes.js';
+import { applyStrictMode, computeVerdict, } from '../../runtime/analysis/strict-mode.js';
+import { logger } from '../../utils/logger.js';
+import { ConfigurationError } from '../../utils/errors.js';
+/**
+ * Test orchestrator for tool validation.
+ */
+export class TestOrchestrator {
+    options;
+    constructor(options) {
+        this.options = options;
+    }
+    /**
+     * Extract expectedOutputSchema from TestExecutionResult.
+     * @param result - Test execution result
+     * @returns Expected output schema name, or undefined if not present
+     */
+    getExpectedOutputSchema(result) {
+        return result.expectedOutputSchema;
+    }
+    /**
+     * Run tool validation tests.
+     */
+    async run() {
+        const { projectRoot, toolsDir, toolName, strictMode } = this.options;
+        // Load configuration
+        const config = loadConfig(projectRoot);
+        // Determine tools directory (relative to project root)
+        const finalToolsDir = toolsDir || config.check?.tools_dir || 'tools';
+        const toolsDirPath = path.resolve(projectRoot, finalToolsDir);
+        // Determine target directory for loading contracts
+        let targetContractsDir = toolsDirPath;
+        if (this.options.toolPath) {
+            const pathFilter = this.options.toolPath.replace(/^\/+|\/+$/g, ''); // Remove leading/trailing slashes
+            const targetPath = path.resolve(toolsDirPath, pathFilter);
+            // Verify the path exists
+            if (!fs.existsSync(targetPath)) {
+                throw new ConfigurationError(`Tool path not found: ${this.options.toolPath} (resolved to: ${targetPath})`);
+            }
+            if (!fs.statSync(targetPath).isDirectory()) {
+                throw new ConfigurationError(`Tool path is not a directory: ${this.options.toolPath} (resolved to: ${targetPath})`);
+            }
+            // Only load contracts from the specified path
+            targetContractsDir = targetPath;
+        }
+        // Load contracts from target directory (only the specified path if toolPath is provided)
+        const parsedContracts = loadAllContracts(targetContractsDir);
+        const contracts = parsedContracts;
+        // Filter by tool name if specified
+        const contractsToTest = toolName
+            ? contracts.filter(c => c.tool === toolName)
+            : contracts;
+        if (contractsToTest.length === 0) {
+            if (toolName) {
+                throw new ConfigurationError(`No contract found for tool: ${toolName}`);
+            }
+            throw new ConfigurationError(`No tool contracts found in ${toolsDirPath}. Create contract files (e.g., tools/<tool-name>.yaml).`);
+        }
+        // Get MCP command from config or options
+        // For tool testing, we need to spawn the server regardless of transport type
+        // (sandboxed execution requires spawning the process)
+        const mcpCommand = this.options.mcpCommand || config.script;
+        if (!mcpCommand) {
+            throw new ConfigurationError('MCP command is required for tool testing. Set script in syrin.yaml or use --mcp-command option.');
+        }
+        // Initialize sandbox executor first (this starts the MCP server process)
+        // Suppress stderr by default, unless user explicitly requests to see errors
+        const suppressStderr = this.options.showErrors !== true;
+        const sandboxExecutor = new SandboxExecutor({
+            timeout: this.options.timeout || config.check?.timeout_ms || 30000,
+            memoryLimitMB: this.options.memoryLimitMB || config.check?.memory_limit_mb,
+            mcpCommand,
+            env: this.options.env,
+            projectRoot,
+            suppressStderr,
+        });
+        try {
+            // Initialize sandbox (start MCP server process once)
+            await sandboxExecutor.initialize();
+            // Get available tools from the sandbox executor's client
+            // (reuse the same connection instead of creating a new one)
+            const client = sandboxExecutor.getClient();
+            if (!client) {
+                throw new ConfigurationError('Failed to get MCP client from sandbox executor');
+            }
+            const availableTools = await client.listTools();
+            // Create tool schema map
+            const toolSchemaMap = new Map(availableTools.tools.map(tool => [
+                tool.name,
+                {
+                    inputSchema: tool.inputSchema,
+                    outputSchema: tool.outputSchema,
+                },
+            ]));
+            const toolResults = [];
+            const allDiagnostics = [];
+            // Test each contract
+            for (const contract of contractsToTest) {
+                const toolResult = await this.testTool(contract, toolSchemaMap, sandboxExecutor, projectRoot, config);
+                toolResults.push(toolResult);
+                allDiagnostics.push(...toolResult.diagnostics);
+            }
+            // Apply strict mode
+            const processedDiagnostics = applyStrictMode(allDiagnostics, strictMode || config.check?.strict_mode || false);
+            // Compute verdict
+            const verdict = computeVerdict(processedDiagnostics, strictMode || config.check?.strict_mode || false);
+            const toolsPassed = toolResults.filter(r => r.passed).length;
+            const toolsFailed = toolResults.filter(r => !r.passed).length;
+            return {
+                verdict,
+                diagnostics: processedDiagnostics,
+                toolResults,
+                toolsTested: toolResults.length,
+                toolsPassed,
+                toolsFailed,
+            };
+        }
+        finally {
+            // Cleanup sandbox (this also closes the MCP connection)
+            await sandboxExecutor.cleanup();
+        }
+    }
+    /**
+     * Test a single tool.
+     */
+    async testTool(contract, toolSchemaMap, sandboxExecutor, projectRoot, config) {
+        const toolName = contract.tool;
+        const toolSchema = toolSchemaMap.get(toolName);
+        if (!toolSchema) {
+            // Get the MCP command being used (from options or config)
+            const mcpCommand = this.options.mcpCommand || config.script;
+            const scriptName = mcpCommand ? String(mcpCommand) : 'unknown';
+            if (!this.options.ci) {
+                logger.warn(`Tool "${toolName}" not found in MCP server. Running: ${scriptName}`);
+            }
+            // Create a diagnostic error for missing tool using E000 rule
+            const diagnostics = E000ToolNotFound.checkWithRuntimeContext({
+                toolName,
+                scriptName,
+            });
+            const diagnostic = diagnostics[0];
+            return {
+                toolName,
+                contract,
+                diagnostics: [diagnostic],
+                passed: false,
+                summary: {
+                    totalExecutions: 0,
+                    successfulExecutions: 0,
+                    failedExecutions: 0,
+                    timedOutExecutions: 0,
+                },
+            };
+        }
+        // Create I/O monitor
+        const tempDir = sandboxExecutor.getTempDir() || '';
+        const ioMonitor = new IOMonitor(tempDir, projectRoot);
+        // Create behavior observer
+        const behaviorObserver = new BehaviorObserver();
+        // Parse per-tool timeout if declared, otherwise use global default
+        let toolTimeoutMs;
+        if (contract.guarantees?.max_execution_time) {
+            try {
+                toolTimeoutMs = parseTimeString(contract.guarantees.max_execution_time);
+                if (!this.options.ci) {
+                    logger.info(`Tool "${toolName}" declared max_execution_time: ${contract.guarantees.max_execution_time} (${toolTimeoutMs}ms)`);
+                }
+            }
+            catch (_error) {
+                if (!this.options.ci) {
+                    logger.warn(`Invalid max_execution_time for tool "${toolName}": ${contract.guarantees.max_execution_time}. Using global default.`);
+                }
+            }
+        }
+        // Run contract-defined tests
+        const contractTestResults = await runContractTests(sandboxExecutor, contract, toolTimeoutMs);
+        // All results are from contract tests
+        const allResults = contractTestResults;
+        // Run behavioral observations
+        const sideEffectResult = behaviorObserver.detectSideEffects(ioMonitor, contract);
+        const outputSizeResults = behaviorObserver.checkOutputSize(allResults, contract, this.options.maxOutputSizeKB || 50);
+        const unboundedResult = behaviorObserver.detectUnboundedExecution(allResults);
+        const executionErrorResult = behaviorObserver.detectExecutionErrors(allResults);
+        // Run behavioral rules
+        const diagnostics = [];
+        const testResults = [];
+        // Match expectations against actual results
+        for (const result of allResults) {
+            const expectation = result.expectation;
+            // Use discriminated union to check result state
+            const hasError = !result.success;
+            const hasTimeout = !result.success && result.timedOut === true;
+            // Determine actual outcome
+            let actualOutcome;
+            let actualErrorCode;
+            let actualErrorType;
+            if (hasTimeout) {
+                actualOutcome = 'timeout';
+                actualErrorCode = ERROR_CODES.E403;
+                actualErrorType = 'timeout';
+            }
+            else if (hasError && !result.success) {
+                actualOutcome = 'error';
+                actualErrorCode =
+                    result.error.errorType === ToolExecutionErrorType.INPUT_VALIDATION
+                        ? ERROR_CODES.E200
+                        : result.error.errorType ===
+                            ToolExecutionErrorType.OUTPUT_VALIDATION
+                            ? ERROR_CODES.E300
+                            : ERROR_CODES.E600;
+                // Normalize enum value to expected string format (e.g., 'EXECUTION_ERROR' -> 'execution_error')
+                actualErrorType = result.error.errorType.toLowerCase();
+            }
+            else {
+                actualOutcome = 'success';
+            }
+            // Fix TypeScript: error is guaranteed to exist when actualOutcome is 'error'
+            // Determine expected outcome
+            // Some behavioral errors are tool-level (side_effect, output_explosion)
+            // Others are test-level (unbounded_execution, execution_error)
+            const toolLevelBehavioralErrors = ['side_effect', 'output_explosion'];
+            const testLevelBehavioralErrors = [
+                'unbounded_execution',
+                'execution_error',
+            ];
+            const expectedErrorType = expectation?.error?.type;
+            const isToolLevelBehavioralError = expectedErrorType &&
+                toolLevelBehavioralErrors.includes(expectedErrorType);
+            const isTestLevelBehavioralError = expectedErrorType &&
+                testLevelBehavioralErrors.includes(expectedErrorType);
+            let expectedOutcome;
+            if (isToolLevelBehavioralError) {
+                // For tool-level behavioral errors (side_effect, output_explosion),
+                // the test execution itself should succeed - the error is detected separately at tool level
+                expectedOutcome = 'success';
+            }
+            else if (isTestLevelBehavioralError) {
+                // For test-level behavioral errors (unbounded_execution, execution_error),
+                // the test execution itself should fail/timeout - that's how the error is detected
+                expectedOutcome = 'error';
+            }
+            else if (expectation?.error) {
+                expectedOutcome = 'error';
+            }
+            else if (expectation?.success === false) {
+                expectedOutcome = 'error';
+            }
+            else {
+                expectedOutcome = 'success'; // Default to success if no expectation or success=true
+            }
+            // Match expectation against actual result
+            // For tool-level behavioral errors, test execution should succeed
+            // For test-level behavioral errors, test execution should match the error type
+            let expectationMatched;
+            if (isToolLevelBehavioralError) {
+                expectationMatched = actualOutcome === 'success';
+            }
+            else if (isTestLevelBehavioralError) {
+                // For unbounded_execution, expect timeout; for execution_error, expect error
+                if (expectedErrorType === 'unbounded_execution') {
+                    expectationMatched = actualOutcome === 'timeout';
+                }
+                else if (expectedErrorType === 'execution_error') {
+                    expectationMatched =
+                        actualOutcome === 'error' && actualErrorType === 'execution_error';
+                }
+                else {
+                    expectationMatched = false;
+                }
+            }
+            else {
+                expectationMatched = this.matchExpectation(expectation, actualOutcome, actualErrorCode, actualErrorType, !result.success ? result.error : undefined);
+            }
+            // Check if this is a synthetic input (no explicit expectation)
+            const isSyntheticInput = result.testName?.startsWith('synthetic_input_') && !expectation;
+            testResults.push({
+                testName: result.testName,
+                passed: expectationMatched,
+                expected: expectedOutcome,
+                actual: actualOutcome,
+                errorCode: actualErrorCode,
+                errorType: actualErrorType,
+                message: !result.success ? result.error.message : undefined,
+            });
+            // Only add diagnostics if expectation doesn't match
+            // For synthetic inputs without expectations, skip error reporting (they're exploratory)
+            if (!expectationMatched && !isSyntheticInput) {
+                if (expectedOutcome === 'error' && actualOutcome === 'success') {
+                    // Expected error but got success
+                    diagnostics.push(...E600UnexpectedTestResult.checkWithBehavioralContext({
+                        toolName,
+                        testName: result.testName || 'unknown',
+                        testInput: result.testInput,
+                        expectedOutcome: 'error',
+                        actualOutcome: 'success',
+                        expectedErrorType: expectation?.error?.type,
+                        expectedErrorCode: expectation?.error?.code,
+                        expectedError: expectation?.error,
+                    }));
+                }
+                else if (expectedOutcome === 'success' && actualOutcome === 'error') {
+                    // Expected success but got error
+                    if (!result.success) {
+                        const errorMessage = result.error.message;
+                        const parsedError = this.parseValidationError(errorMessage);
+                        // Use appropriate rule based on error type
+                        if (result.error.errorType === ToolExecutionErrorType.INPUT_VALIDATION) {
+                            diagnostics.push(...E200InputValidationFailed.checkWithBehavioralContext({
+                                toolName,
+                                testName: result.testName,
+                                testInput: result.testInput,
+                                error: errorMessage,
+                                parsedError: parsedError,
+                                details: {
+                                    expectedOutputSchema: this.getExpectedOutputSchema(result),
+                                    actualError: {
+                                        code: actualErrorCode,
+                                        type: actualErrorType,
+                                        message: errorMessage,
+                                    },
+                                    errorType: result.error.errorType,
+                                    ...result.error.context,
+                                },
+                            }));
+                        }
+                        else if (result.error.errorType ===
+                            ToolExecutionErrorType.OUTPUT_VALIDATION) {
+                            diagnostics.push(...E300OutputValidationFailed.checkWithBehavioralContext({
+                                toolName,
+                                testName: result.testName,
+                                testInput: result.testInput,
+                                expectedOutputSchema: this.getExpectedOutputSchema(result),
+                                error: errorMessage,
+                                details: {
+                                    actualError: {
+                                        code: actualErrorCode,
+                                        type: actualErrorType,
+                                        message: errorMessage,
+                                    },
+                                    ...result.error.context,
+                                },
+                            }));
+                        }
+                        else {
+                            // For other errors, use E019 (execution errors are handled separately in the E019 rule section)
+                            // This case should rarely happen as E019 is handled separately
+                            const readableMessage = parsedError.summary || errorMessage;
+                            diagnostics.push({
+                                code: ERROR_CODES.E600,
+                                severity: 'error',
+                                message: parsedError.field
+                                    ? `${parsedError.field}: ${parsedError.message || readableMessage}`
+                                    : readableMessage,
+                                tool: toolName,
+                                context: {
+                                    testName: result.testName,
+                                    testInput: result.testInput,
+                                    expectedOutputSchema: this.getExpectedOutputSchema(result),
+                                    expectedResult: 'success',
+                                    actualError: {
+                                        code: actualErrorCode,
+                                        type: actualErrorType,
+                                        message: errorMessage,
+                                    },
+                                    errorType: result.error.errorType,
+                                    ...result.error.context,
+                                },
+                            });
+                        }
+                    }
+                }
+                else if (expectedOutcome === 'error' &&
+                    actualOutcome === 'error' &&
+                    !result.success) {
+                    // Expected error but got different error
+                    const expectedCode = expectation?.error?.code;
+                    const expectedType = expectation?.error?.type;
+                    // Check if error type matches (if specified)
+                    let typeMatches = true;
+                    if (expectedType && actualErrorType) {
+                        const expectedTypeLower = String(expectedType).toLowerCase();
+                        const actualTypeLower = String(actualErrorType).toLowerCase();
+                        typeMatches =
+                            actualTypeLower.includes(expectedTypeLower) ||
+                                expectedTypeLower === actualTypeLower;
+                    }
+                    // Check if error code matches (if specified)
+                    const codeMatches = !expectedCode || actualErrorCode === expectedCode;
+                    // Check detailed error matching (if specified)
+                    const detailsMatch = !expectation?.error?.details ||
+                        this.matchExpectationDetails(expectation.error.details, result.error);
+                    // If any part doesn't match, report E020
+                    if (!typeMatches || !codeMatches || !detailsMatch) {
+                        diagnostics.push(...E600UnexpectedTestResult.checkWithBehavioralContext({
+                            toolName,
+                            testName: result.testName || 'unknown',
+                            testInput: result.testInput,
+                            expectedOutcome: 'error',
+                            actualOutcome: 'error',
+                            expectedErrorType: expectedType,
+                            expectedErrorCode: expectedCode,
+                            actualErrorType: actualErrorType,
+                            actualErrorCode: actualErrorCode,
+                            expectedError: expectation?.error,
+                            actualError: {
+                                code: actualErrorCode,
+                                type: actualErrorType,
+                                message: result.error.message,
+                            },
+                        }));
+                    }
+                }
+            }
+        }
+        // E012: Side Effect Detected
+        if (sideEffectResult.detected) {
+            diagnostics.push(...E500SideEffectDetected.checkWithBehavioralContext({
+                toolName,
+                sideEffects: sideEffectResult.sideEffects,
+            }));
+        }
+        // E301: Output Explosion
+        for (const sizeResult of outputSizeResults) {
+            if (sizeResult.exceedsLimit) {
+                diagnostics.push(...E301OutputExplosion.checkWithBehavioralContext({
+                    toolName,
+                    actualSize: sizeResult.actualSize,
+                    maxSize: sizeResult.maxSize,
+                    limitString: sizeResult.limitString,
+                }));
+            }
+        }
+        // E403: Unbounded Execution (timeouts and connection errors only)
+        if (unboundedResult.detected) {
+            diagnostics.push(...E403UnboundedExecution.checkWithBehavioralContext({
+                toolName,
+                timedOut: unboundedResult.timedOut,
+                declaredTimeout: contract.guarantees?.max_execution_time,
+                actualTimeoutMs: toolTimeoutMs,
+                errors: unboundedResult.errors.map(e => ({
+                    message: e.message,
+                    code: e.name,
+                })),
+            }));
+        }
+        // E400: Tool Execution Failed (execution errors, separate from E016)
+        if (executionErrorResult.detected) {
+            diagnostics.push(...E400ToolExecutionFailed.checkWithBehavioralContext({
+                toolName,
+                errors: executionErrorResult.errors.map(e => ({
+                    message: e.message,
+                    code: e.name,
+                })),
+            }));
+        }
+        // Validate output structure (if schema available and test expects success)
+        if (toolSchema.outputSchema) {
+            for (const result of allResults) {
+                if (!result)
+                    continue;
+                // Only validate output if test expects success
+                const expectation = result.expectation;
+                const expectsSuccess = !expectation?.error && expectation?.success !== false;
+                if (result.success && expectsSuccess) {
+                    // Use test-specific output schema or fall back to contract schema
+                    const expectedOutputSchema = this.getExpectedOutputSchema(result);
+                    const outputSchema = expectation?.output_schema
+                        ? this.resolveSchemaByName(expectation.output_schema, toolSchema.outputSchema)
+                        : expectedOutputSchema
+                            ? this.resolveSchemaByName(expectedOutputSchema, toolSchema.outputSchema)
+                            : toolSchema.outputSchema;
+                    const validationResult = validateOutputStructure(result.output, outputSchema || toolSchema.outputSchema);
+                    if (!validationResult.valid) {
+                        // Check if this test result already failed expectation matching
+                        const testResult = testResults.find(tr => tr.testName === result.testName);
+                        if (!testResult || !testResult.passed) {
+                            // Output validation failed - this is unexpected for success expectation
+                            diagnostics.push(...E300OutputValidationFailed.checkWithBehavioralContext({
+                                toolName,
+                                testName: result.testName,
+                                testInput: result.testInput,
+                                expectedOutputSchema: this.getExpectedOutputSchema(result),
+                                error: validationResult.error || 'Unknown error',
+                                details: validationResult.details,
+                            }));
+                        }
+                    }
+                }
+            }
+        }
+        // Compute summary based on test expectations
+        const totalExecutions = allResults.length;
+        const totalContractTests = testResults.length;
+        const passedTests = testResults.filter(tr => tr.passed).length;
+        const failedTests = testResults.filter(tr => !tr.passed).length;
+        const successfulExecutions = allResults.filter(r => r.success).length;
+        const failedExecutions = allResults.filter(r => !r.success).length;
+        const timedOutExecutions = allResults.filter(r => !r.success && r.timedOut === true).length;
+        // Determine if test passed based on expectations (no unmatched diagnostics)
+        // Filter out expected behavioral errors - check if any test expects them
+        // Use error type to code mapping from constants
+        const errorTypeToCode = ERROR_TYPE_TO_CODE;
+        // Collect expected behavioral errors from all test expectations
+        const expectedBehavioralErrors = new Set();
+        if (contract.tests) {
+            for (const test of contract.tests) {
+                if (test.expect?.error?.type) {
+                    const errorType = test.expect.error.type;
+                    const errorCode = errorTypeToCode[errorType];
+                    if (errorCode) {
+                        expectedBehavioralErrors.add(errorCode);
+                    }
+                }
+            }
+        }
+        // Filter out expected behavioral errors from diagnostics
+        // This prevents them from being displayed and counted in the summary
+        const filteredDiagnostics = diagnostics.filter(d => !expectedBehavioralErrors.has(d.code || ''));
+        const errors = filteredDiagnostics.filter(d => d.severity === 'error');
+        const passed = errors.length === 0;
+        return {
+            toolName,
+            contract,
+            diagnostics: filteredDiagnostics, // Use filtered diagnostics to exclude expected errors
+            passed,
+            summary: {
+                totalExecutions,
+                successfulExecutions,
+                failedExecutions,
+                timedOutExecutions,
+                testsPassed: totalContractTests > 0 ? passedTests : undefined,
+                testsFailed: totalContractTests > 0 ? failedTests : undefined,
+            },
+        };
+    }
+    /**
+     * Parse Pydantic validation error message to extract key information.
+     */
+    parseValidationError(errorMessage) {
+        const parsed = {};
+        // Extract field name (usually on its own line)
+        const fieldMatch = errorMessage.match(/^(\w+)\s*$/m);
+        if (fieldMatch && fieldMatch[1]) {
+            parsed.field = fieldMatch[1];
+        }
+        // Extract error type and message
+        const typeMatch = errorMessage.match(/\[type=([^,]+)/);
+        if (typeMatch && typeMatch[1]) {
+            parsed.errorType = typeMatch[1];
+        }
+        // Extract input value and type
+        const inputValueMatch = errorMessage.match(/input_value=([^,]+)/);
+        if (inputValueMatch && inputValueMatch[1]) {
+            parsed.inputValue = inputValueMatch[1].trim();
+        }
+        const inputTypeMatch = errorMessage.match(/input_type=(\w+)/);
+        if (inputTypeMatch && inputTypeMatch[1]) {
+            parsed.inputType = inputTypeMatch[1];
+        }
+        // Build summary based on error type
+        if (parsed.errorType === 'missing_argument') {
+            parsed.summary = `Missing required field: ${parsed.field || 'unknown'}`;
+            parsed.message = `Field "${parsed.field || 'unknown'}" is required but was not provided`;
+        }
+        else if (parsed.errorType === 'string_type') {
+            parsed.summary = `Invalid type for ${parsed.field || 'field'}: expected string, got ${parsed.inputType || 'unknown'}`;
+            parsed.message = `Expected string but received ${parsed.inputType || 'unknown type'}`;
+        }
+        else if (parsed.errorType === 'unexpected_keyword_argument') {
+            parsed.summary = `Unexpected field: ${parsed.field || 'unknown'}`;
+            parsed.message = `Field "${parsed.field || 'unknown'}" is not allowed in the input schema`;
+        }
+        else {
+            // Generic error
+            const firstLine = errorMessage.split('\n')[0];
+            parsed.summary = firstLine || errorMessage;
+            parsed.message = errorMessage;
+        }
+        return parsed;
+    }
+    /**
+     * Match actual result against test expectation.
+     */
+    matchExpectation(expectation, actualOutcome, actualErrorCode, actualErrorType, error) {
+        // No expectation means expect success by default
+        if (!expectation) {
+            return actualOutcome === 'success';
+        }
+        // If error expectation is specified
+        if (expectation.error) {
+            // Must have an error
+            if (actualOutcome !== 'error') {
+                return false;
+            }
+            // Match by type first (most important for developer-friendly matching)
+            if (expectation.error.type && actualErrorType) {
+                const expectedType = String(expectation.error.type).toLowerCase();
+                const actualType = String(actualErrorType).toLowerCase();
+                // Normalize type names for matching
+                const typeMapping = {
+                    input_validation: ['input_validation'],
+                    output_validation: ['output_validation'],
+                    execution_error: ['execution_error', 'unknown'],
+                    side_effect: ['side_effect'],
+                    output_explosion: ['output_explosion'],
+                    unbounded_execution: ['unbounded_execution', 'timeout'],
+                };
+                const expectedTypes = typeMapping[expectedType] || [expectedType];
+                const typeMatches = expectedTypes.some(et => actualType.includes(et) || et === actualType);
+                if (!typeMatches) {
+                    return false;
+                }
+            }
+            // Match error code if specified (optional - for backward compatibility)
+            if (expectation.error.code && actualErrorCode) {
+                const expectedCode = String(expectation.error.code)
+                    .trim()
+                    .toUpperCase();
+                const actualCode = String(actualErrorCode).trim().toUpperCase();
+                if (expectedCode !== actualCode) {
+                    return false;
+                }
+            }
+            // Match error details if specified (most specific matching)
+            if (expectation.error.details && error) {
+                const detailsMatch = this.matchExpectationDetails(expectation.error.details, error);
+                if (!detailsMatch) {
+                    return false;
+                }
+            }
+            // If we have type or details, that's sufficient for matching
+            // If only code was specified, we already checked it above
+            return true;
+        }
+        // If success is explicitly false, expect error
+        if (expectation.success === false) {
+            return actualOutcome === 'error';
+        }
+        // Default: expect success
+        return actualOutcome === 'success';
+    }
+    /**
+     * Match expectation details against actual error.
+     */
+    matchExpectationDetails(expectedDetails, error) {
+        if (!expectedDetails) {
+            return true; // No details to match
+        }
+        const parsedError = this.parseValidationError(error.message);
+        // Match error_type if specified
+        if (expectedDetails.error_type &&
+            expectedDetails.error_type !== parsedError.errorType) {
+            return false;
+        }
+        // Match field if specified
+        if (expectedDetails.field && expectedDetails.field !== parsedError.field) {
+            return false;
+        }
+        // Match expected type if specified (pattern match)
+        if (expectedDetails.expected) {
+            const expectedStr = String(expectedDetails.expected).toLowerCase();
+            if (!error.message.toLowerCase().includes(expectedStr)) {
+                return false;
+            }
+        }
+        // Match received type if specified
+        if (expectedDetails.received &&
+            expectedDetails.received !== parsedError.inputType) {
+            return false;
+        }
+        return true;
+    }
+    /**
+     * Resolve schema by name from JSON Schema $defs.
+     *
+     * Schema names in contracts are string references to named schemas defined in the
+     * tool's schema $defs section (e.g., "Username", "UserResponse").
+     *
+     * This function looks up the named schema from the root schema's $defs dictionary.
+     * If the schema name is not found in $defs, it falls back to the defaultSchema.
+     *
+     * @param schemaName - Schema name to resolve (e.g., "Username")
+     * @param defaultSchema - The root schema containing $defs (e.g., tool outputSchema)
+     * @returns The resolved schema from $defs, or defaultSchema if not found
+     */
+    resolveSchemaByName(schemaName, defaultSchema) {
+        // Check if defaultSchema is an object with $defs
+        if (defaultSchema &&
+            typeof defaultSchema === 'object' &&
+            !Array.isArray(defaultSchema)) {
+            const schema = defaultSchema;
+            // Look for $defs (JSON Schema 2020-12) or definitions (JSON Schema draft-07)
+            const defs = ('$defs' in schema ? schema.$defs : undefined) ||
+                ('definitions' in schema ? schema.definitions : undefined);
+            if (defs && typeof defs === 'object' && !Array.isArray(defs)) {
+                const defsDict = defs;
+                // Look up the schema by name in $defs
+                if (schemaName in defsDict) {
+                    const resolvedSchema = defsDict[schemaName];
+                    // Return the resolved schema, merging with any base schema context if needed
+                    return resolvedSchema;
+                }
+            }
+        }
+        // Fallback to defaultSchema if schema name not found in $defs
+        // This handles cases where schemaName refers to the root schema itself
+        // or when $defs doesn't exist
+        return defaultSchema;
+    }
+}
+//# sourceMappingURL=orchestrator.js.map