ppef 1.0.0 → 1.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +172 -0
- package/bin/ppef.mjs +20 -0
- package/dist/__tests__/framework-pipeline.integration.test.d.ts +7 -0
- package/dist/__tests__/framework-pipeline.integration.test.d.ts.map +1 -0
- package/dist/__tests__/framework-pipeline.integration.test.js +415 -0
- package/dist/__tests__/framework-pipeline.integration.test.js.map +1 -0
- package/dist/__tests__/index-exports.unit.test.d.ts +8 -0
- package/dist/__tests__/index-exports.unit.test.d.ts.map +1 -0
- package/dist/__tests__/index-exports.unit.test.js +127 -0
- package/dist/__tests__/index-exports.unit.test.js.map +1 -0
- package/dist/__tests__/registry-executor.integration.test.d.ts +5 -0
- package/dist/__tests__/registry-executor.integration.test.d.ts.map +1 -0
- package/dist/__tests__/registry-executor.integration.test.js +352 -0
- package/dist/__tests__/registry-executor.integration.test.js.map +1 -0
- package/dist/__tests__/test-helpers.d.ts +94 -0
- package/dist/__tests__/test-helpers.d.ts.map +1 -0
- package/dist/__tests__/test-helpers.js +271 -0
- package/dist/__tests__/test-helpers.js.map +1 -0
- package/dist/aggregation/__tests__/aggregators.unit.test.d.ts +7 -0
- package/dist/aggregation/__tests__/aggregators.unit.test.d.ts.map +1 -0
- package/dist/aggregation/__tests__/aggregators.unit.test.js +350 -0
- package/dist/aggregation/__tests__/aggregators.unit.test.js.map +1 -0
- package/dist/aggregation/__tests__/pipeline.unit.test.d.ts +7 -0
- package/dist/aggregation/__tests__/pipeline.unit.test.d.ts.map +1 -0
- package/dist/aggregation/__tests__/pipeline.unit.test.js +213 -0
- package/dist/aggregation/__tests__/pipeline.unit.test.js.map +1 -0
- package/dist/aggregation/aggregators.d.ts +63 -0
- package/dist/aggregation/aggregators.d.ts.map +1 -0
- package/dist/aggregation/aggregators.js +228 -0
- package/dist/aggregation/aggregators.js.map +1 -0
- package/dist/aggregation/index.d.ts +8 -0
- package/dist/aggregation/index.d.ts.map +1 -0
- package/dist/aggregation/index.js +8 -0
- package/dist/aggregation/index.js.map +1 -0
- package/dist/aggregation/pipeline.d.ts +38 -0
- package/dist/aggregation/pipeline.d.ts.map +1 -0
- package/dist/aggregation/pipeline.js +198 -0
- package/dist/aggregation/pipeline.js.map +1 -0
- package/dist/claims/__tests__/evaluator.unit.test.d.ts +12 -0
- package/dist/claims/__tests__/evaluator.unit.test.d.ts.map +1 -0
- package/dist/claims/__tests__/evaluator.unit.test.js +801 -0
- package/dist/claims/__tests__/evaluator.unit.test.js.map +1 -0
- package/dist/claims/evaluator.d.ts +33 -0
- package/dist/claims/evaluator.d.ts.map +1 -0
- package/dist/claims/evaluator.js +174 -0
- package/dist/claims/evaluator.js.map +1 -0
- package/dist/claims/index.d.ts +7 -0
- package/dist/claims/index.d.ts.map +1 -0
- package/dist/claims/index.js +7 -0
- package/dist/claims/index.js.map +1 -0
- package/dist/cli/__tests__/aggregate.command.unit.test.d.ts +7 -0
- package/dist/cli/__tests__/aggregate.command.unit.test.d.ts.map +1 -0
- package/dist/cli/__tests__/aggregate.command.unit.test.js +396 -0
- package/dist/cli/__tests__/aggregate.command.unit.test.js.map +1 -0
- package/dist/cli/__tests__/commands.unit.test.d.ts +10 -0
- package/dist/cli/__tests__/commands.unit.test.d.ts.map +1 -0
- package/dist/cli/__tests__/commands.unit.test.js +217 -0
- package/dist/cli/__tests__/commands.unit.test.js.map +1 -0
- package/dist/cli/__tests__/index.unit.test.d.ts +10 -0
- package/dist/cli/__tests__/index.unit.test.d.ts.map +1 -0
- package/dist/cli/__tests__/index.unit.test.js +65 -0
- package/dist/cli/__tests__/index.unit.test.js.map +1 -0
- package/dist/cli/__tests__/logger.unit.test.d.ts +11 -0
- package/dist/cli/__tests__/logger.unit.test.d.ts.map +1 -0
- package/dist/cli/__tests__/logger.unit.test.js +180 -0
- package/dist/cli/__tests__/logger.unit.test.js.map +1 -0
- package/dist/cli/__tests__/module-loader.unit.test.d.ts +11 -0
- package/dist/cli/__tests__/module-loader.unit.test.d.ts.map +1 -0
- package/dist/cli/__tests__/module-loader.unit.test.js +262 -0
- package/dist/cli/__tests__/module-loader.unit.test.js.map +1 -0
- package/dist/cli/__tests__/output-writer.unit.test.d.ts +10 -0
- package/dist/cli/__tests__/output-writer.unit.test.d.ts.map +1 -0
- package/dist/cli/__tests__/output-writer.unit.test.js +216 -0
- package/dist/cli/__tests__/output-writer.unit.test.js.map +1 -0
- package/dist/cli/__tests__/plan.command.unit.test.d.ts +7 -0
- package/dist/cli/__tests__/plan.command.unit.test.d.ts.map +1 -0
- package/dist/cli/__tests__/plan.command.unit.test.js +289 -0
- package/dist/cli/__tests__/plan.command.unit.test.js.map +1 -0
- package/dist/cli/__tests__/run.command.unit.test.d.ts +7 -0
- package/dist/cli/__tests__/run.command.unit.test.d.ts.map +1 -0
- package/dist/cli/__tests__/run.command.unit.test.js +422 -0
- package/dist/cli/__tests__/run.command.unit.test.js.map +1 -0
- package/dist/cli/__tests__/validate.command.unit.test.d.ts +7 -0
- package/dist/cli/__tests__/validate.command.unit.test.d.ts.map +1 -0
- package/dist/cli/__tests__/validate.command.unit.test.js +226 -0
- package/dist/cli/__tests__/validate.command.unit.test.js.map +1 -0
- package/dist/cli/command-deps.d.ts +125 -0
- package/dist/cli/command-deps.d.ts.map +1 -0
- package/dist/cli/command-deps.js +7 -0
- package/dist/cli/command-deps.js.map +1 -0
- package/dist/cli/commands/aggregate.d.ts +35 -0
- package/dist/cli/commands/aggregate.d.ts.map +1 -0
- package/dist/cli/commands/aggregate.js +121 -0
- package/dist/cli/commands/aggregate.js.map +1 -0
- package/dist/cli/commands/plan.d.ts +36 -0
- package/dist/cli/commands/plan.d.ts.map +1 -0
- package/dist/cli/commands/plan.js +109 -0
- package/dist/cli/commands/plan.js.map +1 -0
- package/dist/cli/commands/run.d.ts +33 -0
- package/dist/cli/commands/run.d.ts.map +1 -0
- package/dist/cli/commands/run.js +185 -0
- package/dist/cli/commands/run.js.map +1 -0
- package/dist/cli/commands/validate.d.ts +27 -0
- package/dist/cli/commands/validate.d.ts.map +1 -0
- package/dist/cli/commands/validate.js +88 -0
- package/dist/cli/commands/validate.js.map +1 -0
- package/dist/cli/config-loader.d.ts +30 -0
- package/dist/cli/config-loader.d.ts.map +1 -0
- package/dist/cli/config-loader.js +181 -0
- package/dist/cli/config-loader.js.map +1 -0
- package/dist/cli/index.d.ts +26 -0
- package/dist/cli/index.d.ts.map +1 -0
- package/dist/cli/index.js +58 -0
- package/dist/cli/index.js.map +1 -0
- package/dist/cli/logger.d.ts +75 -0
- package/dist/cli/logger.d.ts.map +1 -0
- package/dist/cli/logger.js +131 -0
- package/dist/cli/logger.js.map +1 -0
- package/dist/cli/module-loader.d.ts +46 -0
- package/dist/cli/module-loader.d.ts.map +1 -0
- package/dist/cli/module-loader.js +116 -0
- package/dist/cli/module-loader.js.map +1 -0
- package/dist/cli/output-writer.d.ts +51 -0
- package/dist/cli/output-writer.d.ts.map +1 -0
- package/dist/cli/output-writer.js +65 -0
- package/dist/cli/output-writer.js.map +1 -0
- package/dist/cli/types.d.ts +174 -0
- package/dist/cli/types.d.ts.map +1 -0
- package/dist/cli/types.js +7 -0
- package/dist/cli/types.js.map +1 -0
- package/dist/collector/__tests__/result-collector.unit.test.d.ts +7 -0
- package/dist/collector/__tests__/result-collector.unit.test.d.ts.map +1 -0
- package/dist/collector/__tests__/result-collector.unit.test.js +1021 -0
- package/dist/collector/__tests__/result-collector.unit.test.js.map +1 -0
- package/dist/collector/__tests__/schema.unit.test.d.ts +7 -0
- package/dist/collector/__tests__/schema.unit.test.d.ts.map +1 -0
- package/dist/collector/__tests__/schema.unit.test.js +360 -0
- package/dist/collector/__tests__/schema.unit.test.js.map +1 -0
- package/dist/collector/index.d.ts +8 -0
- package/dist/collector/index.d.ts.map +1 -0
- package/dist/collector/index.js +8 -0
- package/dist/collector/index.js.map +1 -0
- package/dist/collector/result-collector.d.ts +159 -0
- package/dist/collector/result-collector.d.ts.map +1 -0
- package/dist/collector/result-collector.js +213 -0
- package/dist/collector/result-collector.js.map +1 -0
- package/dist/collector/schema.d.ts +34 -0
- package/dist/collector/schema.d.ts.map +1 -0
- package/dist/collector/schema.js +145 -0
- package/dist/collector/schema.js.map +1 -0
- package/dist/executor/__tests__/checkpoint-hash-bug.diagnostic.test.d.ts +10 -0
- package/dist/executor/__tests__/checkpoint-hash-bug.diagnostic.test.d.ts.map +1 -0
- package/dist/executor/__tests__/checkpoint-hash-bug.diagnostic.test.js +122 -0
- package/dist/executor/__tests__/checkpoint-hash-bug.diagnostic.test.js.map +1 -0
- package/dist/executor/__tests__/checkpoint-manager.integration.test.d.ts +7 -0
- package/dist/executor/__tests__/checkpoint-manager.integration.test.d.ts.map +1 -0
- package/dist/executor/__tests__/checkpoint-manager.integration.test.js +330 -0
- package/dist/executor/__tests__/checkpoint-manager.integration.test.js.map +1 -0
- package/dist/executor/__tests__/checkpoint-manager.unit.test.d.ts +7 -0
- package/dist/executor/__tests__/checkpoint-manager.unit.test.d.ts.map +1 -0
- package/dist/executor/__tests__/checkpoint-manager.unit.test.js +531 -0
- package/dist/executor/__tests__/checkpoint-manager.unit.test.js.map +1 -0
- package/dist/executor/__tests__/checkpoint-merge-bug.diagnostic.test.d.ts +8 -0
- package/dist/executor/__tests__/checkpoint-merge-bug.diagnostic.test.d.ts.map +1 -0
- package/dist/executor/__tests__/checkpoint-merge-bug.diagnostic.test.js +493 -0
- package/dist/executor/__tests__/checkpoint-merge-bug.diagnostic.test.js.map +1 -0
- package/dist/executor/__tests__/checkpoint-merge-bug.unit.test.d.ts +8 -0
- package/dist/executor/__tests__/checkpoint-merge-bug.unit.test.d.ts.map +1 -0
- package/dist/executor/__tests__/checkpoint-merge-bug.unit.test.js +164 -0
- package/dist/executor/__tests__/checkpoint-merge-bug.unit.test.js.map +1 -0
- package/dist/executor/__tests__/checkpoint-storage.unit.test.d.ts +7 -0
- package/dist/executor/__tests__/checkpoint-storage.unit.test.d.ts.map +1 -0
- package/dist/executor/__tests__/checkpoint-storage.unit.test.js +490 -0
- package/dist/executor/__tests__/checkpoint-storage.unit.test.js.map +1 -0
- package/dist/executor/__tests__/executor.unit.test.d.ts +7 -0
- package/dist/executor/__tests__/executor.unit.test.d.ts.map +1 -0
- package/dist/executor/__tests__/executor.unit.test.js +202 -0
- package/dist/executor/__tests__/executor.unit.test.js.map +1 -0
- package/dist/executor/__tests__/memory-monitor.unit.test.d.ts +7 -0
- package/dist/executor/__tests__/memory-monitor.unit.test.d.ts.map +1 -0
- package/dist/executor/__tests__/memory-monitor.unit.test.js +285 -0
- package/dist/executor/__tests__/memory-monitor.unit.test.js.map +1 -0
- package/dist/executor/__tests__/parallel-checkpoint-merge.integration.test.d.ts +12 -0
- package/dist/executor/__tests__/parallel-checkpoint-merge.integration.test.d.ts.map +1 -0
- package/dist/executor/__tests__/parallel-checkpoint-merge.integration.test.js +196 -0
- package/dist/executor/__tests__/parallel-checkpoint-merge.integration.test.js.map +1 -0
- package/dist/executor/__tests__/parallel-executor.integration.test.d.ts +7 -0
- package/dist/executor/__tests__/parallel-executor.integration.test.d.ts.map +1 -0
- package/dist/executor/__tests__/parallel-executor.integration.test.js +249 -0
- package/dist/executor/__tests__/parallel-executor.integration.test.js.map +1 -0
- package/dist/executor/__tests__/parallel-executor.unit.test.d.ts +8 -0
- package/dist/executor/__tests__/parallel-executor.unit.test.d.ts.map +1 -0
- package/dist/executor/__tests__/parallel-executor.unit.test.js +473 -0
- package/dist/executor/__tests__/parallel-executor.unit.test.js.map +1 -0
- package/dist/executor/__tests__/run-id.unit.test.d.ts +8 -0
- package/dist/executor/__tests__/run-id.unit.test.d.ts.map +1 -0
- package/dist/executor/__tests__/run-id.unit.test.js +156 -0
- package/dist/executor/__tests__/run-id.unit.test.js.map +1 -0
- package/dist/executor/__tests__/worker-entry.integration.test.d.ts +24 -0
- package/dist/executor/__tests__/worker-entry.integration.test.d.ts.map +1 -0
- package/dist/executor/__tests__/worker-entry.integration.test.js +82 -0
- package/dist/executor/__tests__/worker-entry.integration.test.js.map +1 -0
- package/dist/executor/__tests__/worker-entry.unit.test.d.ts +7 -0
- package/dist/executor/__tests__/worker-entry.unit.test.d.ts.map +1 -0
- package/dist/executor/__tests__/worker-entry.unit.test.js +364 -0
- package/dist/executor/__tests__/worker-entry.unit.test.js.map +1 -0
- package/dist/executor/checkpoint-manager.d.ts +231 -0
- package/dist/executor/checkpoint-manager.d.ts.map +1 -0
- package/dist/executor/checkpoint-manager.js +395 -0
- package/dist/executor/checkpoint-manager.js.map +1 -0
- package/dist/executor/checkpoint-storage.d.ts +230 -0
- package/dist/executor/checkpoint-storage.d.ts.map +1 -0
- package/dist/executor/checkpoint-storage.js +370 -0
- package/dist/executor/checkpoint-storage.js.map +1 -0
- package/dist/executor/checkpoint-types.d.ts +48 -0
- package/dist/executor/checkpoint-types.d.ts.map +1 -0
- package/dist/executor/checkpoint-types.js +8 -0
- package/dist/executor/checkpoint-types.js.map +1 -0
- package/dist/executor/executor.d.ts +164 -0
- package/dist/executor/executor.d.ts.map +1 -0
- package/dist/executor/executor.js +408 -0
- package/dist/executor/executor.js.map +1 -0
- package/dist/executor/index.d.ts +11 -0
- package/dist/executor/index.d.ts.map +1 -0
- package/dist/executor/index.js +11 -0
- package/dist/executor/index.js.map +1 -0
- package/dist/executor/memory-monitor.d.ts +115 -0
- package/dist/executor/memory-monitor.d.ts.map +1 -0
- package/dist/executor/memory-monitor.js +168 -0
- package/dist/executor/memory-monitor.js.map +1 -0
- package/dist/executor/parallel-executor.d.ts +239 -0
- package/dist/executor/parallel-executor.d.ts.map +1 -0
- package/dist/executor/parallel-executor.js +329 -0
- package/dist/executor/parallel-executor.js.map +1 -0
- package/dist/executor/run-id.d.ts +71 -0
- package/dist/executor/run-id.d.ts.map +1 -0
- package/dist/executor/run-id.js +74 -0
- package/dist/executor/run-id.js.map +1 -0
- package/dist/executor/worker-entry.d.ts +10 -0
- package/dist/executor/worker-entry.d.ts.map +1 -0
- package/dist/executor/worker-entry.js +42 -0
- package/dist/executor/worker-entry.js.map +1 -0
- package/dist/executor/worker-executor.d.ts +156 -0
- package/dist/executor/worker-executor.d.ts.map +1 -0
- package/dist/executor/worker-executor.js +88 -0
- package/dist/executor/worker-executor.js.map +1 -0
- package/dist/index.cjs +11 -0
- package/dist/index.d.ts +15 -0
- package/dist/index.d.ts.map +1 -0
- package/dist/index.js +24 -0
- package/dist/index.js.map +1 -0
- package/dist/registry/case-registry.d.ts +113 -0
- package/dist/registry/case-registry.d.ts.map +1 -0
- package/dist/registry/case-registry.js +160 -0
- package/dist/registry/case-registry.js.map +1 -0
- package/dist/registry/index.d.ts +8 -0
- package/dist/registry/index.d.ts.map +1 -0
- package/dist/registry/index.js +8 -0
- package/dist/registry/index.js.map +1 -0
- package/dist/registry/sut-registry.d.ts +96 -0
- package/dist/registry/sut-registry.d.ts.map +1 -0
- package/dist/registry/sut-registry.js +126 -0
- package/dist/registry/sut-registry.js.map +1 -0
- package/dist/renderers/index.d.ts +10 -0
- package/dist/renderers/index.d.ts.map +1 -0
- package/dist/renderers/index.js +9 -0
- package/dist/renderers/index.js.map +1 -0
- package/dist/renderers/latex-renderer.d.ts +84 -0
- package/dist/renderers/latex-renderer.d.ts.map +1 -0
- package/dist/renderers/latex-renderer.js +208 -0
- package/dist/renderers/latex-renderer.js.map +1 -0
- package/dist/renderers/types.d.ts +106 -0
- package/dist/renderers/types.d.ts.map +1 -0
- package/dist/renderers/types.js +23 -0
- package/dist/renderers/types.js.map +1 -0
- package/dist/robustness/__tests__/analyzer.unit.test.d.ts +11 -0
- package/dist/robustness/__tests__/analyzer.unit.test.d.ts.map +1 -0
- package/dist/robustness/__tests__/analyzer.unit.test.js +455 -0
- package/dist/robustness/__tests__/analyzer.unit.test.js.map +1 -0
- package/dist/robustness/__tests__/perturbations.unit.test.d.ts +11 -0
- package/dist/robustness/__tests__/perturbations.unit.test.d.ts.map +1 -0
- package/dist/robustness/__tests__/perturbations.unit.test.js +284 -0
- package/dist/robustness/__tests__/perturbations.unit.test.js.map +1 -0
- package/dist/robustness/analyzer.d.ts +61 -0
- package/dist/robustness/analyzer.d.ts.map +1 -0
- package/dist/robustness/analyzer.js +191 -0
- package/dist/robustness/analyzer.js.map +1 -0
- package/dist/robustness/index.d.ts +8 -0
- package/dist/robustness/index.d.ts.map +1 -0
- package/dist/robustness/index.js +8 -0
- package/dist/robustness/index.js.map +1 -0
- package/dist/robustness/perturbations.d.ts +46 -0
- package/dist/robustness/perturbations.d.ts.map +1 -0
- package/dist/robustness/perturbations.js +184 -0
- package/dist/robustness/perturbations.js.map +1 -0
- package/dist/statistical/__tests__/mann-whitney-u.unit.test.d.ts +7 -0
- package/dist/statistical/__tests__/mann-whitney-u.unit.test.d.ts.map +1 -0
- package/dist/statistical/__tests__/mann-whitney-u.unit.test.js +185 -0
- package/dist/statistical/__tests__/mann-whitney-u.unit.test.js.map +1 -0
- package/dist/statistical/index.d.ts +8 -0
- package/dist/statistical/index.d.ts.map +1 -0
- package/dist/statistical/index.js +8 -0
- package/dist/statistical/index.js.map +1 -0
- package/dist/statistical/mann-whitney-u.d.ts +62 -0
- package/dist/statistical/mann-whitney-u.d.ts.map +1 -0
- package/dist/statistical/mann-whitney-u.js +127 -0
- package/dist/statistical/mann-whitney-u.js.map +1 -0
- package/dist/types/aggregate.d.ts +124 -0
- package/dist/types/aggregate.d.ts.map +1 -0
- package/dist/types/aggregate.js +9 -0
- package/dist/types/aggregate.js.map +1 -0
- package/dist/types/case.d.ts +105 -0
- package/dist/types/case.d.ts.map +1 -0
- package/dist/types/case.js +10 -0
- package/dist/types/case.js.map +1 -0
- package/dist/types/claims.d.ts +122 -0
- package/dist/types/claims.d.ts.map +1 -0
- package/dist/types/claims.js +14 -0
- package/dist/types/claims.js.map +1 -0
- package/dist/types/index.d.ts +12 -0
- package/dist/types/index.d.ts.map +1 -0
- package/dist/types/index.js +7 -0
- package/dist/types/index.js.map +1 -0
- package/dist/types/perturbation.d.ts +105 -0
- package/dist/types/perturbation.d.ts.map +1 -0
- package/dist/types/perturbation.js +9 -0
- package/dist/types/perturbation.js.map +1 -0
- package/dist/types/result.d.ts +150 -0
- package/dist/types/result.d.ts.map +1 -0
- package/dist/types/result.js +12 -0
- package/dist/types/result.js.map +1 -0
- package/dist/types/sut.d.ts +128 -0
- package/dist/types/sut.d.ts.map +1 -0
- package/dist/types/sut.js +12 -0
- package/dist/types/sut.js.map +1 -0
- package/package.json +290 -7
|
@@ -0,0 +1,150 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Evaluation Result Type Definitions
|
|
3
|
+
*
|
|
4
|
+
* The canonical schema for individual evaluation results. Each result
|
|
5
|
+
* captures everything needed for reproducibility and auditing:
|
|
6
|
+
* - Deterministic run identity
|
|
7
|
+
* - Correctness assessment
|
|
8
|
+
* - Output artefacts and metrics
|
|
9
|
+
* - Provenance information
|
|
10
|
+
*/
|
|
11
|
+
import type { ArtefactReference, Primitive } from "./case.js";
|
|
12
|
+
import type { SutRole } from "./sut.js";
|
|
13
|
+
/**
|
|
14
|
+
* Categories of evaluation failure.
|
|
15
|
+
*/
|
|
16
|
+
export type FailureType = "no_output" | "invalid_structure" | "constraint_violation" | "exception" | "oracle_mismatch" | "timeout";
|
|
17
|
+
/**
|
|
18
|
+
* Run identity and context.
|
|
19
|
+
*/
|
|
20
|
+
export interface RunContext {
|
|
21
|
+
/** Deterministic run ID (hash of inputs) */
|
|
22
|
+
runId: string;
|
|
23
|
+
/** SUT identifier */
|
|
24
|
+
sut: string;
|
|
25
|
+
/** SUT role (primary/baseline/oracle) */
|
|
26
|
+
sutRole: SutRole;
|
|
27
|
+
/** SUT version for reproducibility */
|
|
28
|
+
sutVersion?: string;
|
|
29
|
+
/** Case identifier */
|
|
30
|
+
caseId: string;
|
|
31
|
+
/** Case class for grouping */
|
|
32
|
+
caseClass?: string;
|
|
33
|
+
/** Configuration overrides for this run */
|
|
34
|
+
config?: Record<string, Primitive>;
|
|
35
|
+
/** Random seed if applicable */
|
|
36
|
+
seed?: number;
|
|
37
|
+
/** Repetition number for statistical runs */
|
|
38
|
+
repetition?: number;
|
|
39
|
+
}
|
|
40
|
+
/**
|
|
41
|
+
* Correctness assessment.
|
|
42
|
+
*/
|
|
43
|
+
export interface CorrectnessResult {
|
|
44
|
+
/** Whether expected output exists (oracle available) */
|
|
45
|
+
expectedExists: boolean;
|
|
46
|
+
/** Whether the SUT produced any output */
|
|
47
|
+
producedOutput: boolean;
|
|
48
|
+
/** Whether output is structurally valid */
|
|
49
|
+
valid: boolean;
|
|
50
|
+
/** Whether output matches expected (null if no oracle) */
|
|
51
|
+
matchesExpected: boolean | null;
|
|
52
|
+
/** Failure classification if applicable */
|
|
53
|
+
failureType?: FailureType;
|
|
54
|
+
/** Human-readable failure notes */
|
|
55
|
+
notes?: string[];
|
|
56
|
+
}
|
|
57
|
+
/**
|
|
58
|
+
* A ranked item for ranking tasks.
|
|
59
|
+
*/
|
|
60
|
+
export interface RankedItem {
|
|
61
|
+
/** Item identifier */
|
|
62
|
+
itemId: string;
|
|
63
|
+
/** Score or rank value */
|
|
64
|
+
score: number;
|
|
65
|
+
/** Optional additional metadata */
|
|
66
|
+
metadata?: Record<string, Primitive>;
|
|
67
|
+
}
|
|
68
|
+
/**
|
|
69
|
+
* Output artefacts and summaries.
|
|
70
|
+
*/
|
|
71
|
+
export interface ResultOutputs {
|
|
72
|
+
/** Scalar summary values */
|
|
73
|
+
summary?: Record<string, Primitive | Primitive[]>;
|
|
74
|
+
/** Classification labels */
|
|
75
|
+
labels?: Record<string, Primitive>;
|
|
76
|
+
/** Ranking results */
|
|
77
|
+
ranking?: RankedItem[];
|
|
78
|
+
/** References to generated artefacts */
|
|
79
|
+
artefacts?: ArtefactReference[];
|
|
80
|
+
/** Additional untyped outputs */
|
|
81
|
+
extra?: Record<string, unknown>;
|
|
82
|
+
}
|
|
83
|
+
/**
|
|
84
|
+
* Numeric metrics collected during evaluation.
|
|
85
|
+
*/
|
|
86
|
+
export interface ResultMetrics {
|
|
87
|
+
/** Primary numeric metrics */
|
|
88
|
+
numeric: Record<string, number>;
|
|
89
|
+
/** Additional metrics (overflow) */
|
|
90
|
+
extra?: Record<string, number>;
|
|
91
|
+
}
|
|
92
|
+
/**
|
|
93
|
+
* Provenance information for reproducibility.
|
|
94
|
+
*/
|
|
95
|
+
export interface Provenance {
|
|
96
|
+
/** Execution environment */
|
|
97
|
+
runtime: {
|
|
98
|
+
platform: string;
|
|
99
|
+
arch: string;
|
|
100
|
+
nodeVersion: string;
|
|
101
|
+
};
|
|
102
|
+
/** Git commit hash */
|
|
103
|
+
gitCommit?: string;
|
|
104
|
+
/** Whether working directory had uncommitted changes */
|
|
105
|
+
dirty?: boolean;
|
|
106
|
+
/** Hash of package-lock.json for dependency pinning */
|
|
107
|
+
dependencyLockHash?: string;
|
|
108
|
+
/** Parent run IDs (for derived results) */
|
|
109
|
+
parentRunIds?: string[];
|
|
110
|
+
/** Execution timestamp */
|
|
111
|
+
timestamp?: string;
|
|
112
|
+
/** Wall-clock execution time in milliseconds */
|
|
113
|
+
executionTimeMs?: number;
|
|
114
|
+
/** Peak memory usage during execution (bytes) */
|
|
115
|
+
peakMemoryBytes?: number;
|
|
116
|
+
/** Memory usage at completion (bytes) */
|
|
117
|
+
finalMemoryBytes?: number;
|
|
118
|
+
}
|
|
119
|
+
/**
|
|
120
|
+
* Complete evaluation result.
|
|
121
|
+
*
|
|
122
|
+
* This is the canonical schema for all evaluation outputs. Every experiment
|
|
123
|
+
* produces results in this format for consistent aggregation and rendering.
|
|
124
|
+
*/
|
|
125
|
+
export interface EvaluationResult {
|
|
126
|
+
/** Run identity and context */
|
|
127
|
+
run: RunContext;
|
|
128
|
+
/** Correctness assessment */
|
|
129
|
+
correctness: CorrectnessResult;
|
|
130
|
+
/** Output artefacts and summaries */
|
|
131
|
+
outputs: ResultOutputs;
|
|
132
|
+
/** Numeric metrics */
|
|
133
|
+
metrics: ResultMetrics;
|
|
134
|
+
/** Provenance for reproducibility */
|
|
135
|
+
provenance: Provenance;
|
|
136
|
+
}
|
|
137
|
+
/**
|
|
138
|
+
* Batch of evaluation results.
|
|
139
|
+
*/
|
|
140
|
+
export interface ResultBatch {
|
|
141
|
+
/** Schema version */
|
|
142
|
+
version: string;
|
|
143
|
+
/** Generation timestamp */
|
|
144
|
+
timestamp: string;
|
|
145
|
+
/** All results in this batch */
|
|
146
|
+
results: EvaluationResult[];
|
|
147
|
+
/** Optional batch-level metadata */
|
|
148
|
+
metadata?: Record<string, Primitive>;
|
|
149
|
+
}
|
|
150
|
+
//# sourceMappingURL=result.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"result.d.ts","sourceRoot":"","sources":["../../src/types/result.ts"],"names":[],"mappings":"AAAA;;;;;;;;;GASG;AAEH,OAAO,KAAK,EAAE,iBAAiB,EAAE,SAAS,EAAE,MAAM,WAAW,CAAC;AAC9D,OAAO,KAAK,EAAE,OAAO,EAAE,MAAM,UAAU,CAAC;AAExC;;GAEG;AACH,MAAM,MAAM,WAAW,GACpB,WAAW,GACX,mBAAmB,GACnB,sBAAsB,GACtB,WAAW,GACX,iBAAiB,GACjB,SAAS,CAAC;AAEb;;GAEG;AACH,MAAM,WAAW,UAAU;IAC1B,4CAA4C;IAC5C,KAAK,EAAE,MAAM,CAAC;IAEd,qBAAqB;IACrB,GAAG,EAAE,MAAM,CAAC;IAEZ,yCAAyC;IACzC,OAAO,EAAE,OAAO,CAAC;IAEjB,sCAAsC;IACtC,UAAU,CAAC,EAAE,MAAM,CAAC;IAEpB,sBAAsB;IACtB,MAAM,EAAE,MAAM,CAAC;IAEf,8BAA8B;IAC9B,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB,2CAA2C;IAC3C,MAAM,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,SAAS,CAAC,CAAC;IAEnC,gCAAgC;IAChC,IAAI,CAAC,EAAE,MAAM,CAAC;IAEd,6CAA6C;IAC7C,UAAU,CAAC,EAAE,MAAM,CAAC;CACpB;AAED;;GAEG;AACH,MAAM,WAAW,iBAAiB;IACjC,wDAAwD;IACxD,cAAc,EAAE,OAAO,CAAC;IAExB,0CAA0C;IAC1C,cAAc,EAAE,OAAO,CAAC;IAExB,2CAA2C;IAC3C,KAAK,EAAE,OAAO,CAAC;IAEf,0DAA0D;IAC1D,eAAe,EAAE,OAAO,GAAG,IAAI,CAAC;IAEhC,2CAA2C;IAC3C,WAAW,CAAC,EAAE,WAAW,CAAC;IAE1B,mCAAmC;IACnC,KAAK,CAAC,EAAE,MAAM,EAAE,CAAC;CACjB;AAED;;GAEG;AACH,MAAM,WAAW,UAAU;IAC1B,sBAAsB;IACtB,MAAM,EAAE,MAAM,CAAC;IAEf,0BAA0B;IAC1B,KAAK,EAAE,MAAM,CAAC;IAEd,mCAAmC;IACnC,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,SAAS,CAAC,CAAC;CACrC;AAED;;GAEG;AACH,MAAM,WAAW,aAAa;IAC7B,4BAA4B;IAC5B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,SAAS,GAAG,SAAS,EAAE,CAAC,CAAC;IAElD,4BAA4B;IAC5B,MAAM,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,SAAS,CAAC,CAAC;IAEnC,sBAAsB;IACtB,OAAO,CAAC,EAAE,UAAU,EAAE,CAAC;IAEvB,wCAAwC;IACxC,SAAS,CAAC,EAAE,iBAAiB,EAAE,CAAC;IAEhC,iCAAiC;IACjC,KAAK,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;CAChC;AAED;;GAEG;AACH,MAAM,WAAW,aAAa;IAC7B,8BAA8B;IAC9B,OAAO,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IAEhC,oCAAoC;IACpC,KAAK,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;CAC/B;AAED;;GAEG;AACH,MAAM,WAAW,UAAU;IAC1B,4BAA4B;IAC5B,OAAO,EAAE;QACR,QAAQ,EAAE,MAAM,CAAC;QACjB,IAAI,EAAE,MAAM,CAAC;QACb,WAAW,EAAE,MAAM,CAAC;KACpB,CAAC;IAEF,sBAAsB;IACtB,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB,wDAAwD;IACxD,KAAK,CAAC,EAAE,OAAO,CAAC;IAEhB,uDAAuD;IACvD,kBAAkB,CAAC,EAAE,MAAM,CAAC;IAE5B,2CAA2C;IAC3C,YAAY,CAAC,EAAE,MAAM,EAAE,CAAC;IAExB,0BAA0B;IAC1B,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB,gDAAgD;IAChD,eAAe,CAAC,EAAE,MAAM,CAAC;IAEzB,iDAAiD;IACjD,eAAe,CAAC,EAAE,MAAM,CAAC;IAEzB,yCAAyC;IACzC,gBAAgB,CAAC,EAAE,MAAM,CAAC;CAC1B;AAED;;;;;GAKG;AACH,MAAM,WAAW,gBAAgB;IAChC,+BAA+B;IAC/B,GAAG,EAAE,UAAU,CAAC;IAEhB,6BAA6B;IAC7B,WAAW,EAAE,iBAAiB,CAAC;IAE/B,qCAAqC;IACrC,OAAO,EAAE,aAAa,CAAC;IAEvB,sBAAsB;IACtB,OAAO,EAAE,aAAa,CAAC;IAEvB,qCAAqC;IACrC,UAAU,EAAE,UAAU,CAAC;CACvB;AAED;;GAEG;AACH,MAAM,WAAW,WAAW;IAC3B,qBAAqB;IACrB,OAAO,EAAE,MAAM,CAAC;IAEhB,2BAA2B;IAC3B,SAAS,EAAE,MAAM,CAAC;IAElB,gCAAgC;IAChC,OAAO,EAAE,gBAAgB,EAAE,CAAC;IAE5B,oCAAoC;IACpC,QAAQ,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,SAAS,CAAC,CAAC;CACrC"}
|
|
@@ -0,0 +1,12 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Evaluation Result Type Definitions
|
|
3
|
+
*
|
|
4
|
+
* The canonical schema for individual evaluation results. Each result
|
|
5
|
+
* captures everything needed for reproducibility and auditing:
|
|
6
|
+
* - Deterministic run identity
|
|
7
|
+
* - Correctness assessment
|
|
8
|
+
* - Output artefacts and metrics
|
|
9
|
+
* - Provenance information
|
|
10
|
+
*/
|
|
11
|
+
export {};
|
|
12
|
+
//# sourceMappingURL=result.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"result.js","sourceRoot":"","sources":["../../src/types/result.ts"],"names":[],"mappings":"AAAA;;;;;;;;;GASG"}
|
|
@@ -0,0 +1,128 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* System Under Test (SUT) Type Definitions
|
|
3
|
+
*
|
|
4
|
+
* SUTs represent the algorithms being evaluated. Each SUT has a role that
|
|
5
|
+
* determines how its results are interpreted during evaluation:
|
|
6
|
+
*
|
|
7
|
+
* - primary: The algorithm being proposed/evaluated (e.g., Degree-Prioritised)
|
|
8
|
+
* - baseline: Comparison algorithms (e.g., Standard BFS, Frontier-Balanced)
|
|
9
|
+
* - oracle: Ground truth provider for correctness validation
|
|
10
|
+
*/
|
|
11
|
+
/**
|
|
12
|
+
* Role of the SUT in evaluation.
|
|
13
|
+
*
|
|
14
|
+
* - `primary`: The algorithm being proposed/evaluated
|
|
15
|
+
* - `baseline`: Comparison algorithm for relative evaluation
|
|
16
|
+
* - `oracle`: Ground truth provider for correctness validation
|
|
17
|
+
*/
|
|
18
|
+
export type SutRole = "primary" | "baseline" | "oracle";
|
|
19
|
+
/**
|
|
20
|
+
* Registration information for a System Under Test.
|
|
21
|
+
*/
|
|
22
|
+
export interface SutRegistration {
|
|
23
|
+
/** Unique identifier (e.g., "degree-prioritised-v1.0.0") */
|
|
24
|
+
id: string;
|
|
25
|
+
/** Human-readable name (e.g., "Degree-Prioritised Expansion") */
|
|
26
|
+
name: string;
|
|
27
|
+
/** Version string for reproducibility */
|
|
28
|
+
version: string;
|
|
29
|
+
/** Role in evaluation */
|
|
30
|
+
role: SutRole;
|
|
31
|
+
/** Configuration parameters (immutable) */
|
|
32
|
+
config: Readonly<Record<string, unknown>>;
|
|
33
|
+
/** Searchable tags for filtering */
|
|
34
|
+
tags: readonly string[];
|
|
35
|
+
/** Optional description for documentation */
|
|
36
|
+
description?: string;
|
|
37
|
+
}
|
|
38
|
+
/**
|
|
39
|
+
* Universal SUT interface for algorithms that take inputs and produce results.
|
|
40
|
+
*
|
|
41
|
+
* This is the core abstraction - any algorithm can be evaluated if it:
|
|
42
|
+
* 1. Takes INPUTS (what it needs to run)
|
|
43
|
+
* 2. Produces OUTPUTS (what it returns)
|
|
44
|
+
* 3. Can be measured (metrics extraction)
|
|
45
|
+
*
|
|
46
|
+
* @template TInputs - The algorithm-specific inputs type
|
|
47
|
+
* @template TResult - The algorithm result type
|
|
48
|
+
*/
|
|
49
|
+
export interface SUT<TInputs, TResult> {
|
|
50
|
+
/** Unique identifier */
|
|
51
|
+
readonly id: string;
|
|
52
|
+
/** Immutable configuration */
|
|
53
|
+
readonly config: Readonly<Record<string, unknown>>;
|
|
54
|
+
/**
|
|
55
|
+
* Execute the algorithm.
|
|
56
|
+
*
|
|
57
|
+
* @param inputs - Algorithm-specific inputs
|
|
58
|
+
* @returns Promise resolving to algorithm result
|
|
59
|
+
*/
|
|
60
|
+
run(inputs: TInputs): Promise<TResult>;
|
|
61
|
+
}
|
|
62
|
+
/**
|
|
63
|
+
* Factory function type for instantiating SUTs.
|
|
64
|
+
*
|
|
65
|
+
* @template TInputs - The algorithm inputs type
|
|
66
|
+
* @template TResult - The algorithm result type
|
|
67
|
+
*/
|
|
68
|
+
export type SutFactory<TInputs, TResult> = (config?: Record<string, unknown>) => SUT<TInputs, TResult>;
|
|
69
|
+
/**
|
|
70
|
+
* Runtime instance of a SUT ready for execution.
|
|
71
|
+
* @deprecated Use SUT<TInputs, TResult> directly
|
|
72
|
+
*/
|
|
73
|
+
export interface SutInstance<TResult> {
|
|
74
|
+
/** Execute the algorithm and return results */
|
|
75
|
+
run(): Promise<TResult>;
|
|
76
|
+
}
|
|
77
|
+
/**
|
|
78
|
+
* Complete SUT definition including factory and metadata.
|
|
79
|
+
*
|
|
80
|
+
* @template TInputs - The algorithm inputs type
|
|
81
|
+
* @template TResult - The algorithm result type
|
|
82
|
+
*/
|
|
83
|
+
export interface SutDefinition<TInputs = unknown, TResult = unknown> {
|
|
84
|
+
/** Registration metadata */
|
|
85
|
+
registration: SutRegistration;
|
|
86
|
+
/** Factory for creating SUT instances */
|
|
87
|
+
factory: SutFactory<TInputs, TResult>;
|
|
88
|
+
}
|
|
89
|
+
/**
|
|
90
|
+
* Universal SUT result structure.
|
|
91
|
+
*
|
|
92
|
+
* Generic outputs allow any algorithm type to be evaluated:
|
|
93
|
+
* - Expansion: paths, nodes, edges
|
|
94
|
+
* - Ranking: ranked paths, scores
|
|
95
|
+
* - Classification: labels, confidences
|
|
96
|
+
*
|
|
97
|
+
* @template TOutputs - The outputs type (generic, not hardcoded)
|
|
98
|
+
*/
|
|
99
|
+
export interface SUTResult<TOutputs = unknown> {
|
|
100
|
+
/** Unique identifier for this run */
|
|
101
|
+
runId: string;
|
|
102
|
+
/** SUT identifier */
|
|
103
|
+
sutId: string;
|
|
104
|
+
/** SUT version */
|
|
105
|
+
sutVersion: string;
|
|
106
|
+
/** Case identifier */
|
|
107
|
+
caseId: string;
|
|
108
|
+
/** Unix timestamp of execution */
|
|
109
|
+
timestamp: number;
|
|
110
|
+
/** Execution duration in milliseconds */
|
|
111
|
+
duration: number;
|
|
112
|
+
/** Correctness assessment */
|
|
113
|
+
correctness: {
|
|
114
|
+
/** Whether an expected output was defined */
|
|
115
|
+
expectedExists: boolean;
|
|
116
|
+
/** Whether the SUT produced any output */
|
|
117
|
+
producedOutput: boolean;
|
|
118
|
+
/** Whether the output is structurally valid */
|
|
119
|
+
valid: boolean;
|
|
120
|
+
/** Whether the output matches the expected output (null if no expected output) */
|
|
121
|
+
matchesExpected: boolean | null;
|
|
122
|
+
};
|
|
123
|
+
/** SUT outputs - generic, not hardcoded to paths */
|
|
124
|
+
outputs: TOutputs;
|
|
125
|
+
/** Computed metrics */
|
|
126
|
+
metrics: Record<string, number>;
|
|
127
|
+
}
|
|
128
|
+
//# sourceMappingURL=sut.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"sut.d.ts","sourceRoot":"","sources":["../../src/types/sut.ts"],"names":[],"mappings":"AAAA;;;;;;;;;GASG;AAEH;;;;;;GAMG;AACH,MAAM,MAAM,OAAO,GAAG,SAAS,GAAG,UAAU,GAAG,QAAQ,CAAC;AAExD;;GAEG;AACH,MAAM,WAAW,eAAe;IAC/B,4DAA4D;IAC5D,EAAE,EAAE,MAAM,CAAC;IAEX,iEAAiE;IACjE,IAAI,EAAE,MAAM,CAAC;IAEb,yCAAyC;IACzC,OAAO,EAAE,MAAM,CAAC;IAEhB,yBAAyB;IACzB,IAAI,EAAE,OAAO,CAAC;IAEd,2CAA2C;IAC3C,MAAM,EAAE,QAAQ,CAAC,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC,CAAC;IAE1C,oCAAoC;IACpC,IAAI,EAAE,SAAS,MAAM,EAAE,CAAC;IAExB,6CAA6C;IAC7C,WAAW,CAAC,EAAE,MAAM,CAAC;CACrB;AAED;;;;;;;;;;GAUG;AACH,MAAM,WAAW,GAAG,CAAC,OAAO,EAAE,OAAO;IACpC,wBAAwB;IACxB,QAAQ,CAAC,EAAE,EAAE,MAAM,CAAC;IAEpB,8BAA8B;IAC9B,QAAQ,CAAC,MAAM,EAAE,QAAQ,CAAC,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC,CAAC;IAEnD;;;;;OAKG;IACH,GAAG,CAAC,MAAM,EAAE,OAAO,GAAG,OAAO,CAAC,OAAO,CAAC,CAAC;CACvC;AAED;;;;;GAKG;AACH,MAAM,MAAM,UAAU,CAAC,OAAO,EAAE,OAAO,IAAI,CAC1C,MAAM,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,KAC5B,GAAG,CAAC,OAAO,EAAE,OAAO,CAAC,CAAC;AAE3B;;;GAGG;AACH,MAAM,WAAW,WAAW,CAAC,OAAO;IACnC,+CAA+C;IAC/C,GAAG,IAAI,OAAO,CAAC,OAAO,CAAC,CAAC;CACxB;AAED;;;;;GAKG;AACH,MAAM,WAAW,aAAa,CAAC,OAAO,GAAG,OAAO,EAAE,OAAO,GAAG,OAAO;IAClE,4BAA4B;IAC5B,YAAY,EAAE,eAAe,CAAC;IAE9B,yCAAyC;IACzC,OAAO,EAAE,UAAU,CAAC,OAAO,EAAE,OAAO,CAAC,CAAC;CACtC;AAED;;;;;;;;;GASG;AACH,MAAM,WAAW,SAAS,CAAC,QAAQ,GAAG,OAAO;IAC5C,qCAAqC;IACrC,KAAK,EAAE,MAAM,CAAC;IAEd,qBAAqB;IACrB,KAAK,EAAE,MAAM,CAAC;IAEd,kBAAkB;IAClB,UAAU,EAAE,MAAM,CAAC;IAEnB,sBAAsB;IACtB,MAAM,EAAE,MAAM,CAAC;IAEf,kCAAkC;IAClC,SAAS,EAAE,MAAM,CAAC;IAElB,yCAAyC;IACzC,QAAQ,EAAE,MAAM,CAAC;IAEjB,6BAA6B;IAC7B,WAAW,EAAE;QACZ,6CAA6C;QAC7C,cAAc,EAAE,OAAO,CAAC;QAExB,0CAA0C;QAC1C,cAAc,EAAE,OAAO,CAAC;QAExB,+CAA+C;QAC/C,KAAK,EAAE,OAAO,CAAC;QAEf,kFAAkF;QAClF,eAAe,EAAE,OAAO,GAAG,IAAI,CAAC;KAChC,CAAC;IAEF,oDAAoD;IACpD,OAAO,EAAE,QAAQ,CAAC;IAElB,uBAAuB;IACvB,OAAO,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;CAChC"}
|
|
@@ -0,0 +1,12 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* System Under Test (SUT) Type Definitions
|
|
3
|
+
*
|
|
4
|
+
* SUTs represent the algorithms being evaluated. Each SUT has a role that
|
|
5
|
+
* determines how its results are interpreted during evaluation:
|
|
6
|
+
*
|
|
7
|
+
* - primary: The algorithm being proposed/evaluated (e.g., Degree-Prioritised)
|
|
8
|
+
* - baseline: Comparison algorithms (e.g., Standard BFS, Frontier-Balanced)
|
|
9
|
+
* - oracle: Ground truth provider for correctness validation
|
|
10
|
+
*/
|
|
11
|
+
export {};
|
|
12
|
+
//# sourceMappingURL=sut.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"sut.js","sourceRoot":"","sources":["../../src/types/sut.ts"],"names":[],"mappings":"AAAA;;;;;;;;;GASG"}
|
package/package.json
CHANGED
|
@@ -1,12 +1,295 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "ppef",
|
|
3
|
-
"version": "1.
|
|
4
|
-
"description": "",
|
|
5
|
-
"
|
|
3
|
+
"version": "1.1.0",
|
|
4
|
+
"description": "Portable Programmatic Evaluation Framework - Claim-driven, deterministic evaluation for experiments",
|
|
5
|
+
"type": "module",
|
|
6
|
+
"main": "dist/index.cjs",
|
|
7
|
+
"module": "dist/index.js",
|
|
8
|
+
"types": "dist/index.d.ts",
|
|
9
|
+
"bin": {
|
|
10
|
+
"ppef": "./bin/ppef.mjs"
|
|
11
|
+
},
|
|
12
|
+
"exports": {
|
|
13
|
+
".": {
|
|
14
|
+
"types": "./dist/index.d.ts",
|
|
15
|
+
"import": "./dist/index.js",
|
|
16
|
+
"require": "./dist/index.cjs"
|
|
17
|
+
},
|
|
18
|
+
"./types": {
|
|
19
|
+
"types": "./dist/types/index.d.ts",
|
|
20
|
+
"import": "./dist/types/index.js"
|
|
21
|
+
},
|
|
22
|
+
"./types/*": {
|
|
23
|
+
"types": "./dist/types/*.d.ts",
|
|
24
|
+
"import": "./dist/types/*.js"
|
|
25
|
+
},
|
|
26
|
+
"./registry": {
|
|
27
|
+
"types": "./dist/registry/index.d.ts",
|
|
28
|
+
"import": "./dist/registry/index.js"
|
|
29
|
+
},
|
|
30
|
+
"./registry/*": {
|
|
31
|
+
"types": "./dist/registry/*.d.ts",
|
|
32
|
+
"import": "./dist/registry/*.js"
|
|
33
|
+
},
|
|
34
|
+
"./executor": {
|
|
35
|
+
"types": "./dist/executor/index.d.ts",
|
|
36
|
+
"import": "./dist/executor/index.js"
|
|
37
|
+
},
|
|
38
|
+
"./executor/*": {
|
|
39
|
+
"types": "./dist/executor/*.d.ts",
|
|
40
|
+
"import": "./dist/executor/*.js"
|
|
41
|
+
},
|
|
42
|
+
"./collector": {
|
|
43
|
+
"types": "./dist/collector/index.d.ts",
|
|
44
|
+
"import": "./dist/collector/index.js"
|
|
45
|
+
},
|
|
46
|
+
"./collector/*": {
|
|
47
|
+
"types": "./dist/collector/*.d.ts",
|
|
48
|
+
"import": "./dist/collector/*.js"
|
|
49
|
+
},
|
|
50
|
+
"./statistical": {
|
|
51
|
+
"types": "./dist/statistical/index.d.ts",
|
|
52
|
+
"import": "./dist/statistical/index.js"
|
|
53
|
+
},
|
|
54
|
+
"./aggregation": {
|
|
55
|
+
"types": "./dist/aggregation/index.d.ts",
|
|
56
|
+
"import": "./dist/aggregation/index.js"
|
|
57
|
+
},
|
|
58
|
+
"./aggregation/*": {
|
|
59
|
+
"types": "./dist/aggregation/*.d.ts",
|
|
60
|
+
"import": "./dist/aggregation/*.js"
|
|
61
|
+
},
|
|
62
|
+
"./claims": {
|
|
63
|
+
"types": "./dist/claims/index.d.ts",
|
|
64
|
+
"import": "./dist/claims/index.js"
|
|
65
|
+
},
|
|
66
|
+
"./claims/*": {
|
|
67
|
+
"types": "./dist/claims/*.d.ts",
|
|
68
|
+
"import": "./dist/claims/*.js"
|
|
69
|
+
},
|
|
70
|
+
"./robustness": {
|
|
71
|
+
"types": "./dist/robustness/index.d.ts",
|
|
72
|
+
"import": "./dist/robustness/index.js"
|
|
73
|
+
},
|
|
74
|
+
"./robustness/*": {
|
|
75
|
+
"types": "./dist/robustness/*.d.ts",
|
|
76
|
+
"import": "./dist/robustness/*.js"
|
|
77
|
+
},
|
|
78
|
+
"./renderers": {
|
|
79
|
+
"types": "./dist/renderers/index.d.ts",
|
|
80
|
+
"import": "./dist/renderers/index.js"
|
|
81
|
+
},
|
|
82
|
+
"./renderers/*": {
|
|
83
|
+
"types": "./dist/renderers/*.d.ts",
|
|
84
|
+
"import": "./dist/renderers/*.js"
|
|
85
|
+
}
|
|
86
|
+
},
|
|
87
|
+
"files": [
|
|
88
|
+
"dist"
|
|
89
|
+
],
|
|
90
|
+
"sideEffects": false,
|
|
91
|
+
"engines": {
|
|
92
|
+
"node": ">=18"
|
|
93
|
+
},
|
|
94
|
+
"c8": {
|
|
95
|
+
"all": true,
|
|
96
|
+
"include": [
|
|
97
|
+
"src/**/*.ts"
|
|
98
|
+
],
|
|
99
|
+
"exclude": [
|
|
100
|
+
"src/**/*.test.ts",
|
|
101
|
+
"src/**/*.spec.ts",
|
|
102
|
+
"src/**/*.diagnostic.test.ts"
|
|
103
|
+
],
|
|
104
|
+
"reporter": [
|
|
105
|
+
"text",
|
|
106
|
+
"html",
|
|
107
|
+
"json-summary"
|
|
108
|
+
],
|
|
109
|
+
"reports-dir": "coverage"
|
|
110
|
+
},
|
|
6
111
|
"scripts": {
|
|
7
|
-
"
|
|
112
|
+
"typecheck": "tsc --noEmit",
|
|
113
|
+
"lint": "eslint 'src/**/!(__tests__)/**/*.ts' --fix",
|
|
114
|
+
"test": "c8 tsx --test src/**/*.test.ts src/**/**/*.test.ts",
|
|
115
|
+
"build": "tsc && node scripts/generate-cjs-wrapper.mjs",
|
|
116
|
+
"prepare": "husky"
|
|
117
|
+
},
|
|
118
|
+
"keywords": [
|
|
119
|
+
"evaluation",
|
|
120
|
+
"framework",
|
|
121
|
+
"testing",
|
|
122
|
+
"experiments",
|
|
123
|
+
"claims-driven"
|
|
124
|
+
],
|
|
125
|
+
"author": "Joseph Mearman",
|
|
126
|
+
"repository": {
|
|
127
|
+
"type": "git",
|
|
128
|
+
"url": "git+https://github.com/Mearman/ppef.git"
|
|
129
|
+
},
|
|
130
|
+
"release": {
|
|
131
|
+
"branches": [
|
|
132
|
+
"**"
|
|
133
|
+
],
|
|
134
|
+
"plugins": [
|
|
135
|
+
[
|
|
136
|
+
"@semantic-release/commit-analyzer",
|
|
137
|
+
{
|
|
138
|
+
"preset": "conventionalcommits",
|
|
139
|
+
"releaseRules": [
|
|
140
|
+
{
|
|
141
|
+
"type": "feat",
|
|
142
|
+
"release": "minor"
|
|
143
|
+
},
|
|
144
|
+
{
|
|
145
|
+
"type": "fix",
|
|
146
|
+
"release": "patch"
|
|
147
|
+
},
|
|
148
|
+
{
|
|
149
|
+
"type": "perf",
|
|
150
|
+
"release": "patch"
|
|
151
|
+
},
|
|
152
|
+
{
|
|
153
|
+
"type": "refactor",
|
|
154
|
+
"release": "patch"
|
|
155
|
+
},
|
|
156
|
+
{
|
|
157
|
+
"type": "docs",
|
|
158
|
+
"release": "patch"
|
|
159
|
+
},
|
|
160
|
+
{
|
|
161
|
+
"type": "style",
|
|
162
|
+
"release": "patch"
|
|
163
|
+
},
|
|
164
|
+
{
|
|
165
|
+
"type": "test",
|
|
166
|
+
"release": "patch"
|
|
167
|
+
},
|
|
168
|
+
{
|
|
169
|
+
"type": "build",
|
|
170
|
+
"release": "patch"
|
|
171
|
+
},
|
|
172
|
+
{
|
|
173
|
+
"type": "ci",
|
|
174
|
+
"release": "patch"
|
|
175
|
+
},
|
|
176
|
+
{
|
|
177
|
+
"type": "chore",
|
|
178
|
+
"release": "patch"
|
|
179
|
+
},
|
|
180
|
+
{
|
|
181
|
+
"type": "revert",
|
|
182
|
+
"release": "patch"
|
|
183
|
+
}
|
|
184
|
+
]
|
|
185
|
+
}
|
|
186
|
+
],
|
|
187
|
+
[
|
|
188
|
+
"@semantic-release/release-notes-generator",
|
|
189
|
+
{
|
|
190
|
+
"preset": "conventionalcommits",
|
|
191
|
+
"presetConfig": {
|
|
192
|
+
"types": [
|
|
193
|
+
{
|
|
194
|
+
"type": "feat",
|
|
195
|
+
"section": "Features"
|
|
196
|
+
},
|
|
197
|
+
{
|
|
198
|
+
"type": "fix",
|
|
199
|
+
"section": "Bug Fixes"
|
|
200
|
+
},
|
|
201
|
+
{
|
|
202
|
+
"type": "perf",
|
|
203
|
+
"section": "Performance Improvements"
|
|
204
|
+
},
|
|
205
|
+
{
|
|
206
|
+
"type": "refactor",
|
|
207
|
+
"section": "Code Refactoring"
|
|
208
|
+
},
|
|
209
|
+
{
|
|
210
|
+
"type": "docs",
|
|
211
|
+
"section": "Documentation"
|
|
212
|
+
},
|
|
213
|
+
{
|
|
214
|
+
"type": "style",
|
|
215
|
+
"section": "Styles"
|
|
216
|
+
},
|
|
217
|
+
{
|
|
218
|
+
"type": "test",
|
|
219
|
+
"section": "Tests"
|
|
220
|
+
},
|
|
221
|
+
{
|
|
222
|
+
"type": "build",
|
|
223
|
+
"section": "Build System"
|
|
224
|
+
},
|
|
225
|
+
{
|
|
226
|
+
"type": "ci",
|
|
227
|
+
"section": "Continuous Integration"
|
|
228
|
+
},
|
|
229
|
+
{
|
|
230
|
+
"type": "chore",
|
|
231
|
+
"section": "Chores"
|
|
232
|
+
},
|
|
233
|
+
{
|
|
234
|
+
"type": "revert",
|
|
235
|
+
"section": "Reverts"
|
|
236
|
+
}
|
|
237
|
+
]
|
|
238
|
+
}
|
|
239
|
+
}
|
|
240
|
+
],
|
|
241
|
+
"@semantic-release/changelog",
|
|
242
|
+
"@semantic-release/npm",
|
|
243
|
+
[
|
|
244
|
+
"@semantic-release/git",
|
|
245
|
+
{
|
|
246
|
+
"assets": [
|
|
247
|
+
"CHANGELOG.md",
|
|
248
|
+
"package.json"
|
|
249
|
+
],
|
|
250
|
+
"message": "chore(release): ${nextRelease.version} [skip ci]\n\n${nextRelease.notes}"
|
|
251
|
+
}
|
|
252
|
+
]
|
|
253
|
+
]
|
|
254
|
+
},
|
|
255
|
+
"lint-staged": {
|
|
256
|
+
"*.ts": [
|
|
257
|
+
"eslint --fix"
|
|
258
|
+
],
|
|
259
|
+
"*.js": [
|
|
260
|
+
"eslint --fix"
|
|
261
|
+
]
|
|
262
|
+
},
|
|
263
|
+
"devDependencies": {
|
|
264
|
+
"@commitlint/cli": "20.3.1",
|
|
265
|
+
"@commitlint/config-conventional": "20.3.1",
|
|
266
|
+
"@eslint/js": "9.39.2",
|
|
267
|
+
"@eslint/markdown": "7.5.1",
|
|
268
|
+
"@semantic-release/changelog": "6.0.3",
|
|
269
|
+
"@semantic-release/git": "10.0.1",
|
|
270
|
+
"@types/node": "25.0.10",
|
|
271
|
+
"c8": "10.1.3",
|
|
272
|
+
"eslint": "9.39.2",
|
|
273
|
+
"eslint-config-prettier": "10.1.8",
|
|
274
|
+
"@eslint-community/eslint-plugin-eslint-comments": "4.6.0",
|
|
275
|
+
"eslint-plugin-jsonc": "2.21.0",
|
|
276
|
+
"eslint-plugin-prettier": "5.5.5",
|
|
277
|
+
"husky": "9.1.7",
|
|
278
|
+
"jiti": "2.6.1",
|
|
279
|
+
"lint-staged": "16.2.7",
|
|
280
|
+
"prettier": "3.8.1",
|
|
281
|
+
"semantic-release": "25.0.2",
|
|
282
|
+
"tsx": "4.21.0",
|
|
283
|
+
"typescript": "5.9.3",
|
|
284
|
+
"typescript-eslint": "8.53.1"
|
|
285
|
+
},
|
|
286
|
+
"peerDependencies": {
|
|
287
|
+
"typescript": "5.0.0"
|
|
288
|
+
},
|
|
289
|
+
"dependencies": {
|
|
290
|
+
"commander": "^12.0.0"
|
|
8
291
|
},
|
|
9
|
-
"
|
|
10
|
-
|
|
11
|
-
|
|
292
|
+
"publishConfig": {
|
|
293
|
+
"provenance": true
|
|
294
|
+
}
|
|
12
295
|
}
|