@hasna/evals 0.1.23 → 0.1.25

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (105) hide show
  1. package/LICENSE +1 -2
  2. package/README.md +12 -13
  3. package/dist/adapters/adapters.test.d.ts +2 -0
  4. package/dist/adapters/adapters.test.d.ts.map +1 -0
  5. package/dist/adapters/anthropic-openai.test.d.ts +2 -0
  6. package/dist/adapters/anthropic-openai.test.d.ts.map +1 -0
  7. package/dist/adapters/anthropic.d.ts +4 -0
  8. package/dist/adapters/anthropic.d.ts.map +1 -0
  9. package/dist/adapters/cli.d.ts +4 -0
  10. package/dist/adapters/cli.d.ts.map +1 -0
  11. package/dist/adapters/function.d.ts +4 -0
  12. package/dist/adapters/function.d.ts.map +1 -0
  13. package/dist/adapters/http-cli-coverage.test.d.ts +2 -0
  14. package/dist/adapters/http-cli-coverage.test.d.ts.map +1 -0
  15. package/dist/adapters/http.d.ts +16 -0
  16. package/dist/adapters/http.d.ts.map +1 -0
  17. package/dist/adapters/mcp-adapter.test.d.ts +2 -0
  18. package/dist/adapters/mcp-adapter.test.d.ts.map +1 -0
  19. package/dist/adapters/mcp.d.ts +4 -0
  20. package/dist/adapters/mcp.d.ts.map +1 -0
  21. package/dist/adapters/openai.d.ts +4 -0
  22. package/dist/adapters/openai.d.ts.map +1 -0
  23. package/dist/cli/adapter-parser.d.ts +3 -0
  24. package/dist/cli/adapter-parser.d.ts.map +1 -0
  25. package/dist/cli/cli.test.d.ts +2 -0
  26. package/dist/cli/cli.test.d.ts.map +1 -0
  27. package/dist/cli/commands/calibrate.d.ts +3 -0
  28. package/dist/cli/commands/calibrate.d.ts.map +1 -0
  29. package/dist/cli/commands/capture.d.ts +3 -0
  30. package/dist/cli/commands/capture.d.ts.map +1 -0
  31. package/dist/cli/commands/ci.d.ts +3 -0
  32. package/dist/cli/commands/ci.d.ts.map +1 -0
  33. package/dist/cli/commands/compare.d.ts +5 -0
  34. package/dist/cli/commands/compare.d.ts.map +1 -0
  35. package/dist/cli/commands/compare.test.d.ts +2 -0
  36. package/dist/cli/commands/compare.test.d.ts.map +1 -0
  37. package/dist/cli/commands/completion.d.ts +3 -0
  38. package/dist/cli/commands/completion.d.ts.map +1 -0
  39. package/dist/cli/commands/doctor.d.ts +3 -0
  40. package/dist/cli/commands/doctor.d.ts.map +1 -0
  41. package/dist/cli/commands/estimate.d.ts +3 -0
  42. package/dist/cli/commands/estimate.d.ts.map +1 -0
  43. package/dist/cli/commands/generate.d.ts +3 -0
  44. package/dist/cli/commands/generate.d.ts.map +1 -0
  45. package/dist/cli/commands/judge.d.ts +3 -0
  46. package/dist/cli/commands/judge.d.ts.map +1 -0
  47. package/dist/cli/commands/mcp.d.ts +3 -0
  48. package/dist/cli/commands/mcp.d.ts.map +1 -0
  49. package/dist/cli/commands/run.d.ts +3 -0
  50. package/dist/cli/commands/run.d.ts.map +1 -0
  51. package/dist/cli/commands/sync.d.ts +3 -0
  52. package/dist/cli/commands/sync.d.ts.map +1 -0
  53. package/dist/cli/index.d.ts +3 -0
  54. package/dist/cli/index.d.ts.map +1 -0
  55. package/dist/cli/index.js +11688 -19142
  56. package/dist/core/assertions-coverage.test.d.ts +2 -0
  57. package/dist/core/assertions-coverage.test.d.ts.map +1 -0
  58. package/dist/core/assertions.d.ts +18 -0
  59. package/dist/core/assertions.d.ts.map +1 -0
  60. package/dist/core/assertions.test.d.ts +2 -0
  61. package/dist/core/assertions.test.d.ts.map +1 -0
  62. package/dist/core/e2e.test.d.ts +2 -0
  63. package/dist/core/e2e.test.d.ts.map +1 -0
  64. package/dist/core/judge.d.ts +13 -0
  65. package/dist/core/judge.d.ts.map +1 -0
  66. package/dist/core/judge.test.d.ts +2 -0
  67. package/dist/core/judge.test.d.ts.map +1 -0
  68. package/dist/core/reporter.d.ts +21 -0
  69. package/dist/core/reporter.d.ts.map +1 -0
  70. package/dist/core/reporter.test.d.ts +2 -0
  71. package/dist/core/reporter.test.d.ts.map +1 -0
  72. package/dist/core/runner.d.ts +4 -0
  73. package/dist/core/runner.d.ts.map +1 -0
  74. package/dist/core/runner.test.d.ts +2 -0
  75. package/dist/core/runner.test.d.ts.map +1 -0
  76. package/dist/datasets/loader.d.ts +18 -0
  77. package/dist/datasets/loader.d.ts.map +1 -0
  78. package/dist/datasets/loader.test.d.ts +2 -0
  79. package/dist/datasets/loader.test.d.ts.map +1 -0
  80. package/dist/db/cloud-sync.d.ts +33 -0
  81. package/dist/db/cloud-sync.d.ts.map +1 -0
  82. package/dist/db/pg-migrations.d.ts +5 -0
  83. package/dist/db/pg-migrations.d.ts.map +1 -0
  84. package/dist/db/remote-storage.d.ts +10 -0
  85. package/dist/db/remote-storage.d.ts.map +1 -0
  86. package/dist/db/store.d.ts +17 -0
  87. package/dist/db/store.d.ts.map +1 -0
  88. package/dist/db/store.test.d.ts +2 -0
  89. package/dist/db/store.test.d.ts.map +1 -0
  90. package/dist/index.d.ts +11 -0
  91. package/dist/index.d.ts.map +1 -0
  92. package/dist/index.js +12309 -10076
  93. package/dist/mcp/index.d.ts +3 -0
  94. package/dist/mcp/index.d.ts.map +1 -0
  95. package/dist/mcp/index.js +21247 -18303
  96. package/dist/mcp/mcp.test.d.ts +2 -0
  97. package/dist/mcp/mcp.test.d.ts.map +1 -0
  98. package/dist/server/index.d.ts +3 -0
  99. package/dist/server/index.d.ts.map +1 -0
  100. package/dist/server/index.js +903 -3792
  101. package/dist/server/server.test.d.ts +2 -0
  102. package/dist/server/server.test.d.ts.map +1 -0
  103. package/dist/types/index.d.ts +171 -0
  104. package/dist/types/index.d.ts.map +1 -0
  105. package/package.json +3 -2
@@ -0,0 +1,2 @@
1
+ export {};
2
+ //# sourceMappingURL=assertions-coverage.test.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"assertions-coverage.test.d.ts","sourceRoot":"","sources":["../../src/core/assertions-coverage.test.ts"],"names":[],"mappings":""}
@@ -0,0 +1,18 @@
1
+ import type { Assertion, AssertionResult } from "../types/index.js";
2
+ export declare function sortAssertionsCheapestFirst(assertions: Assertion[]): Assertion[];
3
+ export interface AssertionContext {
4
+ output: string;
5
+ durationMs?: number;
6
+ inputTokens?: number;
7
+ outputTokens?: number;
8
+ costUsd?: number;
9
+ toolCalls?: Array<{
10
+ name: string;
11
+ arguments?: Record<string, unknown>;
12
+ }>;
13
+ }
14
+ export declare function runAssertion(assertion: Assertion, ctx: AssertionContext): Promise<AssertionResult>;
15
+ export declare function runAssertions(assertions: Assertion[], ctx: AssertionContext): Promise<AssertionResult[]>;
16
+ export declare function assertionsPassed(results: AssertionResult[]): boolean;
17
+ export declare function allAssertionsPassed(results: AssertionResult[]): boolean;
18
+ //# sourceMappingURL=assertions.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"assertions.d.ts","sourceRoot":"","sources":["../../src/core/assertions.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,EAAE,SAAS,EAAE,eAAe,EAAE,MAAM,mBAAmB,CAAC;AA6BpE,wBAAgB,2BAA2B,CAAC,UAAU,EAAE,SAAS,EAAE,GAAG,SAAS,EAAE,CAMhF;AAED,MAAM,WAAW,gBAAgB;IAC/B,MAAM,EAAE,MAAM,CAAC;IACf,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,SAAS,CAAC,EAAE,KAAK,CAAC;QAAE,IAAI,EAAE,MAAM,CAAC;QAAC,SAAS,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAA;KAAE,CAAC,CAAC;CAC1E;AAED,wBAAsB,YAAY,CAChC,SAAS,EAAE,SAAS,EACpB,GAAG,EAAE,gBAAgB,GACpB,OAAO,CAAC,eAAe,CAAC,CAqB1B;AAED,wBAAsB,aAAa,CACjC,UAAU,EAAE,SAAS,EAAE,EACvB,GAAG,EAAE,gBAAgB,GACpB,OAAO,CAAC,eAAe,EAAE,CAAC,CAyB5B;AAED,wBAAgB,gBAAgB,CAAC,OAAO,EAAE,eAAe,EAAE,GAAG,OAAO,CAKpE;AAED,wBAAgB,mBAAmB,CAAC,OAAO,EAAE,eAAe,EAAE,GAAG,OAAO,CAEvE"}
@@ -0,0 +1,2 @@
1
+ export {};
2
+ //# sourceMappingURL=assertions.test.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"assertions.test.d.ts","sourceRoot":"","sources":["../../src/core/assertions.test.ts"],"names":[],"mappings":""}
@@ -0,0 +1,2 @@
1
+ export declare function echoInput(input: string): Promise<string>;
2
+ //# sourceMappingURL=e2e.test.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"e2e.test.d.ts","sourceRoot":"","sources":["../../src/core/e2e.test.ts"],"names":[],"mappings":"AAyBA,wBAAsB,SAAS,CAAC,KAAK,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC,CAE9D"}
@@ -0,0 +1,13 @@
1
+ import type { JudgeConfig, JudgeResult } from "../types/index.js";
2
+ export declare function runJudge(input: string, output: string, config: JudgeConfig, expected?: string): Promise<JudgeResult>;
3
+ /** One-shot judge: no full eval case, just input/output/rubric */
4
+ export declare function judgeOnce(params: {
5
+ input: string;
6
+ output: string;
7
+ rubric: string;
8
+ expected?: string;
9
+ model?: string;
10
+ provider?: "anthropic" | "openai";
11
+ apiKey?: string;
12
+ }): Promise<JudgeResult>;
13
+ //# sourceMappingURL=judge.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"judge.d.ts","sourceRoot":"","sources":["../../src/core/judge.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,WAAW,EAAE,WAAW,EAAW,MAAM,mBAAmB,CAAC;AAsD3E,wBAAsB,QAAQ,CAC5B,KAAK,EAAE,MAAM,EACb,MAAM,EAAE,MAAM,EACd,MAAM,EAAE,WAAW,EACnB,QAAQ,CAAC,EAAE,MAAM,GAChB,OAAO,CAAC,WAAW,CAAC,CAmBtB;AA4ED,kEAAkE;AAClE,wBAAsB,SAAS,CAAC,MAAM,EAAE;IACtC,KAAK,EAAE,MAAM,CAAC;IACd,MAAM,EAAE,MAAM,CAAC;IACf,MAAM,EAAE,MAAM,CAAC;IACf,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,QAAQ,CAAC,EAAE,WAAW,GAAG,QAAQ,CAAC;IAClC,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB,GAAG,OAAO,CAAC,WAAW,CAAC,CAOvB"}
@@ -0,0 +1,2 @@
1
+ export {};
2
+ //# sourceMappingURL=judge.test.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"judge.test.d.ts","sourceRoot":"","sources":["../../src/core/judge.test.ts"],"names":[],"mappings":""}
@@ -0,0 +1,21 @@
1
+ import type { EvalRun, Verdict } from "../types/index.js";
2
+ export declare function printTerminalReport(run: EvalRun): void;
3
+ export declare function toJson(run: EvalRun): string;
4
+ export declare function toMarkdown(run: EvalRun): string;
5
+ export interface RunDiff {
6
+ regressions: Array<{
7
+ caseId: string;
8
+ before: Verdict;
9
+ after: Verdict;
10
+ }>;
11
+ improvements: Array<{
12
+ caseId: string;
13
+ before: Verdict;
14
+ after: Verdict;
15
+ }>;
16
+ scoreDelta: number;
17
+ passRateDelta: number;
18
+ }
19
+ export declare function compareRuns(before: EvalRun, after: EvalRun): RunDiff;
20
+ export declare function printDiffReport(diff: RunDiff): void;
21
+ //# sourceMappingURL=reporter.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"reporter.d.ts","sourceRoot":"","sources":["../../src/core/reporter.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,OAAO,EAAE,OAAO,EAAE,MAAM,mBAAmB,CAAC;AAgB1D,wBAAgB,mBAAmB,CAAC,GAAG,EAAE,OAAO,GAAG,IAAI,CAoCtD;AAID,wBAAgB,MAAM,CAAC,GAAG,EAAE,OAAO,GAAG,MAAM,CAE3C;AAID,wBAAgB,UAAU,CAAC,GAAG,EAAE,OAAO,GAAG,MAAM,CAkD/C;AAID,MAAM,WAAW,OAAO;IACtB,WAAW,EAAE,KAAK,CAAC;QAAE,MAAM,EAAE,MAAM,CAAC;QAAC,MAAM,EAAE,OAAO,CAAC;QAAC,KAAK,EAAE,OAAO,CAAA;KAAE,CAAC,CAAC;IACxE,YAAY,EAAE,KAAK,CAAC;QAAE,MAAM,EAAE,MAAM,CAAC;QAAC,MAAM,EAAE,OAAO,CAAC;QAAC,KAAK,EAAE,OAAO,CAAA;KAAE,CAAC,CAAC;IACzE,UAAU,EAAE,MAAM,CAAC;IACnB,aAAa,EAAE,MAAM,CAAC;CACvB;AAED,wBAAgB,WAAW,CAAC,MAAM,EAAE,OAAO,EAAE,KAAK,EAAE,OAAO,GAAG,OAAO,CAuBpE;AAED,wBAAgB,eAAe,CAAC,IAAI,EAAE,OAAO,GAAG,IAAI,CAcnD"}
@@ -0,0 +1,2 @@
1
+ export {};
2
+ //# sourceMappingURL=reporter.test.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"reporter.test.d.ts","sourceRoot":"","sources":["../../src/core/reporter.test.ts"],"names":[],"mappings":""}
@@ -0,0 +1,4 @@
1
+ import type { AdapterConfig, EvalCase, EvalResult, EvalRun, RunOptions } from "../types/index.js";
2
+ export declare function runEvals(cases: EvalCase[], options: RunOptions): Promise<EvalRun>;
3
+ export declare function runSingleCase(evalCase: EvalCase, adapterConfig: AdapterConfig, skipJudge?: boolean): Promise<EvalResult>;
4
+ //# sourceMappingURL=runner.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"runner.d.ts","sourceRoot":"","sources":["../../src/core/runner.ts"],"names":[],"mappings":"AASA,OAAO,KAAK,EACV,aAAa,EACb,QAAQ,EACR,UAAU,EACV,OAAO,EAEP,UAAU,EAGX,MAAM,mBAAmB,CAAC;AAqI3B,wBAAsB,QAAQ,CAC5B,KAAK,EAAE,QAAQ,EAAE,EACjB,OAAO,EAAE,UAAU,GAClB,OAAO,CAAC,OAAO,CAAC,CAqClB;AAID,wBAAsB,aAAa,CACjC,QAAQ,EAAE,QAAQ,EAClB,aAAa,EAAE,aAAa,EAC5B,SAAS,UAAQ,GAChB,OAAO,CAAC,UAAU,CAAC,CAKrB"}
@@ -0,0 +1,2 @@
1
+ export {};
2
+ //# sourceMappingURL=runner.test.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"runner.test.d.ts","sourceRoot":"","sources":["../../src/core/runner.test.ts"],"names":[],"mappings":""}
@@ -0,0 +1,18 @@
1
+ import type { EvalCase } from "../types/index.js";
2
+ export interface LoadOptions {
3
+ /** Fail hard on malformed lines instead of warning and skipping */
4
+ strict?: boolean;
5
+ /** Filter by tags */
6
+ tags?: string[];
7
+ }
8
+ export interface LoadResult {
9
+ cases: EvalCase[];
10
+ warnings: string[];
11
+ totalLines: number;
12
+ skipped: number;
13
+ }
14
+ /** Load eval cases from a JSONL or JSON file (or glob pattern) */
15
+ export declare function loadDataset(pathOrGlob: string, opts?: LoadOptions): Promise<LoadResult>;
16
+ /** Stream large JSONL files case-by-case (for very large datasets) */
17
+ export declare function streamDataset(path: string, opts?: LoadOptions): AsyncGenerator<EvalCase>;
18
+ //# sourceMappingURL=loader.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"loader.d.ts","sourceRoot":"","sources":["../../src/datasets/loader.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,QAAQ,EAAE,MAAM,mBAAmB,CAAC;AAElD,MAAM,WAAW,WAAW;IAC1B,mEAAmE;IACnE,MAAM,CAAC,EAAE,OAAO,CAAC;IACjB,qBAAqB;IACrB,IAAI,CAAC,EAAE,MAAM,EAAE,CAAC;CACjB;AAED,MAAM,WAAW,UAAU;IACzB,KAAK,EAAE,QAAQ,EAAE,CAAC;IAClB,QAAQ,EAAE,MAAM,EAAE,CAAC;IACnB,UAAU,EAAE,MAAM,CAAC;IACnB,OAAO,EAAE,MAAM,CAAC;CACjB;AAED,kEAAkE;AAClE,wBAAsB,WAAW,CAAC,UAAU,EAAE,MAAM,EAAE,IAAI,GAAE,WAAgB,GAAG,OAAO,CAAC,UAAU,CAAC,CAiCjG;AAoFD,sEAAsE;AACtE,wBAAuB,aAAa,CAAC,IAAI,EAAE,MAAM,EAAE,IAAI,GAAE,WAAgB,GAAG,cAAc,CAAC,QAAQ,CAAC,CAyBnG"}
@@ -0,0 +1,2 @@
1
+ export {};
2
+ //# sourceMappingURL=loader.test.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"loader.test.d.ts","sourceRoot":"","sources":["../../src/datasets/loader.test.ts"],"names":[],"mappings":""}
@@ -0,0 +1,33 @@
1
+ import { PgAdapterAsync } from "./remote-storage.js";
2
+ export declare const CLOUD_TABLES: readonly ["runs", "baselines"];
3
+ type CloudTable = (typeof CLOUD_TABLES)[number];
4
+ export interface SyncResult {
5
+ table: string;
6
+ rowsRead: number;
7
+ rowsWritten: number;
8
+ errors: string[];
9
+ }
10
+ export interface SyncMeta {
11
+ table_name: string;
12
+ last_synced_at: string | null;
13
+ direction: "push" | "pull";
14
+ }
15
+ export declare function getCloudDatabaseUrl(): string | null;
16
+ export declare function getCloudPg(): Promise<PgAdapterAsync>;
17
+ export declare function runCloudMigrations(remote: PgAdapterAsync): Promise<void>;
18
+ export declare function cloudPush(options?: {
19
+ tables?: string[];
20
+ }): Promise<SyncResult[]>;
21
+ export declare function cloudPull(options?: {
22
+ tables?: string[];
23
+ }): Promise<SyncResult[]>;
24
+ export declare function cloudSync(options?: {
25
+ tables?: string[];
26
+ }): Promise<{
27
+ pull: SyncResult[];
28
+ push: SyncResult[];
29
+ }>;
30
+ export declare function getSyncMetaAll(): SyncMeta[];
31
+ export declare function resolveTables(tables?: string[]): CloudTable[];
32
+ export {};
33
+ //# sourceMappingURL=cloud-sync.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"cloud-sync.d.ts","sourceRoot":"","sources":["../../src/db/cloud-sync.ts"],"names":[],"mappings":"AAGA,OAAO,EAAE,cAAc,EAAE,MAAM,qBAAqB,CAAC;AAErD,eAAO,MAAM,YAAY,gCAAiC,CAAC;AAE3D,KAAK,UAAU,GAAG,CAAC,OAAO,YAAY,CAAC,CAAC,MAAM,CAAC,CAAC;AAQhD,MAAM,WAAW,UAAU;IACzB,KAAK,EAAE,MAAM,CAAC;IACd,QAAQ,EAAE,MAAM,CAAC;IACjB,WAAW,EAAE,MAAM,CAAC;IACpB,MAAM,EAAE,MAAM,EAAE,CAAC;CAClB;AAED,MAAM,WAAW,QAAQ;IACvB,UAAU,EAAE,MAAM,CAAC;IACnB,cAAc,EAAE,MAAM,GAAG,IAAI,CAAC;IAC9B,SAAS,EAAE,MAAM,GAAG,MAAM,CAAC;CAC5B;AAED,wBAAgB,mBAAmB,IAAI,MAAM,GAAG,IAAI,CAKnD;AAED,wBAAsB,UAAU,IAAI,OAAO,CAAC,cAAc,CAAC,CAM1D;AAED,wBAAsB,kBAAkB,CAAC,MAAM,EAAE,cAAc,GAAG,OAAO,CAAC,IAAI,CAAC,CAE9E;AAED,wBAAsB,SAAS,CAAC,OAAO,CAAC,EAAE;IAAE,MAAM,CAAC,EAAE,MAAM,EAAE,CAAA;CAAE,GAAG,OAAO,CAAC,UAAU,EAAE,CAAC,CAYtF;AAED,wBAAsB,SAAS,CAAC,OAAO,CAAC,EAAE;IAAE,MAAM,CAAC,EAAE,MAAM,EAAE,CAAA;CAAE,GAAG,OAAO,CAAC,UAAU,EAAE,CAAC,CAYtF;AAED,wBAAsB,SAAS,CAAC,OAAO,CAAC,EAAE;IAAE,MAAM,CAAC,EAAE,MAAM,EAAE,CAAA;CAAE,GAAG,OAAO,CAAC;IAAE,IAAI,EAAE,UAAU,EAAE,CAAC;IAAC,IAAI,EAAE,UAAU,EAAE,CAAA;CAAE,CAAC,CAIpH;AAED,wBAAgB,cAAc,IAAI,QAAQ,EAAE,CAI3C;AAED,wBAAgB,aAAa,CAAC,MAAM,CAAC,EAAE,MAAM,EAAE,GAAG,UAAU,EAAE,CAO7D"}
@@ -0,0 +1,5 @@
1
+ /**
2
+ * PostgreSQL migrations for open-evals cloud sync.
3
+ */
4
+ export declare const PG_MIGRATIONS: string[];
5
+ //# sourceMappingURL=pg-migrations.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"pg-migrations.d.ts","sourceRoot":"","sources":["../../src/db/pg-migrations.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,eAAO,MAAM,aAAa,EAAE,MAAM,EAgBjC,CAAC"}
@@ -0,0 +1,10 @@
1
+ export declare class PgAdapterAsync {
2
+ private readonly pool;
3
+ constructor(connectionString: string);
4
+ run(sql: string, ...params: unknown[]): Promise<{
5
+ changes: number;
6
+ }>;
7
+ all(sql: string, ...params: unknown[]): Promise<unknown[]>;
8
+ close(): Promise<void>;
9
+ }
10
+ //# sourceMappingURL=remote-storage.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"remote-storage.d.ts","sourceRoot":"","sources":["../../src/db/remote-storage.ts"],"names":[],"mappings":"AAmBA,qBAAa,cAAc;IACzB,OAAO,CAAC,QAAQ,CAAC,IAAI,CAAO;gBAEhB,gBAAgB,EAAE,MAAM;IAI9B,GAAG,CAAC,GAAG,EAAE,MAAM,EAAE,GAAG,MAAM,EAAE,OAAO,EAAE,GAAG,OAAO,CAAC;QAAE,OAAO,EAAE,MAAM,CAAA;KAAE,CAAC;IAKpE,GAAG,CAAC,GAAG,EAAE,MAAM,EAAE,GAAG,MAAM,EAAE,OAAO,EAAE,GAAG,OAAO,CAAC,OAAO,EAAE,CAAC;IAK1D,KAAK,IAAI,OAAO,CAAC,IAAI,CAAC;CAG7B"}
@@ -0,0 +1,17 @@
1
+ import { Database } from "bun:sqlite";
2
+ import type { EvalRun } from "../types/index.js";
3
+ export declare function getDatabase(): Database;
4
+ export declare function closeDatabase(): void;
5
+ export declare function saveRun(run: EvalRun): void;
6
+ export declare function getRun(id: string): EvalRun | null;
7
+ export declare function listRuns(limit?: number, dataset?: string): EvalRun[];
8
+ export declare function deleteRun(id: string): void;
9
+ export declare function setBaseline(name: string, runId: string): void;
10
+ export declare function getBaseline(name: string): EvalRun | null;
11
+ export declare function listBaselines(): Array<{
12
+ name: string;
13
+ runId: string;
14
+ createdAt: string;
15
+ }>;
16
+ export declare function clearBaseline(name: string): void;
17
+ //# sourceMappingURL=store.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"store.d.ts","sourceRoot":"","sources":["../../src/db/store.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,QAAQ,EAAE,MAAM,YAAY,CAAC;AAItC,OAAO,KAAK,EAAE,OAAO,EAAE,MAAM,mBAAmB,CAAC;AAQjD,wBAAgB,WAAW,IAAI,QAAQ,CAUtC;AAED,wBAAgB,aAAa,IAAI,IAAI,CAGpC;AA6BD,wBAAgB,OAAO,CAAC,GAAG,EAAE,OAAO,GAAG,IAAI,CAa1C;AAED,wBAAgB,MAAM,CAAC,EAAE,EAAE,MAAM,GAAG,OAAO,GAAG,IAAI,CAIjD;AAED,wBAAgB,QAAQ,CAAC,KAAK,SAAK,EAAE,OAAO,CAAC,EAAE,MAAM,GAAG,OAAO,EAAE,CAMhE;AAED,wBAAgB,SAAS,CAAC,EAAE,EAAE,MAAM,GAAG,IAAI,CAE1C;AAID,wBAAgB,WAAW,CAAC,IAAI,EAAE,MAAM,EAAE,KAAK,EAAE,MAAM,GAAG,IAAI,CAI7D;AAED,wBAAgB,WAAW,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,GAAG,IAAI,CAKxD;AAED,wBAAgB,aAAa,IAAI,KAAK,CAAC;IAAE,IAAI,EAAE,MAAM,CAAC;IAAC,KAAK,EAAE,MAAM,CAAC;IAAC,SAAS,EAAE,MAAM,CAAA;CAAE,CAAC,CAKzF;AAED,wBAAgB,aAAa,CAAC,IAAI,EAAE,MAAM,GAAG,IAAI,CAEhD"}
@@ -0,0 +1,2 @@
1
+ export {};
2
+ //# sourceMappingURL=store.test.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"store.test.d.ts","sourceRoot":"","sources":["../../src/db/store.test.ts"],"names":[],"mappings":""}
@@ -0,0 +1,11 @@
1
+ export * from "./types/index.js";
2
+ export * from "./core/runner.js";
3
+ export * from "./core/assertions.js";
4
+ export * from "./core/judge.js";
5
+ export * from "./core/reporter.js";
6
+ export * from "./datasets/loader.js";
7
+ export * from "./db/store.js";
8
+ export * from "./db/pg-migrations.js";
9
+ export * from "./db/remote-storage.js";
10
+ export * from "./db/cloud-sync.js";
11
+ //# sourceMappingURL=index.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":"AACA,cAAc,kBAAkB,CAAC;AACjC,cAAc,kBAAkB,CAAC;AACjC,cAAc,sBAAsB,CAAC;AACrC,cAAc,iBAAiB,CAAC;AAChC,cAAc,oBAAoB,CAAC;AACnC,cAAc,sBAAsB,CAAC;AACrC,cAAc,eAAe,CAAC;AAC9B,cAAc,uBAAuB,CAAC;AACtC,cAAc,wBAAwB,CAAC;AACvC,cAAc,oBAAoB,CAAC"}