@vfarcic/dot-ai 0.115.0 → 0.117.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +21 -18
- package/dist/core/ai-provider-factory.d.ts +4 -2
- package/dist/core/ai-provider-factory.d.ts.map +1 -1
- package/dist/core/ai-provider-factory.js +17 -6
- package/dist/core/capability-operations.js +1 -1
- package/dist/core/generic-session-manager.d.ts +67 -0
- package/dist/core/generic-session-manager.d.ts.map +1 -0
- package/dist/core/generic-session-manager.js +192 -0
- package/dist/core/pattern-operations.js +1 -1
- package/dist/core/providers/noop-provider.d.ts +47 -0
- package/dist/core/providers/noop-provider.d.ts.map +1 -0
- package/dist/core/providers/noop-provider.js +63 -0
- package/dist/core/schema.d.ts.map +1 -1
- package/dist/core/schema.js +13 -13
- package/dist/core/session-utils.d.ts +3 -6
- package/dist/core/session-utils.d.ts.map +1 -1
- package/dist/core/session-utils.js +5 -13
- package/dist/core/shared-prompt-loader.d.ts +15 -3
- package/dist/core/shared-prompt-loader.d.ts.map +1 -1
- package/dist/core/shared-prompt-loader.js +67 -14
- package/dist/core/unified-creation-session.d.ts +3 -10
- package/dist/core/unified-creation-session.d.ts.map +1 -1
- package/dist/core/unified-creation-session.js +34 -75
- package/dist/core/unified-creation-types.d.ts +31 -22
- package/dist/core/unified-creation-types.d.ts.map +1 -1
- package/dist/evaluation/eval-runner.js +12 -3
- package/dist/evaluation/evaluators/base-comparative.d.ts +2 -0
- package/dist/evaluation/evaluators/base-comparative.d.ts.map +1 -1
- package/dist/evaluation/evaluators/base-comparative.js +13 -1
- package/dist/evaluation/graph-generator.d.ts +56 -0
- package/dist/evaluation/graph-generator.d.ts.map +1 -0
- package/dist/evaluation/graph-generator.js +694 -0
- package/dist/evaluation/metadata-loader.d.ts +39 -0
- package/dist/evaluation/metadata-loader.d.ts.map +1 -0
- package/dist/evaluation/metadata-loader.js +74 -0
- package/dist/evaluation/platform-synthesizer.d.ts +5 -1
- package/dist/evaluation/platform-synthesizer.d.ts.map +1 -1
- package/dist/evaluation/platform-synthesizer.js +65 -23
- package/dist/evaluation/run-platform-synthesis.js +22 -5
- package/dist/interfaces/mcp.d.ts.map +1 -1
- package/dist/interfaces/mcp.js +9 -34
- package/dist/tools/answer-question.d.ts.map +1 -1
- package/dist/tools/answer-question.js +12 -12
- package/dist/tools/choose-solution.js +1 -1
- package/dist/tools/generate-manifests.d.ts.map +1 -1
- package/dist/tools/generate-manifests.js +9 -10
- package/dist/tools/index.d.ts +1 -1
- package/dist/tools/index.d.ts.map +1 -1
- package/dist/tools/index.js +6 -6
- package/dist/tools/organizational-data.js +12 -12
- package/dist/tools/project-setup/discovery.d.ts +15 -0
- package/dist/tools/project-setup/discovery.d.ts.map +1 -0
- package/dist/tools/project-setup/discovery.js +104 -0
- package/dist/tools/project-setup/generate-scope.d.ts +15 -0
- package/dist/tools/project-setup/generate-scope.d.ts.map +1 -0
- package/dist/tools/project-setup/generate-scope.js +237 -0
- package/dist/tools/project-setup/report-scan.d.ts +15 -0
- package/dist/tools/project-setup/report-scan.d.ts.map +1 -0
- package/dist/tools/project-setup/report-scan.js +156 -0
- package/dist/tools/project-setup/types.d.ts +111 -0
- package/dist/tools/project-setup/types.d.ts.map +1 -0
- package/dist/tools/project-setup/types.js +8 -0
- package/dist/tools/project-setup.d.ts +28 -0
- package/dist/tools/project-setup.d.ts.map +1 -0
- package/dist/tools/project-setup.js +134 -0
- package/dist/tools/recommend.js +1 -1
- package/dist/tools/remediate.js +1 -1
- package/dist/tools/version.d.ts +0 -7
- package/dist/tools/version.d.ts.map +1 -1
- package/dist/tools/version.js +5 -34
- package/package.json +4 -2
- package/prompts/capability-inference.md +2 -2
- package/prompts/infrastructure-trigger-expansion.md +2 -2
- package/prompts/intent-analysis.md +2 -2
- package/prompts/kyverno-generation.md +14 -14
- package/prompts/manifest-generation.md +5 -5
- package/prompts/map-intent-to-operation.md +2 -2
- package/prompts/pattern-complete-error.md +1 -1
- package/prompts/pattern-complete-success.md +4 -4
- package/prompts/pattern-rationale.md +1 -1
- package/prompts/pattern-resources.md +1 -1
- package/prompts/pattern-review.md +5 -5
- package/prompts/policy-complete-apply.md +4 -4
- package/prompts/policy-complete-discard.md +1 -1
- package/prompts/policy-complete-error.md +1 -1
- package/prompts/policy-complete-save.md +4 -4
- package/prompts/policy-complete-success.md +4 -4
- package/prompts/policy-namespace-scope.md +1 -1
- package/prompts/question-generation.md +5 -5
- package/prompts/resource-analysis.md +3 -3
- package/prompts/resource-selection.md +3 -3
- package/prompts/solution-enhancement.md +4 -4
- package/scripts/anthropic.nu +9 -13
- package/scripts/common.nu +31 -33
- package/scripts/ingress.nu +5 -4
- package/scripts/kubernetes.nu +38 -53
- package/dist/core/doc-discovery.d.ts +0 -38
- package/dist/core/doc-discovery.d.ts.map +0 -1
- package/dist/core/doc-discovery.js +0 -231
- package/dist/core/doc-testing-session.d.ts +0 -109
- package/dist/core/doc-testing-session.d.ts.map +0 -1
- package/dist/core/doc-testing-session.js +0 -696
- package/dist/core/doc-testing-types.d.ts +0 -127
- package/dist/core/doc-testing-types.d.ts.map +0 -1
- package/dist/core/doc-testing-types.js +0 -53
- package/dist/core/nushell-runtime.d.ts +0 -39
- package/dist/core/nushell-runtime.d.ts.map +0 -1
- package/dist/core/nushell-runtime.js +0 -103
- package/dist/core/platform-operations.d.ts +0 -70
- package/dist/core/platform-operations.d.ts.map +0 -1
- package/dist/core/platform-operations.js +0 -294
- package/dist/tools/build-platform.d.ts +0 -25
- package/dist/tools/build-platform.d.ts.map +0 -1
- package/dist/tools/build-platform.js +0 -277
- package/dist/tools/test-docs.d.ts +0 -22
- package/dist/tools/test-docs.d.ts.map +0 -1
- package/dist/tools/test-docs.js +0 -351
- package/prompts/doc-testing-done.md +0 -51
- package/prompts/doc-testing-fix.md +0 -120
- package/prompts/doc-testing-scan.md +0 -140
- package/prompts/doc-testing-test-section.md +0 -169
- package/prompts/platform-operations-parse-script-help.md +0 -68
- package/scripts/ack.nu +0 -195
- package/scripts/argo-workflows.nu +0 -47
- package/scripts/argocd.nu +0 -85
- package/scripts/aso.nu +0 -74
- package/scripts/backstage.nu +0 -349
- package/scripts/cert-manager.nu +0 -13
- package/scripts/cnpg.nu +0 -14
- package/scripts/dot.nu +0 -32
- package/scripts/external-secrets.nu +0 -110
- package/scripts/gatekeeper.nu +0 -19
- package/scripts/github.nu +0 -42
- package/scripts/image.nu +0 -67
- package/scripts/kro.nu +0 -11
- package/scripts/kubevela.nu +0 -22
- package/scripts/port.nu +0 -71
- package/scripts/prometheus.nu +0 -21
- package/scripts/registry.nu +0 -55
- package/scripts/storage.nu +0 -210
- package/scripts/tests.nu +0 -12
- package/scripts/velero.nu +0 -45
- package/shared-prompts/validate-docs.md +0 -22
|
@@ -13,10 +13,12 @@ const platform_utils_1 = require("../../core/platform-utils");
|
|
|
13
13
|
const fs_1 = require("fs");
|
|
14
14
|
const path_1 = require("path");
|
|
15
15
|
const dataset_analyzer_js_1 = require("../dataset-analyzer.js");
|
|
16
|
+
const metadata_loader_js_1 = require("../metadata-loader.js");
|
|
16
17
|
class BaseComparativeEvaluator {
|
|
17
18
|
evaluatorModel;
|
|
18
19
|
datasetAnalyzer;
|
|
19
20
|
promptTemplate;
|
|
21
|
+
metadata;
|
|
20
22
|
constructor(datasetDir) {
|
|
21
23
|
// Use Claude via VercelProvider as the evaluator (most reliable for complex comparative evaluation)
|
|
22
24
|
this.evaluatorModel = new vercel_provider_1.VercelProvider({
|
|
@@ -28,6 +30,8 @@ class BaseComparativeEvaluator {
|
|
|
28
30
|
this.datasetAnalyzer = new dataset_analyzer_js_1.DatasetAnalyzer(datasetDir || './eval/datasets');
|
|
29
31
|
// Prompt template will be loaded by subclass
|
|
30
32
|
this.promptTemplate = '';
|
|
33
|
+
// Load metadata
|
|
34
|
+
this.metadata = (0, metadata_loader_js_1.loadEvaluationMetadata)();
|
|
31
35
|
}
|
|
32
36
|
/**
|
|
33
37
|
* Initialize the evaluator - must be called by subclass constructor
|
|
@@ -122,6 +126,7 @@ class BaseComparativeEvaluator {
|
|
|
122
126
|
${reliabilityContext}
|
|
123
127
|
|
|
124
128
|
**Response:**
|
|
129
|
+
|
|
125
130
|
${modelResponse.response}
|
|
126
131
|
|
|
127
132
|
---`;
|
|
@@ -171,11 +176,18 @@ ${modelResponse.response}
|
|
|
171
176
|
* Build the evaluation prompt - can be overridden by subclasses for custom behavior
|
|
172
177
|
*/
|
|
173
178
|
buildEvaluationPrompt(scenario, modelResponsesText, modelList) {
|
|
179
|
+
// Build metadata context sections
|
|
180
|
+
const pricingContext = (0, metadata_loader_js_1.buildModelPricingContext)(this.metadata.models);
|
|
181
|
+
const toolContext = (0, metadata_loader_js_1.buildToolContext)(this.toolName, this.metadata.tools);
|
|
182
|
+
// Inject all data into prompt template via placeholders
|
|
174
183
|
return this.promptTemplate
|
|
184
|
+
.replace('{pricing_context}', pricingContext)
|
|
185
|
+
.replace('{tool_context}', toolContext)
|
|
175
186
|
.replace('{issue}', scenario.issue)
|
|
176
187
|
.replace('{model_responses}', modelResponsesText)
|
|
177
188
|
.replace('{model_list}', modelList)
|
|
178
|
-
.replace('{phase}', scenario.interaction_id)
|
|
189
|
+
.replace('{phase}', scenario.interaction_id)
|
|
190
|
+
.replace('{scenario_name}', scenario.interaction_id);
|
|
179
191
|
}
|
|
180
192
|
/**
|
|
181
193
|
* Get statistics about available datasets
|
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
import type { ModelPerformance } from './platform-synthesizer.js';
|
|
2
|
+
export interface GraphGenerationResult {
|
|
3
|
+
success: boolean;
|
|
4
|
+
graphPath?: string;
|
|
5
|
+
error?: string;
|
|
6
|
+
}
|
|
7
|
+
/**
|
|
8
|
+
* GraphGenerator creates data visualizations for platform synthesis reports.
|
|
9
|
+
* Uses QuickChart.io API to generate chart images without requiring native dependencies.
|
|
10
|
+
*/
|
|
11
|
+
export declare class GraphGenerator {
|
|
12
|
+
private outputDir;
|
|
13
|
+
private quickchartBaseUrl;
|
|
14
|
+
constructor(outputDir?: string);
|
|
15
|
+
/**
|
|
16
|
+
* Generates all or specific graphs for the platform report
|
|
17
|
+
* @param modelPerformances Model performance data
|
|
18
|
+
* @param graphNames Optional array of specific graph names to generate. If not provided, generates all graphs.
|
|
19
|
+
* Valid names: 'performance-tiers', 'cost-vs-quality', 'reliability-comparison',
|
|
20
|
+
* 'tool-performance-heatmap', 'context-window-correlation'
|
|
21
|
+
*/
|
|
22
|
+
generateAllGraphs(modelPerformances: ModelPerformance[], graphNames?: string[]): Promise<Record<string, GraphGenerationResult>>;
|
|
23
|
+
/**
|
|
24
|
+
* Graph 1: Performance Tiers - Grouped bar chart showing score, reliability, and consistency
|
|
25
|
+
*/
|
|
26
|
+
private generatePerformanceTiersGraph;
|
|
27
|
+
/**
|
|
28
|
+
* Graph 2: Cost vs Quality - Line chart showing input/output cost range per model
|
|
29
|
+
*/
|
|
30
|
+
private generateCostVsQualityGraph;
|
|
31
|
+
/**
|
|
32
|
+
* Graph 3: Reliability Comparison - Bar chart with reliability scores
|
|
33
|
+
*/
|
|
34
|
+
private generateReliabilityComparisonGraph;
|
|
35
|
+
/**
|
|
36
|
+
* Graph 4: Tool Performance Heatmap - Shows model scores per tool
|
|
37
|
+
*/
|
|
38
|
+
private generateToolPerformanceHeatmap;
|
|
39
|
+
/**
|
|
40
|
+
* Graph 5: Context Window Correlation - Scatter plot showing context window vs performance
|
|
41
|
+
*/
|
|
42
|
+
private generateContextWindowCorrelationGraph;
|
|
43
|
+
/**
|
|
44
|
+
* Downloads a chart from QuickChart.io API and saves it as PNG
|
|
45
|
+
*/
|
|
46
|
+
private downloadChart;
|
|
47
|
+
/**
|
|
48
|
+
* Cleans model names by removing provider prefixes
|
|
49
|
+
*/
|
|
50
|
+
private cleanModelName;
|
|
51
|
+
/**
|
|
52
|
+
* Returns a consistent color for each tool index (supports up to 10 tools)
|
|
53
|
+
*/
|
|
54
|
+
private getToolColor;
|
|
55
|
+
}
|
|
56
|
+
//# sourceMappingURL=graph-generator.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"graph-generator.d.ts","sourceRoot":"","sources":["../../src/evaluation/graph-generator.ts"],"names":[],"mappings":"AAGA,OAAO,KAAK,EAAE,gBAAgB,EAAE,MAAM,2BAA2B,CAAC;AAElE,MAAM,WAAW,qBAAqB;IACpC,OAAO,EAAE,OAAO,CAAC;IACjB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,KAAK,CAAC,EAAE,MAAM,CAAC;CAChB;AAED;;;GAGG;AACH,qBAAa,cAAc;IACzB,OAAO,CAAC,SAAS,CAAS;IAC1B,OAAO,CAAC,iBAAiB,CAAiC;gBAE9C,SAAS,SAAoC;IAIzD;;;;;;OAMG;IACG,iBAAiB,CACrB,iBAAiB,EAAE,gBAAgB,EAAE,EACrC,UAAU,CAAC,EAAE,MAAM,EAAE,GACpB,OAAO,CAAC,MAAM,CAAC,MAAM,EAAE,qBAAqB,CAAC,CAAC;IAkCjD;;OAEG;YACW,6BAA6B;IAiH3C;;OAEG;YACW,0BAA0B;IAsHxC;;OAEG;YACW,kCAAkC;IA4GhD;;OAEG;YACW,8BAA8B;IAqG5C;;OAEG;YACW,qCAAqC;IAyHnD;;OAEG;YACW,aAAa;IA8B3B;;OAEG;IACH,OAAO,CAAC,cAAc;IAQtB;;OAEG;IACH,OAAO,CAAC,YAAY;CAerB"}
|