@xiuper/cli 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (218) hide show
  1. package/README.md +180 -0
  2. package/dist/jsMain/typescript/agents/LLMService.d.ts +40 -0
  3. package/dist/jsMain/typescript/agents/LLMService.d.ts.map +1 -0
  4. package/dist/jsMain/typescript/agents/LLMService.js +156 -0
  5. package/dist/jsMain/typescript/agents/LLMService.js.map +1 -0
  6. package/dist/jsMain/typescript/agents/ServerAgentClient.d.ts +103 -0
  7. package/dist/jsMain/typescript/agents/ServerAgentClient.d.ts.map +1 -0
  8. package/dist/jsMain/typescript/agents/ServerAgentClient.js +142 -0
  9. package/dist/jsMain/typescript/agents/ServerAgentClient.js.map +1 -0
  10. package/dist/jsMain/typescript/agents/render/BaseRenderer.d.ts +87 -0
  11. package/dist/jsMain/typescript/agents/render/BaseRenderer.d.ts.map +1 -0
  12. package/dist/jsMain/typescript/agents/render/BaseRenderer.js +128 -0
  13. package/dist/jsMain/typescript/agents/render/BaseRenderer.js.map +1 -0
  14. package/dist/jsMain/typescript/agents/render/CliRenderer.d.ts +51 -0
  15. package/dist/jsMain/typescript/agents/render/CliRenderer.d.ts.map +1 -0
  16. package/dist/jsMain/typescript/agents/render/CliRenderer.js +564 -0
  17. package/dist/jsMain/typescript/agents/render/CliRenderer.js.map +1 -0
  18. package/dist/jsMain/typescript/agents/render/ServerRenderer.d.ts +55 -0
  19. package/dist/jsMain/typescript/agents/render/ServerRenderer.d.ts.map +1 -0
  20. package/dist/jsMain/typescript/agents/render/ServerRenderer.js +503 -0
  21. package/dist/jsMain/typescript/agents/render/ServerRenderer.js.map +1 -0
  22. package/dist/jsMain/typescript/agents/render/TuiRenderer.d.ts +104 -0
  23. package/dist/jsMain/typescript/agents/render/TuiRenderer.d.ts.map +1 -0
  24. package/dist/jsMain/typescript/agents/render/TuiRenderer.js +279 -0
  25. package/dist/jsMain/typescript/agents/render/TuiRenderer.js.map +1 -0
  26. package/dist/jsMain/typescript/config/ConfigManager.d.ts +146 -0
  27. package/dist/jsMain/typescript/config/ConfigManager.d.ts.map +1 -0
  28. package/dist/jsMain/typescript/config/ConfigManager.js +257 -0
  29. package/dist/jsMain/typescript/config/ConfigManager.js.map +1 -0
  30. package/dist/jsMain/typescript/constants/asciiArt.d.ts +9 -0
  31. package/dist/jsMain/typescript/constants/asciiArt.d.ts.map +1 -0
  32. package/dist/jsMain/typescript/constants/asciiArt.js +47 -0
  33. package/dist/jsMain/typescript/constants/asciiArt.js.map +1 -0
  34. package/dist/jsMain/typescript/design-system/colors.d.ts +492 -0
  35. package/dist/jsMain/typescript/design-system/colors.d.ts.map +1 -0
  36. package/dist/jsMain/typescript/design-system/colors.js +333 -0
  37. package/dist/jsMain/typescript/design-system/colors.js.map +1 -0
  38. package/dist/jsMain/typescript/design-system/index.d.ts +31 -0
  39. package/dist/jsMain/typescript/design-system/index.d.ts.map +1 -0
  40. package/dist/jsMain/typescript/design-system/index.js +195 -0
  41. package/dist/jsMain/typescript/design-system/index.js.map +1 -0
  42. package/dist/jsMain/typescript/design-system/theme-helpers.d.ts +161 -0
  43. package/dist/jsMain/typescript/design-system/theme-helpers.d.ts.map +1 -0
  44. package/dist/jsMain/typescript/design-system/theme-helpers.js +153 -0
  45. package/dist/jsMain/typescript/design-system/theme-helpers.js.map +1 -0
  46. package/dist/jsMain/typescript/i18n/index.d.ts +37 -0
  47. package/dist/jsMain/typescript/i18n/index.d.ts.map +1 -0
  48. package/dist/jsMain/typescript/i18n/index.js +139 -0
  49. package/dist/jsMain/typescript/i18n/index.js.map +1 -0
  50. package/dist/jsMain/typescript/i18n/locales/en.d.ts +6 -0
  51. package/dist/jsMain/typescript/i18n/locales/en.d.ts.map +1 -0
  52. package/dist/jsMain/typescript/i18n/locales/en.js +120 -0
  53. package/dist/jsMain/typescript/i18n/locales/en.js.map +1 -0
  54. package/dist/jsMain/typescript/i18n/locales/zh.d.ts +6 -0
  55. package/dist/jsMain/typescript/i18n/locales/zh.d.ts.map +1 -0
  56. package/dist/jsMain/typescript/i18n/locales/zh.js +120 -0
  57. package/dist/jsMain/typescript/i18n/locales/zh.js.map +1 -0
  58. package/dist/jsMain/typescript/i18n/types.d.ts +124 -0
  59. package/dist/jsMain/typescript/i18n/types.d.ts.map +1 -0
  60. package/dist/jsMain/typescript/i18n/types.js +7 -0
  61. package/dist/jsMain/typescript/i18n/types.js.map +1 -0
  62. package/dist/jsMain/typescript/index.d.ts +9 -0
  63. package/dist/jsMain/typescript/index.d.ts.map +1 -0
  64. package/dist/jsMain/typescript/index.js +380 -0
  65. package/dist/jsMain/typescript/index.js.map +1 -0
  66. package/dist/jsMain/typescript/modes/AgentMode.d.ts +33 -0
  67. package/dist/jsMain/typescript/modes/AgentMode.d.ts.map +1 -0
  68. package/dist/jsMain/typescript/modes/AgentMode.js +243 -0
  69. package/dist/jsMain/typescript/modes/AgentMode.js.map +1 -0
  70. package/dist/jsMain/typescript/modes/ChatMode.d.ts +30 -0
  71. package/dist/jsMain/typescript/modes/ChatMode.d.ts.map +1 -0
  72. package/dist/jsMain/typescript/modes/ChatMode.js +260 -0
  73. package/dist/jsMain/typescript/modes/ChatMode.js.map +1 -0
  74. package/dist/jsMain/typescript/modes/DocumentMode.d.ts +26 -0
  75. package/dist/jsMain/typescript/modes/DocumentMode.d.ts.map +1 -0
  76. package/dist/jsMain/typescript/modes/DocumentMode.js +217 -0
  77. package/dist/jsMain/typescript/modes/DocumentMode.js.map +1 -0
  78. package/dist/jsMain/typescript/modes/Mode.d.ts +72 -0
  79. package/dist/jsMain/typescript/modes/Mode.d.ts.map +1 -0
  80. package/dist/jsMain/typescript/modes/Mode.js +7 -0
  81. package/dist/jsMain/typescript/modes/Mode.js.map +1 -0
  82. package/dist/jsMain/typescript/modes/ModeManager.d.ts +76 -0
  83. package/dist/jsMain/typescript/modes/ModeManager.d.ts.map +1 -0
  84. package/dist/jsMain/typescript/modes/ModeManager.js +156 -0
  85. package/dist/jsMain/typescript/modes/ModeManager.js.map +1 -0
  86. package/dist/jsMain/typescript/modes/ReviewMode.d.ts +52 -0
  87. package/dist/jsMain/typescript/modes/ReviewMode.d.ts.map +1 -0
  88. package/dist/jsMain/typescript/modes/ReviewMode.js +435 -0
  89. package/dist/jsMain/typescript/modes/ReviewMode.js.map +1 -0
  90. package/dist/jsMain/typescript/modes/index.d.ts +9 -0
  91. package/dist/jsMain/typescript/modes/index.d.ts.map +1 -0
  92. package/dist/jsMain/typescript/modes/index.js +7 -0
  93. package/dist/jsMain/typescript/modes/index.js.map +1 -0
  94. package/dist/jsMain/typescript/processors/AtCommandProcessor.d.ts +34 -0
  95. package/dist/jsMain/typescript/processors/AtCommandProcessor.d.ts.map +1 -0
  96. package/dist/jsMain/typescript/processors/AtCommandProcessor.js +118 -0
  97. package/dist/jsMain/typescript/processors/AtCommandProcessor.js.map +1 -0
  98. package/dist/jsMain/typescript/processors/InputRouter.d.ts +84 -0
  99. package/dist/jsMain/typescript/processors/InputRouter.d.ts.map +1 -0
  100. package/dist/jsMain/typescript/processors/InputRouter.js +78 -0
  101. package/dist/jsMain/typescript/processors/InputRouter.js.map +1 -0
  102. package/dist/jsMain/typescript/processors/ModeCommandProcessor.d.ts +25 -0
  103. package/dist/jsMain/typescript/processors/ModeCommandProcessor.d.ts.map +1 -0
  104. package/dist/jsMain/typescript/processors/ModeCommandProcessor.js +127 -0
  105. package/dist/jsMain/typescript/processors/ModeCommandProcessor.js.map +1 -0
  106. package/dist/jsMain/typescript/processors/SlashCommandProcessor.d.ts +68 -0
  107. package/dist/jsMain/typescript/processors/SlashCommandProcessor.d.ts.map +1 -0
  108. package/dist/jsMain/typescript/processors/SlashCommandProcessor.js +391 -0
  109. package/dist/jsMain/typescript/processors/SlashCommandProcessor.js.map +1 -0
  110. package/dist/jsMain/typescript/processors/VariableProcessor.d.ts +44 -0
  111. package/dist/jsMain/typescript/processors/VariableProcessor.d.ts.map +1 -0
  112. package/dist/jsMain/typescript/processors/VariableProcessor.js +105 -0
  113. package/dist/jsMain/typescript/processors/VariableProcessor.js.map +1 -0
  114. package/dist/jsMain/typescript/ui/App.d.ts +16 -0
  115. package/dist/jsMain/typescript/ui/App.d.ts.map +1 -0
  116. package/dist/jsMain/typescript/ui/App.js +208 -0
  117. package/dist/jsMain/typescript/ui/App.js.map +1 -0
  118. package/dist/jsMain/typescript/ui/Banner.d.ts +6 -0
  119. package/dist/jsMain/typescript/ui/Banner.d.ts.map +1 -0
  120. package/dist/jsMain/typescript/ui/Banner.js +13 -0
  121. package/dist/jsMain/typescript/ui/Banner.js.map +1 -0
  122. package/dist/jsMain/typescript/ui/ChatInterface.d.ts +19 -0
  123. package/dist/jsMain/typescript/ui/ChatInterface.d.ts.map +1 -0
  124. package/dist/jsMain/typescript/ui/ChatInterface.js +223 -0
  125. package/dist/jsMain/typescript/ui/ChatInterface.js.map +1 -0
  126. package/dist/jsMain/typescript/ui/CommandSuggestions.d.ts +21 -0
  127. package/dist/jsMain/typescript/ui/CommandSuggestions.d.ts.map +1 -0
  128. package/dist/jsMain/typescript/ui/CommandSuggestions.js +43 -0
  129. package/dist/jsMain/typescript/ui/CommandSuggestions.js.map +1 -0
  130. package/dist/jsMain/typescript/ui/LanguageSwitcher.d.ts +11 -0
  131. package/dist/jsMain/typescript/ui/LanguageSwitcher.d.ts.map +1 -0
  132. package/dist/jsMain/typescript/ui/LanguageSwitcher.js +37 -0
  133. package/dist/jsMain/typescript/ui/LanguageSwitcher.js.map +1 -0
  134. package/dist/jsMain/typescript/ui/MessageRenderer.d.ts +70 -0
  135. package/dist/jsMain/typescript/ui/MessageRenderer.d.ts.map +1 -0
  136. package/dist/jsMain/typescript/ui/MessageRenderer.js +255 -0
  137. package/dist/jsMain/typescript/ui/MessageRenderer.js.map +1 -0
  138. package/dist/jsMain/typescript/ui/ModelConfigForm.d.ts +19 -0
  139. package/dist/jsMain/typescript/ui/ModelConfigForm.d.ts.map +1 -0
  140. package/dist/jsMain/typescript/ui/ModelConfigForm.js +257 -0
  141. package/dist/jsMain/typescript/ui/ModelConfigForm.js.map +1 -0
  142. package/dist/jsMain/typescript/ui/WelcomeScreen.d.ts +12 -0
  143. package/dist/jsMain/typescript/ui/WelcomeScreen.d.ts.map +1 -0
  144. package/dist/jsMain/typescript/ui/WelcomeScreen.js +93 -0
  145. package/dist/jsMain/typescript/ui/WelcomeScreen.js.map +1 -0
  146. package/dist/jsMain/typescript/utils/commandUtils.d.ts +64 -0
  147. package/dist/jsMain/typescript/utils/commandUtils.d.ts.map +1 -0
  148. package/dist/jsMain/typescript/utils/commandUtils.js +195 -0
  149. package/dist/jsMain/typescript/utils/commandUtils.js.map +1 -0
  150. package/dist/jsMain/typescript/utils/domainDictUtils.d.ts +53 -0
  151. package/dist/jsMain/typescript/utils/domainDictUtils.d.ts.map +1 -0
  152. package/dist/jsMain/typescript/utils/domainDictUtils.js +130 -0
  153. package/dist/jsMain/typescript/utils/domainDictUtils.js.map +1 -0
  154. package/dist/jsMain/typescript/utils/markdownSplitter.d.ts +23 -0
  155. package/dist/jsMain/typescript/utils/markdownSplitter.d.ts.map +1 -0
  156. package/dist/jsMain/typescript/utils/markdownSplitter.js +90 -0
  157. package/dist/jsMain/typescript/utils/markdownSplitter.js.map +1 -0
  158. package/dist/jsMain/typescript/utils/outputFormatter.d.ts +70 -0
  159. package/dist/jsMain/typescript/utils/outputFormatter.d.ts.map +1 -0
  160. package/dist/jsMain/typescript/utils/outputFormatter.js +140 -0
  161. package/dist/jsMain/typescript/utils/outputFormatter.js.map +1 -0
  162. package/dist/jsMain/typescript/utils/renderUtils.d.ts +17 -0
  163. package/dist/jsMain/typescript/utils/renderUtils.d.ts.map +1 -0
  164. package/dist/jsMain/typescript/utils/renderUtils.js +128 -0
  165. package/dist/jsMain/typescript/utils/renderUtils.js.map +1 -0
  166. package/dist/test/framework/analyzers/CodeChangeAnalyzer.d.ts +87 -0
  167. package/dist/test/framework/analyzers/CodeChangeAnalyzer.d.ts.map +1 -0
  168. package/dist/test/framework/analyzers/CodeChangeAnalyzer.js +412 -0
  169. package/dist/test/framework/analyzers/CodeChangeAnalyzer.js.map +1 -0
  170. package/dist/test/framework/analyzers/PromptAnalyzer.d.ts +46 -0
  171. package/dist/test/framework/analyzers/PromptAnalyzer.d.ts.map +1 -0
  172. package/dist/test/framework/analyzers/PromptAnalyzer.js +185 -0
  173. package/dist/test/framework/analyzers/PromptAnalyzer.js.map +1 -0
  174. package/dist/test/framework/analyzers/ToolCallAnalyzer.d.ts +45 -0
  175. package/dist/test/framework/analyzers/ToolCallAnalyzer.d.ts.map +1 -0
  176. package/dist/test/framework/analyzers/ToolCallAnalyzer.js +215 -0
  177. package/dist/test/framework/analyzers/ToolCallAnalyzer.js.map +1 -0
  178. package/dist/test/framework/cli.d.ts +8 -0
  179. package/dist/test/framework/cli.d.ts.map +1 -0
  180. package/dist/test/framework/cli.js +175 -0
  181. package/dist/test/framework/cli.js.map +1 -0
  182. package/dist/test/framework/core/TestCase.d.ts +100 -0
  183. package/dist/test/framework/core/TestCase.d.ts.map +1 -0
  184. package/dist/test/framework/core/TestCase.js +101 -0
  185. package/dist/test/framework/core/TestCase.js.map +1 -0
  186. package/dist/test/framework/core/TestEngine.d.ts +89 -0
  187. package/dist/test/framework/core/TestEngine.d.ts.map +1 -0
  188. package/dist/test/framework/core/TestEngine.js +552 -0
  189. package/dist/test/framework/core/TestEngine.js.map +1 -0
  190. package/dist/test/framework/core/TestResult.d.ts +143 -0
  191. package/dist/test/framework/core/TestResult.d.ts.map +1 -0
  192. package/dist/test/framework/core/TestResult.js +76 -0
  193. package/dist/test/framework/core/TestResult.js.map +1 -0
  194. package/dist/test/framework/examples/BasicRobustnessTest.d.ts +19 -0
  195. package/dist/test/framework/examples/BasicRobustnessTest.d.ts.map +1 -0
  196. package/dist/test/framework/examples/BasicRobustnessTest.js +116 -0
  197. package/dist/test/framework/examples/BasicRobustnessTest.js.map +1 -0
  198. package/dist/test/framework/index.d.ts +30 -0
  199. package/dist/test/framework/index.d.ts.map +1 -0
  200. package/dist/test/framework/index.js +38 -0
  201. package/dist/test/framework/index.js.map +1 -0
  202. package/dist/test/framework/loaders/JsonScenarioLoader.d.ts +99 -0
  203. package/dist/test/framework/loaders/JsonScenarioLoader.d.ts.map +1 -0
  204. package/dist/test/framework/loaders/JsonScenarioLoader.js +197 -0
  205. package/dist/test/framework/loaders/JsonScenarioLoader.js.map +1 -0
  206. package/dist/test/framework/reporters/ConsoleReporter.d.ts +25 -0
  207. package/dist/test/framework/reporters/ConsoleReporter.d.ts.map +1 -0
  208. package/dist/test/framework/reporters/ConsoleReporter.js +196 -0
  209. package/dist/test/framework/reporters/ConsoleReporter.js.map +1 -0
  210. package/dist/test/framework/scenarios/ScenarioBuilder.d.ts +62 -0
  211. package/dist/test/framework/scenarios/ScenarioBuilder.d.ts.map +1 -0
  212. package/dist/test/framework/scenarios/ScenarioBuilder.js +285 -0
  213. package/dist/test/framework/scenarios/ScenarioBuilder.js.map +1 -0
  214. package/dist/test/framework/validate-framework.d.ts +9 -0
  215. package/dist/test/framework/validate-framework.d.ts.map +1 -0
  216. package/dist/test/framework/validate-framework.js +187 -0
  217. package/dist/test/framework/validate-framework.js.map +1 -0
  218. package/package.json +84 -0
@@ -0,0 +1,143 @@
1
+ /**
2
+ * AI Agent 测试结果数据结构
3
+ *
4
+ * 定义了测试执行结果的完整数据结构,包括执行信息、分析结果、质量指标等
5
+ */
6
+ import { TestCase } from './TestCase';
7
+ export declare enum TestStatus {
8
+ PASSED = "passed",
9
+ FAILED = "failed",
10
+ TIMEOUT = "timeout",
11
+ ERROR = "error",
12
+ SKIPPED = "skipped"
13
+ }
14
+ export interface ExecutionInfo {
15
+ startTime: Date;
16
+ endTime: Date;
17
+ duration: number;
18
+ exitCode: number;
19
+ stdout: string;
20
+ stderr: string;
21
+ iterations: number;
22
+ timeoutOccurred: boolean;
23
+ }
24
+ export interface ToolCallInfo {
25
+ tool: string;
26
+ timestamp: Date;
27
+ parameters?: Record<string, any>;
28
+ success: boolean;
29
+ output?: string;
30
+ error?: string;
31
+ duration?: number;
32
+ }
33
+ export interface FileChangeInfo {
34
+ type: 'created' | 'modified' | 'deleted';
35
+ path: string;
36
+ sizeBefore?: number;
37
+ sizeAfter?: number;
38
+ contentPreview?: string;
39
+ timestamp: Date;
40
+ }
41
+ export interface PromptAnalysisResult {
42
+ followedSystemPrompt: boolean;
43
+ exploredProjectFirst: boolean;
44
+ usedAppropriateTools: boolean;
45
+ handledErrorsGracefully: boolean;
46
+ promptEffectivenessScore: number;
47
+ issues: string[];
48
+ }
49
+ export interface ToolCallAnalysisResult {
50
+ totalCalls: number;
51
+ uniqueTools: string[];
52
+ toolAccuracy: number;
53
+ sequenceCorrectness: number;
54
+ parameterCorrectness: number;
55
+ unexpectedTools: string[];
56
+ missingTools: string[];
57
+ toolCallDetails: ToolCallInfo[];
58
+ }
59
+ export interface CodeQualityResult {
60
+ syntaxErrors: number;
61
+ structuralIssues: number;
62
+ bestPracticeViolations: number;
63
+ totalIssues: number;
64
+ qualityScore: number;
65
+ issues: {
66
+ type: 'syntax' | 'structure' | 'best-practice';
67
+ severity: 'error' | 'warning' | 'info';
68
+ message: string;
69
+ file?: string;
70
+ line?: number;
71
+ }[];
72
+ }
73
+ export interface TaskCompletionResult {
74
+ completed: boolean;
75
+ completionScore: number;
76
+ functionalityImplemented: string[];
77
+ functionalityMissing: string[];
78
+ backwardCompatibility: boolean;
79
+ regressionIssues: string[];
80
+ }
81
+ export interface TestResult {
82
+ testCase: TestCase;
83
+ status: TestStatus;
84
+ executionInfo: ExecutionInfo;
85
+ promptAnalysis: PromptAnalysisResult;
86
+ toolCallAnalysis: ToolCallAnalysisResult;
87
+ codeQuality: CodeQualityResult;
88
+ taskCompletion: TaskCompletionResult;
89
+ fileChanges: FileChangeInfo[];
90
+ overallScore: number;
91
+ errors: string[];
92
+ warnings: string[];
93
+ customValidationResults?: {
94
+ name: string;
95
+ passed: boolean;
96
+ message?: string;
97
+ }[];
98
+ metadata: {
99
+ frameworkVersion: string;
100
+ agentVersion?: string;
101
+ environment: Record<string, string>;
102
+ testProjectPath?: string;
103
+ };
104
+ }
105
+ export interface TestSuiteResult {
106
+ suiteId: string;
107
+ suiteName: string;
108
+ startTime: Date;
109
+ endTime: Date;
110
+ duration: number;
111
+ totalTests: number;
112
+ passedTests: number;
113
+ failedTests: number;
114
+ skippedTests: number;
115
+ errorTests: number;
116
+ testResults: TestResult[];
117
+ summary: {
118
+ averageScore: number;
119
+ averageExecutionTime: number;
120
+ mostCommonIssues: string[];
121
+ toolUsageStats: Record<string, number>;
122
+ categoryStats: Record<string, {
123
+ passed: number;
124
+ total: number;
125
+ }>;
126
+ };
127
+ }
128
+ export declare class TestResultBuilder {
129
+ private result;
130
+ static create(testCase: TestCase): TestResultBuilder;
131
+ withTestCase(testCase: TestCase): TestResultBuilder;
132
+ withStatus(status: TestStatus): TestResultBuilder;
133
+ withExecutionInfo(executionInfo: ExecutionInfo): TestResultBuilder;
134
+ withPromptAnalysis(analysis: PromptAnalysisResult): TestResultBuilder;
135
+ withToolCallAnalysis(analysis: ToolCallAnalysisResult): TestResultBuilder;
136
+ withCodeQuality(quality: CodeQualityResult): TestResultBuilder;
137
+ withTaskCompletion(completion: TaskCompletionResult): TestResultBuilder;
138
+ addFileChange(change: FileChangeInfo): TestResultBuilder;
139
+ addError(error: string): TestResultBuilder;
140
+ addWarning(warning: string): TestResultBuilder;
141
+ build(): TestResult;
142
+ }
143
+ //# sourceMappingURL=TestResult.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"TestResult.d.ts","sourceRoot":"","sources":["../../../../src/test/framework/core/TestResult.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,QAAQ,EAAE,MAAM,YAAY,CAAC;AAEtC,oBAAY,UAAU;IACpB,MAAM,WAAW;IACjB,MAAM,WAAW;IACjB,OAAO,YAAY;IACnB,KAAK,UAAU;IACf,OAAO,YAAY;CACpB;AAED,MAAM,WAAW,aAAa;IAC5B,SAAS,EAAE,IAAI,CAAC;IAChB,OAAO,EAAE,IAAI,CAAC;IACd,QAAQ,EAAE,MAAM,CAAC;IACjB,QAAQ,EAAE,MAAM,CAAC;IACjB,MAAM,EAAE,MAAM,CAAC;IACf,MAAM,EAAE,MAAM,CAAC;IACf,UAAU,EAAE,MAAM,CAAC;IACnB,eAAe,EAAE,OAAO,CAAC;CAC1B;AAED,MAAM,WAAW,YAAY;IAC3B,IAAI,EAAE,MAAM,CAAC;IACb,SAAS,EAAE,IAAI,CAAC;IAChB,UAAU,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;IACjC,OAAO,EAAE,OAAO,CAAC;IACjB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,QAAQ,CAAC,EAAE,MAAM,CAAC;CACnB;AAED,MAAM,WAAW,cAAc;IAC7B,IAAI,EAAE,SAAS,GAAG,UAAU,GAAG,SAAS,CAAC;IACzC,IAAI,EAAE,MAAM,CAAC;IACb,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,cAAc,CAAC,EAAE,MAAM,CAAC;IACxB,SAAS,EAAE,IAAI,CAAC;CACjB;AAED,MAAM,WAAW,oBAAoB;IACnC,oBAAoB,EAAE,OAAO,CAAC;IAC9B,oBAAoB,EAAE,OAAO,CAAC;IAC9B,oBAAoB,EAAE,OAAO,CAAC;IAC9B,uBAAuB,EAAE,OAAO,CAAC;IACjC,wBAAwB,EAAE,MAAM,CAAC;IACjC,MAAM,EAAE,MAAM,EAAE,CAAC;CAClB;AAED,MAAM,WAAW,sBAAsB;IACrC,UAAU,EAAE,MAAM,CAAC;IACnB,WAAW,EAAE,MAAM,EAAE,CAAC;IACtB,YAAY,EAAE,MAAM,CAAC;IACrB,mBAAmB,EAAE,MAAM,CAAC;IAC5B,oBAAoB,EAAE,MAAM,CAAC;IAC7B,eAAe,EAAE,MAAM,EAAE,CAAC;IAC1B,YAAY,EAAE,MAAM,EAAE,CAAC;IACvB,eAAe,EAAE,YAAY,EAAE,CAAC;CACjC;AAED,MAAM,WAAW,iBAAiB;IAChC,YAAY,EAAE,MAAM,CAAC;IACrB,gBAAgB,EAAE,MAAM,CAAC;IACzB,sBAAsB,EAAE,MAAM,CAAC;IAC/B,WAAW,EAAE,MAAM,CAAC;IACpB,YAAY,EAAE,MAAM,CAAC;IACrB,MAAM,EAAE;QACN,IAAI,EAAE,QAAQ,GAAG,WAAW,GAAG,eAAe,CAAC;QAC/C,QAAQ,EAAE,OAAO,GAAG,SAAS,GAAG,MAAM,CAAC;QACvC,OAAO,EAAE,MAAM,CAAC;QAChB,IAAI,CAAC,EAAE,MAAM,CAAC;QACd,IAAI,CAAC,EAAE,MAAM,CAAC;KACf,EAAE,CAAC;CACL;AAED,MAAM,WAAW,oBAAoB;IACnC,SAAS,EAAE,OAAO,CAAC;IACnB,eAAe,EAAE,MAAM,CAAC;IACxB,wBAAwB,EAAE,MAAM,EAAE,CAAC;IACnC,oBAAoB,EAAE,MAAM,EAAE,CAAC;IAC/B,qBAAqB,EAAE,OAAO,CAAC;IAC/B,gBAAgB,EAAE,MAAM,EAAE,CAAC;CAC5B;AAED,MAAM,WAAW,UAAU;IAEzB,QAAQ,EAAE,QAAQ,CAAC;IACnB,MAAM,EAAE,UAAU,CAAC;IACnB,aAAa,EAAE,aAAa,CAAC;IAG7B,cAAc,EAAE,oBAAoB,CAAC;IACrC,gBAAgB,EAAE,sBAAsB,CAAC;IACzC,WAAW,EAAE,iBAAiB,CAAC;IAC/B,cAAc,EAAE,oBAAoB,CAAC;IAGrC,WAAW,EAAE,cAAc,EAAE,CAAC;IAG9B,YAAY,EAAE,MAAM,CAAC;IAGrB,MAAM,EAAE,MAAM,EAAE,CAAC;IACjB,QAAQ,EAAE,MAAM,EAAE,CAAC;IAGnB,uBAAuB,CAAC,EAAE;QACxB,IAAI,EAAE,MAAM,CAAC;QACb,MAAM,EAAE,OAAO,CAAC;QAChB,OAAO,CAAC,EAAE,MAAM,CAAC;KAClB,EAAE,CAAC;IAGJ,QAAQ,EAAE;QACR,gBAAgB,EAAE,MAAM,CAAC;QACzB,YAAY,CAAC,EAAE,MAAM,CAAC;QACtB,WAAW,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;QACpC,eAAe,CAAC,EAAE,MAAM,CAAC;KAC1B,CAAC;CACH;AAED,MAAM,WAAW,eAAe;IAC9B,OAAO,EAAE,MAAM,CAAC;IAChB,SAAS,EAAE,MAAM,CAAC;IAClB,SAAS,EAAE,IAAI,CAAC;IAChB,OAAO,EAAE,IAAI,CAAC;IACd,QAAQ,EAAE,MAAM,CAAC;IAGjB,UAAU,EAAE,MAAM,CAAC;IACnB,WAAW,EAAE,MAAM,CAAC;IACpB,WAAW,EAAE,MAAM,CAAC;IACpB,YAAY,EAAE,MAAM,CAAC;IACrB,UAAU,EAAE,MAAM,CAAC;IAGnB,WAAW,EAAE,UAAU,EAAE,CAAC;IAG1B,OAAO,EAAE;QACP,YAAY,EAAE,MAAM,CAAC;QACrB,oBAAoB,EAAE,MAAM,CAAC;QAC7B,gBAAgB,EAAE,MAAM,EAAE,CAAC;QAC3B,cAAc,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;QACvC,aAAa,EAAE,MAAM,CAAC,MAAM,EAAE;YAAE,MAAM,EAAE,MAAM,CAAC;YAAC,KAAK,EAAE,MAAM,CAAA;SAAE,CAAC,CAAC;KAClE,CAAC;CACH;AAGD,qBAAa,iBAAiB;IAC5B,OAAO,CAAC,MAAM,CAIZ;IAEF,MAAM,CAAC,MAAM,CAAC,QAAQ,EAAE,QAAQ,GAAG,iBAAiB;IAIpD,YAAY,CAAC,QAAQ,EAAE,QAAQ,GAAG,iBAAiB;IAKnD,UAAU,CAAC,MAAM,EAAE,UAAU,GAAG,iBAAiB;IAKjD,iBAAiB,CAAC,aAAa,EAAE,aAAa,GAAG,iBAAiB;IAKlE,kBAAkB,CAAC,QAAQ,EAAE,oBAAoB,GAAG,iBAAiB;IAKrE,oBAAoB,CAAC,QAAQ,EAAE,sBAAsB,GAAG,iBAAiB;IAKzE,eAAe,CAAC,OAAO,EAAE,iBAAiB,GAAG,iBAAiB;IAK9D,kBAAkB,CAAC,UAAU,EAAE,oBAAoB,GAAG,iBAAiB;IAKvE,aAAa,CAAC,MAAM,EAAE,cAAc,GAAG,iBAAiB;IAKxD,QAAQ,CAAC,KAAK,EAAE,MAAM,GAAG,iBAAiB;IAK1C,UAAU,CAAC,OAAO,EAAE,MAAM,GAAG,iBAAiB;IAK9C,KAAK,IAAI,UAAU;CAapB"}
@@ -0,0 +1,76 @@
1
+ /**
2
+ * AI Agent 测试结果数据结构
3
+ *
4
+ * 定义了测试执行结果的完整数据结构,包括执行信息、分析结果、质量指标等
5
+ */
6
+ export var TestStatus;
7
+ (function (TestStatus) {
8
+ TestStatus["PASSED"] = "passed";
9
+ TestStatus["FAILED"] = "failed";
10
+ TestStatus["TIMEOUT"] = "timeout";
11
+ TestStatus["ERROR"] = "error";
12
+ TestStatus["SKIPPED"] = "skipped";
13
+ })(TestStatus || (TestStatus = {}));
14
+ // 结果构建器,用于逐步构建测试结果
15
+ export class TestResultBuilder {
16
+ result = {
17
+ errors: [],
18
+ warnings: [],
19
+ fileChanges: []
20
+ };
21
+ static create(testCase) {
22
+ return new TestResultBuilder().withTestCase(testCase);
23
+ }
24
+ withTestCase(testCase) {
25
+ this.result.testCase = testCase;
26
+ return this;
27
+ }
28
+ withStatus(status) {
29
+ this.result.status = status;
30
+ return this;
31
+ }
32
+ withExecutionInfo(executionInfo) {
33
+ this.result.executionInfo = executionInfo;
34
+ return this;
35
+ }
36
+ withPromptAnalysis(analysis) {
37
+ this.result.promptAnalysis = analysis;
38
+ return this;
39
+ }
40
+ withToolCallAnalysis(analysis) {
41
+ this.result.toolCallAnalysis = analysis;
42
+ return this;
43
+ }
44
+ withCodeQuality(quality) {
45
+ this.result.codeQuality = quality;
46
+ return this;
47
+ }
48
+ withTaskCompletion(completion) {
49
+ this.result.taskCompletion = completion;
50
+ return this;
51
+ }
52
+ addFileChange(change) {
53
+ this.result.fileChanges.push(change);
54
+ return this;
55
+ }
56
+ addError(error) {
57
+ this.result.errors.push(error);
58
+ return this;
59
+ }
60
+ addWarning(warning) {
61
+ this.result.warnings.push(warning);
62
+ return this;
63
+ }
64
+ build() {
65
+ // 计算综合评分
66
+ const scores = [
67
+ this.result.promptAnalysis?.promptEffectivenessScore || 0,
68
+ this.result.toolCallAnalysis?.toolAccuracy || 0,
69
+ this.result.codeQuality?.qualityScore || 0,
70
+ this.result.taskCompletion?.completionScore || 0
71
+ ];
72
+ this.result.overallScore = scores.reduce((sum, score) => sum + score, 0) / scores.length;
73
+ return this.result;
74
+ }
75
+ }
76
+ //# sourceMappingURL=TestResult.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"TestResult.js","sourceRoot":"","sources":["../../../../src/test/framework/core/TestResult.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAIH,MAAM,CAAN,IAAY,UAMX;AAND,WAAY,UAAU;IACpB,+BAAiB,CAAA;IACjB,+BAAiB,CAAA;IACjB,iCAAmB,CAAA;IACnB,6BAAe,CAAA;IACf,iCAAmB,CAAA;AACrB,CAAC,EANW,UAAU,KAAV,UAAU,QAMrB;AA6ID,mBAAmB;AACnB,MAAM,OAAO,iBAAiB;IACpB,MAAM,GAAwB;QACpC,MAAM,EAAE,EAAE;QACV,QAAQ,EAAE,EAAE;QACZ,WAAW,EAAE,EAAE;KAChB,CAAC;IAEF,MAAM,CAAC,MAAM,CAAC,QAAkB;QAC9B,OAAO,IAAI,iBAAiB,EAAE,CAAC,YAAY,CAAC,QAAQ,CAAC,CAAC;IACxD,CAAC;IAED,YAAY,CAAC,QAAkB;QAC7B,IAAI,CAAC,MAAM,CAAC,QAAQ,GAAG,QAAQ,CAAC;QAChC,OAAO,IAAI,CAAC;IACd,CAAC;IAED,UAAU,CAAC,MAAkB;QAC3B,IAAI,CAAC,MAAM,CAAC,MAAM,GAAG,MAAM,CAAC;QAC5B,OAAO,IAAI,CAAC;IACd,CAAC;IAED,iBAAiB,CAAC,aAA4B;QAC5C,IAAI,CAAC,MAAM,CAAC,aAAa,GAAG,aAAa,CAAC;QAC1C,OAAO,IAAI,CAAC;IACd,CAAC;IAED,kBAAkB,CAAC,QAA8B;QAC/C,IAAI,CAAC,MAAM,CAAC,cAAc,GAAG,QAAQ,CAAC;QACtC,OAAO,IAAI,CAAC;IACd,CAAC;IAED,oBAAoB,CAAC,QAAgC;QACnD,IAAI,CAAC,MAAM,CAAC,gBAAgB,GAAG,QAAQ,CAAC;QACxC,OAAO,IAAI,CAAC;IACd,CAAC;IAED,eAAe,CAAC,OAA0B;QACxC,IAAI,CAAC,MAAM,CAAC,WAAW,GAAG,OAAO,CAAC;QAClC,OAAO,IAAI,CAAC;IACd,CAAC;IAED,kBAAkB,CAAC,UAAgC;QACjD,IAAI,CAAC,MAAM,CAAC,cAAc,GAAG,UAAU,CAAC;QACxC,OAAO,IAAI,CAAC;IACd,CAAC;IAED,aAAa,CAAC,MAAsB;QAClC,IAAI,CAAC,MAAM,CAAC,WAAY,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QACtC,OAAO,IAAI,CAAC;IACd,CAAC;IAED,QAAQ,CAAC,KAAa;QACpB,IAAI,CAAC,MAAM,CAAC,MAAO,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAChC,OAAO,IAAI,CAAC;IACd,CAAC;IAED,UAAU,CAAC,OAAe;QACxB,IAAI,CAAC,MAAM,CAAC,QAAS,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC;QACpC,OAAO,IAAI,CAAC;IACd,CAAC;IAED,KAAK;QACH,SAAS;QACT,MAAM,MAAM,GAAG;YACb,IAAI,CAAC,MAAM,CAAC,cAAc,EAAE,wBAAwB,IAAI,CAAC;YACzD,IAAI,CAAC,MAAM,CAAC,gBAAgB,EAAE,YAAY,IAAI,CAAC;YAC/C,IAAI,CAAC,MAAM,CAAC,WAAW,EAAE,YAAY,IAAI,CAAC;YAC1C,IAAI,CAAC,MAAM,CAAC,cAAc,EAAE,eAAe,IAAI,CAAC;SACjD,CAAC;QAEF,IAAI,CAAC,MAAM,CAAC,YAAY,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,KAAK,EAAE,EAAE,CAAC,GAAG,GAAG,KAAK,EAAE,CAAC,CAAC,GAAG,MAAM,CAAC,MAAM,CAAC;QAEzF,OAAO,IAAI,CAAC,MAAoB,CAAC;IACnC,CAAC;CACF"}
@@ -0,0 +1,19 @@
1
+ /**
2
+ * 基础健壮性测试示例
3
+ *
4
+ * 演示如何使用测试框架创建和运行基础的 AI Agent 健壮性测试
5
+ */
6
+ import { TestCategory } from '../core/TestCase';
7
+ /**
8
+ * 运行基础健壮性测试示例
9
+ */
10
+ export declare function runBasicRobustnessTest(): Promise<void>;
11
+ /**
12
+ * 运行特定类别的测试
13
+ */
14
+ export declare function runCategoryTests(category: TestCategory): Promise<void>;
15
+ /**
16
+ * 运行性能基准测试
17
+ */
18
+ export declare function runPerformanceBenchmark(): Promise<void>;
19
+ //# sourceMappingURL=BasicRobustnessTest.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"BasicRobustnessTest.d.ts","sourceRoot":"","sources":["../../../../src/test/framework/examples/BasicRobustnessTest.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAGH,OAAO,EAAmB,YAAY,EAAe,MAAM,kBAAkB,CAAC;AAI9E;;GAEG;AACH,wBAAsB,sBAAsB,IAAI,OAAO,CAAC,IAAI,CAAC,CA0C5D;AAED;;GAEG;AACH,wBAAsB,gBAAgB,CAAC,QAAQ,EAAE,YAAY,GAAG,OAAO,CAAC,IAAI,CAAC,CA4B5E;AAED;;GAEG;AACH,wBAAsB,uBAAuB,IAAI,OAAO,CAAC,IAAI,CAAC,CA4B7D"}
@@ -0,0 +1,116 @@
1
+ /**
2
+ * 基础健壮性测试示例
3
+ *
4
+ * 演示如何使用测试框架创建和运行基础的 AI Agent 健壮性测试
5
+ */
6
+ import { TestEngine } from '../core/TestEngine';
7
+ import { TestCaseBuilder, TestCategory, ProjectType } from '../core/TestCase';
8
+ import { ScenarioBuilder } from '../scenarios/ScenarioBuilder';
9
+ import { ConsoleReporter } from '../reporters/ConsoleReporter';
10
+ /**
11
+ * 运行基础健壮性测试示例
12
+ */
13
+ export async function runBasicRobustnessTest() {
14
+ console.log('🚀 开始运行基础健壮性测试示例');
15
+ // 1. 配置测试引擎
16
+ const testEngine = new TestEngine({
17
+ agentPath: './dist/index.js',
18
+ outputDir: './test-results',
19
+ reporters: ['console'],
20
+ verbose: true,
21
+ keepTestProjects: false
22
+ });
23
+ try {
24
+ // 2. 创建测试用例 - 手动构建
25
+ const manualTestCase = TestCaseBuilder.create('manual-basic-001')
26
+ .withName('手动创建的基础测试')
27
+ .withDescription('测试 Agent 基本的项目探索能力')
28
+ .withCategory(TestCategory.BASIC_ROBUSTNESS)
29
+ .withTask('Explore the project structure and create a README.md file with project description')
30
+ .withProjectType(ProjectType.GRADLE_SPRING_BOOT)
31
+ .expectTool('glob', { required: true, minCalls: 1 })
32
+ .expectTool('read-file', { required: false })
33
+ .expectTool('write-file', { required: true, minCalls: 1 })
34
+ .expectChange('file-created', { path: 'README.md', required: true })
35
+ .withTimeout(120000)
36
+ .build();
37
+ // 3. 运行单个测试
38
+ console.log('\n📋 运行手动创建的测试用例...');
39
+ const singleResult = await testEngine.runTest(manualTestCase);
40
+ console.log(ConsoleReporter.generateTestReport(singleResult));
41
+ // 4. 输出总结
42
+ console.log(`\n🎉 测试完成!`);
43
+ console.log(`📊 得分: ${(singleResult.overallScore * 100).toFixed(1)}%`);
44
+ }
45
+ catch (error) {
46
+ console.error(`❌ 测试执行失败: ${error}`);
47
+ }
48
+ finally {
49
+ // 清理资源
50
+ await testEngine.stopAllTests();
51
+ }
52
+ }
53
+ /**
54
+ * 运行特定类别的测试
55
+ */
56
+ export async function runCategoryTests(category) {
57
+ console.log(`🎯 运行 ${category} 类别的测试`);
58
+ const testEngine = new TestEngine({
59
+ agentPath: './dist/index.js',
60
+ outputDir: './test-results',
61
+ reporters: ['console'],
62
+ parallel: true,
63
+ maxConcurrency: 2
64
+ });
65
+ try {
66
+ // 获取该类别的所有模板
67
+ const templates = ScenarioBuilder.filterTemplates({ category });
68
+ console.log(`📋 找到 ${templates.length} 个 ${category} 类别的模板`);
69
+ if (templates.length === 0) {
70
+ console.log(`⚠️ 没有找到 ${category} 类别的测试用例`);
71
+ return;
72
+ }
73
+ console.log('✅ 类别测试功能已准备就绪');
74
+ }
75
+ catch (error) {
76
+ console.error(`❌ 类别测试执行失败: ${error}`);
77
+ }
78
+ finally {
79
+ await testEngine.stopAllTests();
80
+ }
81
+ }
82
+ /**
83
+ * 运行性能基准测试
84
+ */
85
+ export async function runPerformanceBenchmark() {
86
+ console.log('⚡ 运行性能基准测试');
87
+ const testEngine = new TestEngine({
88
+ agentPath: './dist/index.js',
89
+ outputDir: './test-results',
90
+ reporters: ['console'],
91
+ parallel: false, // 顺序执行以获得准确的性能数据
92
+ verbose: false
93
+ });
94
+ try {
95
+ // 创建简单的性能测试用例
96
+ const performanceTest = TestCaseBuilder.create('perf-simple')
97
+ .withName('性能测试 - 简单任务')
98
+ .withTask('List all Java files in the project')
99
+ .withProjectType(ProjectType.GRADLE_SPRING_BOOT)
100
+ .expectTool('glob', { required: true })
101
+ .withTimeout(30000)
102
+ .build();
103
+ console.log('✅ 性能测试功能已准备就绪');
104
+ }
105
+ catch (error) {
106
+ console.error(`❌ 性能测试执行失败: ${error}`);
107
+ }
108
+ finally {
109
+ await testEngine.stopAllTests();
110
+ }
111
+ }
112
+ // 如果直接运行此文件,执行基础测试
113
+ if (require.main === module) {
114
+ runBasicRobustnessTest().catch(console.error);
115
+ }
116
+ //# sourceMappingURL=BasicRobustnessTest.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"BasicRobustnessTest.js","sourceRoot":"","sources":["../../../../src/test/framework/examples/BasicRobustnessTest.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,EAAE,UAAU,EAAE,MAAM,oBAAoB,CAAC;AAChD,OAAO,EAAE,eAAe,EAAE,YAAY,EAAE,WAAW,EAAE,MAAM,kBAAkB,CAAC;AAC9E,OAAO,EAAE,eAAe,EAAE,MAAM,8BAA8B,CAAC;AAC/D,OAAO,EAAE,eAAe,EAAE,MAAM,8BAA8B,CAAC;AAE/D;;GAEG;AACH,MAAM,CAAC,KAAK,UAAU,sBAAsB;IAC1C,OAAO,CAAC,GAAG,CAAC,kBAAkB,CAAC,CAAC;IAEhC,YAAY;IACZ,MAAM,UAAU,GAAG,IAAI,UAAU,CAAC;QAChC,SAAS,EAAE,iBAAiB;QAC5B,SAAS,EAAE,gBAAgB;QAC3B,SAAS,EAAE,CAAC,SAAS,CAAC;QACtB,OAAO,EAAE,IAAI;QACb,gBAAgB,EAAE,KAAK;KACxB,CAAC,CAAC;IAEH,IAAI,CAAC;QACH,mBAAmB;QACnB,MAAM,cAAc,GAAG,eAAe,CAAC,MAAM,CAAC,kBAAkB,CAAC;aAC9D,QAAQ,CAAC,WAAW,CAAC;aACrB,eAAe,CAAC,oBAAoB,CAAC;aACrC,YAAY,CAAC,YAAY,CAAC,gBAAgB,CAAC;aAC3C,QAAQ,CAAC,oFAAoF,CAAC;aAC9F,eAAe,CAAC,WAAW,CAAC,kBAAkB,CAAC;aAC/C,UAAU,CAAC,MAAM,EAAE,EAAE,QAAQ,EAAE,IAAI,EAAE,QAAQ,EAAE,CAAC,EAAE,CAAC;aACnD,UAAU,CAAC,WAAW,EAAE,EAAE,QAAQ,EAAE,KAAK,EAAE,CAAC;aAC5C,UAAU,CAAC,YAAY,EAAE,EAAE,QAAQ,EAAE,IAAI,EAAE,QAAQ,EAAE,CAAC,EAAE,CAAC;aACzD,YAAY,CAAC,cAAc,EAAE,EAAE,IAAI,EAAE,WAAW,EAAE,QAAQ,EAAE,IAAI,EAAE,CAAC;aACnE,WAAW,CAAC,MAAM,CAAC;aACnB,KAAK,EAAE,CAAC;QAEX,YAAY;QACZ,OAAO,CAAC,GAAG,CAAC,qBAAqB,CAAC,CAAC;QACnC,MAAM,YAAY,GAAG,MAAM,UAAU,CAAC,OAAO,CAAC,cAAc,CAAC,CAAC;QAC9D,OAAO,CAAC,GAAG,CAAC,eAAe,CAAC,kBAAkB,CAAC,YAAY,CAAC,CAAC,CAAC;QAE9D,UAAU;QACV,OAAO,CAAC,GAAG,CAAC,YAAY,CAAC,CAAC;QAC1B,OAAO,CAAC,GAAG,CAAC,UAAU,CAAC,YAAY,CAAC,YAAY,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;IAEzE,CAAC;IAAC,OAAO,KAAK,EAAE,CAAC;QACf,OAAO,CAAC,KAAK,CAAC,aAAa,KAAK,EAAE,CAAC,CAAC;IACtC,CAAC;YAAS,CAAC;QACT,OAAO;QACP,MAAM,UAAU,CAAC,YAAY,EAAE,CAAC;IAClC,CAAC;AACH,CAAC;AAED;;GAEG;AACH,MAAM,CAAC,KAAK,UAAU,gBAAgB,CAAC,QAAsB;IAC3D,OAAO,CAAC,GAAG,CAAC,SAAS,QAAQ,QAAQ,CAAC,CAAC;IAEvC,MAAM,UAAU,GAAG,IAAI,UAAU,CAAC;QAChC,SAAS,EAAE,iBAAiB;QAC5B,SAAS,EAAE,gBAAgB;QAC3B,SAAS,EAAE,CAAC,SAAS,CAAC;QACtB,QAAQ,EAAE,IAAI;QACd,cAAc,EAAE,CAAC;KAClB,CAAC,CAAC;IAEH,IAAI,CAAC;QACH,aAAa;QACb,MAAM,SAAS,GAAG,eAAe,CAAC,eAAe,CAAC,EAAE,QAAQ,EAAE,CAAC,CAAC;QAChE,OAAO,CAAC,GAAG,CAAC,SAAS,SAAS,CAAC,MAAM,MAAM,QAAQ,QAAQ,CAAC,CAAC;QAE7D,IAAI,SAAS,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YAC3B,OAAO,CAAC,GAAG,CAAC,YAAY,QAAQ,UAAU,CAAC,CAAC;YAC5C,OAAO;QACT,CAAC;QAED,OAAO,CAAC,GAAG,CAAC,eAAe,CAAC,CAAC;IAE/B,CAAC;IAAC,OAAO,KAAK,EAAE,CAAC;QACf,OAAO,CAAC,KAAK,CAAC,eAAe,KAAK,EAAE,CAAC,CAAC;IACxC,CAAC;YAAS,CAAC;QACT,MAAM,UAAU,CAAC,YAAY,EAAE,CAAC;IAClC,CAAC;AACH,CAAC;AAED;;GAEG;AACH,MAAM,CAAC,KAAK,UAAU,uBAAuB;IAC3C,OAAO,CAAC,GAAG,CAAC,YAAY,CAAC,CAAC;IAE1B,MAAM,UAAU,GAAG,IAAI,UAAU,CAAC;QAChC,SAAS,EAAE,iBAAiB;QAC5B,SAAS,EAAE,gBAAgB;QAC3B,SAAS,EAAE,CAAC,SAAS,CAAC;QACtB,QAAQ,EAAE,KAAK,EAAE,iBAAiB;QAClC,OAAO,EAAE,KAAK;KACf,CAAC,CAAC;IAEH,IAAI,CAAC;QACH,cAAc;QACd,MAAM,eAAe,GAAG,eAAe,CAAC,MAAM,CAAC,aAAa,CAAC;aAC1D,QAAQ,CAAC,aAAa,CAAC;aACvB,QAAQ,CAAC,oCAAoC,CAAC;aAC9C,eAAe,CAAC,WAAW,CAAC,kBAAkB,CAAC;aAC/C,UAAU,CAAC,MAAM,EAAE,EAAE,QAAQ,EAAE,IAAI,EAAE,CAAC;aACtC,WAAW,CAAC,KAAK,CAAC;aAClB,KAAK,EAAE,CAAC;QAEX,OAAO,CAAC,GAAG,CAAC,eAAe,CAAC,CAAC;IAE/B,CAAC;IAAC,OAAO,KAAK,EAAE,CAAC;QACf,OAAO,CAAC,KAAK,CAAC,eAAe,KAAK,EAAE,CAAC,CAAC;IACxC,CAAC;YAAS,CAAC;QACT,MAAM,UAAU,CAAC,YAAY,EAAE,CAAC;IAClC,CAAC;AACH,CAAC;AAED,mBAAmB;AACnB,IAAI,OAAO,CAAC,IAAI,KAAK,MAAM,EAAE,CAAC;IAC5B,sBAAsB,EAAE,CAAC,KAAK,CAAC,OAAO,CAAC,KAAK,CAAC,CAAC;AAChD,CAAC"}
@@ -0,0 +1,30 @@
1
+ /**
2
+ * AI Agent 健壮性测试框架 - 主入口文件
3
+ *
4
+ * 导出所有核心组件,提供统一的 API 接口
5
+ */
6
+ import { TestEngine } from './core/TestEngine';
7
+ export { TestEngine };
8
+ export { TestCase, TestCaseBuilder, TestSuite, TestCategory, ProjectType, ToolCallExpectation, ChangeExpectation, PromptExpectation, FileDefinition } from './core/TestCase';
9
+ export { TestResult, TestSuiteResult, TestStatus, ExecutionInfo, ToolCallInfo, FileChangeInfo, PromptAnalysisResult, ToolCallAnalysisResult, CodeQualityResult, TaskCompletionResult, TestResultBuilder } from './core/TestResult';
10
+ export { PromptAnalyzer } from './analyzers/PromptAnalyzer';
11
+ export { ToolCallAnalyzer } from './analyzers/ToolCallAnalyzer';
12
+ export { CodeChangeAnalyzer } from './analyzers/CodeChangeAnalyzer';
13
+ export { ScenarioBuilder, ScenarioTemplate } from './scenarios/ScenarioBuilder';
14
+ export { JsonScenarioLoader, JsonScenarioConfig } from './loaders/JsonScenarioLoader';
15
+ export { ConsoleReporter } from './reporters/ConsoleReporter';
16
+ /**
17
+ * 快速创建测试引擎的工厂函数
18
+ */
19
+ export declare function createTestEngine(config: {
20
+ agentPath: string;
21
+ outputDir?: string;
22
+ verbose?: boolean;
23
+ parallel?: boolean;
24
+ keepTestProjects?: boolean;
25
+ }): TestEngine;
26
+ /**
27
+ * 框架版本信息
28
+ */
29
+ export declare const FRAMEWORK_VERSION = "1.0.0";
30
+ //# sourceMappingURL=index.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/test/framework/index.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAGH,OAAO,EAAE,UAAU,EAAE,MAAM,mBAAmB,CAAC;AAC/C,OAAO,EAAE,UAAU,EAAE,CAAC;AACtB,OAAO,EACL,QAAQ,EACR,eAAe,EACf,SAAS,EACT,YAAY,EACZ,WAAW,EACX,mBAAmB,EACnB,iBAAiB,EACjB,iBAAiB,EACjB,cAAc,EACf,MAAM,iBAAiB,CAAC;AAEzB,OAAO,EACL,UAAU,EACV,eAAe,EACf,UAAU,EACV,aAAa,EACb,YAAY,EACZ,cAAc,EACd,oBAAoB,EACpB,sBAAsB,EACtB,iBAAiB,EACjB,oBAAoB,EACpB,iBAAiB,EAClB,MAAM,mBAAmB,CAAC;AAG3B,OAAO,EAAE,cAAc,EAAE,MAAM,4BAA4B,CAAC;AAC5D,OAAO,EAAE,gBAAgB,EAAE,MAAM,8BAA8B,CAAC;AAChE,OAAO,EAAE,kBAAkB,EAAE,MAAM,gCAAgC,CAAC;AAGpE,OAAO,EAAE,eAAe,EAAE,gBAAgB,EAAE,MAAM,6BAA6B,CAAC;AAGhF,OAAO,EAAE,kBAAkB,EAAE,kBAAkB,EAAE,MAAM,8BAA8B,CAAC;AAGtF,OAAO,EAAE,eAAe,EAAE,MAAM,6BAA6B,CAAC;AAE9D;;GAEG;AACH,wBAAgB,gBAAgB,CAAC,MAAM,EAAE;IACvC,SAAS,EAAE,MAAM,CAAC;IAClB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,OAAO,CAAC,EAAE,OAAO,CAAC;IAClB,QAAQ,CAAC,EAAE,OAAO,CAAC;IACnB,gBAAgB,CAAC,EAAE,OAAO,CAAC;CAC5B,GAAG,UAAU,CASb;AAED;;GAEG;AACH,eAAO,MAAM,iBAAiB,UAAU,CAAC"}
@@ -0,0 +1,38 @@
1
+ /**
2
+ * AI Agent 健壮性测试框架 - 主入口文件
3
+ *
4
+ * 导出所有核心组件,提供统一的 API 接口
5
+ */
6
+ // 核心组件
7
+ import { TestEngine } from './core/TestEngine';
8
+ export { TestEngine };
9
+ export { TestCaseBuilder, TestCategory, ProjectType } from './core/TestCase';
10
+ export { TestStatus, TestResultBuilder } from './core/TestResult';
11
+ // 分析器
12
+ export { PromptAnalyzer } from './analyzers/PromptAnalyzer';
13
+ export { ToolCallAnalyzer } from './analyzers/ToolCallAnalyzer';
14
+ export { CodeChangeAnalyzer } from './analyzers/CodeChangeAnalyzer';
15
+ // 场景构建器
16
+ export { ScenarioBuilder } from './scenarios/ScenarioBuilder';
17
+ // JSON 场景加载器
18
+ export { JsonScenarioLoader } from './loaders/JsonScenarioLoader';
19
+ // 报告生成器
20
+ export { ConsoleReporter } from './reporters/ConsoleReporter';
21
+ /**
22
+ * 快速创建测试引擎的工厂函数
23
+ */
24
+ export function createTestEngine(config) {
25
+ return new TestEngine({
26
+ agentPath: config.agentPath,
27
+ outputDir: config.outputDir || './test-results',
28
+ reporters: ['console'],
29
+ verbose: config.verbose || false,
30
+ parallel: config.parallel || false,
31
+ keepTestProjects: config.keepTestProjects || false
32
+ });
33
+ }
34
+ /**
35
+ * 框架版本信息
36
+ */
37
+ export const FRAMEWORK_VERSION = '1.0.0';
38
+ //# sourceMappingURL=index.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/test/framework/index.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO;AACP,OAAO,EAAE,UAAU,EAAE,MAAM,mBAAmB,CAAC;AAC/C,OAAO,EAAE,UAAU,EAAE,CAAC;AACtB,OAAO,EAEL,eAAe,EAEf,YAAY,EACZ,WAAW,EAKZ,MAAM,iBAAiB,CAAC;AAEzB,OAAO,EAGL,UAAU,EAQV,iBAAiB,EAClB,MAAM,mBAAmB,CAAC;AAE3B,MAAM;AACN,OAAO,EAAE,cAAc,EAAE,MAAM,4BAA4B,CAAC;AAC5D,OAAO,EAAE,gBAAgB,EAAE,MAAM,8BAA8B,CAAC;AAChE,OAAO,EAAE,kBAAkB,EAAE,MAAM,gCAAgC,CAAC;AAEpE,QAAQ;AACR,OAAO,EAAE,eAAe,EAAoB,MAAM,6BAA6B,CAAC;AAEhF,aAAa;AACb,OAAO,EAAE,kBAAkB,EAAsB,MAAM,8BAA8B,CAAC;AAEtF,QAAQ;AACR,OAAO,EAAE,eAAe,EAAE,MAAM,6BAA6B,CAAC;AAE9D;;GAEG;AACH,MAAM,UAAU,gBAAgB,CAAC,MAMhC;IACC,OAAO,IAAI,UAAU,CAAC;QACpB,SAAS,EAAE,MAAM,CAAC,SAAS;QAC3B,SAAS,EAAE,MAAM,CAAC,SAAS,IAAI,gBAAgB;QAC/C,SAAS,EAAE,CAAC,SAAS,CAAC;QACtB,OAAO,EAAE,MAAM,CAAC,OAAO,IAAI,KAAK;QAChC,QAAQ,EAAE,MAAM,CAAC,QAAQ,IAAI,KAAK;QAClC,gBAAgB,EAAE,MAAM,CAAC,gBAAgB,IAAI,KAAK;KACnD,CAAC,CAAC;AACL,CAAC;AAED;;GAEG;AACH,MAAM,CAAC,MAAM,iBAAiB,GAAG,OAAO,CAAC"}
@@ -0,0 +1,99 @@
1
+ /**
2
+ * JSON 场景加载器
3
+ *
4
+ * 支持从 JSON 文件加载测试场景配置,简化复杂测试用例的定义
5
+ */
6
+ import { TestCase } from '../core/TestCase';
7
+ /**
8
+ * JSON 场景配置格式
9
+ */
10
+ export interface JsonScenarioConfig {
11
+ id: string;
12
+ name: string;
13
+ description: string;
14
+ category: 'basic-robustness' | 'business-scenario' | 'error-recovery' | 'performance' | 'boundary-conditions';
15
+ task: {
16
+ description: string;
17
+ context?: string;
18
+ documentation?: string[];
19
+ };
20
+ project: {
21
+ type: 'gradle-spring-boot' | 'maven-spring-boot' | 'npm-node' | 'empty';
22
+ initialFiles?: {
23
+ path: string;
24
+ content: string;
25
+ }[];
26
+ };
27
+ expectedTools: {
28
+ tool: string;
29
+ required: boolean;
30
+ minCalls?: number;
31
+ maxCalls?: number;
32
+ order?: number;
33
+ parameters?: Record<string, any>;
34
+ description?: string;
35
+ }[];
36
+ expectedChanges: {
37
+ type: 'file-created' | 'file-modified' | 'file-deleted' | 'dependency-added';
38
+ path?: string;
39
+ pattern?: string;
40
+ content?: string;
41
+ required: boolean;
42
+ description?: string;
43
+ }[];
44
+ quality?: {
45
+ minToolAccuracy?: number;
46
+ maxExecutionTime?: number;
47
+ minTaskCompletion?: number;
48
+ maxCodeIssues?: number;
49
+ };
50
+ config?: {
51
+ timeout?: number;
52
+ maxIterations?: number;
53
+ retryCount?: number;
54
+ keepTestProject?: boolean;
55
+ quiet?: boolean;
56
+ };
57
+ customValidations?: {
58
+ name: string;
59
+ description: string;
60
+ validatorScript?: string;
61
+ }[];
62
+ }
63
+ /**
64
+ * JSON 场景加载器
65
+ */
66
+ export declare class JsonScenarioLoader {
67
+ /**
68
+ * 从 JSON 文件加载测试场景
69
+ */
70
+ static loadFromFile(filePath: string): Promise<TestCase>;
71
+ /**
72
+ * 从 JSON 字符串加载测试场景
73
+ */
74
+ static loadFromString(jsonString: string): TestCase;
75
+ /**
76
+ * 批量加载目录下的所有 JSON 场景
77
+ */
78
+ static loadFromDirectory(dirPath: string): Promise<TestCase[]>;
79
+ /**
80
+ * 从配置对象构建测试用例
81
+ */
82
+ private static buildFromConfig;
83
+ /**
84
+ * 映射类别
85
+ */
86
+ private static mapCategory;
87
+ /**
88
+ * 映射项目类型
89
+ */
90
+ private static mapProjectType;
91
+ /**
92
+ * 验证 JSON 配置的有效性
93
+ */
94
+ static validateConfig(config: JsonScenarioConfig): {
95
+ valid: boolean;
96
+ errors: string[];
97
+ };
98
+ }
99
+ //# sourceMappingURL=JsonScenarioLoader.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"JsonScenarioLoader.d.ts","sourceRoot":"","sources":["../../../../src/test/framework/loaders/JsonScenarioLoader.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAIH,OAAO,EAAE,QAAQ,EAAsF,MAAM,kBAAkB,CAAC;AAEhI;;GAEG;AACH,MAAM,WAAW,kBAAkB;IACjC,EAAE,EAAE,MAAM,CAAC;IACX,IAAI,EAAE,MAAM,CAAC;IACb,WAAW,EAAE,MAAM,CAAC;IACpB,QAAQ,EAAE,kBAAkB,GAAG,mBAAmB,GAAG,gBAAgB,GAAG,aAAa,GAAG,qBAAqB,CAAC;IAG9G,IAAI,EAAE;QACJ,WAAW,EAAE,MAAM,CAAC;QACpB,OAAO,CAAC,EAAE,MAAM,CAAC;QACjB,aAAa,CAAC,EAAE,MAAM,EAAE,CAAC;KAC1B,CAAC;IAGF,OAAO,EAAE;QACP,IAAI,EAAE,oBAAoB,GAAG,mBAAmB,GAAG,UAAU,GAAG,OAAO,CAAC;QACxE,YAAY,CAAC,EAAE;YACb,IAAI,EAAE,MAAM,CAAC;YACb,OAAO,EAAE,MAAM,CAAC;SACjB,EAAE,CAAC;KACL,CAAC;IAGF,aAAa,EAAE;QACb,IAAI,EAAE,MAAM,CAAC;QACb,QAAQ,EAAE,OAAO,CAAC;QAClB,QAAQ,CAAC,EAAE,MAAM,CAAC;QAClB,QAAQ,CAAC,EAAE,MAAM,CAAC;QAClB,KAAK,CAAC,EAAE,MAAM,CAAC;QACf,UAAU,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;QACjC,WAAW,CAAC,EAAE,MAAM,CAAC;KACtB,EAAE,CAAC;IAGJ,eAAe,EAAE;QACf,IAAI,EAAE,cAAc,GAAG,eAAe,GAAG,cAAc,GAAG,kBAAkB,CAAC;QAC7E,IAAI,CAAC,EAAE,MAAM,CAAC;QACd,OAAO,CAAC,EAAE,MAAM,CAAC;QACjB,OAAO,CAAC,EAAE,MAAM,CAAC;QACjB,QAAQ,EAAE,OAAO,CAAC;QAClB,WAAW,CAAC,EAAE,MAAM,CAAC;KACtB,EAAE,CAAC;IAGJ,OAAO,CAAC,EAAE;QACR,eAAe,CAAC,EAAE,MAAM,CAAC;QACzB,gBAAgB,CAAC,EAAE,MAAM,CAAC;QAC1B,iBAAiB,CAAC,EAAE,MAAM,CAAC;QAC3B,aAAa,CAAC,EAAE,MAAM,CAAC;KACxB,CAAC;IAGF,MAAM,CAAC,EAAE;QACP,OAAO,CAAC,EAAE,MAAM,CAAC;QACjB,aAAa,CAAC,EAAE,MAAM,CAAC;QACvB,UAAU,CAAC,EAAE,MAAM,CAAC;QACpB,eAAe,CAAC,EAAE,OAAO,CAAC;QAC1B,KAAK,CAAC,EAAE,OAAO,CAAC;KACjB,CAAC;IAGF,iBAAiB,CAAC,EAAE;QAClB,IAAI,EAAE,MAAM,CAAC;QACb,WAAW,EAAE,MAAM,CAAC;QAEpB,eAAe,CAAC,EAAE,MAAM,CAAC;KAC1B,EAAE,CAAC;CACL;AAED;;GAEG;AACH,qBAAa,kBAAkB;IAC7B;;OAEG;WACU,YAAY,CAAC,QAAQ,EAAE,MAAM,GAAG,OAAO,CAAC,QAAQ,CAAC;IAM9D;;OAEG;IACH,MAAM,CAAC,cAAc,CAAC,UAAU,EAAE,MAAM,GAAG,QAAQ;IAKnD;;OAEG;WACU,iBAAiB,CAAC,OAAO,EAAE,MAAM,GAAG,OAAO,CAAC,QAAQ,EAAE,CAAC;IAkBpE;;OAEG;IACH,OAAO,CAAC,MAAM,CAAC,eAAe;IA+F9B;;OAEG;IACH,OAAO,CAAC,MAAM,CAAC,WAAW;IAY1B;;OAEG;IACH,OAAO,CAAC,MAAM,CAAC,cAAc;IAW7B;;OAEG;IACH,MAAM,CAAC,cAAc,CAAC,MAAM,EAAE,kBAAkB,GAAG;QAAE,KAAK,EAAE,OAAO,CAAC;QAAC,MAAM,EAAE,MAAM,EAAE,CAAA;KAAE;CA+BxF"}