@agentmark-ai/cli 0.9.0 → 0.10.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (149) hide show
  1. package/README.md +143 -1
  2. package/dist/.next/BUILD_ID +1 -1
  3. package/dist/.next/app-build-manifest.json +65 -15
  4. package/dist/.next/app-path-routes-manifest.json +3 -0
  5. package/dist/.next/build-manifest.json +2 -2
  6. package/dist/.next/cache/.previewinfo +1 -1
  7. package/dist/.next/cache/.rscinfo +1 -1
  8. package/dist/.next/cache/.tsbuildinfo +1 -1
  9. package/dist/.next/cache/config.json +3 -3
  10. package/dist/.next/cache/webpack/client-production/0.pack +0 -0
  11. package/dist/.next/cache/webpack/client-production/index.pack +0 -0
  12. package/dist/.next/cache/webpack/edge-server-production/index.pack +0 -0
  13. package/dist/.next/cache/webpack/server-production/0.pack +0 -0
  14. package/dist/.next/cache/webpack/server-production/index.pack +0 -0
  15. package/dist/.next/prerender-manifest.json +61 -13
  16. package/dist/.next/routes-manifest.json +22 -1
  17. package/dist/.next/server/app/_not-found/page.js +1 -1
  18. package/dist/.next/server/app/_not-found/page_client-reference-manifest.js +1 -1
  19. package/dist/.next/server/app/_not-found.html +1 -1
  20. package/dist/.next/server/app/_not-found.rsc +7 -6
  21. package/dist/.next/server/app/experiments/[id]/page.js +2 -0
  22. package/dist/.next/server/app/experiments/[id]/page.js.nft.json +1 -0
  23. package/dist/.next/server/app/experiments/[id]/page_client-reference-manifest.js +1 -0
  24. package/dist/.next/server/app/experiments/compare/page.js +2 -0
  25. package/dist/.next/server/app/experiments/compare/page.js.nft.json +1 -0
  26. package/dist/.next/server/app/experiments/compare/page_client-reference-manifest.js +1 -0
  27. package/dist/.next/server/app/experiments/compare.html +1 -0
  28. package/dist/.next/server/app/experiments/compare.meta +7 -0
  29. package/dist/.next/server/app/experiments/compare.rsc +24 -0
  30. package/dist/.next/server/app/experiments/page.js +2 -0
  31. package/dist/.next/server/app/experiments/page.js.nft.json +1 -0
  32. package/dist/.next/server/app/experiments/page_client-reference-manifest.js +1 -0
  33. package/dist/.next/server/app/experiments.html +1 -0
  34. package/dist/.next/server/app/experiments.meta +7 -0
  35. package/dist/.next/server/app/experiments.rsc +24 -0
  36. package/dist/.next/server/app/index.html +1 -1
  37. package/dist/.next/server/app/index.rsc +9 -9
  38. package/dist/.next/server/app/page.js +1 -1
  39. package/dist/.next/server/app/page_client-reference-manifest.js +1 -1
  40. package/dist/.next/server/app/requests/page.js +1 -1
  41. package/dist/.next/server/app/requests/page.js.nft.json +1 -1
  42. package/dist/.next/server/app/requests/page_client-reference-manifest.js +1 -1
  43. package/dist/.next/server/app/requests.html +1 -1
  44. package/dist/.next/server/app/requests.rsc +8 -8
  45. package/dist/.next/server/app/sessions/page.js +1 -1
  46. package/dist/.next/server/app/sessions/page.js.nft.json +1 -1
  47. package/dist/.next/server/app/sessions/page_client-reference-manifest.js +1 -1
  48. package/dist/.next/server/app/sessions.html +1 -1
  49. package/dist/.next/server/app/sessions.rsc +8 -8
  50. package/dist/.next/server/app/traces/page.js +1 -1
  51. package/dist/.next/server/app/traces/page.js.nft.json +1 -1
  52. package/dist/.next/server/app/traces/page_client-reference-manifest.js +1 -1
  53. package/dist/.next/server/app/traces.html +1 -1
  54. package/dist/.next/server/app/traces.rsc +8 -8
  55. package/dist/.next/server/app-paths-manifest.json +3 -0
  56. package/dist/.next/server/chunks/101.js +1 -0
  57. package/dist/.next/server/chunks/203.js +5 -5
  58. package/dist/.next/server/chunks/225.js +173 -0
  59. package/dist/.next/server/chunks/335.js +1 -0
  60. package/dist/.next/server/chunks/478.js +3 -3
  61. package/dist/.next/server/chunks/547.js +1 -1
  62. package/dist/.next/server/chunks/672.js +1 -0
  63. package/dist/.next/server/chunks/934.js +1 -0
  64. package/dist/.next/server/chunks/936.js +29 -0
  65. package/dist/.next/server/pages/404.html +1 -1
  66. package/dist/.next/server/pages/500.html +1 -1
  67. package/dist/.next/server/server-reference-manifest.json +1 -1
  68. package/dist/.next/static/2NZm040KzCzDPOX6MqoKG/_buildManifest.js +1 -0
  69. package/dist/.next/static/chunks/181-396b329bd35e4de0.js +1 -0
  70. package/dist/.next/static/chunks/349-9266e48c00c8ac76.js +37 -0
  71. package/dist/.next/static/chunks/352-d7aa9d2da963e9e5.js +1 -0
  72. package/dist/.next/static/chunks/41-f512c46d7ea943f6.js +1 -0
  73. package/dist/.next/static/chunks/444-d88bd1e37e750aee.js +1 -0
  74. package/dist/.next/static/chunks/49-6efbcf2b4f20d950.js +1 -0
  75. package/dist/.next/static/chunks/729-21a669506b8ae33c.js +1 -0
  76. package/dist/.next/static/chunks/757-19ef6a21d87937d9.js +1 -0
  77. package/dist/.next/static/chunks/{902-8d8c521535a2c32f.js → 860-75914efffd5add16.js} +1 -1
  78. package/dist/.next/static/chunks/866-87ad78bf0bef953a.js +28 -0
  79. package/dist/.next/static/chunks/app/experiments/[id]/page-1522aa0a86d6d004.js +1 -0
  80. package/dist/.next/static/chunks/app/experiments/compare/page-b99f5e9ebb5488b4.js +1 -0
  81. package/dist/.next/static/chunks/app/experiments/page-e17f8133f9467da7.js +1 -0
  82. package/dist/.next/static/chunks/app/layout-3af953219517dd3e.js +1 -0
  83. package/dist/.next/static/chunks/app/requests/{page-91666bcc2877f9ee.js → page-aa9725ed8b67059b.js} +1 -1
  84. package/dist/.next/static/chunks/app/sessions/{page-679425471f82f56d.js → page-bf2019c391763736.js} +1 -1
  85. package/dist/.next/static/chunks/app/traces/page-c43b6aa5cd13fdf1.js +1 -0
  86. package/dist/.next/trace +56 -54
  87. package/dist/.next/types/app/experiments/[id]/page.ts +84 -0
  88. package/dist/.next/types/app/experiments/compare/page.ts +84 -0
  89. package/dist/.next/types/app/experiments/page.ts +84 -0
  90. package/dist/.next/types/routes.d.ts +4 -1
  91. package/dist/.next/types/validator.ts +27 -0
  92. package/dist/api-server.js +28 -1
  93. package/dist/api-server.js.map +1 -1
  94. package/dist/commands/deploy.d.ts +27 -0
  95. package/dist/commands/deploy.js +223 -0
  96. package/dist/commands/deploy.js.map +1 -0
  97. package/dist/commands/dev.d.ts +0 -1
  98. package/dist/commands/dev.js +79 -66
  99. package/dist/commands/dev.js.map +1 -1
  100. package/dist/commands/run-experiment.js +7 -28
  101. package/dist/commands/run-experiment.js.map +1 -1
  102. package/dist/commands/run-prompt.js +6 -27
  103. package/dist/commands/run-prompt.js.map +1 -1
  104. package/dist/config.d.ts +2 -12
  105. package/dist/config.js +5 -45
  106. package/dist/config.js.map +1 -1
  107. package/dist/connect/job-handler.d.ts +23 -0
  108. package/dist/connect/job-handler.js +187 -0
  109. package/dist/connect/job-handler.js.map +1 -0
  110. package/dist/forwarding/config.js +1 -1
  111. package/dist/forwarding/config.js.map +1 -1
  112. package/dist/index.js +3 -3
  113. package/dist/index.js.map +1 -1
  114. package/dist/runner-server.d.ts +0 -6
  115. package/dist/runner-server.js +3 -39
  116. package/dist/runner-server.js.map +1 -1
  117. package/dist/server/routes/experiments/index.d.ts +31 -0
  118. package/dist/server/routes/experiments/index.js +192 -0
  119. package/dist/server/routes/experiments/index.js.map +1 -0
  120. package/package.json +4 -3
  121. package/dist/.next/server/chunks/525.js +0 -201
  122. package/dist/.next/static/_uH98Yva4C-QS08PL-_0P/_buildManifest.js +0 -1
  123. package/dist/.next/static/chunks/397-361c64519c49911b.js +0 -37
  124. package/dist/.next/static/chunks/41-f3c56d50aeb34db9.js +0 -1
  125. package/dist/.next/static/chunks/602-1f23cff16de7187a.js +0 -28
  126. package/dist/.next/static/chunks/app/layout-eaddb6da201ab019.js +0 -1
  127. package/dist/.next/static/chunks/app/traces/page-15500a82980abfc8.js +0 -1
  128. package/dist/cloudflared/download.d.ts +0 -12
  129. package/dist/cloudflared/download.js +0 -130
  130. package/dist/cloudflared/download.js.map +0 -1
  131. package/dist/cloudflared/index.d.ts +0 -9
  132. package/dist/cloudflared/index.js +0 -20
  133. package/dist/cloudflared/index.js.map +0 -1
  134. package/dist/cloudflared/platform.d.ts +0 -20
  135. package/dist/cloudflared/platform.js +0 -79
  136. package/dist/cloudflared/platform.js.map +0 -1
  137. package/dist/cloudflared/tunnel.d.ts +0 -16
  138. package/dist/cloudflared/tunnel.js +0 -129
  139. package/dist/cloudflared/tunnel.js.map +0 -1
  140. package/dist/cloudflared/types.d.ts +0 -53
  141. package/dist/cloudflared/types.js +0 -8
  142. package/dist/cloudflared/types.js.map +0 -1
  143. package/dist/runner-server/middleware/signature-verification.d.ts +0 -37
  144. package/dist/runner-server/middleware/signature-verification.js +0 -55
  145. package/dist/runner-server/middleware/signature-verification.js.map +0 -1
  146. package/dist/tunnel.d.ts +0 -6
  147. package/dist/tunnel.js +0 -11
  148. package/dist/tunnel.js.map +0 -1
  149. /package/dist/.next/static/{_uH98Yva4C-QS08PL-_0P → 2NZm040KzCzDPOX6MqoKG}/_ssgManifest.js +0 -0
package/README.md CHANGED
@@ -1 +1,143 @@
1
- # Agentmark CLI
1
+ # AgentMark CLI
2
+
3
+ The command-line tool for developing, testing, and evaluating AI agents with AgentMark.
4
+
5
+ ## Installation
6
+
7
+ ```bash
8
+ npm install -g @agentmark-ai/cli
9
+ ```
10
+
11
+ Or use it directly with `npx`:
12
+
13
+ ```bash
14
+ npx @agentmark-ai/cli dev
15
+ ```
16
+
17
+ ## Quick Start
18
+
19
+ ```bash
20
+ # Scaffold a new project
21
+ npm create agentmark@latest
22
+
23
+ # Start the dev server (API + trace UI + hot reload)
24
+ agentmark dev
25
+
26
+ # Run a prompt with its test props
27
+ agentmark run-prompt my-prompt.prompt.mdx
28
+
29
+ # Run an experiment against a dataset
30
+ agentmark run-experiment my-prompt.prompt.mdx
31
+ ```
32
+
33
+ ## Commands
34
+
35
+ ### `agentmark dev`
36
+
37
+ Start the local development environment: API server, webhook server, and trace UI.
38
+
39
+ ```bash
40
+ agentmark dev
41
+ agentmark dev --api-port 9418 --app-port 3000
42
+ agentmark dev --remote # Connect to AgentMark Cloud (login + trace forwarding)
43
+ agentmark dev --tunnel # Expose webhook server publicly
44
+ ```
45
+
46
+ The dev server auto-detects your project language (TypeScript or Python), finds your virtual environment, and handles port conflicts automatically.
47
+
48
+ ### `agentmark run-prompt <filepath>`
49
+
50
+ Execute a single prompt and display the result.
51
+
52
+ ```bash
53
+ # Run with test props from the prompt's frontmatter
54
+ agentmark run-prompt customer-support.prompt.mdx
55
+
56
+ # Run with custom props
57
+ agentmark run-prompt customer-support.prompt.mdx --props '{"customer_question": "Where is my order?"}'
58
+
59
+ # Run with props from a file
60
+ agentmark run-prompt customer-support.prompt.mdx --props-file test-data.json
61
+ ```
62
+
63
+ Output includes the LLM response, token usage, cost, and a link to the trace in the local UI.
64
+
65
+ ### `agentmark run-experiment <filepath>`
66
+
67
+ Run a prompt against every item in its dataset, with optional evaluations.
68
+
69
+ ```bash
70
+ # Run with evals (default)
71
+ agentmark run-experiment my-prompt.prompt.mdx
72
+
73
+ # Skip evals
74
+ agentmark run-experiment my-prompt.prompt.mdx --skip-eval
75
+
76
+ # Output as JSON instead of table
77
+ agentmark run-experiment my-prompt.prompt.mdx --format json
78
+
79
+ # Fail if pass rate is below 80%
80
+ agentmark run-experiment my-prompt.prompt.mdx --threshold 80
81
+ ```
82
+
83
+ Output formats: `table` (default), `csv`, `json`, `jsonl`.
84
+
85
+ ### `agentmark build`
86
+
87
+ Pre-compile `.prompt.mdx` files into JSON for production use with the file loader.
88
+
89
+ ```bash
90
+ agentmark build
91
+ agentmark build --out dist/prompts
92
+ ```
93
+
94
+ ### `agentmark generate-types`
95
+
96
+ Generate TypeScript type definitions from your prompts for type-safe usage in code.
97
+
98
+ ```bash
99
+ agentmark generate-types
100
+ ```
101
+
102
+ ### `agentmark generate-schema`
103
+
104
+ Generate a JSON Schema for `.prompt.mdx` frontmatter, enabling IDE validation and autocomplete.
105
+
106
+ ```bash
107
+ agentmark generate-schema
108
+ agentmark generate-schema --out .agentmark
109
+ ```
110
+
111
+ ### `agentmark pull-models`
112
+
113
+ Interactively select and add LLM models from a provider to your `agentmark.json`.
114
+
115
+ ```bash
116
+ agentmark pull-models
117
+ ```
118
+
119
+ ### `agentmark login` / `agentmark logout`
120
+
121
+ Authenticate with AgentMark Cloud.
122
+
123
+ ```bash
124
+ agentmark login
125
+ agentmark logout
126
+ ```
127
+
128
+ ### `agentmark link`
129
+
130
+ Link your project to an AgentMark Cloud app for trace forwarding.
131
+
132
+ ```bash
133
+ agentmark link
134
+ agentmark link --app-id <uuid>
135
+ ```
136
+
137
+ ## Documentation
138
+
139
+ Full documentation at [docs.agentmark.co](https://docs.agentmark.co/agentmark/).
140
+
141
+ ## License
142
+
143
+ [MIT](../../LICENSE.md)
@@ -1 +1 @@
1
- _uH98Yva4C-QS08PL-_0P
1
+ 2NZm040KzCzDPOX6MqoKG
@@ -12,9 +12,47 @@
12
12
  "static/chunks/87c73c54-09e1ba5c70e60a51.js",
13
13
  "static/chunks/18-175d23c8e99dd60b.js",
14
14
  "static/chunks/main-app-0b5725cb98f081b4.js",
15
- "static/chunks/902-8d8c521535a2c32f.js",
16
- "static/chunks/602-1f23cff16de7187a.js",
17
- "static/chunks/app/layout-eaddb6da201ab019.js"
15
+ "static/chunks/860-75914efffd5add16.js",
16
+ "static/chunks/757-19ef6a21d87937d9.js",
17
+ "static/chunks/866-87ad78bf0bef953a.js",
18
+ "static/chunks/app/layout-3af953219517dd3e.js"
19
+ ],
20
+ "/experiments/[id]/page": [
21
+ "static/chunks/webpack-f10b0ea54196b48e.js",
22
+ "static/chunks/87c73c54-09e1ba5c70e60a51.js",
23
+ "static/chunks/18-175d23c8e99dd60b.js",
24
+ "static/chunks/main-app-0b5725cb98f081b4.js",
25
+ "static/chunks/860-75914efffd5add16.js",
26
+ "static/chunks/729-21a669506b8ae33c.js",
27
+ "static/chunks/444-d88bd1e37e750aee.js",
28
+ "static/chunks/352-d7aa9d2da963e9e5.js",
29
+ "static/chunks/757-19ef6a21d87937d9.js",
30
+ "static/chunks/181-396b329bd35e4de0.js",
31
+ "static/chunks/app/experiments/[id]/page-1522aa0a86d6d004.js"
32
+ ],
33
+ "/experiments/compare/page": [
34
+ "static/chunks/webpack-f10b0ea54196b48e.js",
35
+ "static/chunks/87c73c54-09e1ba5c70e60a51.js",
36
+ "static/chunks/18-175d23c8e99dd60b.js",
37
+ "static/chunks/main-app-0b5725cb98f081b4.js",
38
+ "static/chunks/860-75914efffd5add16.js",
39
+ "static/chunks/729-21a669506b8ae33c.js",
40
+ "static/chunks/352-d7aa9d2da963e9e5.js",
41
+ "static/chunks/757-19ef6a21d87937d9.js",
42
+ "static/chunks/181-396b329bd35e4de0.js",
43
+ "static/chunks/app/experiments/compare/page-b99f5e9ebb5488b4.js"
44
+ ],
45
+ "/experiments/page": [
46
+ "static/chunks/webpack-f10b0ea54196b48e.js",
47
+ "static/chunks/87c73c54-09e1ba5c70e60a51.js",
48
+ "static/chunks/18-175d23c8e99dd60b.js",
49
+ "static/chunks/main-app-0b5725cb98f081b4.js",
50
+ "static/chunks/860-75914efffd5add16.js",
51
+ "static/chunks/729-21a669506b8ae33c.js",
52
+ "static/chunks/444-d88bd1e37e750aee.js",
53
+ "static/chunks/757-19ef6a21d87937d9.js",
54
+ "static/chunks/49-6efbcf2b4f20d950.js",
55
+ "static/chunks/app/experiments/page-e17f8133f9467da7.js"
18
56
  ],
19
57
  "/page": [
20
58
  "static/chunks/webpack-f10b0ea54196b48e.js",
@@ -31,10 +69,14 @@
31
69
  "static/css/a00826fc162bd22d.css",
32
70
  "static/chunks/baeaa4ff-f55976a85e939da3.js",
33
71
  "static/chunks/6b3bb038-04520a4579611038.js",
34
- "static/chunks/902-8d8c521535a2c32f.js",
35
- "static/chunks/397-361c64519c49911b.js",
36
- "static/chunks/41-f3c56d50aeb34db9.js",
37
- "static/chunks/app/requests/page-91666bcc2877f9ee.js"
72
+ "static/chunks/860-75914efffd5add16.js",
73
+ "static/chunks/729-21a669506b8ae33c.js",
74
+ "static/chunks/444-d88bd1e37e750aee.js",
75
+ "static/chunks/352-d7aa9d2da963e9e5.js",
76
+ "static/chunks/49-6efbcf2b4f20d950.js",
77
+ "static/chunks/349-9266e48c00c8ac76.js",
78
+ "static/chunks/41-f512c46d7ea943f6.js",
79
+ "static/chunks/app/requests/page-aa9725ed8b67059b.js"
38
80
  ],
39
81
  "/sessions/page": [
40
82
  "static/chunks/webpack-f10b0ea54196b48e.js",
@@ -44,10 +86,14 @@
44
86
  "static/css/a00826fc162bd22d.css",
45
87
  "static/chunks/baeaa4ff-f55976a85e939da3.js",
46
88
  "static/chunks/6b3bb038-04520a4579611038.js",
47
- "static/chunks/902-8d8c521535a2c32f.js",
48
- "static/chunks/397-361c64519c49911b.js",
49
- "static/chunks/41-f3c56d50aeb34db9.js",
50
- "static/chunks/app/sessions/page-679425471f82f56d.js"
89
+ "static/chunks/860-75914efffd5add16.js",
90
+ "static/chunks/729-21a669506b8ae33c.js",
91
+ "static/chunks/444-d88bd1e37e750aee.js",
92
+ "static/chunks/352-d7aa9d2da963e9e5.js",
93
+ "static/chunks/49-6efbcf2b4f20d950.js",
94
+ "static/chunks/349-9266e48c00c8ac76.js",
95
+ "static/chunks/41-f512c46d7ea943f6.js",
96
+ "static/chunks/app/sessions/page-bf2019c391763736.js"
51
97
  ],
52
98
  "/traces/page": [
53
99
  "static/chunks/webpack-f10b0ea54196b48e.js",
@@ -57,10 +103,14 @@
57
103
  "static/css/a00826fc162bd22d.css",
58
104
  "static/chunks/baeaa4ff-f55976a85e939da3.js",
59
105
  "static/chunks/6b3bb038-04520a4579611038.js",
60
- "static/chunks/902-8d8c521535a2c32f.js",
61
- "static/chunks/397-361c64519c49911b.js",
62
- "static/chunks/41-f3c56d50aeb34db9.js",
63
- "static/chunks/app/traces/page-15500a82980abfc8.js"
106
+ "static/chunks/860-75914efffd5add16.js",
107
+ "static/chunks/729-21a669506b8ae33c.js",
108
+ "static/chunks/444-d88bd1e37e750aee.js",
109
+ "static/chunks/352-d7aa9d2da963e9e5.js",
110
+ "static/chunks/49-6efbcf2b4f20d950.js",
111
+ "static/chunks/349-9266e48c00c8ac76.js",
112
+ "static/chunks/41-f512c46d7ea943f6.js",
113
+ "static/chunks/app/traces/page-c43b6aa5cd13fdf1.js"
64
114
  ]
65
115
  }
66
116
  }
@@ -1,5 +1,8 @@
1
1
  {
2
2
  "/_not-found/page": "/_not-found",
3
+ "/experiments/[id]/page": "/experiments/[id]",
4
+ "/experiments/compare/page": "/experiments/compare",
5
+ "/experiments/page": "/experiments",
3
6
  "/page": "/",
4
7
  "/requests/page": "/requests",
5
8
  "/sessions/page": "/sessions",
@@ -5,8 +5,8 @@
5
5
  "devFiles": [],
6
6
  "ampDevFiles": [],
7
7
  "lowPriorityFiles": [
8
- "static/_uH98Yva4C-QS08PL-_0P/_buildManifest.js",
9
- "static/_uH98Yva4C-QS08PL-_0P/_ssgManifest.js"
8
+ "static/2NZm040KzCzDPOX6MqoKG/_buildManifest.js",
9
+ "static/2NZm040KzCzDPOX6MqoKG/_ssgManifest.js"
10
10
  ],
11
11
  "rootMainFiles": [
12
12
  "static/chunks/webpack-f10b0ea54196b48e.js",
@@ -1 +1 @@
1
- {"previewModeId":"0265d9bac88f8f6ab3c8829fc5b41b3d","previewModeSigningKey":"1b94d4ca5cd0226ac9b678f2d555dd18320d6b02934b175b11c0481dfe9d9701","previewModeEncryptionKey":"e3aa292891db53e66185dc67f41f42e49d4fe1462b2c6ce2eea6f7bbb12cf584","expireAt":1772742981486}
1
+ {"previewModeId":"3d2ff63eaf01f7abb0ba0caeb3c17d0c","previewModeSigningKey":"981a172e225e7b17909282f71dbf463040b54bf9bf7eba4644fd99aa08e76454","previewModeEncryptionKey":"aca121c70f6014285fd5e771c8346ae5ee08d3e6a8a14de58b70d582604c589b","expireAt":1775126363538}
@@ -1 +1 @@
1
- {"encryption.key":"jwd7Nr+LbIL3aUoenjOD6a8YW3lBEYYd7GKSxdDWdKI=","encryption.expire_at":1772742980967}
1
+ {"encryption.key":"ht9K53UtRRttTiNu7t5Oj65n4lCPbGM1sV7diyI4Lcs=","encryption.expire_at":1775126363195}