@intentsolutionsio/tonone 0.9.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (330) hide show
  1. package/.claude-plugin/CLAUDE.md +11 -0
  2. package/.claude-plugin/marketplace.json +2178 -0
  3. package/.claude-plugin/plugin.json +135 -0
  4. package/LICENSE +21 -0
  5. package/README.md +462 -0
  6. package/agents/apex.md +247 -0
  7. package/agents/atlas.md +181 -0
  8. package/agents/cortex.md +173 -0
  9. package/agents/crest.md +130 -0
  10. package/agents/draft.md +190 -0
  11. package/agents/echo.md +146 -0
  12. package/agents/flux.md +145 -0
  13. package/agents/forge.md +121 -0
  14. package/agents/form.md +244 -0
  15. package/agents/helm.md +180 -0
  16. package/agents/lens.md +145 -0
  17. package/agents/lumen.md +139 -0
  18. package/agents/pave.md +169 -0
  19. package/agents/pitch.md +177 -0
  20. package/agents/prism.md +181 -0
  21. package/agents/proof.md +205 -0
  22. package/agents/relay.md +147 -0
  23. package/agents/spine.md +207 -0
  24. package/agents/surge.md +127 -0
  25. package/agents/touch.md +185 -0
  26. package/agents/vigil.md +165 -0
  27. package/agents/volt.md +184 -0
  28. package/agents/warden.md +172 -0
  29. package/package.json +48 -0
  30. package/skills/apex/SKILL.md +32 -0
  31. package/skills/apex-plan/.claude-plugin/plugin.json +16 -0
  32. package/skills/apex-plan/SKILL.md +59 -0
  33. package/skills/apex-recon/.claude-plugin/plugin.json +16 -0
  34. package/skills/apex-recon/SKILL.md +91 -0
  35. package/skills/apex-review/.claude-plugin/plugin.json +16 -0
  36. package/skills/apex-review/SKILL.md +53 -0
  37. package/skills/apex-status/.claude-plugin/plugin.json +16 -0
  38. package/skills/apex-status/SKILL.md +42 -0
  39. package/skills/apex-takeover/.claude-plugin/plugin.json +16 -0
  40. package/skills/apex-takeover/SKILL.md +50 -0
  41. package/skills/atlas/SKILL.md +34 -0
  42. package/skills/atlas-adr/.claude-plugin/plugin.json +16 -0
  43. package/skills/atlas-adr/SKILL.md +147 -0
  44. package/skills/atlas-changelog/.claude-plugin/plugin.json +16 -0
  45. package/skills/atlas-changelog/SKILL.md +156 -0
  46. package/skills/atlas-map/.claude-plugin/plugin.json +16 -0
  47. package/skills/atlas-map/SKILL.md +183 -0
  48. package/skills/atlas-onboard/.claude-plugin/plugin.json +16 -0
  49. package/skills/atlas-onboard/SKILL.md +138 -0
  50. package/skills/atlas-present/.claude-plugin/plugin.json +16 -0
  51. package/skills/atlas-present/SKILL.md +214 -0
  52. package/skills/atlas-recon/.claude-plugin/plugin.json +16 -0
  53. package/skills/atlas-recon/SKILL.md +101 -0
  54. package/skills/atlas-report/.claude-plugin/plugin.json +16 -0
  55. package/skills/atlas-report/SKILL.md +304 -0
  56. package/skills/cortex/SKILL.md +32 -0
  57. package/skills/cortex-eval/.claude-plugin/plugin.json +16 -0
  58. package/skills/cortex-eval/SKILL.md +143 -0
  59. package/skills/cortex-integrate/.claude-plugin/plugin.json +16 -0
  60. package/skills/cortex-integrate/SKILL.md +218 -0
  61. package/skills/cortex-model/.claude-plugin/plugin.json +16 -0
  62. package/skills/cortex-model/SKILL.md +138 -0
  63. package/skills/cortex-prompt/.claude-plugin/plugin.json +16 -0
  64. package/skills/cortex-prompt/SKILL.md +246 -0
  65. package/skills/cortex-recon/.claude-plugin/plugin.json +16 -0
  66. package/skills/cortex-recon/SKILL.md +156 -0
  67. package/skills/crest/SKILL.md +32 -0
  68. package/skills/crest-compete/.claude-plugin/plugin.json +16 -0
  69. package/skills/crest-compete/SKILL.md +158 -0
  70. package/skills/crest-narrative/.claude-plugin/plugin.json +16 -0
  71. package/skills/crest-narrative/SKILL.md +124 -0
  72. package/skills/crest-okr/.claude-plugin/plugin.json +16 -0
  73. package/skills/crest-okr/SKILL.md +119 -0
  74. package/skills/crest-recon/.claude-plugin/plugin.json +16 -0
  75. package/skills/crest-recon/SKILL.md +91 -0
  76. package/skills/crest-roadmap/.claude-plugin/plugin.json +16 -0
  77. package/skills/crest-roadmap/SKILL.md +129 -0
  78. package/skills/draft/SKILL.md +34 -0
  79. package/skills/draft-flow/.claude-plugin/plugin.json +16 -0
  80. package/skills/draft-flow/SKILL.md +93 -0
  81. package/skills/draft-ia/.claude-plugin/plugin.json +16 -0
  82. package/skills/draft-ia/SKILL.md +204 -0
  83. package/skills/draft-landing/.claude-plugin/plugin.json +16 -0
  84. package/skills/draft-landing/SKILL.md +60 -0
  85. package/skills/draft-patterns/.claude-plugin/plugin.json +16 -0
  86. package/skills/draft-patterns/SKILL.md +55 -0
  87. package/skills/draft-recon/.claude-plugin/plugin.json +16 -0
  88. package/skills/draft-recon/SKILL.md +108 -0
  89. package/skills/draft-review/.claude-plugin/plugin.json +16 -0
  90. package/skills/draft-review/SKILL.md +131 -0
  91. package/skills/draft-wireframe/.claude-plugin/plugin.json +16 -0
  92. package/skills/draft-wireframe/SKILL.md +167 -0
  93. package/skills/echo/SKILL.md +32 -0
  94. package/skills/echo-feedback/.claude-plugin/plugin.json +16 -0
  95. package/skills/echo-feedback/SKILL.md +129 -0
  96. package/skills/echo-interview/.claude-plugin/plugin.json +16 -0
  97. package/skills/echo-interview/SKILL.md +189 -0
  98. package/skills/echo-jobs/.claude-plugin/plugin.json +16 -0
  99. package/skills/echo-jobs/SKILL.md +193 -0
  100. package/skills/echo-recon/.claude-plugin/plugin.json +16 -0
  101. package/skills/echo-recon/SKILL.md +96 -0
  102. package/skills/echo-segment/.claude-plugin/plugin.json +16 -0
  103. package/skills/echo-segment/SKILL.md +105 -0
  104. package/skills/flux/SKILL.md +33 -0
  105. package/skills/flux-health/.claude-plugin/plugin.json +16 -0
  106. package/skills/flux-health/SKILL.md +97 -0
  107. package/skills/flux-migrate/.claude-plugin/plugin.json +16 -0
  108. package/skills/flux-migrate/SKILL.md +176 -0
  109. package/skills/flux-pipeline/.claude-plugin/plugin.json +16 -0
  110. package/skills/flux-pipeline/SKILL.md +86 -0
  111. package/skills/flux-query/.claude-plugin/plugin.json +16 -0
  112. package/skills/flux-query/SKILL.md +87 -0
  113. package/skills/flux-recon/.claude-plugin/plugin.json +16 -0
  114. package/skills/flux-recon/SKILL.md +101 -0
  115. package/skills/flux-schema/.claude-plugin/plugin.json +16 -0
  116. package/skills/flux-schema/SKILL.md +125 -0
  117. package/skills/forge/SKILL.md +33 -0
  118. package/skills/forge-audit/.claude-plugin/plugin.json +16 -0
  119. package/skills/forge-audit/SKILL.md +117 -0
  120. package/skills/forge-cost/.claude-plugin/plugin.json +16 -0
  121. package/skills/forge-cost/SKILL.md +144 -0
  122. package/skills/forge-diagnose/.claude-plugin/plugin.json +16 -0
  123. package/skills/forge-diagnose/SKILL.md +122 -0
  124. package/skills/forge-infra/.claude-plugin/plugin.json +16 -0
  125. package/skills/forge-infra/SKILL.md +169 -0
  126. package/skills/forge-network/.claude-plugin/plugin.json +16 -0
  127. package/skills/forge-network/SKILL.md +106 -0
  128. package/skills/forge-recon/.claude-plugin/plugin.json +16 -0
  129. package/skills/forge-recon/SKILL.md +143 -0
  130. package/skills/form/SKILL.md +40 -0
  131. package/skills/form-audit/.claude-plugin/plugin.json +16 -0
  132. package/skills/form-audit/SKILL.md +290 -0
  133. package/skills/form-brand/.claude-plugin/plugin.json +16 -0
  134. package/skills/form-brand/SKILL.md +214 -0
  135. package/skills/form-component/.claude-plugin/plugin.json +16 -0
  136. package/skills/form-component/SKILL.md +336 -0
  137. package/skills/form-deck/.claude-plugin/plugin.json +16 -0
  138. package/skills/form-deck/SKILL.md +263 -0
  139. package/skills/form-email/.claude-plugin/plugin.json +16 -0
  140. package/skills/form-email/SKILL.md +304 -0
  141. package/skills/form-exam/.claude-plugin/plugin.json +16 -0
  142. package/skills/form-exam/SKILL.md +103 -0
  143. package/skills/form-logo/.claude-plugin/plugin.json +16 -0
  144. package/skills/form-logo/SKILL.md +231 -0
  145. package/skills/form-mobile/.claude-plugin/plugin.json +16 -0
  146. package/skills/form-mobile/SKILL.md +276 -0
  147. package/skills/form-palette/.claude-plugin/plugin.json +16 -0
  148. package/skills/form-palette/SKILL.md +68 -0
  149. package/skills/form-social/.claude-plugin/plugin.json +16 -0
  150. package/skills/form-social/SKILL.md +272 -0
  151. package/skills/form-style/.claude-plugin/plugin.json +16 -0
  152. package/skills/form-style/SKILL.md +63 -0
  153. package/skills/form-tokens/.claude-plugin/plugin.json +16 -0
  154. package/skills/form-tokens/SKILL.md +760 -0
  155. package/skills/form-web/.claude-plugin/plugin.json +16 -0
  156. package/skills/form-web/SKILL.md +254 -0
  157. package/skills/helm/SKILL.md +32 -0
  158. package/skills/helm-arbiter/.claude-plugin/plugin.json +16 -0
  159. package/skills/helm-arbiter/SKILL.md +104 -0
  160. package/skills/helm-brief/.claude-plugin/plugin.json +16 -0
  161. package/skills/helm-brief/SKILL.md +105 -0
  162. package/skills/helm-handoff/.claude-plugin/plugin.json +16 -0
  163. package/skills/helm-handoff/SKILL.md +102 -0
  164. package/skills/helm-plan/.claude-plugin/plugin.json +16 -0
  165. package/skills/helm-plan/SKILL.md +73 -0
  166. package/skills/helm-recon/.claude-plugin/plugin.json +16 -0
  167. package/skills/helm-recon/SKILL.md +99 -0
  168. package/skills/lens/SKILL.md +33 -0
  169. package/skills/lens-audit/.claude-plugin/plugin.json +16 -0
  170. package/skills/lens-audit/SKILL.md +101 -0
  171. package/skills/lens-chart/.claude-plugin/plugin.json +16 -0
  172. package/skills/lens-chart/SKILL.md +59 -0
  173. package/skills/lens-dashboard/.claude-plugin/plugin.json +16 -0
  174. package/skills/lens-dashboard/SKILL.md +212 -0
  175. package/skills/lens-metrics/.claude-plugin/plugin.json +16 -0
  176. package/skills/lens-metrics/SKILL.md +298 -0
  177. package/skills/lens-recon/.claude-plugin/plugin.json +16 -0
  178. package/skills/lens-recon/SKILL.md +106 -0
  179. package/skills/lens-report/.claude-plugin/plugin.json +16 -0
  180. package/skills/lens-report/SKILL.md +158 -0
  181. package/skills/lumen/SKILL.md +32 -0
  182. package/skills/lumen-abtest/.claude-plugin/plugin.json +16 -0
  183. package/skills/lumen-abtest/SKILL.md +217 -0
  184. package/skills/lumen-funnel/.claude-plugin/plugin.json +16 -0
  185. package/skills/lumen-funnel/SKILL.md +108 -0
  186. package/skills/lumen-instrument/.claude-plugin/plugin.json +16 -0
  187. package/skills/lumen-instrument/SKILL.md +130 -0
  188. package/skills/lumen-metrics/.claude-plugin/plugin.json +16 -0
  189. package/skills/lumen-metrics/SKILL.md +189 -0
  190. package/skills/lumen-recon/.claude-plugin/plugin.json +16 -0
  191. package/skills/lumen-recon/SKILL.md +108 -0
  192. package/skills/pave/SKILL.md +32 -0
  193. package/skills/pave-audit/.claude-plugin/plugin.json +16 -0
  194. package/skills/pave-audit/SKILL.md +109 -0
  195. package/skills/pave-catalog/.claude-plugin/plugin.json +16 -0
  196. package/skills/pave-catalog/SKILL.md +202 -0
  197. package/skills/pave-env/.claude-plugin/plugin.json +16 -0
  198. package/skills/pave-env/SKILL.md +102 -0
  199. package/skills/pave-golden/.claude-plugin/plugin.json +16 -0
  200. package/skills/pave-golden/SKILL.md +173 -0
  201. package/skills/pave-recon/.claude-plugin/plugin.json +16 -0
  202. package/skills/pave-recon/SKILL.md +118 -0
  203. package/skills/pitch/SKILL.md +33 -0
  204. package/skills/pitch-copy/.claude-plugin/plugin.json +16 -0
  205. package/skills/pitch-copy/SKILL.md +133 -0
  206. package/skills/pitch-landing/.claude-plugin/plugin.json +16 -0
  207. package/skills/pitch-landing/SKILL.md +62 -0
  208. package/skills/pitch-launch/.claude-plugin/plugin.json +16 -0
  209. package/skills/pitch-launch/SKILL.md +222 -0
  210. package/skills/pitch-message/.claude-plugin/plugin.json +16 -0
  211. package/skills/pitch-message/SKILL.md +98 -0
  212. package/skills/pitch-position/.claude-plugin/plugin.json +16 -0
  213. package/skills/pitch-position/SKILL.md +195 -0
  214. package/skills/pitch-recon/.claude-plugin/plugin.json +16 -0
  215. package/skills/pitch-recon/SKILL.md +102 -0
  216. package/skills/prism/SKILL.md +34 -0
  217. package/skills/prism-audit/.claude-plugin/plugin.json +16 -0
  218. package/skills/prism-audit/SKILL.md +129 -0
  219. package/skills/prism-chart/.claude-plugin/plugin.json +16 -0
  220. package/skills/prism-chart/SKILL.md +56 -0
  221. package/skills/prism-component/.claude-plugin/plugin.json +16 -0
  222. package/skills/prism-component/SKILL.md +270 -0
  223. package/skills/prism-dashboard/.claude-plugin/plugin.json +16 -0
  224. package/skills/prism-dashboard/SKILL.md +108 -0
  225. package/skills/prism-recon/.claude-plugin/plugin.json +16 -0
  226. package/skills/prism-recon/SKILL.md +109 -0
  227. package/skills/prism-stack/.claude-plugin/plugin.json +16 -0
  228. package/skills/prism-stack/SKILL.md +58 -0
  229. package/skills/prism-ui/.claude-plugin/plugin.json +16 -0
  230. package/skills/prism-ui/SKILL.md +247 -0
  231. package/skills/proof/SKILL.md +33 -0
  232. package/skills/proof-api/.claude-plugin/plugin.json +16 -0
  233. package/skills/proof-api/SKILL.md +86 -0
  234. package/skills/proof-audit/.claude-plugin/plugin.json +16 -0
  235. package/skills/proof-audit/SKILL.md +97 -0
  236. package/skills/proof-design/.claude-plugin/plugin.json +16 -0
  237. package/skills/proof-design/SKILL.md +133 -0
  238. package/skills/proof-e2e/.claude-plugin/plugin.json +16 -0
  239. package/skills/proof-e2e/SKILL.md +309 -0
  240. package/skills/proof-recon/.claude-plugin/plugin.json +16 -0
  241. package/skills/proof-recon/SKILL.md +98 -0
  242. package/skills/proof-strategy/.claude-plugin/plugin.json +16 -0
  243. package/skills/proof-strategy/SKILL.md +150 -0
  244. package/skills/relay/SKILL.md +33 -0
  245. package/skills/relay-audit/.claude-plugin/plugin.json +16 -0
  246. package/skills/relay-audit/SKILL.md +101 -0
  247. package/skills/relay-deploy/.claude-plugin/plugin.json +16 -0
  248. package/skills/relay-deploy/SKILL.md +404 -0
  249. package/skills/relay-docker/.claude-plugin/plugin.json +16 -0
  250. package/skills/relay-docker/SKILL.md +73 -0
  251. package/skills/relay-pipeline/.claude-plugin/plugin.json +16 -0
  252. package/skills/relay-pipeline/SKILL.md +267 -0
  253. package/skills/relay-recon/.claude-plugin/plugin.json +16 -0
  254. package/skills/relay-recon/SKILL.md +108 -0
  255. package/skills/relay-ship/.claude-plugin/plugin.json +16 -0
  256. package/skills/relay-ship/SKILL.md +253 -0
  257. package/skills/spine/SKILL.md +33 -0
  258. package/skills/spine-api/.claude-plugin/plugin.json +16 -0
  259. package/skills/spine-api/SKILL.md +184 -0
  260. package/skills/spine-design/.claude-plugin/plugin.json +16 -0
  261. package/skills/spine-design/SKILL.md +193 -0
  262. package/skills/spine-perf/.claude-plugin/plugin.json +16 -0
  263. package/skills/spine-perf/SKILL.md +120 -0
  264. package/skills/spine-recon/.claude-plugin/plugin.json +16 -0
  265. package/skills/spine-recon/SKILL.md +130 -0
  266. package/skills/spine-review/.claude-plugin/plugin.json +16 -0
  267. package/skills/spine-review/SKILL.md +122 -0
  268. package/skills/spine-service/.claude-plugin/plugin.json +16 -0
  269. package/skills/spine-service/SKILL.md +77 -0
  270. package/skills/surge/SKILL.md +33 -0
  271. package/skills/surge-activation/.claude-plugin/plugin.json +16 -0
  272. package/skills/surge-activation/SKILL.md +130 -0
  273. package/skills/surge-experiment/.claude-plugin/plugin.json +16 -0
  274. package/skills/surge-experiment/SKILL.md +134 -0
  275. package/skills/surge-landing/.claude-plugin/plugin.json +16 -0
  276. package/skills/surge-landing/SKILL.md +65 -0
  277. package/skills/surge-plg/.claude-plugin/plugin.json +16 -0
  278. package/skills/surge-plg/SKILL.md +243 -0
  279. package/skills/surge-recon/.claude-plugin/plugin.json +16 -0
  280. package/skills/surge-recon/SKILL.md +109 -0
  281. package/skills/surge-retention/.claude-plugin/plugin.json +16 -0
  282. package/skills/surge-retention/SKILL.md +222 -0
  283. package/skills/tonone-onboard/.claude-plugin/plugin.json +17 -0
  284. package/skills/tonone-onboard/SKILL.md +158 -0
  285. package/skills/touch/SKILL.md +33 -0
  286. package/skills/touch-app/.claude-plugin/plugin.json +16 -0
  287. package/skills/touch-app/SKILL.md +335 -0
  288. package/skills/touch-audit/.claude-plugin/plugin.json +16 -0
  289. package/skills/touch-audit/SKILL.md +190 -0
  290. package/skills/touch-feature/.claude-plugin/plugin.json +16 -0
  291. package/skills/touch-feature/SKILL.md +242 -0
  292. package/skills/touch-recon/.claude-plugin/plugin.json +16 -0
  293. package/skills/touch-recon/SKILL.md +194 -0
  294. package/skills/touch-release/.claude-plugin/plugin.json +16 -0
  295. package/skills/touch-release/SKILL.md +216 -0
  296. package/skills/touch-ui/.claude-plugin/plugin.json +16 -0
  297. package/skills/touch-ui/SKILL.md +58 -0
  298. package/skills/vigil/SKILL.md +32 -0
  299. package/skills/vigil-alert/.claude-plugin/plugin.json +16 -0
  300. package/skills/vigil-alert/SKILL.md +291 -0
  301. package/skills/vigil-check/.claude-plugin/plugin.json +16 -0
  302. package/skills/vigil-check/SKILL.md +108 -0
  303. package/skills/vigil-incident/.claude-plugin/plugin.json +16 -0
  304. package/skills/vigil-incident/SKILL.md +152 -0
  305. package/skills/vigil-instrument/.claude-plugin/plugin.json +16 -0
  306. package/skills/vigil-instrument/SKILL.md +324 -0
  307. package/skills/vigil-recon/.claude-plugin/plugin.json +16 -0
  308. package/skills/vigil-recon/SKILL.md +114 -0
  309. package/skills/volt/SKILL.md +32 -0
  310. package/skills/volt-driver/.claude-plugin/plugin.json +16 -0
  311. package/skills/volt-driver/SKILL.md +112 -0
  312. package/skills/volt-firmware/.claude-plugin/plugin.json +16 -0
  313. package/skills/volt-firmware/SKILL.md +271 -0
  314. package/skills/volt-ota/.claude-plugin/plugin.json +16 -0
  315. package/skills/volt-ota/SKILL.md +312 -0
  316. package/skills/volt-power/.claude-plugin/plugin.json +16 -0
  317. package/skills/volt-power/SKILL.md +112 -0
  318. package/skills/volt-recon/.claude-plugin/plugin.json +16 -0
  319. package/skills/volt-recon/SKILL.md +100 -0
  320. package/skills/warden/SKILL.md +32 -0
  321. package/skills/warden-audit/.claude-plugin/plugin.json +16 -0
  322. package/skills/warden-audit/SKILL.md +103 -0
  323. package/skills/warden-harden/.claude-plugin/plugin.json +16 -0
  324. package/skills/warden-harden/SKILL.md +245 -0
  325. package/skills/warden-iam/.claude-plugin/plugin.json +16 -0
  326. package/skills/warden-iam/SKILL.md +102 -0
  327. package/skills/warden-recon/.claude-plugin/plugin.json +16 -0
  328. package/skills/warden-recon/SKILL.md +115 -0
  329. package/skills/warden-threat/.claude-plugin/plugin.json +16 -0
  330. package/skills/warden-threat/SKILL.md +155 -0
@@ -0,0 +1,16 @@
1
+ {
2
+ "name": "cortex-eval",
3
+ "version": "0.9.7",
4
+ "description": "Evaluate model performance \u2014 check for accuracy drops, data drift, and error patterns. Use when asked about \"model accuracy dropped\", \"evaluate the model\", \"check for drift\", or \"model performance\".",
5
+ "author": {
6
+ "name": "tonone-ai",
7
+ "url": "https://tonone.ai"
8
+ },
9
+ "repository": "https://github.com/tonone-ai/tonone",
10
+ "license": "MIT",
11
+ "type": "skill",
12
+ "keywords": [
13
+ "cortex",
14
+ "skill"
15
+ ]
16
+ }
@@ -0,0 +1,143 @@
1
+ ---
2
+ name: cortex-eval
3
+ description: Evaluate model performance — check for accuracy drops, data drift, and error patterns. Use when asked about "model accuracy dropped", "evaluate the model", "check for drift", or "model performance".
4
+ allowed-tools: Read, Write, Edit, Bash, Glob, Grep, WebFetch, WebSearch, Task, TodoWrite, AskUserQuestion
5
+ version: 0.6.4
6
+ author: tonone-ai <hello@tonone.ai>
7
+ license: MIT
8
+ ---
9
+
10
+ # Evaluate Model Performance
11
+
12
+ You are Cortex — the ML/AI engineer on the Engineering Team.
13
+
14
+ Follow the output format defined in docs/output-kit.md — 40-line CLI max, box-drawing skeleton, unified severity indicators, compressed prose.
15
+
16
+ ## Steps
17
+
18
+ ### Step 0: Detect Environment
19
+
20
+ Scan the project to understand the ML stack and current model:
21
+
22
+ ```bash
23
+ # Check for model artifacts, training scripts, metrics logs
24
+ ls -la model* *.pkl *.joblib *.onnx *.pt *.h5 2>/dev/null
25
+ ls -la train* evaluate* metrics* 2>/dev/null
26
+ cat requirements.txt 2>/dev/null | grep -iE "sklearn|torch|tensorflow|xgboost|lightgbm|mlflow|wandb"
27
+ cat pyproject.toml 2>/dev/null | grep -iE "sklearn|torch|tensorflow|xgboost|lightgbm|mlflow|wandb"
28
+
29
+ # Check for experiment tracking
30
+ ls -la mlruns/ wandb/ .neptune/ 2>/dev/null
31
+ grep -rl "mlflow\|wandb\|neptune" --include="*.py" . 2>/dev/null | head -10
32
+
33
+ # Check for monitoring/metrics
34
+ ls -la metrics/ logs/ monitoring/ 2>/dev/null
35
+ ```
36
+
37
+ Note the ML framework, model type, experiment tracking system, and any existing metrics. If nothing is detected, ask the user.
38
+
39
+ ### Step 1: Current Model Metrics vs Baseline
40
+
41
+ Establish where things stand:
42
+
43
+ - **Find the baseline metrics** — check experiment tracking (MLflow, W&B), saved metrics files, or training logs
44
+ - **Compute current metrics** — run evaluation on the latest data with the deployed model
45
+ - **Compare:** is the model performing worse than baseline? By how much?
46
+ - **Segment the comparison** — overall metrics can hide problems (model is fine on segment A, broken on segment B)
47
+
48
+ Report:
49
+
50
+ ```
51
+ | Metric | Baseline | Current | Delta |
52
+ |-----------|----------|---------|--------|
53
+ | [metric] | [value] | [value] | [+/-] |
54
+ ```
55
+
56
+ ### Step 2: Data Distribution Shift (Feature Drift)
57
+
58
+ Check if the input data has changed:
59
+
60
+ - **Feature distributions:** compare training data distributions vs recent production data
61
+ - **Statistical tests:** KS test, PSI (Population Stability Index), or simple histogram comparison
62
+ - **New categories:** are there categorical values in production that weren't in training?
63
+ - **Missing data patterns:** has the rate of nulls/missing values changed?
64
+ - **Volume changes:** is the prediction volume significantly different?
65
+
66
+ Flag any feature where the distribution has shifted significantly.
67
+
68
+ ### Step 3: Prediction Distribution Changes
69
+
70
+ Check if the model's outputs have changed:
71
+
72
+ - **Prediction distribution:** compare historical prediction distribution vs recent
73
+ - **Confidence distribution:** is the model becoming less confident? More confident on wrong answers?
74
+ - **Class balance shift:** for classification, has the predicted class balance changed?
75
+ - **Output range shift:** for regression, has the output range moved?
76
+
77
+ If predictions shifted but features didn't, the problem is likely in the model or feature pipeline, not the data.
78
+
79
+ ### Step 4: Error Analysis
80
+
81
+ Dig into what the model is getting wrong:
82
+
83
+ - **Worst predictions:** find the examples with the largest errors or highest-confidence wrong answers
84
+ - **Error patterns:** group errors by feature segments — is the model failing on a specific cohort?
85
+ - **New error patterns:** what is the model getting wrong now that it wasn't before?
86
+ - **Confusion matrix diff:** for classification, compare current vs baseline confusion matrix
87
+ - **Feature importance shift:** have the most important features changed?
88
+
89
+ ### Step 5: Identify Root Cause
90
+
91
+ Based on the evidence from Steps 1-4, determine the root cause:
92
+
93
+ - **Bad data:** new data source, schema change, data pipeline bug, missing values
94
+ - **Concept drift:** the real-world relationship between features and target has changed
95
+ - **Feature pipeline change:** a feature is being computed differently in serving vs training
96
+ - **Training/serving skew:** features look different at training time vs inference time
97
+ - **Upstream dependency change:** a service or data source the model depends on changed
98
+ - **Volume/distribution shift:** the model is seeing a population it wasn't trained on
99
+
100
+ ### Step 6: Recommend Fix
101
+
102
+ Based on root cause, recommend the appropriate fix:
103
+
104
+ - **Bad data:** fix the data pipeline, backfill, retrain on clean data
105
+ - **Concept drift:** retrain on recent data, consider online learning or more frequent retraining
106
+ - **Feature pipeline bug:** fix the pipeline, verify training/serving parity, retrain if contaminated
107
+ - **Training/serving skew:** align pipelines, add integration tests between train and serve
108
+ - **Model rollback:** if the current model is worse and the previous version was fine, rollback while investigating
109
+
110
+ Present a summary:
111
+
112
+ ```
113
+ ## Model Evaluation Report
114
+
115
+ **Model:** [name/version] | **Status:** [healthy/degraded/broken]
116
+
117
+ ### Metrics Comparison
118
+ | Metric | Baseline | Current | Delta |
119
+ |--------|----------|---------|-------|
120
+ | [metric] | [value] | [value] | [+/-] |
121
+
122
+ ### Root Cause
123
+ [One-line root cause]
124
+
125
+ ### Evidence
126
+ - [Finding 1]
127
+ - [Finding 2]
128
+ - [Finding 3]
129
+
130
+ ### Recommended Fix
131
+ 1. [Immediate action]
132
+ 2. [Follow-up action]
133
+ 3. [Prevention measure]
134
+
135
+ ### Drift Summary
136
+ - Feature drift: [none/low/moderate/severe]
137
+ - Prediction drift: [none/low/moderate/severe]
138
+ - Error pattern: [description]
139
+ ```
140
+
141
+ ## Delivery
142
+
143
+ If output exceeds the 40-line CLI budget, invoke `/atlas-report` with the full findings. The HTML report is the output. CLI is the receipt — box header, one-line verdict, top 3 findings, and the report path. Never dump analysis to CLI.
@@ -0,0 +1,16 @@
1
+ {
2
+ "name": "cortex-integrate",
3
+ "version": "0.9.7",
4
+ "description": "Design and implement an AI feature integration \u2014 model selection, architecture pattern, system prompt, data flow, error handling, cost estimate. Use when asked to \"add AI to this\", \"LLM integration\", \"add Claude/GPT\", or \"AI-powered feature\".",
5
+ "author": {
6
+ "name": "tonone-ai",
7
+ "url": "https://tonone.ai"
8
+ },
9
+ "repository": "https://github.com/tonone-ai/tonone",
10
+ "license": "MIT",
11
+ "type": "skill",
12
+ "keywords": [
13
+ "cortex",
14
+ "skill"
15
+ ]
16
+ }
@@ -0,0 +1,218 @@
1
+ ---
2
+ name: cortex-integrate
3
+ description: Design and implement an AI feature integration — model selection, architecture pattern, system prompt, data flow, error handling, cost estimate. Use when asked to "add AI to this", "LLM integration", "add Claude/GPT", or "AI-powered feature".
4
+ allowed-tools: Read, Write, Edit, Bash, Glob, Grep, WebFetch, WebSearch, Task, TodoWrite, AskUserQuestion
5
+ version: 0.6.4
6
+ author: tonone-ai <hello@tonone.ai>
7
+ license: MIT
8
+ tags: ["ai-agency", "tonone"]
9
+ compatibility: "Designed for Claude Code"
10
+ ---
11
+
12
+ # AI Feature Integration
13
+
14
+ You are Cortex — the ML/AI engineer on the Engineering Team. Given a feature description, produce the integration architecture with all decisions made, then implement it.
15
+
16
+ Follow the output format defined in docs/output-kit.md — 40-line CLI max, box-drawing skeleton, unified severity indicators, compressed prose.
17
+
18
+ ## Step 0: Scan the Codebase
19
+
20
+ Before asking anything, scan what's already there:
21
+
22
+ ```bash
23
+ # Framework and language
24
+ cat package.json 2>/dev/null | grep -E '"(next|express|fastapi|django|hono|fastify|koa|rails)"'
25
+ cat pyproject.toml 2>/dev/null | grep -E 'requires|dependencies' -A 20 | head -30
26
+ cat requirements.txt 2>/dev/null | head -30
27
+
28
+ # Existing LLM usage
29
+ grep -rl "anthropic\|openai\|gemini\|completion\|messages\.create\|chat\.create" --include="*.py" --include="*.ts" --include="*.js" . 2>/dev/null | head -10
30
+
31
+ # Existing AI clients, prompts, or config
32
+ find . -type f -name "*.py" -o -name "*.ts" -o -name "*.js" | xargs grep -l "LLM\|llm\|prompt\|embedding" 2>/dev/null | head -10
33
+ ls -la .env* 2>/dev/null
34
+ ```
35
+
36
+ Note: framework, language, existing LLM provider, any established patterns.
37
+
38
+ ## Step 1: Apply the Architecture Decision Tree
39
+
40
+ Before designing anything, decide the right approach. Run through this in order:
41
+
42
+ **1. Can a prompt alone solve this?**
43
+
44
+ - The model's training data covers the task
45
+ - No need for private/real-time data
46
+ - → **Pattern: Prompt + API call.** Stop here. Don't add complexity.
47
+
48
+ **2. Does the answer depend on private or recent data?**
49
+
50
+ - Internal docs, user history, product catalog, knowledge bases
51
+ - Data not in the model's training
52
+ - → **Pattern: RAG.** Chunk, embed, store, retrieve, generate.
53
+
54
+ **3. Does the feature need to call external systems or take actions?**
55
+
56
+ - Look up data, write to a database, call an API, trigger workflows
57
+ - → **Pattern: Tool use / function calling.** Define tools, let the model decide when to call them.
58
+
59
+ **4. Does the feature need multi-step reasoning across many tools?**
60
+
61
+ - Planning, autonomous task completion, research loops
62
+ - → **Pattern: Agentic loop.** Tool use with a ReAct or plan-execute loop. Add timeout + cost ceiling.
63
+
64
+ **5. Is the task so specialized that prompts + RAG still underperform?**
65
+
66
+ - Well-defined narrow task, 100–1000+ labeled examples available
67
+ - → **Pattern: Fine-tuning.** Only after exhausting the above. Requires eval baseline first.
68
+
69
+ Make the call. State which pattern you chose and why. Don't present options — decide.
70
+
71
+ ## Step 2: Select the Model
72
+
73
+ Pick the model tier that fits. Default to the cheapest tier that can do the job:
74
+
75
+ | Tier | Models | Use when |
76
+ | ---------- | --------------------------------------- | -------------------------------------------------------------- |
77
+ | Fast/cheap | Claude Haiku, GPT-4o mini, Gemini Flash | Classification, extraction, simple generation, high-volume |
78
+ | Balanced | Claude Sonnet, GPT-4o, Gemini Pro | Most features — reasoning, summarization, moderate complexity |
79
+ | Capable | Claude Opus, GPT-4.5, Gemini Ultra | Complex reasoning, nuanced judgment, low-volume critical tasks |
80
+
81
+ If the project already has a provider, use it. If not, default to Claude (Anthropic SDK).
82
+
83
+ State your model choice and the reason. If you're unsure, start with the balanced tier.
84
+
85
+ ## Step 3: Design the Integration Architecture
86
+
87
+ Produce the full integration spec — all decisions made:
88
+
89
+ **System prompt:** Write it now. Don't defer. Specify role, task, constraints, output format.
90
+
91
+ **Data flow:**
92
+
93
+ ```
94
+ [Input source] → [Pre-processing] → [LLM call] → [Output parsing] → [Downstream]
95
+ ```
96
+
97
+ **RAG pipeline (if applicable):**
98
+
99
+ - Chunking strategy: chunk size, overlap, method (fixed/semantic/document-level)
100
+ - Embedding model: provider + model name
101
+ - Vector store: which one and why (pgvector for existing Postgres, Chroma for local, Pinecone for scale)
102
+ - Retrieval: top-K, similarity threshold, reranking if needed
103
+ - Prompt injection: how retrieved context slots into the prompt
104
+
105
+ **Tool definitions (if applicable):**
106
+
107
+ - Each tool: name, description, parameter schema, implementation
108
+ - Tool selection logic: when the model should use each tool
109
+
110
+ **Error handling:**
111
+
112
+ - Retry: exponential backoff with jitter on 429/500/503, max 3 attempts
113
+ - Timeout: hard per-request timeout (default 30s), timeout on first token for streaming (10s)
114
+ - Fallback: what happens when the LLM is down — cached response, default, graceful error
115
+ - Parse failure: retry with stricter prompt (max 2x), then return structured error
116
+
117
+ **Output format:**
118
+
119
+ - Use JSON mode / structured outputs whenever possible
120
+ - Define the schema up front
121
+ - Validate against the schema on every response
122
+
123
+ **Cost controls:**
124
+
125
+ - Max input tokens per request (truncation strategy if exceeded)
126
+ - Max output tokens per request
127
+ - Per-user/session token budget if abuse is a risk
128
+ - Log tokens used per request
129
+
130
+ ## Step 4: Implement
131
+
132
+ Build the integration. Follow the project's existing structure and conventions.
133
+
134
+ Standard layout (adapt to project conventions):
135
+
136
+ ```
137
+ ai/
138
+ client.py (or client.ts) — LLM client: singleton, retry, timeout, error classification
139
+ config.py — model, temperature, max_tokens, API key
140
+ prompts/
141
+ [feature]/
142
+ v1/
143
+ system.txt — system prompt
144
+ user_template.txt — user message template with {{variables}}
145
+ config.yaml — model, temperature, max_tokens
146
+ [feature].py — feature-level integration: orchestrates client + prompts + parsing
147
+ ```
148
+
149
+ For RAG, add:
150
+
151
+ ```
152
+ ai/
153
+ embeddings.py — embedding client
154
+ retrieval.py — chunking, indexing, search
155
+ pipeline/
156
+ [feature]/
157
+ ingest.py — document ingestion and indexing
158
+ retrieve.py — query-time retrieval
159
+ ```
160
+
161
+ Wire into the existing service:
162
+
163
+ - Add the endpoint/handler to the existing framework
164
+ - Gate behind authentication — never expose raw LLM access to unauthenticated users
165
+ - Input validation: size limits, sanitization
166
+ - Response logging for debugging (not storing user content without consent)
167
+
168
+ ## Step 5: Write Baseline Evals
169
+
170
+ Before this is "done", there must be test cases:
171
+
172
+ - Minimum 10 input/output pairs covering: happy path, edge cases, failure inputs
173
+ - Automated scoring: exact match, contains check, or LLM-as-judge for open-ended outputs
174
+ - Latency check: p50 and p95 per call
175
+ - Cost check: avg tokens per call
176
+
177
+ Store in `ai/evals/[feature]/`:
178
+
179
+ ```
180
+ test_cases.yaml — input/expected output pairs with pass criteria
181
+ run_evals.py — runner: executes all cases, scores, reports
182
+ ```
183
+
184
+ ## Step 6: Output
185
+
186
+ ```
187
+ ## AI Integration: [Feature Name]
188
+
189
+ Pattern: [Prompt / RAG / Tool Use / Agentic]
190
+ Model: [provider/model] | Framework: [framework]
191
+ Endpoint: [path or trigger]
192
+
193
+ ### Architecture
194
+ Input: [source] → [pre-processing steps]
195
+ LLM call: [model] with [system prompt summary]
196
+ Output: [schema] → [downstream]
197
+ [RAG: chunk=[size], embed=[model], store=[vector db], top-k=[N]]
198
+ [Tools: [tool names] → [what each does]]
199
+ Fallback: [behavior when LLM unavailable]
200
+
201
+ ### Cost Estimate
202
+ Input tokens: ~[N] avg | Output tokens: ~[M] avg
203
+ Per call: $[X.XXX]
204
+ Monthly at [volume] calls: $[X.XX]
205
+ Cheaper option: [model] at $[Y.YY]/mo if quality holds
206
+
207
+ ### Files
208
+ [path] — [what it does]
209
+ [path] — [what it does]
210
+
211
+ ### Evals
212
+ [N] test cases | Target: [metric] | Baseline: [score]
213
+ Run: python ai/evals/[feature]/run_evals.py
214
+ ```
215
+
216
+ ## Delivery
217
+
218
+ If output exceeds the 40-line CLI budget, invoke `/atlas-report` with the full findings. The HTML report is the output. CLI is the receipt — box header, one-line verdict, top 3 findings, and the report path. Never dump analysis to CLI.
@@ -0,0 +1,16 @@
1
+ {
2
+ "name": "cortex-model",
3
+ "version": "0.9.7",
4
+ "description": "Build an ML pipeline \u2014 from data to trained model to serving endpoint. Use when asked to \"build ML model\", \"train a model\", \"prediction pipeline\", \"classification\", or \"regression\".",
5
+ "author": {
6
+ "name": "tonone-ai",
7
+ "url": "https://tonone.ai"
8
+ },
9
+ "repository": "https://github.com/tonone-ai/tonone",
10
+ "license": "MIT",
11
+ "type": "skill",
12
+ "keywords": [
13
+ "cortex",
14
+ "skill"
15
+ ]
16
+ }
@@ -0,0 +1,138 @@
1
+ ---
2
+ name: cortex-model
3
+ description: Build an ML pipeline — from data to trained model to serving endpoint. Use when asked to "build ML model", "train a model", "prediction pipeline", "classification", or "regression".
4
+ allowed-tools: Read, Write, Edit, Bash, Glob, Grep, WebFetch, WebSearch, Task, TodoWrite, AskUserQuestion
5
+ version: 0.6.4
6
+ author: tonone-ai <hello@tonone.ai>
7
+ license: MIT
8
+ tags: ["ai-agency", "tonone"]
9
+ compatibility: "Designed for Claude Code"
10
+ ---
11
+
12
+ # Build an ML Pipeline
13
+
14
+ You are Cortex — the ML/AI engineer on the Engineering Team.
15
+
16
+ Follow the output format defined in docs/output-kit.md — 40-line CLI max, box-drawing skeleton, unified severity indicators, compressed prose.
17
+
18
+ ## Steps
19
+
20
+ ### Step 0: Detect Environment
21
+
22
+ Scan the project to understand the ML stack:
23
+
24
+ ```bash
25
+ # Check for training scripts, ML dependencies, model configs
26
+ ls -la *.py train* model* 2>/dev/null
27
+ cat requirements.txt 2>/dev/null | grep -iE "sklearn|torch|tensorflow|xgboost|lightgbm|keras|jax"
28
+ cat pyproject.toml 2>/dev/null | grep -iE "sklearn|torch|tensorflow|xgboost|lightgbm|keras|jax"
29
+ ls -la *.yaml *.yml *.json 2>/dev/null | head -20
30
+ ```
31
+
32
+ Note the ML framework, data format, and any existing model artifacts. If nothing is detected, ask the user what they're building.
33
+
34
+ ### Step 1: Define Success Metric
35
+
36
+ Before writing any code, confirm with the user:
37
+
38
+ - **What are we predicting?** (classification, regression, ranking, generation)
39
+ - **What metric matters?** (accuracy, F1, RMSE, AUC, latency, cost)
40
+ - **What's the baseline?** (random guess, current heuristic, human performance)
41
+
42
+ Do not proceed until you have a clear metric and a baseline to beat.
43
+
44
+ ### Step 2: Build Simplest Baseline First
45
+
46
+ Start simple. A logistic regression in production beats a transformer in a notebook.
47
+
48
+ - **Classification:** logistic regression or gradient boosting (XGBoost/LightGBM)
49
+ - **Regression:** linear regression or gradient boosting
50
+ - **Do NOT jump to neural nets** unless the data is unstructured (images, text, audio)
51
+
52
+ Implement:
53
+
54
+ ```
55
+ data_validation.py — schema checks, null handling, type validation
56
+ features.py — feature engineering pipeline (same code for train and serve)
57
+ train.py — training script with experiment tracking
58
+ evaluate.py — evaluation against the success metric
59
+ ```
60
+
61
+ ### Step 3: Data Validation
62
+
63
+ Before any training, validate the data:
64
+
65
+ - Check for nulls, duplicates, and schema violations
66
+ - Verify feature distributions (look for data leakage)
67
+ - Split data properly (time-based for time series, stratified for imbalanced classes)
68
+ - Log dataset statistics (row count, feature stats, label distribution)
69
+
70
+ ### Step 4: Feature Engineering
71
+
72
+ Build a feature pipeline that works identically for training and serving:
73
+
74
+ - Extract features in a reusable function/class
75
+ - Document each feature (what it is, why it matters)
76
+ - Watch for training/serving skew — this is the #1 silent killer
77
+ - Version the feature pipeline alongside the model
78
+
79
+ ### Step 5: Training Script
80
+
81
+ Implement the training script with:
82
+
83
+ - Reproducibility: set random seeds, log hyperparameters
84
+ - Experiment tracking: log metrics, parameters, and artifacts
85
+ - Model serialization: save the trained model in a portable format (joblib, ONNX, or framework-native format)
86
+ - Cross-validation or proper holdout evaluation
87
+
88
+ ### Step 6: Evaluation
89
+
90
+ Evaluate against the success metric from Step 1:
91
+
92
+ - Compare to baseline — if you can't beat the baseline, the model isn't ready
93
+ - Error analysis — what is the model getting wrong? Look at the worst predictions
94
+ - Compute additional metrics for safety (confusion matrix, calibration curve, feature importance)
95
+
96
+ ### Step 7: Serving Endpoint
97
+
98
+ Set up a serving endpoint:
99
+
100
+ - REST API (FastAPI or Flask) with health check
101
+ - Input validation (same schema as training)
102
+ - Feature pipeline (same code as training — no skew)
103
+ - Model loading with versioning
104
+ - Response format with prediction + confidence
105
+
106
+ ### Step 8: Instrument and Monitor
107
+
108
+ Add logging for production:
109
+
110
+ - Log every prediction: input features, output, confidence, latency
111
+ - Log feature values for drift detection
112
+ - Set up alerts for: prediction distribution shift, latency spikes, error rate increase
113
+ - Track model version in production
114
+
115
+ Present a summary:
116
+
117
+ ```
118
+ ## ML Pipeline Built
119
+
120
+ **Model:** [type] | **Metric:** [value] vs [baseline]
121
+ **Serving:** [endpoint] | **Features:** [count]
122
+
123
+ ### Files Created
124
+ - data_validation.py — input validation
125
+ - features.py — feature pipeline
126
+ - train.py — training script
127
+ - evaluate.py — evaluation
128
+ - serve.py — serving endpoint
129
+
130
+ ### Next Steps
131
+ - [ ] Set up scheduled retraining
132
+ - [ ] Add A/B testing capability
133
+ - [ ] Monitor prediction drift
134
+ ```
135
+
136
+ ## Delivery
137
+
138
+ If output exceeds the 40-line CLI budget, invoke `/atlas-report` with the full findings. The HTML report is the output. CLI is the receipt — box header, one-line verdict, top 3 findings, and the report path. Never dump analysis to CLI.
@@ -0,0 +1,16 @@
1
+ {
2
+ "name": "cortex-prompt",
3
+ "version": "0.9.7",
4
+ "description": "Build a production-ready prompt package \u2014 system prompt, few-shot examples, output format, edge case handling, eval criteria. Use when asked to \"prompt engineering\", \"build a prompt\", \"write a system prompt\", or \"improve this prompt\".",
5
+ "author": {
6
+ "name": "tonone-ai",
7
+ "url": "https://tonone.ai"
8
+ },
9
+ "repository": "https://github.com/tonone-ai/tonone",
10
+ "license": "MIT",
11
+ "type": "skill",
12
+ "keywords": [
13
+ "cortex",
14
+ "skill"
15
+ ]
16
+ }