get-claudia 1.53.2 → 1.53.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (26) hide show
  1. package/CHANGELOG.md +19 -0
  2. package/bin/index.js +22 -20
  3. package/package.json +1 -1
  4. package/template-v2/.claude/skills/README.md +11 -1
  5. package/template-v2/.claude/skills/capability-suggester.md +164 -98
  6. package/template-v2/.claude/skills/capture-meeting/evals/basic.yaml +27 -0
  7. package/template-v2/.claude/skills/diagnose/evals/basic.yaml +34 -0
  8. package/template-v2/.claude/skills/diagnose/references/common-issues.md +133 -0
  9. package/template-v2/.claude/skills/draft-reply/SKILL.md +1 -1
  10. package/template-v2/.claude/skills/follow-up-draft/SKILL.md +1 -1
  11. package/template-v2/.claude/skills/ingest-sources/references/extraction-patterns.md +202 -0
  12. package/template-v2/.claude/skills/meditate/SKILL.md +1 -1
  13. package/template-v2/.claude/skills/meditate/evals/basic.yaml +29 -0
  14. package/template-v2/.claude/skills/meeting-prep/SKILL.md +1 -1
  15. package/template-v2/.claude/skills/memory-manager.md +1 -1
  16. package/template-v2/.claude/skills/morning-brief/evals/basic.yaml +29 -0
  17. package/template-v2/.claude/skills/new-person/SKILL.md +1 -1
  18. package/template-v2/.claude/skills/new-person/evals/basic.yaml +27 -0
  19. package/template-v2/.claude/skills/new-workspace/references/workspace-templates.md +154 -0
  20. package/template-v2/.claude/skills/pattern-recognizer.md +1 -1
  21. package/template-v2/.claude/skills/research/SKILL.md +120 -12
  22. package/template-v2/.claude/skills/research/references/source-evaluation.md +108 -0
  23. package/template-v2/.claude/skills/skill-index.json +327 -91
  24. package/template-v2/.claude/skills/weekly-review/SKILL.md +1 -1
  25. package/template-v2/.claude/skills/concierge.md +0 -249
  26. package/template-v2/.claude/skills/structure-evolution.md +0 -326
package/CHANGELOG.md CHANGED
@@ -2,6 +2,25 @@
2
2
 
3
3
  All notable changes to Claudia will be documented in this file.
4
4
 
5
+ ## 1.53.4 (2026-03-04)
6
+
7
+ ### The Skill Sharpening Release
8
+
9
+ Systematic improvement of Claudia's 41 default skills for better contextual triggering, testing, and maintainability. Follows the Skill Creator's best practices for description-driven activation and progressive disclosure.
10
+
11
+ - **Improved skill descriptions** -- 8 SKILL.md files updated with richer trigger context so Claude matches skills more accurately from natural language (meditate, new-person, draft-reply, follow-up-draft, memory-manager, pattern-recognizer, meeting-prep, weekly-review)
12
+ - **Skill index v2 with examples** -- `skill-index.json` bumped to schema v2. All 41 entries now include `examples` arrays with 3-6 natural-language utterances for long-tail matching (e.g., "anything urgent this morning?" triggers morning-brief)
13
+ - **Consolidated overlapping skills (43 to 41)** -- Merged `concierge` into `research/SKILL.md` (tool detection, staleness tracking, proactive offers). Merged `structure-evolution` into `capability-suggester.md` (usage gap detection, business depth upgrades, suggestion library)
14
+ - **Eval templates for 5 skills** -- Added `evals/basic.yaml` for morning-brief, capture-meeting, new-person, diagnose, and meditate. Compatible with the Skill Creator plugin for automated quality testing
15
+ - **Reference files for 4 skills** -- Added `references/` subdirectories for diagnose (common-issues), ingest-sources (extraction-patterns), research (source-evaluation), and new-workspace (workspace-templates). Keeps SKILL.md lean via progressive disclosure
16
+ - **README updated** -- Documented `examples` field in schema reference, added progressive disclosure and eval documentation, updated effort level table for 41 skills
17
+
18
+ ## 1.53.3 (2026-03-04)
19
+
20
+ ### Fix: Actually restore disabled MCP servers on upgrade
21
+
22
+ v1.53.2 added restore logic for `_disabled_`-prefixed keys in `mcpServers`, but an early return (`if (!config._disabled_mcpServers) return`) prevented it from running. The function now handles both migration paths independently: the `_disabled_mcpServers` stash (Path 1) and `_disabled_*` prefixed keys directly in `mcpServers` (Path 2). Path 2 is now generic and renames any `_disabled_*` key, not just gmail/google-calendar.
23
+
5
24
  ## 1.53.2 (2026-03-04)
6
25
 
7
26
  ### Re-enable Gmail and Calendar MCPs
package/bin/index.js CHANGED
@@ -1014,31 +1014,38 @@ function restoreMcpServers(targetPath) {
1014
1014
  try {
1015
1015
  const raw = readFileSync(mcpPath, 'utf-8');
1016
1016
  const config = JSON.parse(raw);
1017
- if (!config._disabled_mcpServers) return;
1018
1017
  if (!config.mcpServers) config.mcpServers = {};
1019
1018
 
1020
- // Restore all previously disabled servers (memory, gmail, google-calendar)
1021
- const toRestore = ['claudia-memory', 'claudia_memory', 'gmail', 'google-calendar'];
1022
1019
  let changed = false;
1023
1020
  const restored = [];
1024
1021
 
1025
- for (const key of toRestore) {
1026
- if (config._disabled_mcpServers[key] && !config.mcpServers[key]) {
1027
- const serverConfig = { ...config._disabled_mcpServers[key] };
1028
- delete serverConfig._replaced_by;
1029
- delete serverConfig._warning;
1030
- config.mcpServers[key] = serverConfig;
1031
- delete config._disabled_mcpServers[key];
1032
- changed = true;
1033
- restored.push(key);
1022
+ // Path 1: Restore from _disabled_mcpServers stash (older migration format)
1023
+ if (config._disabled_mcpServers) {
1024
+ const toRestore = ['claudia-memory', 'claudia_memory', 'gmail', 'google-calendar'];
1025
+ for (const key of toRestore) {
1026
+ if (config._disabled_mcpServers[key] && !config.mcpServers[key]) {
1027
+ const serverConfig = { ...config._disabled_mcpServers[key] };
1028
+ delete serverConfig._replaced_by;
1029
+ delete serverConfig._warning;
1030
+ config.mcpServers[key] = serverConfig;
1031
+ delete config._disabled_mcpServers[key];
1032
+ changed = true;
1033
+ restored.push(key);
1034
+ }
1035
+ }
1036
+
1037
+ // Clean up _disabled_mcpServers if it's now empty
1038
+ if (Object.keys(config._disabled_mcpServers).length === 0) {
1039
+ delete config._disabled_mcpServers;
1034
1040
  }
1035
1041
  }
1036
1042
 
1037
- // Also rename _disabled_ prefixed keys in mcpServers itself
1043
+ // Path 2: Rename _disabled_ prefixed keys in mcpServers itself
1044
+ // This handles the case where keys like "_disabled_gmail" exist directly in mcpServers
1038
1045
  for (const key of Object.keys(config.mcpServers)) {
1039
1046
  if (key.startsWith('_disabled_')) {
1040
1047
  const realKey = key.replace('_disabled_', '');
1041
- if (['gmail', 'google-calendar'].includes(realKey) && !config.mcpServers[realKey]) {
1048
+ if (!config.mcpServers[realKey]) {
1042
1049
  const serverConfig = { ...config.mcpServers[key] };
1043
1050
  delete serverConfig._warning;
1044
1051
  config.mcpServers[realKey] = serverConfig;
@@ -1049,14 +1056,9 @@ function restoreMcpServers(targetPath) {
1049
1056
  }
1050
1057
  }
1051
1058
 
1052
- // Clean up _disabled_mcpServers if it's now empty
1053
- if (config._disabled_mcpServers && Object.keys(config._disabled_mcpServers).length === 0) {
1054
- delete config._disabled_mcpServers;
1055
- }
1056
-
1057
1059
  if (changed) {
1058
1060
  writeFileSync(mcpPath, JSON.stringify(config, null, 2) + '\n');
1059
- console.log(` ${colors.green}✓${colors.reset} Restored MCP servers: ${restored.join(', ')} (moved back from _disabled_mcpServers)`);
1061
+ console.log(` ${colors.green}✓${colors.reset} Restored MCP servers: ${restored.join(', ')}`);
1060
1062
  }
1061
1063
  } catch {
1062
1064
  // Not valid JSON or can't read -- skip silently
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "get-claudia",
3
- "version": "1.53.2",
3
+ "version": "1.53.4",
4
4
  "description": "An AI assistant who learns how you work.",
5
5
  "keywords": [
6
6
  "claudia",
@@ -51,10 +51,16 @@ Skills live in `.claude/skills/` and can be either:
51
51
  .claude/skills/
52
52
  └── ingest-sources/
53
53
  ├── SKILL.md # Main skill file (required)
54
+ ├── references/ # Optional deep-dive content (progressive disclosure)
55
+ ├── evals/ # Optional eval templates (Skill Creator compatible)
54
56
  ├── templates/ # Optional supporting files
55
57
  └── examples/ # Optional examples
56
58
  ```
57
59
 
60
+ **Progressive disclosure:** Keep SKILL.md lean (under 500 lines). Move detailed reference content into `references/` subdirectories. Claude reads these on demand when deeper context is needed.
61
+
62
+ **Eval templates:** Skills can include `evals/basic.yaml` with test prompts and expectations. These are compatible with the Skill Creator plugin for automated skill quality testing.
63
+
58
64
  ### SKILL.md Format
59
65
 
60
66
  ```yaml
@@ -86,6 +92,9 @@ effort-level: low | medium | high | max
86
92
  triggers: # Natural language activation patterns
87
93
  - "pattern one"
88
94
  - "pattern two"
95
+ examples: # Full natural-language utterances for matching (v2)
96
+ - "what should I focus on today?"
97
+ - "anything urgent this morning?"
89
98
  inputs: # Expected input data
90
99
  - name: input_name
91
100
  type: string | entity | date | file
@@ -114,6 +123,7 @@ argument-hint: [arg]
114
123
  | `description` | Yes | Used for contextual matching and skill index |
115
124
  | `effort-level` | Yes | Thinking budget: `low`, `medium`, `high`, `max` |
116
125
  | `triggers` | No | 3-5 natural language phrases that activate the skill |
126
+ | `examples` | No | Full natural-language utterances for long-tail matching (v2) |
117
127
  | `inputs` | No | Structured input expectations (name, type, description) |
118
128
  | `outputs` | No | What the skill produces (name, type, description) |
119
129
  | `invocation` | No | `explicit`, `contextual` (default), or `proactive` |
@@ -197,7 +207,7 @@ effort-level: medium
197
207
  |--------|--------|
198
208
  | **low** | morning-brief, client-health, financial-snapshot, growth-check, databases, diagnose, brain-monitor, inbox-check, judgment-awareness |
199
209
  | **medium** | meeting-prep, draft-reply, follow-up-draft, file-document, new-person, capture-meeting, summarize-doc, memory-audit, brain, fix-duplicates, memory-health, memory-manager, onboarding, structure-generator, agent-dispatcher, new-workspace |
200
- | **high** | weekly-review, meditate, research, what-am-i-missing, map-connections, commitment-detector, capability-suggester, concierge, connector-discovery, pattern-recognizer, relationship-tracker, risk-surfacer, structure-evolution, hire-agent |
210
+ | **high** | weekly-review, meditate, research, what-am-i-missing, map-connections, commitment-detector, capability-suggester, connector-discovery, pattern-recognizer, relationship-tracker, risk-surfacer, hire-agent |
201
211
  | **max** | ingest-sources, pipeline-review, deep-context |
202
212
 
203
213
  ## Creating Custom Skills
@@ -1,6 +1,6 @@
1
1
  ---
2
2
  name: capability-suggester
3
- description: Notice repeated user behaviors and suggest new commands, workflows, or structure to streamline their work.
3
+ description: Notice repeated user behaviors and suggest new commands, workflows, structure, or integrations to streamline work. Also detects when the user's setup has outgrown its current structure and suggests targeted upgrades. Activates when repeated task patterns, workflow friction, structural gaps, or business growth signals are detected.
4
4
  user-invocable: false
5
5
  invocation: proactive
6
6
  effort-level: high
@@ -10,22 +10,39 @@ triggers:
10
10
  - "frequent status check query"
11
11
  - "mentions checking external tool"
12
12
  - "workflow gap between steps"
13
+ - "files created outside existing structure"
14
+ - "tracking something with no home"
15
+ - "business complexity has grown"
16
+ - "workflow friction observed"
13
17
  inputs:
14
18
  - name: behavior_pattern
15
19
  type: string
16
- description: Observed repeated behavior or workflow pattern
20
+ description: Observed repeated behavior, workflow pattern, or structural gap
17
21
  outputs:
18
22
  - name: suggestion
19
23
  type: text
20
- description: Proposed enhancement (new command, workflow change, or structure addition)
24
+ description: Proposed enhancement (new command, workflow change, structure addition, or integration)
21
25
  - name: capability
22
26
  type: file
23
- description: New skill file or structural change if user accepts the suggestion
27
+ description: New skill file, structural change, or template if user accepts the suggestion
24
28
  ---
25
29
 
26
30
  # Capability Suggester Skill
27
31
 
28
- **Triggers:** Activates when patterns of repeated behavior reach a threshold.
32
+ **Triggers:** Activates when patterns of repeated behavior reach a threshold, or when structural gaps create friction.
33
+
34
+ ---
35
+
36
+ ## Philosophy
37
+
38
+ Structure should grow organically from actual needs, not be imposed upfront. This skill watches for both repeated behaviors and structural friction, offering targeted solutions.
39
+
40
+ **Core Principles:**
41
+ - Observe before suggesting
42
+ - One suggestion at a time, not a flood
43
+ - Accept "no" gracefully
44
+ - Remember declined suggestions (don't re-suggest)
45
+ - Explain the why, not just the what
29
46
 
30
47
  ---
31
48
 
@@ -82,19 +99,48 @@ Want me to prompt for client file updates after meeting captures?"
82
99
  ### Structure Needs
83
100
 
84
101
  **Detection:**
102
+ - Files created outside the existing structure repeatedly
85
103
  - Topics that don't have a home
86
104
  - Files that are getting too long
87
105
  - Categories that are emerging
88
106
 
89
107
  **Examples:**
90
108
  ```
91
- "You've mentioned 'partnerships' in several contexts but don't
92
- have a dedicated folder. Should we create partnerships/ ?"
109
+ "I notice you've been saving [X] type files in random places.
110
+ Want me to create a dedicated folder for those?"
111
+
112
+ "You've created 3 client notes in /context.
113
+ Should we set up proper client folders?"
93
114
 
94
115
  "Your patterns.md is getting long. Want me to split it into
95
116
  work-patterns.md and relationship-patterns.md?"
96
117
  ```
97
118
 
119
+ ### Business Depth Upgrades
120
+
121
+ If user chose "minimal" or "starter" initially, watch for signs they need more:
122
+
123
+ **Minimal to Starter:**
124
+ - Mentions tracking multiple things manually
125
+ - Asks about pipelines or active work lists
126
+ - Discusses finances more than occasionally
127
+
128
+ **Starter to Full:**
129
+ - Manages 3+ active clients/projects
130
+ - Needs accountability tracking
131
+ - Discusses methodology or repeatable processes
132
+ - Mentions tax planning or financial complexity
133
+
134
+ **Suggest:**
135
+ ```
136
+ "Your workflow has gotten more complex since we started. Want me to add:
137
+ - Pipeline tracking (active, prospecting, completed)
138
+ - Financial structure (expenses, invoicing, tax planning)
139
+ - Templates for common tasks
140
+
141
+ I can add just what you need, not everything at once."
142
+ ```
143
+
98
144
  ### Integration Needs
99
145
 
100
146
  **Detection:**
@@ -108,7 +154,6 @@ work-patterns.md and relationship-patterns.md?"
108
154
  - "Can you check my email/calendar/Notion..."
109
155
  - "Let me paste this from [service]..."
110
156
  - "I need to go look at [service] for..."
111
- - "Here's what [service] says..."
112
157
  - "Can you see my [service]?"
113
158
 
114
159
  **Response:**
@@ -123,15 +168,11 @@ your pages without the copy-paste."
123
168
  "You've asked about your email a few times. I can't see it yet,
124
169
  but I can help you set that up. Takes about 5 minutes for Gmail.
125
170
  Interested?"
126
-
127
- "I see you check your calendar separately before our morning briefs.
128
- Want me to include your schedule automatically? I can connect to
129
- Google Calendar if you'd like."
130
171
  ```
131
172
 
132
173
  **Guardrails:**
133
174
  - Only suggest once per service (check declined list in learnings.md)
134
- - Don't interrupt workflow-suggest at natural pause points
175
+ - Don't interrupt workflow, suggest at natural pause points
135
176
  - If they said "maybe later" during onboarding, wait at least a week
136
177
 
137
178
  ---
@@ -145,53 +186,49 @@ Track behavior without mentioning it until threshold reached:
145
186
  - 2+ for complex workflows
146
187
  - Immediate for obvious improvements
147
188
 
148
- ### 2. Propose Enhancement
149
-
150
- **Format:**
151
- ```
152
- "I've noticed [observation].
153
-
154
- Would you like me to [specific solution]?
155
-
156
- This would [benefit]."
157
- ```
189
+ ### 2. Wait for a Natural Moment
158
190
 
159
- **Examples:**
191
+ **Good times to suggest:**
192
+ - Start of session: "Before we dive in, I noticed something..."
193
+ - End of weekly review: "One observation from reviewing your week..."
194
+ - After completing a task: "That's done. Quick thought..."
195
+ - When they mention friction: "You mentioned [X] being messy. Want me to..."
160
196
 
161
- ```
162
- "I've noticed you check client health status at the start of each week.
197
+ **Bad times:**
198
+ - During focused work
199
+ - When user is stressed
200
+ - If pattern is sensitive and context is wrong
163
201
 
164
- Would you like me to add a client health summary to your Monday morning brief?
202
+ ### 3. Propose Enhancement
165
203
 
166
- This would save you from manually checking each client file."
204
+ **Format:**
167
205
  ```
206
+ "I've noticed [observation].
168
207
 
169
- ```
170
- "You often draft follow-up emails after sales calls.
208
+ Would you like me to [specific solution]?
171
209
 
172
- Would you like me to create a /sales-followup command that:
173
- - Uses the meeting notes as context
174
- - Drafts a templated follow-up
175
- - Suggests next steps based on the conversation
210
+ This would [benefit].
176
211
 
177
- I could have this ready for your next call."
212
+ Totally fine if not - just noticed the pattern."
178
213
  ```
179
214
 
180
- ### 3. Accept Response
215
+ ### 4. Accept Response
181
216
 
182
217
  **If yes:**
183
- - Create the enhancement
184
- - Explain how to use it
218
+ - Create the enhancement immediately
219
+ - Show what was added
220
+ - Offer a quick tour if it's substantial
185
221
  - Note in learnings.md
186
222
 
187
- **If no:**
188
- - Acknowledge gracefully
189
- - Don't suggest again for a while
190
- - Note preference in learnings.md
223
+ **If "not now" / "maybe later":**
224
+ - Note the suggestion and timing
225
+ - Wait at least 2 weeks before similar suggestions
226
+ - Acknowledge: "No problem. I'll let you know if the pattern continues."
191
227
 
192
- **If "maybe later":**
193
- - Note for future
194
- - Remind in a week or when context is relevant
228
+ **If "no" / declined:**
229
+ - Record the declined suggestion
230
+ - Don't suggest the same thing again (unless they explicitly ask)
231
+ - Acknowledge: "Got it. Won't mention it again."
195
232
 
196
233
  ---
197
234
 
@@ -199,26 +236,10 @@ I could have this ready for your next call."
199
236
 
200
237
  ### New Commands
201
238
 
202
- **Template:**
203
- ```markdown
204
- # [Command Name]
205
-
206
- [Brief description of what it does]
207
-
208
- ## When to Use
209
- [Trigger conditions]
210
-
211
- ## What It Does
212
- [Step by step]
213
-
214
- ## Output
215
- [What user gets]
216
- ```
217
-
218
239
  **Process:**
219
240
  1. Draft command based on observed pattern
220
241
  2. Propose to user with explanation
221
- 3. If approved, create in `.claude/commands/`
242
+ 3. If approved, create in `.claude/skills/`
222
243
  4. Confirm creation and explain usage
223
244
 
224
245
  ### Workflow Enhancements
@@ -245,22 +266,11 @@ Want me to enhance it to also:
245
266
  - Split growing files
246
267
  - Add templates for new types
247
268
 
248
- **Example:**
249
- ```
250
- "You've started tracking vendor relationships separately from clients.
251
-
252
- Should I create:
253
- - vendors/ folder with similar structure to clients/
254
- - /vendor-status command for quick checks?"
255
- ```
256
-
257
269
  ---
258
270
 
259
- ## Learning Integration
271
+ ## Tracking Suggestions
260
272
 
261
- ### What Gets Stored
262
-
263
- In `context/learnings.md`:
273
+ Maintain in `context/learnings.md`:
264
274
 
265
275
  ```markdown
266
276
  ## Suggested Capabilities
@@ -268,10 +278,12 @@ In `context/learnings.md`:
268
278
  ### Accepted
269
279
  - /linkedin-quick command (created Jan 15)
270
280
  - Auto-client-update after meetings (enabled Jan 18)
281
+ - Pipeline tracking folders (created Feb 1)
271
282
 
272
- ### Declined
283
+ ### Declined (Don't Re-suggest)
273
284
  - Partnership folder (user prefers flat structure)
274
285
  - Automatic deadline reminders (user finds them annoying)
286
+ - Full pipeline structure - prefers minimal
275
287
 
276
288
  ### Pending
277
289
  - Sales follow-up template (user said "maybe later" - Jan 20)
@@ -286,52 +298,106 @@ Track whether suggestions are used:
286
298
 
287
299
  ---
288
300
 
301
+ ## Suggestion Library
302
+
303
+ ### For Users Who Started Minimal
304
+
305
+ **Pipeline Tracking:**
306
+ ```
307
+ "You've mentioned 3 different clients this week but don't have a pipeline.
308
+ Want me to set up tracking so you can see active work at a glance?"
309
+ ```
310
+
311
+ **Financial Tracking:**
312
+ ```
313
+ "I notice you discuss finances fairly often. Your setup is minimal right now.
314
+ Want me to add an overview file for tracking revenue and expenses?"
315
+ ```
316
+
317
+ **Commitments Tracking:**
318
+ ```
319
+ "You've made several promises this week. Want me to set up a dedicated
320
+ commitments tracker so nothing slips through?"
321
+ ```
322
+
323
+ ### For Users Who Started Starter
324
+
325
+ **Full Pipeline:**
326
+ ```
327
+ "Your pipeline is getting busier. Want me to add prospecting and completed
328
+ tracking so you can see your full sales funnel?"
329
+ ```
330
+
331
+ **Templates Library:**
332
+ ```
333
+ "You do a lot of similar tasks. Want me to set up a templates folder with
334
+ starting points for client intake, meeting prep, and reviews?"
335
+ ```
336
+
337
+ ### For All Users
338
+
339
+ **Weekly Review Template:**
340
+ ```
341
+ "You do informal weekly reviews. Want me to create a template so you hit
342
+ the same key areas each time?"
343
+ ```
344
+
345
+ **Methodology Documentation:**
346
+ ```
347
+ "You've described how you approach [X] a few times. Want me to document it
348
+ so you (and I) can reference it consistently?"
349
+ ```
350
+
351
+ **New Folder for Recurring Content:**
352
+ ```
353
+ "You've created several [X] files. Want me to set up a dedicated folder
354
+ so they're easier to find?"
355
+ ```
356
+
357
+ ---
358
+
359
+ ## Frequency Limits
360
+
361
+ - Maximum 1 suggestion per session (unless asked)
362
+ - Space out suggestions over time
363
+ - Wait 2 weeks after any suggestion before the next
364
+ - Exception: If they ask "what should I add?" give fuller recommendations
365
+
366
+ ---
367
+
289
368
  ## Guardrails
290
369
 
291
370
  ### Don't Overwhelm
292
-
293
371
  - Max 1 suggestion per session (unless asked)
294
- - Space out suggestions over time
295
372
  - Don't repeat declined suggestions
373
+ - Space suggestions over time
296
374
 
297
375
  ### Don't Over-Engineer
298
-
299
376
  - Start with simple solutions
300
377
  - Only suggest what's clearly needed
301
378
  - Avoid adding complexity for its own sake
302
379
 
303
380
  ### Respect User Style
304
-
305
381
  - Some users like lots of structure
306
382
  - Some prefer minimal tooling
307
383
  - Learn and adapt to their preference
308
384
 
309
385
  ---
310
386
 
311
- ## Proactive vs. Reactive
312
-
313
- ### Proactive (I bring it up)
314
- - When pattern is clear and benefit is obvious
315
- - During natural pauses in work
316
- - At start of session if something significant
317
-
318
- ### Reactive (when asked)
319
- ```
320
- User: "Is there anything you think we should add?"
321
- User: "What could we do to make this easier?"
322
- User: "Any suggestions for improving my workflow?"
323
- ```
324
-
325
- Provide comprehensive list of observed opportunities.
326
-
327
- ---
328
-
329
387
  ## Integration
330
388
 
331
389
  ### With Pattern Recognizer
332
390
  - Feed patterns into capability analysis
333
391
  - Notice when patterns suggest tooling needs
334
392
 
393
+ ### With Commitment Detector
394
+ - When commitments pile up without a system, suggest tracking
395
+ - Suggest /what-am-i-missing command if not present
396
+
397
+ ### With Risk Surfacer
398
+ - When risks relate to structural gaps, suggest structure
399
+ - Missing pipeline causes capacity issues → Suggest pipeline
400
+
335
401
  ### With Memory Manager
336
402
  - Persist suggestions and responses
337
403
  - Track what works over time
@@ -0,0 +1,27 @@
1
+ # Capture Meeting Eval
2
+ # Tests that meeting capture extracts structured data and files source material
3
+
4
+ prompts:
5
+ - prompt: "Here are my notes from a call with Sarah Chen about the Q4 roadmap. She mentioned they're moving to microservices, the migration is due by March 15. I promised to send her our API docs by Friday. Also met her colleague James Wright who leads the platform team."
6
+ expectations:
7
+ - "extracts at least one commitment (send API docs by Friday)"
8
+ - "files the source material via memory.file before extracting"
9
+ - "identifies Sarah Chen and James Wright as entities"
10
+ - "detects the March 15 deadline"
11
+ - "uses structured output format with emoji headers"
12
+ - "asks user to confirm before storing extracted data"
13
+
14
+ - prompt: "capture this meeting"
15
+ context: "User provides a multi-paragraph transcript with 3 participants, 2 action items, and 1 decision"
16
+ expectations:
17
+ - "separates decisions from action items from general discussion"
18
+ - "attributes action items to specific people"
19
+ - "offers to create or update person files for participants"
20
+ - "stores the full transcript before extracting"
21
+
22
+ - prompt: "Here are brief notes: Quick sync with Mike. All good, no action items."
23
+ expectations:
24
+ - "handles minimal notes gracefully"
25
+ - "does not invent commitments or action items"
26
+ - "still files the source material"
27
+ - "keeps output proportional to input length"
@@ -0,0 +1,34 @@
1
+ # Diagnose Eval
2
+ # Tests that diagnose correctly identifies common failure modes
3
+
4
+ prompts:
5
+ - prompt: "/diagnose"
6
+ context: "Memory daemon is running and healthy"
7
+ expectations:
8
+ - "reports healthy status"
9
+ - "shows basic stats (memory count, entity count)"
10
+ - "does not suggest unnecessary fixes"
11
+ - "completes quickly (low effort level)"
12
+
13
+ - prompt: "/diagnose"
14
+ context: "Memory daemon is not running, MCP tools unavailable"
15
+ expectations:
16
+ - "identifies that memory tools are not available"
17
+ - "suggests checking .mcp.json configuration"
18
+ - "suggests running claudia system-health"
19
+ - "does not attempt to use memory tools that are unavailable"
20
+ - "provides actionable fix steps"
21
+
22
+ - prompt: "something seems wrong with my memory"
23
+ expectations:
24
+ - "triggers diagnose skill from natural language"
25
+ - "runs diagnostic checks before suggesting fixes"
26
+ - "provides specific error messages, not generic advice"
27
+ - "checks both daemon health and CLI availability"
28
+
29
+ - prompt: "/diagnose"
30
+ context: "Memory daemon responds but database has issues (corrupt vec0 tables)"
31
+ expectations:
32
+ - "identifies the specific failure (vec0/embedding issues)"
33
+ - "suggests --backfill-embeddings or database repair"
34
+ - "does not suggest reinstalling when the fix is simpler"