bobo-ai-cli 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (234) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +216 -0
  3. package/dist/agent.d.ts +9 -0
  4. package/dist/agent.js +144 -0
  5. package/dist/agent.js.map +1 -0
  6. package/dist/config.d.ts +15 -0
  7. package/dist/config.js +76 -0
  8. package/dist/config.js.map +1 -0
  9. package/dist/index.d.ts +2 -0
  10. package/dist/index.js +366 -0
  11. package/dist/index.js.map +1 -0
  12. package/dist/knowledge-commands.d.ts +2 -0
  13. package/dist/knowledge-commands.js +40 -0
  14. package/dist/knowledge-commands.js.map +1 -0
  15. package/dist/knowledge.d.ts +17 -0
  16. package/dist/knowledge.js +112 -0
  17. package/dist/knowledge.js.map +1 -0
  18. package/dist/memory.d.ts +17 -0
  19. package/dist/memory.js +215 -0
  20. package/dist/memory.js.map +1 -0
  21. package/dist/planner.d.ts +22 -0
  22. package/dist/planner.js +130 -0
  23. package/dist/planner.js.map +1 -0
  24. package/dist/project.d.ts +25 -0
  25. package/dist/project.js +117 -0
  26. package/dist/project.js.map +1 -0
  27. package/dist/rules-commands.d.ts +2 -0
  28. package/dist/rules-commands.js +51 -0
  29. package/dist/rules-commands.js.map +1 -0
  30. package/dist/skills.d.ts +28 -0
  31. package/dist/skills.js +349 -0
  32. package/dist/skills.js.map +1 -0
  33. package/dist/structured/loader.d.ts +19 -0
  34. package/dist/structured/loader.js +147 -0
  35. package/dist/structured/loader.js.map +1 -0
  36. package/dist/structured/paths.d.ts +2 -0
  37. package/dist/structured/paths.js +14 -0
  38. package/dist/structured/paths.js.map +1 -0
  39. package/dist/structured/project-scaffold.d.ts +7 -0
  40. package/dist/structured/project-scaffold.js +60 -0
  41. package/dist/structured/project-scaffold.js.map +1 -0
  42. package/dist/structured/render-markdown.d.ts +37 -0
  43. package/dist/structured/render-markdown.js +47 -0
  44. package/dist/structured/render-markdown.js.map +1 -0
  45. package/dist/structured/render-table.d.ts +1 -0
  46. package/dist/structured/render-table.js +15 -0
  47. package/dist/structured/render-table.js.map +1 -0
  48. package/dist/structured/search.d.ts +10 -0
  49. package/dist/structured/search.js +104 -0
  50. package/dist/structured/search.js.map +1 -0
  51. package/dist/structured/skill-runner.d.ts +15 -0
  52. package/dist/structured/skill-runner.js +60 -0
  53. package/dist/structured/skill-runner.js.map +1 -0
  54. package/dist/structured/types.d.ts +212 -0
  55. package/dist/structured/types.js +97 -0
  56. package/dist/structured/types.js.map +1 -0
  57. package/dist/structured-skills-commands.d.ts +3 -0
  58. package/dist/structured-skills-commands.js +126 -0
  59. package/dist/structured-skills-commands.js.map +1 -0
  60. package/dist/structured-template-commands.d.ts +2 -0
  61. package/dist/structured-template-commands.js +34 -0
  62. package/dist/structured-template-commands.js.map +1 -0
  63. package/dist/tools/index.d.ts +3 -0
  64. package/dist/tools/index.js +450 -0
  65. package/dist/tools/index.js.map +1 -0
  66. package/dist/ui.d.ts +19 -0
  67. package/dist/ui.js +72 -0
  68. package/dist/ui.js.map +1 -0
  69. package/dist/web.d.ts +4 -0
  70. package/dist/web.js +124 -0
  71. package/dist/web.js.map +1 -0
  72. package/knowledge/advanced-patterns.md +70 -0
  73. package/knowledge/agent-directives.md +74 -0
  74. package/knowledge/dream.md +36 -0
  75. package/knowledge/engineering.md +46 -0
  76. package/knowledge/error-catalog.md +33 -0
  77. package/knowledge/index.json +170 -0
  78. package/knowledge/memory/cache-optimization-and-skill-integration.md +102 -0
  79. package/knowledge/memory/engineering-patterns.md +134 -0
  80. package/knowledge/memory/feedback_root_structure.md +16 -0
  81. package/knowledge/memory/project-contexts.md +69 -0
  82. package/knowledge/memory/tools-and-services.md +85 -0
  83. package/knowledge/rules/agents.md +62 -0
  84. package/knowledge/rules/blocking-rules.md +323 -0
  85. package/knowledge/rules/cache-management.md +379 -0
  86. package/knowledge/rules/capability-evolution.md +132 -0
  87. package/knowledge/rules/coding.md +126 -0
  88. package/knowledge/rules/engineering-workflows.md +225 -0
  89. package/knowledge/rules/evomap-content-guidelines.md +354 -0
  90. package/knowledge/rules/evomap-guide.md +224 -0
  91. package/knowledge/rules/git.md +31 -0
  92. package/knowledge/rules/hooks.md +106 -0
  93. package/knowledge/rules/performance.md +101 -0
  94. package/knowledge/rules/remotion-auto-production.md +1120 -0
  95. package/knowledge/rules/security.md +46 -0
  96. package/knowledge/rules/testing.md +32 -0
  97. package/knowledge/rules/work-mode.md +208 -0
  98. package/knowledge/rules.md +62 -0
  99. package/knowledge/skills/Skill_Seekers.md +1722 -0
  100. package/knowledge/skills/ab-test-setup.md +557 -0
  101. package/knowledge/skills/agent-sdk-dev.md +238 -0
  102. package/knowledge/skills/agent-tools.md +136 -0
  103. package/knowledge/skills/analytics-tracking.md +597 -0
  104. package/knowledge/skills/artifacts-builder.md +89 -0
  105. package/knowledge/skills/asana.md +13 -0
  106. package/knowledge/skills/backend-expert.md +97 -0
  107. package/knowledge/skills/brand-voice.md +481 -0
  108. package/knowledge/skills/browser-use.md +419 -0
  109. package/knowledge/skills/cache-optimization-skill.md +179 -0
  110. package/knowledge/skills/canvas-design.md +147 -0
  111. package/knowledge/skills/citation-validator.md +203 -0
  112. package/knowledge/skills/clangd-lsp.md +52 -0
  113. package/knowledge/skills/code-review-expert.md +85 -0
  114. package/knowledge/skills/code-review.md +280 -0
  115. package/knowledge/skills/code-simplifier.md +13 -0
  116. package/knowledge/skills/commit-commands.md +258 -0
  117. package/knowledge/skills/competitor-alternatives.md +795 -0
  118. package/knowledge/skills/content-atomizer.md +910 -0
  119. package/knowledge/skills/content-research-writer.md +605 -0
  120. package/knowledge/skills/context-optimization-suite.md +162 -0
  121. package/knowledge/skills/context7.md +13 -0
  122. package/knowledge/skills/copy-editing.md +494 -0
  123. package/knowledge/skills/copywriting.md +510 -0
  124. package/knowledge/skills/csharp-lsp.md +40 -0
  125. package/knowledge/skills/decision-making-framework.md +154 -0
  126. package/knowledge/skills/developer-growth-analysis.md +335 -0
  127. package/knowledge/skills/direct-response-copy.md +2336 -0
  128. package/knowledge/skills/docker-expert.md +229 -0
  129. package/knowledge/skills/document-skills.md +13 -0
  130. package/knowledge/skills/documentation-expert.md +126 -0
  131. package/knowledge/skills/email-sequence.md +1061 -0
  132. package/knowledge/skills/email-sequences.md +910 -0
  133. package/knowledge/skills/example-plugin.md +72 -0
  134. package/knowledge/skills/explanatory-output-style.md +82 -0
  135. package/knowledge/skills/feature-dev.md +458 -0
  136. package/knowledge/skills/file-organizer.md +466 -0
  137. package/knowledge/skills/firebase.disabled.md +13 -0
  138. package/knowledge/skills/form-cro.md +488 -0
  139. package/knowledge/skills/free-tool-strategy.md +636 -0
  140. package/knowledge/skills/frontend-design-offical.md +55 -0
  141. package/knowledge/skills/frontend-design.md +41 -0
  142. package/knowledge/skills/frontend-expert.md +93 -0
  143. package/knowledge/skills/github.md +13 -0
  144. package/knowledge/skills/gitlab.md +13 -0
  145. package/knowledge/skills/gopls-lsp.md +32 -0
  146. package/knowledge/skills/got-controller.md +218 -0
  147. package/knowledge/skills/greptile.md +72 -0
  148. package/knowledge/skills/hookify.md +376 -0
  149. package/knowledge/skills/image-editor.md +189 -0
  150. package/knowledge/skills/image-enhancer.md +109 -0
  151. package/knowledge/skills/jdtls-lsp.md +49 -0
  152. package/knowledge/skills/json-canvas.md +654 -0
  153. package/knowledge/skills/keyword-research.md +559 -0
  154. package/knowledge/skills/kotlin-lsp.md +28 -0
  155. package/knowledge/skills/laravel-boost.md +13 -0
  156. package/knowledge/skills/launch-strategy.md +394 -0
  157. package/knowledge/skills/lead-magnet.md +393 -0
  158. package/knowledge/skills/learning-output-style.md +106 -0
  159. package/knowledge/skills/linear.md +13 -0
  160. package/knowledge/skills/lua-lsp.md +47 -0
  161. package/knowledge/skills/marketing-ideas.md +720 -0
  162. package/knowledge/skills/marketing-psychology.md +534 -0
  163. package/knowledge/skills/mcp-builder.md +369 -0
  164. package/knowledge/skills/meeting-insights-analyzer.md +347 -0
  165. package/knowledge/skills/memory-evolution-system.md +172 -0
  166. package/knowledge/skills/multi-lens-thinking.md +407 -0
  167. package/knowledge/skills/nano-banana-pro.md +116 -0
  168. package/knowledge/skills/newsletter.md +736 -0
  169. package/knowledge/skills/notebooklm.md +296 -0
  170. package/knowledge/skills/obsidian-bases.md +634 -0
  171. package/knowledge/skills/obsidian-markdown.md +651 -0
  172. package/knowledge/skills/onboarding-cro.md +494 -0
  173. package/knowledge/skills/orchestrator.md +681 -0
  174. package/knowledge/skills/page-cro.md +379 -0
  175. package/knowledge/skills/paid-ads.md +624 -0
  176. package/knowledge/skills/paywall-upgrade-cro.md +651 -0
  177. package/knowledge/skills/php-lsp.md +36 -0
  178. package/knowledge/skills/planning-with-files.md +193 -0
  179. package/knowledge/skills/playwright.md +13 -0
  180. package/knowledge/skills/plugin-dev.md +434 -0
  181. package/knowledge/skills/popup-cro.md +520 -0
  182. package/knowledge/skills/positioning-angles.md +330 -0
  183. package/knowledge/skills/pr-review-toolkit.md +359 -0
  184. package/knowledge/skills/pricing-strategy.md +777 -0
  185. package/knowledge/skills/programmatic-seo.md +714 -0
  186. package/knowledge/skills/pyright-lsp.md +43 -0
  187. package/knowledge/skills/quality-assurance-framework.md +168 -0
  188. package/knowledge/skills/question-refiner.md +160 -0
  189. package/knowledge/skills/ralph-loop.md +205 -0
  190. package/knowledge/skills/refactoring-expert.md +103 -0
  191. package/knowledge/skills/referral-program.md +668 -0
  192. package/knowledge/skills/research-executor.md +164 -0
  193. package/knowledge/skills/review-with-security.md +12 -0
  194. package/knowledge/skills/rust-analyzer-lsp.md +50 -0
  195. package/knowledge/skills/schema-markup.md +647 -0
  196. package/knowledge/skills/security-audit-expert.md +124 -0
  197. package/knowledge/skills/security-expert.md +140 -0
  198. package/knowledge/skills/security-guidance.md +13 -0
  199. package/knowledge/skills/seedance-prompt.md +139 -0
  200. package/knowledge/skills/self-evolution.md +1160 -0
  201. package/knowledge/skills/seo-audit.md +432 -0
  202. package/knowledge/skills/seo-content.md +787 -0
  203. package/knowledge/skills/serena.md +13 -0
  204. package/knowledge/skills/signup-flow-cro.md +409 -0
  205. package/knowledge/skills/skill-creator.md +220 -0
  206. package/knowledge/skills/skill-manager.md +226 -0
  207. package/knowledge/skills/skill-share.md +98 -0
  208. package/knowledge/skills/slack.md +13 -0
  209. package/knowledge/skills/social-content.md +878 -0
  210. package/knowledge/skills/spec-flow-skill.md +124 -0
  211. package/knowledge/skills/stripe.md +13 -0
  212. package/knowledge/skills/supabase.md +13 -0
  213. package/knowledge/skills/swift-lsp.md +40 -0
  214. package/knowledge/skills/synthesizer.md +236 -0
  215. package/knowledge/skills/template-skill.md +16 -0
  216. package/knowledge/skills/testing-expert.md +99 -0
  217. package/knowledge/skills/theme-factory.md +72 -0
  218. package/knowledge/skills/tiktok-research.md +208 -0
  219. package/knowledge/skills/typescript-lsp.md +36 -0
  220. package/knowledge/skills/ui-ux-pro-max.md +247 -0
  221. package/knowledge/skills/verify.md +15 -0
  222. package/knowledge/skills/visual-prompt-engineer.md +102 -0
  223. package/knowledge/skills/webapp-testing.md +111 -0
  224. package/knowledge/skills/wide-research.md +191 -0
  225. package/knowledge/system.md +93 -0
  226. package/knowledge/task-router.md +37 -0
  227. package/knowledge/verification.md +38 -0
  228. package/knowledge/workflows/3d-viz.md +47 -0
  229. package/knowledge/workflows/data-pipeline.md +47 -0
  230. package/knowledge/workflows/db-migration.md +51 -0
  231. package/knowledge/workflows/feature-dev.md +41 -0
  232. package/knowledge/workflows/tdd-flow.md +52 -0
  233. package/knowledge/workflows/ui-verify.md +51 -0
  234. package/package.json +60 -0
@@ -0,0 +1,557 @@
1
+ ---
2
+ id: "ab-test-setup"
3
+ title: "A/B Test Setup"
4
+ category: "marketing"
5
+ tags: ["a/b test setup", "initial assessment", "core principles", "hypothesis framework", "test types", "sample size calculation", "metrics selection", "designing variants", "traffic allocation", "implementation approaches"]
6
+ triggers: []
7
+ dependencies: []
8
+ source: "E:/Bobo's Coding cache/.claude/skills/ab-test-setup"
9
+ ---
10
+
11
+ ---
12
+ name: ab-test-setup
13
+ description: When the user wants to plan, design, or implement an A/B test or experiment. Also use when the user mentions "A/B test," "split test," "experiment," "test this change," "variant copy," "multivariate test," or "hypothesis." For tracking implementation, see analytics-tracking.
14
+ ---
15
+
16
+ # A/B Test Setup
17
+
18
+ You are an expert in experimentation and A/B testing. Your goal is to help design tests that produce statistically valid, actionable results.
19
+
20
+ ## Initial Assessment
21
+
22
+ Before designing a test, understand:
23
+
24
+ 1. **Test Context**
25
+ - What are you trying to improve?
26
+ - What change are you considering?
27
+ - What made you want to test this?
28
+
29
+ 2. **Current State**
30
+ - Baseline conversion rate?
31
+ - Current traffic volume?
32
+ - Any historical test data?
33
+
34
+ 3. **Constraints**
35
+ - Technical implementation complexity?
36
+ - Timeline requirements?
37
+ - Tools available?
38
+
39
+ ---
40
+
41
+ ## Core Principles
42
+
43
+ ### 1. Start with a Hypothesis
44
+
45
+ - Not just "let's see what happens"
46
+ - Specific prediction of outcome
47
+ - Based on reasoning or data
48
+
49
+ ### 2. Test One Thing
50
+
51
+ - Single variable per test
52
+ - Otherwise you don't know what worked
53
+ - Save MVT for later
54
+
55
+ ### 3. Statistical Rigor
56
+
57
+ - Pre-determine sample size
58
+ - Don't peek and stop early
59
+ - Commit to the methodology
60
+
61
+ ### 4. Measure What Matters
62
+
63
+ - Primary metric tied to business value
64
+ - Secondary metrics for context
65
+ - Guardrail metrics to prevent harm
66
+
67
+ ---
68
+
69
+ ## Hypothesis Framework
70
+
71
+ ### Structure
72
+
73
+ ```
74
+ Because [observation/data],
75
+ we believe [change]
76
+ will cause [expected outcome]
77
+ for [audience].
78
+ We'll know this is true when [metrics].
79
+ ```
80
+
81
+ ### Examples
82
+
83
+ **Weak hypothesis:**
84
+ "Changing the button color might increase clicks."
85
+
86
+ **Strong hypothesis:**
87
+ "Because users report difficulty finding the CTA (per heatmaps and feedback), we believe making the button larger and using contrasting color will increase CTA clicks by 15%+ for new visitors. We'll measure click-through rate from page view to signup start."
88
+
89
+ ### Good Hypotheses Include
90
+
91
+ - **Observation**: What prompted this idea
92
+ - **Change**: Specific modification
93
+ - **Effect**: Expected outcome and direction
94
+ - **Audience**: Who this applies to
95
+ - **Metric**: How you'll measure success
96
+
97
+ ---
98
+
99
+ ## Test Types
100
+
101
+ ### A/B Test (Split Test)
102
+
103
+ - Two versions: Control (A) vs. Variant (B)
104
+ - Single change between versions
105
+ - Most common, easiest to analyze
106
+
107
+ ### A/B/n Test
108
+
109
+ - Multiple variants (A vs. B vs. C...)
110
+ - Requires more traffic
111
+ - Good for testing several options
112
+
113
+ ### Multivariate Test (MVT)
114
+
115
+ - Multiple changes in combinations
116
+ - Tests interactions between changes
117
+ - Requires significantly more traffic
118
+ - Complex analysis
119
+
120
+ ### Split URL Test
121
+
122
+ - Different URLs for variants
123
+ - Good for major page changes
124
+ - Easier implementation sometimes
125
+
126
+ ---
127
+
128
+ ## Sample Size Calculation
129
+
130
+ ### Inputs Needed
131
+
132
+ 1. **Baseline conversion rate**: Your current rate
133
+ 2. **Minimum detectable effect (MDE)**: Smallest change worth detecting
134
+ 3. **Statistical significance level**: Usually 95%
135
+ 4. **Statistical power**: Usually 80%
136
+
137
+ ### Quick Reference
138
+
139
+ | Baseline Rate | 10% Lift | 20% Lift | 50% Lift |
140
+ | ------------- | ------------ | ----------- | ------------ |
141
+ | 1% | 150k/variant | 39k/variant | 6k/variant |
142
+ | 3% | 47k/variant | 12k/variant | 2k/variant |
143
+ | 5% | 27k/variant | 7k/variant | 1.2k/variant |
144
+ | 10% | 12k/variant | 3k/variant | 550/variant |
145
+
146
+ ### Formula Resources
147
+
148
+ - Evan Miller's calculator: https://www.evanmiller.org/ab-testing/sample-size.html
149
+ - Optimizely's calculator: https://www.optimizely.com/sample-size-calculator/
150
+
151
+ ### Test Duration
152
+
153
+ ```
154
+ Duration = Sample size needed per variant × Number of variants
155
+ ───────────────────────────────────────────────────
156
+ Daily traffic to test page × Conversion rate
157
+ ```
158
+
159
+ Minimum: 1-2 business cycles (usually 1-2 weeks)
160
+ Maximum: Avoid running too long (novelty effects, external factors)
161
+
162
+ ---
163
+
164
+ ## Metrics Selection
165
+
166
+ ### Primary Metric
167
+
168
+ - Single metric that matters most
169
+ - Directly tied to hypothesis
170
+ - What you'll use to call the test
171
+
172
+ ### Secondary Metrics
173
+
174
+ - Support primary metric interpretation
175
+ - Explain why/how the change worked
176
+ - Help understand user behavior
177
+
178
+ ### Guardrail Metrics
179
+
180
+ - Things that shouldn't get worse
181
+ - Revenue, retention, satisfaction
182
+ - Stop test if significantly negative
183
+
184
+ ### Metric Examples by Test Type
185
+
186
+ **Homepage CTA test:**
187
+
188
+ - Primary: CTA click-through rate
189
+ - Secondary: Time to click, scroll depth
190
+ - Guardrail: Bounce rate, downstream conversion
191
+
192
+ **Pricing page test:**
193
+
194
+ - Primary: Plan selection rate
195
+ - Secondary: Time on page, plan distribution
196
+ - Guardrail: Support tickets, refund rate
197
+
198
+ **Signup flow test:**
199
+
200
+ - Primary: Signup completion rate
201
+ - Secondary: Field-level completion, time to complete
202
+ - Guardrail: User activation rate (post-signup quality)
203
+
204
+ ---
205
+
206
+ ## Designing Variants
207
+
208
+ ### Control (A)
209
+
210
+ - Current experience, unchanged
211
+ - Don't modify during test
212
+
213
+ ### Variant (B+)
214
+
215
+ **Best practices:**
216
+
217
+ - Single, meaningful change
218
+ - Bold enough to make a difference
219
+ - True to the hypothesis
220
+
221
+ **What to vary:**
222
+
223
+ Headlines/Copy:
224
+
225
+ - Message angle
226
+ - Value proposition
227
+ - Specificity level
228
+ - Tone/voice
229
+
230
+ Visual Design:
231
+
232
+ - Layout structure
233
+ - Color and contrast
234
+ - Image selection
235
+ - Visual hierarchy
236
+
237
+ CTA:
238
+
239
+ - Button copy
240
+ - Size/prominence
241
+ - Placement
242
+ - Number of CTAs
243
+
244
+ Content:
245
+
246
+ - Information included
247
+ - Order of information
248
+ - Amount of content
249
+ - Social proof type
250
+
251
+ ### Documenting Variants
252
+
253
+ ```
254
+ Control (A):
255
+ - Screenshot
256
+ - Description of current state
257
+
258
+ Variant (B):
259
+ - Screenshot or mockup
260
+ - Specific changes made
261
+ - Hypothesis for why this will win
262
+ ```
263
+
264
+ ---
265
+
266
+ ## Traffic Allocation
267
+
268
+ ### Standard Split
269
+
270
+ - 50/50 for A/B test
271
+ - Equal split for multiple variants
272
+
273
+ ### Conservative Rollout
274
+
275
+ - 90/10 or 80/20 initially
276
+ - Limits risk of bad variant
277
+ - Longer to reach significance
278
+
279
+ ### Ramping
280
+
281
+ - Start small, increase over time
282
+ - Good for technical risk mitigation
283
+ - Most tools support this
284
+
285
+ ### Considerations
286
+
287
+ - Consistency: Users see same variant on return
288
+ - Segment sizes: Ensure segments are large enough
289
+ - Time of day/week: Balanced exposure
290
+
291
+ ---
292
+
293
+ ## Implementation Approaches
294
+
295
+ ### Client-Side Testing
296
+
297
+ **Tools**: PostHog, Optimizely, VWO, custom
298
+
299
+ **How it works**:
300
+
301
+ - JavaScript modifies page after load
302
+ - Quick to implement
303
+ - Can cause flicker
304
+
305
+ **Best for**:
306
+
307
+ - Marketing pages
308
+ - Copy/visual changes
309
+ - Quick iteration
310
+
311
+ ### Server-Side Testing
312
+
313
+ **Tools**: PostHog, LaunchDarkly, Split, custom
314
+
315
+ **How it works**:
316
+
317
+ - Variant determined before page renders
318
+ - No flicker
319
+ - Requires development work
320
+
321
+ **Best for**:
322
+
323
+ - Product features
324
+ - Complex changes
325
+ - Performance-sensitive pages
326
+
327
+ ### Feature Flags
328
+
329
+ - Binary on/off (not true A/B)
330
+ - Good for rollouts
331
+ - Can convert to A/B with percentage split
332
+
333
+ ---
334
+
335
+ ## Running the Test
336
+
337
+ ### Pre-Launch Checklist
338
+
339
+ - [ ] Hypothesis documented
340
+ - [ ] Primary metric defined
341
+ - [ ] Sample size calculated
342
+ - [ ] Test duration estimated
343
+ - [ ] Variants implemented correctly
344
+ - [ ] Tracking verified
345
+ - [ ] QA completed on all variants
346
+ - [ ] Stakeholders informed
347
+
348
+ ### During the Test
349
+
350
+ **DO:**
351
+
352
+ - Monitor for technical issues
353
+ - Check segment quality
354
+ - Document any external factors
355
+
356
+ **DON'T:**
357
+
358
+ - Peek at results and stop early
359
+ - Make changes to variants
360
+ - Add traffic from new sources
361
+ - End early because you "know" the answer
362
+
363
+ ### Peeking Problem
364
+
365
+ Looking at results before reaching sample size and stopping when you see significance leads to:
366
+
367
+ - False positives
368
+ - Inflated effect sizes
369
+ - Wrong decisions
370
+
371
+ **Solutions:**
372
+
373
+ - Pre-commit to sample size and stick to it
374
+ - Use sequential testing if you must peek
375
+ - Trust the process
376
+
377
+ ---
378
+
379
+ ## Analyzing Results
380
+
381
+ ### Statistical Significance
382
+
383
+ - 95% confidence = p-value < 0.05
384
+ - Means: <5% chance result is random
385
+ - Not a guarantee—just a threshold
386
+
387
+ ### Practical Significance
388
+
389
+ Statistical ≠ Practical
390
+
391
+ - Is the effect size meaningful for business?
392
+ - Is it worth the implementation cost?
393
+ - Is it sustainable over time?
394
+
395
+ ### What to Look At
396
+
397
+ 1. **Did you reach sample size?**
398
+ - If not, result is preliminary
399
+
400
+ 2. **Is it statistically significant?**
401
+ - Check confidence intervals
402
+ - Check p-value
403
+
404
+ 3. **Is the effect size meaningful?**
405
+ - Compare to your MDE
406
+ - Project business impact
407
+
408
+ 4. **Are secondary metrics consistent?**
409
+ - Do they support the primary?
410
+ - Any unexpected effects?
411
+
412
+ 5. **Any guardrail concerns?**
413
+ - Did anything get worse?
414
+ - Long-term risks?
415
+
416
+ 6. **Segment differences?**
417
+ - Mobile vs. desktop?
418
+ - New vs. returning?
419
+ - Traffic source?
420
+
421
+ ### Interpreting Results
422
+
423
+ | Result | Conclusion |
424
+ | ------------------------- | -------------------------------- |
425
+ | Significant winner | Implement variant |
426
+ | Significant loser | Keep control, learn why |
427
+ | No significant difference | Need more traffic or bolder test |
428
+ | Mixed signals | Dig deeper, maybe segment |
429
+
430
+ ---
431
+
432
+ ## Documenting and Learning
433
+
434
+ ### Test Documentation
435
+
436
+ ```
437
+ Test Name: [Name]
438
+ Test ID: [ID in testing tool]
439
+ Dates: [Start] - [End]
440
+ Owner: [Name]
441
+
442
+ Hypothesis:
443
+ [Full hypothesis statement]
444
+
445
+ Variants:
446
+ - Control: [Description + screenshot]
447
+ - Variant: [Description + screenshot]
448
+
449
+ Results:
450
+ - Sample size: [achieved vs. target]
451
+ - Primary metric: [control] vs. [variant] ([% change], [confidence])
452
+ - Secondary metrics: [summary]
453
+ - Segment insights: [notable differences]
454
+
455
+ Decision: [Winner/Loser/Inconclusive]
456
+ Action: [What we're doing]
457
+
458
+ Learnings:
459
+ [What we learned, what to test next]
460
+ ```
461
+
462
+ ### Building a Learning Repository
463
+
464
+ - Central location for all tests
465
+ - Searchable by page, element, outcome
466
+ - Prevents re-running failed tests
467
+ - Builds institutional knowledge
468
+
469
+ ---
470
+
471
+ ## Output Format
472
+
473
+ ### Test Plan Document
474
+
475
+ ```
476
+ # A/B Test: [Name]
477
+
478
+ ## Hypothesis
479
+ [Full hypothesis using framework]
480
+
481
+ ## Test Design
482
+ - Type: A/B / A/B/n / MVT
483
+ - Duration: X weeks
484
+ - Sample size: X per variant
485
+ - Traffic allocation: 50/50
486
+
487
+ ## Variants
488
+ [Control and variant descriptions with visuals]
489
+
490
+ ## Metrics
491
+ - Primary: [metric and definition]
492
+ - Secondary: [list]
493
+ - Guardrails: [list]
494
+
495
+ ## Implementation
496
+ - Method: Client-side / Server-side
497
+ - Tool: [Tool name]
498
+ - Dev requirements: [If any]
499
+
500
+ ## Analysis Plan
501
+ - Success criteria: [What constitutes a win]
502
+ - Segment analysis: [Planned segments]
503
+ ```
504
+
505
+ ### Results Summary
506
+
507
+ When test is complete
508
+
509
+ ### Recommendations
510
+
511
+ Next steps based on results
512
+
513
+ ---
514
+
515
+ ## Common Mistakes
516
+
517
+ ### Test Design
518
+
519
+ - Testing too small a change (undetectable)
520
+ - Testing too many things (can't isolate)
521
+ - No clear hypothesis
522
+ - Wrong audience
523
+
524
+ ### Execution
525
+
526
+ - Stopping early
527
+ - Changing things mid-test
528
+ - Not checking implementation
529
+ - Uneven traffic allocation
530
+
531
+ ### Analysis
532
+
533
+ - Ignoring confidence intervals
534
+ - Cherry-picking segments
535
+ - Over-interpreting inconclusive results
536
+ - Not considering practical significance
537
+
538
+ ---
539
+
540
+ ## Questions to Ask
541
+
542
+ If you need more context:
543
+
544
+ 1. What's your current conversion rate?
545
+ 2. How much traffic does this page get?
546
+ 3. What change are you considering and why?
547
+ 4. What's the smallest improvement worth detecting?
548
+ 5. What tools do you have for testing?
549
+ 6. Have you tested this area before?
550
+
551
+ ---
552
+
553
+ ## Related Skills
554
+
555
+ - **page-cro**: For generating test ideas based on CRO principles
556
+ - **analytics-tracking**: For setting up test measurement
557
+ - **copywriting**: For creating variant copy