mindforge-cc 11.5.1 → 11.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (214) hide show
  1. package/.agent/mindforge/skill-tdd.md +53 -0
  2. package/.agent/mindforge/skills-index.md +118 -0
  3. package/.agent/mindforge/systematic-debug.md +60 -0
  4. package/.agent/mindforge/wf-catalog.md +37 -0
  5. package/.agent/mindforge/wf-code-audit.md +31 -0
  6. package/.agent/mindforge/wf-competitive-analysis.md +31 -0
  7. package/.agent/mindforge/wf-deep-research.md +32 -0
  8. package/.agent/mindforge/wf-feature-planner.md +31 -0
  9. package/.agent/mindforge/wf-incident-response.md +31 -0
  10. package/.agent/mindforge/wf-onboard-codebase.md +31 -0
  11. package/.agent/mindforge/wf-perf-optimize.md +31 -0
  12. package/.agent/mindforge/wf-pr-review.md +31 -0
  13. package/.agent/mindforge/wf-refactor-plan.md +31 -0
  14. package/.agent/mindforge/wf-release-prep.md +31 -0
  15. package/.agent/mindforge/wf-tdd-sprint.md +31 -0
  16. package/.agent/mindforge/wf-tech-evaluation.md +31 -0
  17. package/.agent/skills/1password-skill/SKILL.md +156 -0
  18. package/.agent/skills/1password-skill/references/cli-examples.md +31 -0
  19. package/.agent/skills/1password-skill/references/get-started.md +21 -0
  20. package/.agent/skills/article-illustrator/SKILL.md +199 -0
  21. package/.agent/skills/article-illustrator/references/prompt-construction.md +426 -0
  22. package/.agent/skills/article-illustrator/references/style-presets.md +80 -0
  23. package/.agent/skills/article-illustrator/references/styles.md +224 -0
  24. package/.agent/skills/article-illustrator/references/usage.md +50 -0
  25. package/.agent/skills/article-illustrator/references/workflow.md +332 -0
  26. package/.agent/skills/arxiv/SKILL.md +275 -0
  27. package/.agent/skills/blogwatcher/SKILL.md +130 -0
  28. package/.agent/skills/code-wiki/SKILL.md +438 -0
  29. package/.agent/skills/code-wiki/templates/README.md +31 -0
  30. package/.agent/skills/code-wiki/templates/architecture.md +30 -0
  31. package/.agent/skills/code-wiki/templates/getting-started.md +47 -0
  32. package/.agent/skills/code-wiki/templates/module.md +38 -0
  33. package/.agent/skills/codebase-inspection/SKILL.md +109 -0
  34. package/.agent/skills/comic-creator/SKILL.md +240 -0
  35. package/.agent/skills/comic-creator/references/analysis-framework.md +176 -0
  36. package/.agent/skills/comic-creator/references/auto-selection.md +71 -0
  37. package/.agent/skills/comic-creator/references/base-prompt.md +98 -0
  38. package/.agent/skills/comic-creator/references/character-template.md +180 -0
  39. package/.agent/skills/comic-creator/references/ohmsha-guide.md +85 -0
  40. package/.agent/skills/comic-creator/references/partial-workflows.md +106 -0
  41. package/.agent/skills/comic-creator/references/storyboard-template.md +143 -0
  42. package/.agent/skills/comic-creator/references/workflow.md +401 -0
  43. package/.agent/skills/concept-diagrams/SKILL.md +355 -0
  44. package/.agent/skills/concept-diagrams/references/dashboard-patterns.md +43 -0
  45. package/.agent/skills/concept-diagrams/references/infrastructure-patterns.md +144 -0
  46. package/.agent/skills/concept-diagrams/references/physical-shape-cookbook.md +42 -0
  47. package/.agent/skills/creative-ideation/SKILL.md +144 -0
  48. package/.agent/skills/creative-ideation/references/full-prompt-library.md +110 -0
  49. package/.agent/skills/devops-cli/SKILL.md +149 -0
  50. package/.agent/skills/devops-cli/references/app-discovery.md +112 -0
  51. package/.agent/skills/devops-cli/references/authentication.md +59 -0
  52. package/.agent/skills/devops-cli/references/cli-reference.md +104 -0
  53. package/.agent/skills/devops-cli/references/running-apps.md +171 -0
  54. package/.agent/skills/devops-watchers/SKILL.md +103 -0
  55. package/.agent/skills/docker-management/SKILL.md +273 -0
  56. package/.agent/skills/domain-intel/SKILL.md +96 -0
  57. package/.agent/skills/duckduckgo-search/SKILL.md +230 -0
  58. package/.agent/skills/github-auth/SKILL.md +240 -0
  59. package/.agent/skills/github-code-review/SKILL.md +474 -0
  60. package/.agent/skills/github-code-review/references/review-output-template.md +74 -0
  61. package/.agent/skills/github-issues/SKILL.md +363 -0
  62. package/.agent/skills/github-issues/templates/bug-report.md +35 -0
  63. package/.agent/skills/github-issues/templates/feature-request.md +31 -0
  64. package/.agent/skills/github-pr-workflow/SKILL.md +360 -0
  65. package/.agent/skills/github-pr-workflow/references/ci-troubleshooting.md +183 -0
  66. package/.agent/skills/github-pr-workflow/references/conventional-commits.md +71 -0
  67. package/.agent/skills/github-pr-workflow/templates/pr-body-bugfix.md +35 -0
  68. package/.agent/skills/github-pr-workflow/templates/pr-body-feature.md +33 -0
  69. package/.agent/skills/github-repo-management/SKILL.md +509 -0
  70. package/.agent/skills/github-repo-management/references/github-api-cheatsheet.md +161 -0
  71. package/.agent/skills/godmode/SKILL.md +396 -0
  72. package/.agent/skills/godmode/references/jailbreak-templates.md +128 -0
  73. package/.agent/skills/godmode/references/refusal-detection.md +142 -0
  74. package/.agent/skills/hyperframes/SKILL.md +182 -0
  75. package/.agent/skills/hyperframes/references/cli.md +185 -0
  76. package/.agent/skills/hyperframes/references/composition.md +129 -0
  77. package/.agent/skills/hyperframes/references/features.md +289 -0
  78. package/.agent/skills/hyperframes/references/gsap.md +136 -0
  79. package/.agent/skills/hyperframes/references/troubleshooting.md +137 -0
  80. package/.agent/skills/hyperframes/references/website-to-video.md +145 -0
  81. package/.agent/skills/jupyter-live-kernel/SKILL.md +160 -0
  82. package/.agent/skills/kanban-orchestrator/SKILL.md +209 -0
  83. package/.agent/skills/kanban-worker/SKILL.md +188 -0
  84. package/.agent/skills/llm-wiki/SKILL.md +499 -0
  85. package/.agent/skills/meme-generation/SKILL.md +122 -0
  86. package/.agent/skills/node-inspect-debugger/SKILL.md +312 -0
  87. package/.agent/skills/obsidian/SKILL.md +60 -0
  88. package/.agent/skills/osint-investigation/SKILL.md +269 -0
  89. package/.agent/skills/osint-investigation/templates/source-template.md +59 -0
  90. package/.agent/skills/oss-forensics/SKILL.md +422 -0
  91. package/.agent/skills/oss-forensics/references/evidence-types.md +89 -0
  92. package/.agent/skills/oss-forensics/references/github-archive-guide.md +184 -0
  93. package/.agent/skills/oss-forensics/references/investigation-templates.md +131 -0
  94. package/.agent/skills/oss-forensics/references/recovery-techniques.md +164 -0
  95. package/.agent/skills/oss-forensics/templates/forensic-report.md +151 -0
  96. package/.agent/skills/oss-forensics/templates/malicious-package-report.md +43 -0
  97. package/.agent/skills/parallel-cli/SKILL.md +384 -0
  98. package/.agent/skills/pinggy-tunnel/SKILL.md +302 -0
  99. package/.agent/skills/pixel-art/SKILL.md +209 -0
  100. package/.agent/skills/pixel-art/references/palettes.md +49 -0
  101. package/.agent/skills/plan/SKILL.md +331 -0
  102. package/.agent/skills/polymarket/SKILL.md +75 -0
  103. package/.agent/skills/polymarket/references/api-endpoints.md +220 -0
  104. package/.agent/skills/python-debugpy/SKILL.md +368 -0
  105. package/.agent/skills/requesting-code-review/SKILL.md +273 -0
  106. package/.agent/skills/research-paper-writing/SKILL.md +2367 -0
  107. package/.agent/skills/research-paper-writing/references/autoreason-methodology.md +394 -0
  108. package/.agent/skills/research-paper-writing/references/checklists.md +434 -0
  109. package/.agent/skills/research-paper-writing/references/citation-workflow.md +563 -0
  110. package/.agent/skills/research-paper-writing/references/experiment-patterns.md +728 -0
  111. package/.agent/skills/research-paper-writing/references/human-evaluation.md +476 -0
  112. package/.agent/skills/research-paper-writing/references/paper-types.md +481 -0
  113. package/.agent/skills/research-paper-writing/references/reviewer-guidelines.md +433 -0
  114. package/.agent/skills/research-paper-writing/references/sources.md +191 -0
  115. package/.agent/skills/research-paper-writing/references/writing-guide.md +474 -0
  116. package/.agent/skills/research-paper-writing/templates/README.md +251 -0
  117. package/.agent/skills/rest-graphql-debug/SKILL.md +507 -0
  118. package/.agent/skills/s6-container-supervision/SKILL.md +171 -0
  119. package/.agent/skills/scrapling/SKILL.md +328 -0
  120. package/.agent/skills/sherlock/SKILL.md +186 -0
  121. package/.agent/skills/simplify-code/SKILL.md +168 -0
  122. package/.agent/skills/skill-authoring/SKILL.md +158 -0
  123. package/.agent/skills/spike/SKILL.md +190 -0
  124. package/.agent/skills/subagent-driven-development/SKILL.md +345 -0
  125. package/.agent/skills/subagent-driven-development/references/context-budget-discipline.md +53 -0
  126. package/.agent/skills/subagent-driven-development/references/gates-taxonomy.md +93 -0
  127. package/.agent/skills/systematic-debugging/SKILL.md +360 -0
  128. package/.agent/skills/test-driven-development/SKILL.md +336 -0
  129. package/.agent/skills/video-orchestrator/SKILL.md +194 -0
  130. package/.agent/skills/video-orchestrator/references/examples.md +227 -0
  131. package/.agent/skills/video-orchestrator/references/intake.md +166 -0
  132. package/.agent/skills/video-orchestrator/references/kanban-setup.md +278 -0
  133. package/.agent/skills/video-orchestrator/references/monitoring.md +180 -0
  134. package/.agent/skills/video-orchestrator/references/role-archetypes.md +298 -0
  135. package/.agent/skills/video-orchestrator/references/tool-matrix.md +317 -0
  136. package/.agent/skills/web-pentest/SKILL.md +332 -0
  137. package/.agent/skills/web-pentest/references/bypass-techniques.md +133 -0
  138. package/.agent/skills/web-pentest/references/exploitation-techniques.md +204 -0
  139. package/.agent/skills/web-pentest/references/scope-enforcement.md +110 -0
  140. package/.agent/skills/web-pentest/references/vuln-taxonomy.md +81 -0
  141. package/.agent/skills/web-pentest/templates/authorization.md +69 -0
  142. package/.agent/skills/web-pentest/templates/pentest-report.md +178 -0
  143. package/.claude/commands/mindforge/skill-tdd.md +53 -0
  144. package/.claude/commands/mindforge/skills-index.md +118 -0
  145. package/.claude/commands/mindforge/systematic-debug.md +60 -0
  146. package/.claude/commands/mindforge/wf-catalog.md +37 -0
  147. package/.claude/commands/mindforge/wf-code-audit.md +31 -0
  148. package/.claude/commands/mindforge/wf-competitive-analysis.md +31 -0
  149. package/.claude/commands/mindforge/wf-deep-research.md +32 -0
  150. package/.claude/commands/mindforge/wf-feature-planner.md +31 -0
  151. package/.claude/commands/mindforge/wf-incident-response.md +31 -0
  152. package/.claude/commands/mindforge/wf-onboard-codebase.md +31 -0
  153. package/.claude/commands/mindforge/wf-perf-optimize.md +31 -0
  154. package/.claude/commands/mindforge/wf-pr-review.md +31 -0
  155. package/.claude/commands/mindforge/wf-refactor-plan.md +31 -0
  156. package/.claude/commands/mindforge/wf-release-prep.md +31 -0
  157. package/.claude/commands/mindforge/wf-tdd-sprint.md +31 -0
  158. package/.claude/commands/mindforge/wf-tech-evaluation.md +31 -0
  159. package/.mindforge/config.json +2 -2
  160. package/.mindforge/dynamic-workflows/REGISTRY.md +65 -0
  161. package/.mindforge/dynamic-workflows/index.json +171 -0
  162. package/.mindforge/dynamic-workflows/scripts/code-audit.js +103 -0
  163. package/.mindforge/dynamic-workflows/scripts/competitive-analysis.js +85 -0
  164. package/.mindforge/dynamic-workflows/scripts/deep-research.js +151 -0
  165. package/.mindforge/dynamic-workflows/scripts/feature-planner.js +104 -0
  166. package/.mindforge/dynamic-workflows/scripts/incident-response.js +106 -0
  167. package/.mindforge/dynamic-workflows/scripts/onboard-codebase.js +102 -0
  168. package/.mindforge/dynamic-workflows/scripts/perf-optimize.js +128 -0
  169. package/.mindforge/dynamic-workflows/scripts/pr-review.js +87 -0
  170. package/.mindforge/dynamic-workflows/scripts/refactor-plan.js +121 -0
  171. package/.mindforge/dynamic-workflows/scripts/release-prep.js +102 -0
  172. package/.mindforge/dynamic-workflows/scripts/tdd-sprint.js +103 -0
  173. package/.mindforge/dynamic-workflows/scripts/tech-evaluation.js +72 -0
  174. package/.mindforge/memory/sync-manifest.json +1 -1
  175. package/.mindforge/skills/arxiv/SKILL.md +294 -0
  176. package/.mindforge/skills/blogwatcher/SKILL.md +147 -0
  177. package/.mindforge/skills/code-wiki/SKILL.md +457 -0
  178. package/.mindforge/skills/codebase-inspection/SKILL.md +126 -0
  179. package/.mindforge/skills/concept-diagrams/SKILL.md +373 -0
  180. package/.mindforge/skills/creative-ideation/SKILL.md +162 -0
  181. package/.mindforge/skills/domain-intel/SKILL.md +116 -0
  182. package/.mindforge/skills/duckduckgo-search/SKILL.md +249 -0
  183. package/.mindforge/skills/github-code-review/SKILL.md +493 -0
  184. package/.mindforge/skills/github-issues/SKILL.md +382 -0
  185. package/.mindforge/skills/github-pr-workflow/SKILL.md +379 -0
  186. package/.mindforge/skills/jupyter-live-kernel/SKILL.md +179 -0
  187. package/.mindforge/skills/kanban-orchestrator/SKILL.md +227 -0
  188. package/.mindforge/skills/kanban-worker/SKILL.md +206 -0
  189. package/.mindforge/skills/meme-generation/SKILL.md +141 -0
  190. package/.mindforge/skills/obsidian/SKILL.md +80 -0
  191. package/.mindforge/skills/osint-investigation/SKILL.md +288 -0
  192. package/.mindforge/skills/oss-forensics/SKILL.md +421 -0
  193. package/.mindforge/skills/pixel-art/SKILL.md +228 -0
  194. package/.mindforge/skills/plan/SKILL.md +350 -0
  195. package/.mindforge/skills/requesting-code-review/SKILL.md +292 -0
  196. package/.mindforge/skills/research-paper-writing/SKILL.md +2384 -0
  197. package/.mindforge/skills/scrapling/SKILL.md +345 -0
  198. package/.mindforge/skills/sherlock/SKILL.md +203 -0
  199. package/.mindforge/skills/simplify-code/SKILL.md +187 -0
  200. package/.mindforge/skills/spike/SKILL.md +209 -0
  201. package/.mindforge/skills/subagent-driven-development/SKILL.md +364 -0
  202. package/.mindforge/skills/systematic-debugging/SKILL.md +379 -0
  203. package/.mindforge/skills/test-driven-development/SKILL.md +355 -0
  204. package/.mindforge/skills/web-pentest/SKILL.md +327 -0
  205. package/CHANGELOG.md +71 -0
  206. package/MINDFORGE.md +2 -2
  207. package/README.md +72 -3
  208. package/RELEASENOTES.md +109 -0
  209. package/bin/installer-core.js +6 -2
  210. package/bin/mindforge-cli.js +7 -0
  211. package/bin/workflows/workflow-runner.js +110 -0
  212. package/docs/commands-reference.md +25 -0
  213. package/docs/getting-started.md +42 -5
  214. package/package.json +2 -1
@@ -0,0 +1,481 @@
1
+ # Paper Types Beyond Empirical ML
2
+
3
+ Guide for writing non-standard paper types: theory papers, survey/tutorial papers, benchmark/dataset papers, and position papers. Each type has distinct structure, evidence standards, and venue expectations.
4
+
5
+ ---
6
+
7
+ ## Contents
8
+
9
+ - [Theory Papers](#theory-papers)
10
+ - [Survey and Tutorial Papers](#survey-and-tutorial-papers)
11
+ - [Benchmark and Dataset Papers](#benchmark-and-dataset-papers)
12
+ - [Position Papers](#position-papers)
13
+ - [Reproducibility and Replication Papers](#reproducibility-and-replication-papers)
14
+
15
+ ---
16
+
17
+ ## Theory Papers
18
+
19
+ ### When to Write a Theory Paper
20
+
21
+ Your paper should be a theory paper if:
22
+ - The main contribution is a theorem, bound, impossibility result, or formal characterization
23
+ - Experiments are supplementary validation, not the core evidence
24
+ - The contribution advances understanding rather than achieving state-of-the-art numbers
25
+
26
+ ### Structure
27
+
28
+ ```
29
+ 1. Introduction (1-1.5 pages)
30
+ - Problem statement and motivation
31
+ - Informal statement of main results
32
+ - Comparison to prior theoretical work
33
+ - Contribution bullets (state theorems informally)
34
+
35
+ 2. Preliminaries (0.5-1 page)
36
+ - Notation table
37
+ - Formal definitions
38
+ - Assumptions (numbered, referenced later)
39
+ - Known results you build on
40
+
41
+ 3. Main Results (2-3 pages)
42
+ - Theorem statements (formal)
43
+ - Proof sketches (intuition + key steps)
44
+ - Corollaries and special cases
45
+ - Discussion of tightness / optimality
46
+
47
+ 4. Experimental Validation (1-2 pages, optional but recommended)
48
+ - Do theoretical predictions match empirical behavior?
49
+ - Synthetic experiments that isolate the phenomenon
50
+ - Comparison to bounds from prior work
51
+
52
+ 5. Related Work (1 page)
53
+ - Theoretical predecessors
54
+ - Empirical work your theory explains
55
+
56
+ 6. Discussion & Open Problems (0.5 page)
57
+ - Limitations of your results
58
+ - Conjectures suggested by your analysis
59
+ - Concrete open problems
60
+
61
+ Appendix:
62
+ - Full proofs
63
+ - Technical lemmas
64
+ - Extended experimental details
65
+ ```
66
+
67
+ ### Writing Theorems
68
+
69
+ **Template for a well-stated theorem:**
70
+
71
+ ```latex
72
+ \begin{assumption}[Bounded Gradients]\label{assum:bounded-grad}
73
+ There exists $G > 0$ such that $\|\nabla f(x)\| \leq G$ for all $x \in \mathcal{X}$.
74
+ \end{assumption}
75
+
76
+ \begin{theorem}[Convergence Rate]\label{thm:convergence}
77
+ Under Assumptions~\ref{assum:bounded-grad} and~\ref{assum:smoothness},
78
+ Algorithm~\ref{alg:method} with step size $\eta = \frac{1}{\sqrt{T}}$ satisfies
79
+ \[
80
+ \frac{1}{T}\sum_{t=1}^{T} \mathbb{E}\left[\|\nabla f(x_t)\|^2\right]
81
+ \leq \frac{2(f(x_1) - f^*)}{\sqrt{T}} + \frac{G^2}{\sqrt{T}}.
82
+ \]
83
+ In particular, after $T = O(1/\epsilon^2)$ iterations, we obtain an
84
+ $\epsilon$-stationary point.
85
+ \end{theorem}
86
+ ```
87
+
88
+ **Rules for theorem statements:**
89
+ - State all assumptions explicitly (numbered, with names)
90
+ - Include the formal bound, not just "converges at rate O(·)"
91
+ - Add a plain-language corollary: "In particular, this means..."
92
+ - Compare to known bounds: "This improves over [prior work]'s bound of O(·) by a factor of..."
93
+
94
+ ### Proof Sketches
95
+
96
+ The proof sketch is the most important part of the main text for a theory paper. Reviewers evaluate whether you have genuine insight or just mechanical derivation.
97
+
98
+ **Good proof sketch pattern:**
99
+
100
+ ```latex
101
+ \begin{proof}[Proof Sketch of Theorem~\ref{thm:convergence}]
102
+ The key insight is that [one sentence describing the main idea].
103
+
104
+ The proof proceeds in three steps:
105
+ \begin{enumerate}
106
+ \item \textbf{Decomposition.} We decompose the error into [term A]
107
+ and [term B] using [technique]. This reduces the problem to
108
+ bounding each term separately.
109
+
110
+ \item \textbf{Bounding [term A].} By [assumption/lemma], [term A]
111
+ is bounded by $O(\cdot)$. The critical observation is that
112
+ [specific insight that makes this non-trivial].
113
+
114
+ \item \textbf{Combining.} Choosing $\eta = 1/\sqrt{T}$ balances
115
+ the two terms, yielding the stated bound.
116
+ \end{enumerate}
117
+
118
+ The full proof, including the technical lemma for Step 2,
119
+ appears in Appendix~\ref{app:proofs}.
120
+ \end{proof}
121
+ ```
122
+
123
+ **Bad proof sketch**: Restating the theorem with slightly different notation, or just saying "the proof follows standard techniques."
124
+
125
+ ### Full Proofs in Appendix
126
+
127
+ ```latex
128
+ \appendix
129
+ \section{Proofs}\label{app:proofs}
130
+
131
+ \subsection{Proof of Theorem~\ref{thm:convergence}}
132
+
133
+ We first establish two technical lemmas.
134
+
135
+ \begin{lemma}[Descent Lemma]\label{lem:descent}
136
+ Under Assumption~\ref{assum:smoothness}, for any step size $\eta \leq 1/L$:
137
+ \[
138
+ f(x_{t+1}) \leq f(x_t) - \frac{\eta}{2}\|\nabla f(x_t)\|^2 + \frac{\eta^2 L}{2}\|\nabla f(x_t)\|^2.
139
+ \]
140
+ \end{lemma}
141
+
142
+ \begin{proof}
143
+ [Complete proof with all steps]
144
+ \end{proof}
145
+
146
+ % Continue with remaining lemmas and main theorem proof
147
+ ```
148
+
149
+ ### Common Theory Paper Pitfalls
150
+
151
+ | Pitfall | Problem | Fix |
152
+ |---------|---------|-----|
153
+ | Assumptions too strong | Trivializes the result | Discuss which assumptions are necessary; prove lower bounds |
154
+ | No comparison to existing bounds | Reviewers can't assess contribution | Add a comparison table of bounds |
155
+ | Proof sketch is just the full proof shortened | Doesn't convey insight | Focus on the 1-2 key ideas; defer mechanics to appendix |
156
+ | No experimental validation | Reviewers question practical relevance | Add synthetic experiments testing predictions |
157
+ | Notation inconsistency | Confuses reviewers | Create a notation table in Preliminaries |
158
+ | Overly complex proofs where simple ones exist | Reviewers suspect error | Prefer clarity over generality |
159
+
160
+ ### Venues for Theory Papers
161
+
162
+ | Venue | Theory Acceptance Rate | Notes |
163
+ |-------|----------------------|-------|
164
+ | **NeurIPS** | Moderate | Values theory with practical implications |
165
+ | **ICML** | High | Strong theory track |
166
+ | **ICLR** | Moderate | Prefers theory with empirical validation |
167
+ | **COLT** | High | Theory-focused venue |
168
+ | **ALT** | High | Algorithmic learning theory |
169
+ | **STOC/FOCS** | For TCS-flavored results | If contribution is primarily combinatorial/algorithmic |
170
+ | **JMLR** | High | No page limit; good for long proofs |
171
+
172
+ ---
173
+
174
+ ## Survey and Tutorial Papers
175
+
176
+ ### When to Write a Survey
177
+
178
+ - A subfield has matured enough that synthesis is valuable
179
+ - You've identified connections between works that individual papers don't make
180
+ - Newcomers to the area have no good entry point
181
+ - The landscape has changed significantly since the last survey
182
+
183
+ **Warning**: Surveys require genuine expertise. A survey by someone outside the field, however comprehensive, will miss nuances and mischaracterize work.
184
+
185
+ ### Structure
186
+
187
+ ```
188
+ 1. Introduction (1-2 pages)
189
+ - Scope definition (what's included and excluded, and why)
190
+ - Motivation for the survey now
191
+ - Overview of organization (often with a figure)
192
+
193
+ 2. Background / Problem Formulation (1-2 pages)
194
+ - Formal problem definition
195
+ - Notation (used consistently throughout)
196
+ - Historical context
197
+
198
+ 3. Taxonomy (the core contribution)
199
+ - Organize methods along meaningful axes
200
+ - Present taxonomy as a figure or table
201
+ - Each category gets a subsection
202
+
203
+ 4. Detailed Coverage (bulk of paper)
204
+ - For each category: representative methods, key ideas, strengths/weaknesses
205
+ - Comparison tables within and across categories
206
+ - Don't just describe — analyze and compare
207
+
208
+ 5. Experimental Comparison (if applicable)
209
+ - Standardized benchmark comparison
210
+ - Fair hyperparameter tuning for all methods
211
+ - Not always feasible but significantly strengthens the survey
212
+
213
+ 6. Open Problems & Future Directions (1-2 pages)
214
+ - Unsolved problems the field should tackle
215
+ - Promising but underexplored directions
216
+ - This section is what makes a survey a genuine contribution
217
+
218
+ 7. Conclusion
219
+ ```
220
+
221
+ ### Taxonomy Design
222
+
223
+ The taxonomy is the core intellectual contribution of a survey. It should:
224
+
225
+ - **Be meaningful**: Categories should correspond to real methodological differences, not arbitrary groupings
226
+ - **Be exhaustive**: Every relevant paper should fit somewhere
227
+ - **Be mutually exclusive** (ideally): Each paper belongs to one primary category
228
+ - **Have informative names**: "Attention-based methods" > "Category 3"
229
+ - **Be visualized**: A figure showing the taxonomy is almost always helpful
230
+
231
+ **Example taxonomy axes for "LLM Reasoning" survey:**
232
+ - By technique: chain-of-thought, tree-of-thought, self-consistency, tool use
233
+ - By training requirement: prompting-only, fine-tuned, RLHF
234
+ - By reasoning type: mathematical, commonsense, logical, causal
235
+
236
+ ### Writing Standards
237
+
238
+ - **Cite every relevant paper** — authors will check if their work is included
239
+ - **Be fair** — don't dismiss methods you don't prefer
240
+ - **Synthesize, don't just list** — identify patterns, trade-offs, open questions
241
+ - **Include a comparison table** — even if qualitative (features/properties checklist)
242
+ - **Update before submission** — check arXiv for papers published since you started writing
243
+
244
+ ### Venues for Surveys
245
+
246
+ | Venue | Notes |
247
+ |-------|-------|
248
+ | **TMLR** (Survey track) | Dedicated survey submissions; no page limit |
249
+ | **JMLR** | Long format, well-respected |
250
+ | **Foundations and Trends in ML** | Invited, but can be proposed |
251
+ | **ACM Computing Surveys** | Broad CS audience |
252
+ | **arXiv** (standalone) | No peer review but high visibility if well-done |
253
+ | **Conference tutorials** | Present as tutorial at NeurIPS/ICML/ACL; write up as paper |
254
+
255
+ ---
256
+
257
+ ## Benchmark and Dataset Papers
258
+
259
+ ### When to Write a Benchmark Paper
260
+
261
+ - Existing benchmarks don't measure what you think matters
262
+ - A new capability has emerged with no standard evaluation
263
+ - Existing benchmarks are saturated (all methods score >95%)
264
+ - You want to standardize evaluation in a fragmented subfield
265
+
266
+ ### Structure
267
+
268
+ ```
269
+ 1. Introduction
270
+ - What evaluation gap does this benchmark fill?
271
+ - Why existing benchmarks are insufficient
272
+
273
+ 2. Task Definition
274
+ - Formal task specification
275
+ - Input/output format
276
+ - Evaluation criteria (what makes a good answer?)
277
+
278
+ 3. Dataset Construction
279
+ - Data source and collection methodology
280
+ - Annotation process (if human-annotated)
281
+ - Quality control measures
282
+ - Dataset statistics (size, distribution, splits)
283
+
284
+ 4. Baseline Evaluation
285
+ - Run strong baselines (don't just report random/majority)
286
+ - Show the benchmark is challenging but not impossible
287
+ - Human performance baseline (if feasible)
288
+
289
+ 5. Analysis
290
+ - Error analysis on baselines
291
+ - What makes items hard/easy?
292
+ - Construct validity: does the benchmark measure what you claim?
293
+
294
+ 6. Intended Use & Limitations
295
+ - What should this benchmark be used for?
296
+ - What should it NOT be used for?
297
+ - Known biases or limitations
298
+
299
+ 7. Datasheet (Appendix)
300
+ - Full datasheet for datasets (Gebru et al.)
301
+ ```
302
+
303
+ ### Evidence Standards
304
+
305
+ Reviewers evaluate benchmarks on different criteria than methods papers:
306
+
307
+ | Criterion | What Reviewers Check |
308
+ |-----------|---------------------|
309
+ | **Novelty of evaluation** | Does this measure something existing benchmarks don't? |
310
+ | **Construct validity** | Does the benchmark actually measure the stated capability? |
311
+ | **Difficulty calibration** | Not too easy (saturated) or too hard (random performance) |
312
+ | **Annotation quality** | Agreement metrics, annotator qualifications, guidelines |
313
+ | **Documentation** | Datasheet, license, maintenance plan |
314
+ | **Reproducibility** | Can others use this benchmark easily? |
315
+ | **Ethical considerations** | Bias analysis, consent, sensitive content handling |
316
+
317
+ ### Dataset Documentation (Required)
318
+
319
+ Follow the Datasheets for Datasets framework (Gebru et al., 2021):
320
+
321
+ ```
322
+ Datasheet Questions:
323
+ 1. Motivation
324
+ - Why was this dataset created?
325
+ - Who created it and on behalf of whom?
326
+ - Who funded the creation?
327
+
328
+ 2. Composition
329
+ - What do the instances represent?
330
+ - How many instances are there?
331
+ - Does it contain all possible instances or a sample?
332
+ - Is there a label? If so, how was it determined?
333
+ - Are there recommended data splits?
334
+
335
+ 3. Collection Process
336
+ - How was the data collected?
337
+ - Who was involved in collection?
338
+ - Over what timeframe?
339
+ - Was ethical review conducted?
340
+
341
+ 4. Preprocessing
342
+ - What preprocessing was done?
343
+ - Was the "raw" data saved?
344
+
345
+ 5. Uses
346
+ - What tasks has this been used for?
347
+ - What should it NOT be used for?
348
+ - Are there other tasks it could be used for?
349
+
350
+ 6. Distribution
351
+ - How is it distributed?
352
+ - Under what license?
353
+ - Are there any restrictions?
354
+
355
+ 7. Maintenance
356
+ - Who maintains it?
357
+ - How can users contact the maintainer?
358
+ - Will it be updated? How?
359
+ - Is there an erratum?
360
+ ```
361
+
362
+ ### Venues for Benchmark Papers
363
+
364
+ | Venue | Notes |
365
+ |-------|-------|
366
+ | **NeurIPS Datasets & Benchmarks** | Dedicated track; best venue for this |
367
+ | **ACL** (Resource papers) | NLP-focused datasets |
368
+ | **LREC-COLING** | Language resources |
369
+ | **TMLR** | Good for benchmarks with analysis |
370
+
371
+ ---
372
+
373
+ ## Position Papers
374
+
375
+ ### When to Write a Position Paper
376
+
377
+ - You have an argument about how the field should develop
378
+ - You want to challenge a widely-held assumption
379
+ - You want to propose a research agenda based on analysis
380
+ - You've identified a systematic problem in current methodology
381
+
382
+ ### Structure
383
+
384
+ ```
385
+ 1. Introduction
386
+ - State your thesis clearly in the first paragraph
387
+ - Why this matters now
388
+
389
+ 2. Background
390
+ - Current state of the field
391
+ - Prevailing assumptions you're challenging
392
+
393
+ 3. Argument
394
+ - Present your thesis with supporting evidence
395
+ - Evidence can be: empirical data, theoretical analysis, logical argument,
396
+ case studies, historical precedent
397
+ - Be rigorous — this isn't an opinion piece
398
+
399
+ 4. Counterarguments
400
+ - Engage seriously with the strongest objections
401
+ - Explain why they don't undermine your thesis
402
+ - Concede where appropriate — it strengthens credibility
403
+
404
+ 5. Implications
405
+ - What should the field do differently?
406
+ - Concrete research directions your thesis suggests
407
+ - How should evaluation/methodology change?
408
+
409
+ 6. Conclusion
410
+ - Restate thesis
411
+ - Call to action
412
+ ```
413
+
414
+ ### Writing Standards
415
+
416
+ - **Lead with the strongest version of your argument** — don't hedge in the first paragraph
417
+ - **Engage with counterarguments honestly** — the best position papers address the strongest objections, not the weakest
418
+ - **Provide evidence** — a position paper without evidence is an editorial
419
+ - **Be concrete** — "the field should do X" is better than "more work is needed"
420
+ - **Don't straw-man existing work** — characterize opposing positions fairly
421
+
422
+ ### Venues for Position Papers
423
+
424
+ | Venue | Notes |
425
+ |-------|-------|
426
+ | **ICML** (Position track) | Dedicated track for position papers |
427
+ | **NeurIPS** (Workshop papers) | Workshops often welcome position pieces |
428
+ | **ACL** (Theme papers) | When your position aligns with the conference theme |
429
+ | **TMLR** | Accepts well-argued position papers |
430
+ | **CACM** | For broader CS audience |
431
+
432
+ ---
433
+
434
+ ## Reproducibility and Replication Papers
435
+
436
+ ### When to Write a Reproducibility Paper
437
+
438
+ - You attempted to reproduce a published result and succeeded/failed
439
+ - You want to verify claims under different conditions
440
+ - You've identified that a popular method's performance depends on unreported details
441
+
442
+ ### Structure
443
+
444
+ ```
445
+ 1. Introduction
446
+ - What paper/result are you reproducing?
447
+ - Why is this reproduction valuable?
448
+
449
+ 2. Original Claims
450
+ - State the exact claims from the original paper
451
+ - What evidence was provided?
452
+
453
+ 3. Methodology
454
+ - Your reproduction approach
455
+ - Differences from original (if any) and why
456
+ - What information was missing from the original paper?
457
+
458
+ 4. Results
459
+ - Side-by-side comparison with original results
460
+ - Statistical comparison (confidence intervals overlap?)
461
+ - What reproduced and what didn't?
462
+
463
+ 5. Analysis
464
+ - If results differ: why? What's sensitive?
465
+ - Hidden hyperparameters or implementation details?
466
+ - Robustness to seed, hardware, library versions?
467
+
468
+ 6. Recommendations
469
+ - For original authors: what should be clarified?
470
+ - For practitioners: what to watch out for?
471
+ - For the field: what reproducibility lessons emerge?
472
+ ```
473
+
474
+ ### Venues
475
+
476
+ | Venue | Notes |
477
+ |-------|-------|
478
+ | **ML Reproducibility Challenge** | Annual challenge at NeurIPS |
479
+ | **ReScience** | Journal dedicated to replications |
480
+ | **TMLR** | Accepts reproductions with analysis |
481
+ | **Workshops** | Reproducibility workshops at major conferences |