superlab 0.1.69 → 0.1.70

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -51,6 +51,21 @@ SOURCE_SECTION_PATH_MARKERS = (
51
51
  SOURCE_SECTION_CITATION_MARKERS = ("Citation:", "引用:")
52
52
  SOURCE_SECTION_ROLE_MARKERS = ("What it established:", "What it does:", "What it measures:", "做了什么:", "衡量什么:")
53
53
  SOURCE_SECTION_LIMITATION_MARKERS = ("Limitation", "局限")
54
+ METRIC_GUIDE_DETAIL_MARKERS = {
55
+ "evaluation target": ("Evaluation target:", "What is evaluated:", "评估对象:", "评估什么:"),
56
+ "test-set prediction": ("Test-set prediction used:", "Prediction used:", "测试集预测:", "预测量:"),
57
+ "ranking or grouping": ("Ranking or grouping step:", "Ranking step:", "Grouping step:", "排序或分组:", "排序步骤:", "分组步骤:"),
58
+ "calculation sketch": (
59
+ "Aggregation / calculation sketch:",
60
+ "Calculation sketch:",
61
+ "Approximate calculation:",
62
+ "大致计算:",
63
+ "近似公式:",
64
+ "聚合方式:",
65
+ ),
66
+ "direction and scale": ("Direction and scale:", "Metric direction:", "方向与尺度:", "方向:", "越高/越低:"),
67
+ "comparability boundary": ("Comparability boundary:", "What not to compare:", "可比性边界:", "不能比较:"),
68
+ }
54
69
 
55
70
 
56
71
  def parse_args():
@@ -99,6 +114,35 @@ def validate_source_sections(text: str, label: str) -> list[str]:
99
114
  return issues
100
115
 
101
116
 
117
+ def has_marker_with_value(body: str, markers: tuple[str, ...]) -> bool:
118
+ for line in body.splitlines():
119
+ stripped = line.strip()
120
+ for marker in markers:
121
+ if marker not in stripped:
122
+ continue
123
+ value = stripped.split(marker, 1)[1].strip()
124
+ if value and value not in {"-", "—", "TODO", "TBD", "待补", "待定"}:
125
+ return True
126
+ return False
127
+
128
+
129
+ def validate_metric_guide_detail(text: str, label: str) -> list[str]:
130
+ body = extract_section_body(text, REPORT_REQUIRED_SECTIONS["Metric Guide"])
131
+ if not body:
132
+ return []
133
+ missing = [
134
+ detail_name
135
+ for detail_name, markers in METRIC_GUIDE_DETAIL_MARKERS.items()
136
+ if not has_marker_with_value(body, markers)
137
+ ]
138
+ if not missing:
139
+ return []
140
+ return [
141
+ f"{label} section 'Metric Guide' must explain metric computation details: "
142
+ f"{', '.join(missing)}"
143
+ ]
144
+
145
+
102
146
  def validate(path_str: str, required_sections: dict[str, list[str]], label: str) -> list[str]:
103
147
  path = Path(path_str)
104
148
  if not path.exists():
@@ -108,7 +152,7 @@ def validate(path_str: str, required_sections: dict[str, list[str]], label: str)
108
152
  if missing:
109
153
  return [f"{label} is missing required sections: {', '.join(missing)}"]
110
154
  if label == "report.md":
111
- return validate_source_sections(text, label)
155
+ return validate_source_sections(text, label) + validate_metric_guide_detail(text, label)
112
156
  return []
113
157
 
114
158
 
@@ -38,6 +38,7 @@ REQUIRED_TABLE_NOTE_MARKERS = (
38
38
  "% Important caveat:",
39
39
  )
40
40
  WIDTH_CONTROL_NOTE_MARKER = "% Width control:"
41
+ WIDE_PLAIN_TABULAR_COLUMN_LIMIT = 7
41
42
  TABLE_ABBREVIATION_EXCEPTIONS = {"TODO", "TBD"}
42
43
  PLACEHOLDER_TABLE_NOTE_PREFIXES = (
43
44
  "explain ",
@@ -97,6 +98,109 @@ def contains_any(text: str, needles: tuple[str, ...]) -> bool:
97
98
  return any(needle.lower() in lowered for needle in needles)
98
99
 
99
100
 
101
+ def read_braced_group(text: str, start: int) -> tuple[str, int] | None:
102
+ if start >= len(text) or text[start] != "{":
103
+ return None
104
+ depth = 0
105
+ content_start = start + 1
106
+ for index in range(start, len(text)):
107
+ char = text[index]
108
+ if char == "{":
109
+ depth += 1
110
+ elif char == "}":
111
+ depth -= 1
112
+ if depth == 0:
113
+ return text[content_start:index], index + 1
114
+ return None
115
+
116
+
117
+ def skip_whitespace(text: str, index: int) -> int:
118
+ while index < len(text) and text[index].isspace():
119
+ index += 1
120
+ return index
121
+
122
+
123
+ def extract_plain_tabular_specs(text: str) -> list[str]:
124
+ specs: list[str] = []
125
+ needle = r"\begin{tabular}"
126
+ search_from = 0
127
+ while True:
128
+ index = text.find(needle, search_from)
129
+ if index == -1:
130
+ return specs
131
+ spec_start = skip_whitespace(text, index + len(needle))
132
+ group = read_braced_group(text, spec_start)
133
+ if group is not None:
134
+ specs.append(group[0])
135
+ search_from = group[1]
136
+ else:
137
+ search_from = index + len(needle)
138
+
139
+
140
+ def count_column_spec(spec: str) -> tuple[int, bool]:
141
+ count = 0
142
+ has_width_aware_column = False
143
+ index = 0
144
+ while index < len(spec):
145
+ char = spec[index]
146
+ if char in "lcr":
147
+ count += 1
148
+ index += 1
149
+ continue
150
+ if char == "X":
151
+ count += 1
152
+ has_width_aware_column = True
153
+ index += 1
154
+ continue
155
+ if char in "pmb":
156
+ count += 1
157
+ has_width_aware_column = True
158
+ index = skip_whitespace(spec, index + 1)
159
+ if index < len(spec) and spec[index] == "{":
160
+ group = read_braced_group(spec, index)
161
+ index = group[1] if group is not None else index + 1
162
+ continue
163
+ if char == "*":
164
+ index = skip_whitespace(spec, index + 1)
165
+ repeat_group = read_braced_group(spec, index)
166
+ if repeat_group is None:
167
+ continue
168
+ repeat_text, index = repeat_group
169
+ index = skip_whitespace(spec, index)
170
+ repeated_spec_group = read_braced_group(spec, index)
171
+ if repeated_spec_group is None:
172
+ continue
173
+ repeated_spec, index = repeated_spec_group
174
+ try:
175
+ repeat_count = int(repeat_text.strip())
176
+ except ValueError:
177
+ repeat_count = 1
178
+ nested_count, nested_width_aware = count_column_spec(repeated_spec)
179
+ count += repeat_count * nested_count
180
+ has_width_aware_column = has_width_aware_column or nested_width_aware
181
+ continue
182
+ if char in "@!<>":
183
+ index = skip_whitespace(spec, index + 1)
184
+ if index < len(spec) and spec[index] == "{":
185
+ group = read_braced_group(spec, index)
186
+ index = group[1] if group is not None else index + 1
187
+ continue
188
+ index += 1
189
+ return count, has_width_aware_column
190
+
191
+
192
+ def has_width_control_command(text: str) -> bool:
193
+ return any(
194
+ token in text
195
+ for token in (
196
+ r"\begin{tabularx}",
197
+ r"\begin{tabular*}",
198
+ r"\resizebox{",
199
+ r"\setlength{\tabcolsep}",
200
+ )
201
+ )
202
+
203
+
100
204
  def find_workflow_config(start_path: Path) -> Path | None:
101
205
  search_roots = [start_path, *start_path.parents]
102
206
  for root in search_roots:
@@ -315,6 +419,18 @@ def check_table_file(path: Path, issues: list[str], label: str):
315
419
  continue
316
420
  if value < 3.0:
317
421
  issues.append(f"{label} sets \\tabcolsep below the safe range for paper-facing main tables")
422
+ for spec in extract_plain_tabular_specs(text):
423
+ column_count, has_width_aware_column = count_column_spec(spec)
424
+ if (
425
+ column_count >= WIDE_PLAIN_TABULAR_COLUMN_LIMIT
426
+ and not has_width_aware_column
427
+ and not has_width_control_command(text)
428
+ ):
429
+ issues.append(
430
+ f"{label} uses a wide plain tabular layout ({column_count} columns) without a width-aware strategy; "
431
+ "use tabularx or p columns, split the table, move secondary metrics to appendix, "
432
+ "or document last-resort width control"
433
+ )
318
434
 
319
435
 
320
436
  def check_figure_file(path: Path, issues: list[str], label: str):
@@ -241,6 +241,22 @@ INTERNAL_EXPERIMENT_PROVENANCE_PHRASES = (
241
241
  "调参运行",
242
242
  "调参轮次",
243
243
  )
244
+ INTERNAL_EXPERIMENT_PLANNING_PATTERNS = (
245
+ r"current\s+[\d.]+\s+only\s+shows?.*need(?:s|ed)?\s+(?:a\s+)?(?:new\s+)?holdout",
246
+ r"(?:new|additional)\s+holdout\s+(?:and|or)\s+(?:more\s+)?natural(?:ized)?\s+(?:payload|attack|statement)",
247
+ r"(?:small[- ]batch|pilot[- ]batch).*(?:gate|gating)",
248
+ r"(?:freeze|freezing).*(?:payload|attack statement|trigger)",
249
+ r"(?:api|API).*(?:budget|cost|scale)",
250
+ r"新增\s*(?:holdout|外部|样本|实验).*验证",
251
+ r"还需要\s*新增.*验证",
252
+ r"后文.*边界",
253
+ r"当前\s*[\d.]+\s*只能说明.*不能外推.*(?:还需要|需要)",
254
+ r"小批量.*(?:门控|gate)",
255
+ r"(?:冻结|固定).*(?:payload|载荷|攻击语句|触发语句)",
256
+ r"(?:不能|不得).*边跑边调",
257
+ r"API\s*(?:规模|预算|成本)",
258
+ r"(?:按设计|设计上).*(?:失败|不通过).*(?:过拟合|调参)",
259
+ )
244
260
  INTERNAL_CONFIG_LABEL_PATTERN = re.compile(
245
261
  r"\b[a-z]{1,4}\d+(?:[-_][a-z]?\d+(?:\.\d+)?){1,4}\b",
246
262
  flags=re.IGNORECASE,
@@ -265,6 +281,10 @@ def check_common_section_gate_risks(text: str, issues: list[str]):
265
281
  issues.append(
266
282
  "reader-facing prose appears to contain internal experiment provenance or tuning/config labels; move run provenance to workflow notes or map it to paper-facing diagnostic terminology"
267
283
  )
284
+ if any(re.search(pattern, prose_text, flags=re.IGNORECASE) for pattern in INTERNAL_EXPERIMENT_PLANNING_PATTERNS):
285
+ issues.append(
286
+ "reader-facing prose appears to contain internal experiment planning or holdout-expansion rationale; keep plans, gates, payload-freezing notes, and future validation logistics in workflow artifacts instead of the manuscript"
287
+ )
268
288
  if contains_any(
269
289
  prose_text,
270
290
  (
@@ -51,6 +51,12 @@
51
51
  - Primary metric plain-language explanation:
52
52
  - Secondary metric plain-language explanation:
53
53
  - Health or support metrics and why they are not the main claim:
54
+ - Evaluation target:
55
+ - Test-set prediction used:
56
+ - Ranking or grouping step:
57
+ - Aggregation / calculation sketch:
58
+ - Direction and scale:
59
+ - Comparability boundary:
54
60
 
55
61
  ## Background Sources
56
62
 
@@ -17,6 +17,12 @@
17
17
  - Primary metric plain-language explanation:
18
18
  - Secondary metric plain-language explanation:
19
19
  - Health or support metrics and how to read them:
20
+ - Evaluation target:
21
+ - Test-set prediction used:
22
+ - Ranking or grouping step:
23
+ - Aggregation / calculation sketch:
24
+ - Direction and scale:
25
+ - Comparability boundary:
20
26
 
21
27
  ## Final Performance Summary
22
28
 
@@ -2,18 +2,18 @@
2
2
  \caption{One-sentence message of the table and the evaluation protocol.}
3
3
  \label{tab:placeholder}
4
4
  \centering
5
- \begin{tabular}{lcc}
5
+ \begin{tabularx}{\linewidth}{>{\raggedright\arraybackslash}Xcc}
6
6
  \toprule
7
7
  Method & Metric 1 $\uparrow$ & Metric 2 $\uparrow$ \\
8
8
  \midrule
9
9
  Ours & 0.0000 & 0.0000 \\
10
10
  Baseline & 0.0000 & 0.0000 \\
11
11
  \bottomrule
12
- \end{tabular}
12
+ \end{tabularx}
13
13
  % Rows: explain what each row represents.
14
14
  % Columns: explain what each column represents and its direction.
15
15
  % Metric definitions: expand local abbreviations, units, denominators, or event conditions.
16
16
  % Comparison scope: explain which setting, split, attack family, or benchmark scope this table covers.
17
17
  % Important caveat: state any omitted metrics, zero-valued metrics, or appendix-only reporting decision.
18
- % Width control: first shorten headers, move secondary metrics out of the main table, and reduce or split columns; only then adjust \setlength{\tabcolsep}{...} conservatively or use \resizebox{\linewidth}{!}{...} as a documented last resort.
18
+ % Width control: default to bounded columns with tabularx or p{...}; first shorten headers, move secondary metrics out of the main table, and reduce or split columns; only then adjust \setlength{\tabcolsep}{...} conservatively or use \resizebox{\linewidth}{!}{...} as a documented last resort.
19
19
  \end{table}
@@ -4,6 +4,8 @@
4
4
  \usepackage{hyperref}
5
5
  \usepackage{graphicx}
6
6
  \usepackage{booktabs}
7
+ \usepackage{array}
8
+ \usepackage{tabularx}
7
9
 
8
10
  \title{Paper Title}
9
11
  \author{Author Name}
@@ -86,6 +86,9 @@
86
86
  - Were all abbreviations expanded at local first mention:
87
87
  - Did each main table include a local table note:
88
88
  - Can a reader interpret rows and columns without chasing Method:
89
+ - Table width audit:
90
+ - Did any main table use a wide plain `tabular` layout:
91
+ - If width control was needed, was the table first shortened, split, moved partly to appendix, or converted to `tabularx` / bounded columns before using `\tabcolsep` or `\resizebox`:
89
92
  - If this section used canonical short names before their defining section, was a local naming bridge added:
90
93
  - Did model and ablation labels stay canonical instead of drifting into narrative aliases:
91
94
 
@@ -141,6 +144,7 @@
141
144
  - Did the round avoid copying reference wording, claims, metrics, captions, or conclusions:
142
145
  - Did final prose avoid service-style or AI-assistant meta language:
143
146
  - Did final prose avoid workflow-only placeholder language:
147
+ - Did final prose avoid internal experiment planning, future-holdout logistics, gates, payload-freezing notes, API-budget notes, and automation triage language:
144
148
  - Validator command and result:
145
149
 
146
150
  ## Decision
@@ -210,6 +210,7 @@ Use this skill when the user invokes `/lab:*` or asks for the structured researc
210
210
  - Read `.lab/context/mission.md`, `.lab/context/state.md`, `.lab/context/workflow-state.md`, `.lab/context/decisions.md`, `.lab/context/evidence-index.md`, and `.lab/context/data-decisions.md` before drafting.
211
211
  - Read `.lab/context/eval-protocol.md` before choosing tables, thresholds, or final result framing.
212
212
  - Keep metric definitions, comparison semantics, and implementation references anchored to the approved evaluation protocol instead of re-deriving them during reporting.
213
+ - In `report.md`, explain each primary metric with a computation guide: what is evaluated, which test-set predictions or scores are used, whether examples are sorted, grouped, bucketed, or paired, how the value is aggregated or approximately calculated, what direction and scale mean, and what cannot be compared across datasets, splits, or implementations.
213
214
  - Aggregate them with `.lab/.managed/scripts/summarize_iterations.py`.
214
215
  - Write the final document with `.lab/.managed/templates/final-report.md`, the managed table summary with `.lab/.managed/templates/main-tables.md`, and the internal handoff with `.lab/.managed/templates/artifact-status.md`.
215
216
  - Keep failed attempts and limitations visible.
@@ -272,10 +273,12 @@ Use this skill when the user invokes `/lab:*` or asks for the structured researc
272
273
  - Use the same metric names across Method, Experiments, captions, table headers, table notes, and result summaries; remove forbidden aliases from reader-facing LaTeX instead of letting legacy metric names drift.
273
274
  - Run `.lab/.managed/scripts/validate_metric_glossary.py` in metric-bearing draft, final-draft, or export rounds and record the result in the latest write iteration artifact.
274
275
  - Do not treat `\resizebox{\linewidth}{!}{...}` as the default main-table fit strategy.
275
- - Fit paper-facing main tables by redesign first: shorten headers, move secondary metrics out of the main table, reduce or split columns, then adjust `\tabcolsep` conservatively; only use `\resizebox` as a last resort and document why.
276
+ - Wide plain `tabular` layouts with many columns are not manuscript-ready by default; prefer `tabularx` or bounded `p{...}` columns for text-heavy or multi-metric tables.
277
+ - Fit paper-facing main tables by redesign first: shorten headers, move secondary metrics out of the main table, reduce or split columns, prefer `tabularx` or bounded columns, then adjust `\tabcolsep` conservatively; only use `\resizebox` as a last resort and document why.
276
278
  - Keep `\tabcolsep` adjustments conservative and avoid shrinking below a roughly readable floor for paper-facing main tables.
277
279
  - Do not rely on `\scriptsize` or `\tiny` as the default way to make a main table fit.
278
280
  - Keep internal identifiers, tuning-run labels, probe names, config strings, rerun ids, and package labels out of prose unless they are mapped once for the reader and then moved back out of prose.
281
+ - Keep internal experiment planning out of manuscript prose: future holdout expansion, small-batch gates, payload freezing, API budgets, automation decisions, and overfitting triage logic belong in lab artifacts, not paper-facing sections.
279
282
  - Do not rely on unexplained jargon density as a substitute for academic tone.
280
283
  - Bind each claim to evidence from `report`, iteration reports, or normalized summaries.
281
284
  - Use the write-stage contract in `.codex/skills/lab/stages/write.md` or `.claude/skills/lab/stages/write.md` as the single source of truth for template choice, paper-plan requirements, section-specific references, validator calls, asset coverage, and final manuscript gates.
@@ -122,6 +122,7 @@ These are paper-facing defaults. They are not project-specific branding rules.
122
122
  - Self-evaluations such as "结果也很清楚", "the defense results are very clear", or "the table is self-explanatory".
123
123
  - Layout-process commentary in scientific prose, such as "由于表列较多,这里采用页宽自适应排版" or "we use page-width adaptive layout here".
124
124
  - Claims that a table "proves" something when the evidence only supports a bounded empirical result.
125
+ - Internal experiment-planning prose, such as "还需要新增 holdout", "小批量门控", "冻结 payload", "不能边跑边调", "API 规模估计", or "if all scores are 1.0000, treat it as overfitting".
125
126
  - Service-style or AI-assistant meta language such as "用户说", "按你的要求", "我来解释", "let me explain", or "as requested by the user".
126
127
  - Workflow-only placeholder language such as "图的意图", "资产意图", "占位符", "workflow-language", or "sync this wording".
127
128
 
@@ -10,6 +10,7 @@
10
10
  - method overview
11
11
  - selected metrics summary
12
12
  - plain-language metric guide
13
+ - metric computation guide that explains what is evaluated, which test-set predictions are used, whether examples are sorted or grouped, how values are aggregated or approximately calculated, metric direction and scale, and comparability boundaries
13
14
  - background sources
14
15
  - method and baseline sources
15
16
  - metric sources
@@ -52,6 +53,8 @@
52
53
  - Do not restate metric definitions, baseline behavior, or comparison implementations from memory; use the approved evaluation protocol and its recorded sources.
53
54
  - Carry the approved `Primary metrics`, `Secondary metrics`, and `Required terminal evidence` into both the report and the managed main-tables artifact.
54
55
  - Explain the selected primary and secondary metrics in plain language for the user: what each metric measures, whether higher or lower is better, and whether it is a main result metric or only a health/support metric.
56
+ - For every primary metric, also explain enough of the computation for a collaborator to reproduce the idea without reading code: what is evaluated, which test-set predictions or scores are used, whether the examples are sorted, bucketed, grouped, or paired, how the resulting values are aggregated or approximately calculated, what direction and scale mean, and which comparisons are invalid across datasets, splits, or metric implementations.
57
+ - If a metric depends on ranking, the report must name the ranking score and the order. If it depends on a contrast, the report must name the compared conditions or groups. If it depends on an average, rate, area, threshold crossing, or recovery amount, the report must give a simple calculation sketch.
55
58
  - If coverage, completeness, confidence, or similar health metrics appear, explicitly say that they describe experimental reliability rather than the main scientific effect.
56
59
  - Pull the core background references, method or baseline references, and metric references out of the approved evaluation protocol instead of hiding them in `.lab/context/*`.
57
60
  - Treat `report.md` as an external-review-ready memo. Source sections must not rely on local file paths or internal provenance notes; they must give a few human-readable anchor references instead.
@@ -165,6 +165,8 @@ Do not enter prose polish until the current section has passed the reference-con
165
165
  - Do not use labels containing `_` or `-` in reader-facing prose.
166
166
  - Keep internal identifiers, config keys, and experiment package labels out of reader-facing prose unless they are mapped once for the reader and then moved back out of prose.
167
167
  - Keep run provenance such as tuning-run labels, probe names, internal config strings, rerun ids, and package labels out of reader-facing prose. If the evidence is useful, rewrite it as a bounded paper-facing diagnostic or move the raw provenance to workflow notes or appendix metadata.
168
+ - Keep internal experiment planning out of reader-facing prose. Do not write paper sentences that explain future holdout expansion, small-batch gates, payload freezing, API budget, "if all scores are 1.0000 then treat as overfitting", or why a next automation round is needed.
169
+ - When an experiment boundary matters, report only the scientific scope already supported by the evidence. Put the operational plan for collecting new attacks, new papers, new markers, or additional holdout cases into `.lab/changes/`, `.lab/iterations/`, or report artifacts, not into manuscript sections.
168
170
  - Do not use unexplained terminology density as a substitute for academic tone.
169
171
  - Keep service-style or AI-assistant meta language out of manuscript prose. Phrases such as "用户说", "按你的要求", "我来解释", "下面我", "this version", or "as requested by the user" belong in workflow notes, not in paper-facing sections, captions, table notes, or analysis assets.
170
172
  - Keep workflow-only placeholder language out of manuscript prose. Phrases such as "图的意图", "资产意图", "占位符", "workflow-language", "translation layer", or "sync this wording" belong in authoring artifacts, not in reader-facing LaTeX.
@@ -178,10 +180,12 @@ Do not enter prose polish until the current section has passed the reference-con
178
180
  - If a metric's denominator, event condition, score scale, or comparison scope differs by setting, define a separate entry or explicitly scope the metric in `.lab/writing/metric-glossary.md`.
179
181
  - Deprecated or forbidden metric aliases must be removed from reader-facing LaTeX instead of explained away locally.
180
182
  - Do not treat `\resizebox{\linewidth}{!}{...}` as the default way to fit a main table.
181
- - Main-table width control should follow this order: shorten headers while preserving local explanations, move secondary metrics to appendix-only, reduce or split columns, adjust `\tabcolsep` conservatively, and only then consider `\resizebox` as a last resort.
183
+ - Wide plain `tabular` layouts with many columns are not manuscript-ready by default; final/export validation should force a width-aware table design instead of silently accepting likely overfull tables.
184
+ - Main-table width control should follow this order: shorten headers while preserving local explanations, move secondary metrics to appendix-only, reduce or split columns, prefer `tabularx` or bounded `p{...}` columns, adjust `\tabcolsep` conservatively, and only then consider `\resizebox` as a last resort.
182
185
  - When `\tabcolsep` is adjusted for a paper-facing main table, keep it in a safe range and avoid shrinking below roughly `3pt`; prefer `4pt` or `5pt` when a small reduction is enough.
183
186
  - Do not use `\scriptsize` or `\tiny` as the default main-table fit strategy. If a table only fits after aggressive font shrinking, redesign the table instead of forcing it into the page.
184
187
  - If a paper-facing main table uses `\resizebox` or non-default width control, explain the width-control rationale in the same table note.
188
+ - Prefer `tabularx` for paper-facing main tables whose first column or text-heavy columns need bounded line wrapping; use plain `tabular` only for compact tables with a small column count.
185
189
  - Every main table should have a short table-introduction sentence before it and a short interpretation sentence after it so the reader knows what question the table answers and how to read the result.
186
190
  - Build the paper asset plan before prose when the section carries introduction, experimental, method, related-work, or conclusion claims:
187
191
  - record the asset coverage targets and gaps for the current paper
@@ -221,6 +225,7 @@ Do not enter prose polish until the current section has passed the reference-con
221
225
  - Table assets must also include a local table note that explains row meaning, column meaning, metric definitions, comparison scope, and any important caveat.
222
226
  - The local table note must contain real reader-facing explanations, not the default template phrases such as "explain what each row represents" or "expand local abbreviations".
223
227
  - Table assets must not rely on aggressive width hacks by default; if width control is still needed after table redesign, document it locally and keep it readable.
228
+ - Table assets with seven or more columns should be split, moved partly to appendix, or written with width-aware columns such as `tabularx` or `p{...}` instead of a plain `tabular` layout.
224
229
  - Figure placeholders may record what the final figure should show and why the reader needs it in authoring comments, the paper plan, or the write-iteration artifact, but the caption itself must remain paper-facing and must not contain "Figure intent", "图的意图", "asset intent", "占位符", or similar workflow language.
225
230
  - Core asset coverage for a paper-facing final draft should include a problem-setting or teaser figure, a method overview figure, a results overview figure, a main-results table, an ablation table, and one additional analysis asset.
226
231
  - Keep `.lab/writing/plan.md` synchronized with the current table plan, figure plan, citation plan, and section-to-asset map whenever manuscript assets change.
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "superlab",
3
- "version": "0.1.69",
3
+ "version": "0.1.70",
4
4
  "description": "Strict /lab research workflow installer for Codex and Claude",
5
5
  "keywords": [
6
6
  "codex",