npm - superlab - Versions diffs - 0.1.24 → 0.1.25 - Mend

superlab 0.1.24 → 0.1.25

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

package/README.md +2 -1
package/README.zh-CN.md +2 -1
package/lib/auto_contracts.cjs +4 -2
package/lib/context.cjs +155 -13
package/lib/i18n.cjs +71 -14
package/lib/install.cjs +2 -0
package/package-assets/shared/lab/.managed/templates/artifact-status.md +28 -0
package/package-assets/shared/lab/.managed/templates/final-report.md +0 -11
package/package-assets/shared/lab/context/auto-mode.md +2 -2
package/package-assets/shared/lab/context/session-brief.md +1 -1
package/package-assets/shared/lab/context/state.md +19 -13
package/package-assets/shared/lab/context/workflow-state.md +19 -0
package/package-assets/shared/lab/system/core.md +4 -2
package/package-assets/shared/skills/lab/SKILL.md +10 -10
package/package-assets/shared/skills/lab/stages/report.md +5 -2
package/package.json +1 -1

package/README.md CHANGED Viewed

@@ -180,7 +180,7 @@ superlab auto stop
 - `run` and `iterate` must change persistent outputs under `results_root`
 - `review` must update canonical review context
-- `report` must write `<deliverables_root>/report.md` and `<deliverables_root>/main-tables.md`
+- `report` must write `<deliverables_root>/report.md`, `<deliverables_root>/main-tables.md`, and `<deliverables_root>/artifact-status.md`
 - `write` must produce LaTeX output under `<deliverables_root>/paper/`
 - a successful promotion must write back into `.lab/context/data-decisions.md`, `.lab/context/decisions.md`, `.lab/context/state.md`, and `.lab/context/session-brief.md`
 - every run must end with `.lab/context/auto-outcome.md`, including why it stopped, whether the terminal goal was reached, and which artifact is the final outcome
@@ -309,6 +309,7 @@ See the source command docs in [commands/codex/lab.md](/Users/zhouhao119/coding/
 - `docs/research/report.md`
 - `docs/research/main-tables.md`
+- `docs/research/artifact-status.md`
 - `docs/research/paper/main.tex`
 - `docs/research/paper/sections/*.tex`

package/README.zh-CN.md CHANGED Viewed

@@ -178,7 +178,7 @@ superlab auto stop
 - `run` 和 `iterate` 必须更新 `results_root` 下的持久输出
 - `review` 必须更新规范的审查上下文
-- `report` 必须写出 `<deliverables_root>/report.md` 和 `<deliverables_root>/main-tables.md`
+- `report` 必须写出 `<deliverables_root>/report.md`、`<deliverables_root>/main-tables.md` 和 `<deliverables_root>/artifact-status.md`
 - `write` 必须写出 `<deliverables_root>/paper/` 下的 LaTeX 论文产物
 - promotion 成功后必须写回 `.lab/context/data-decisions.md`、`.lab/context/decisions.md`、`.lab/context/state.md` 和 `.lab/context/session-brief.md`
 - 每次运行都必须写出 `.lab/context/auto-outcome.md`，记录为什么停止、是否达到终止目标，以及哪一个工件是最终结果
@@ -294,6 +294,7 @@ Codex 和 Claude 的命令入口不一样：
 - `docs/research/report.md`
 - `docs/research/main-tables.md`
+- `docs/research/artifact-status.md`
 - `docs/research/paper/main.tex`
 - `docs/research/paper/sections/*.tex`

package/lib/auto_contracts.cjs CHANGED Viewed

@@ -34,6 +34,7 @@ const FROZEN_CORE_ALIASES = {
 const REVIEW_CONTEXT_FILES = [
   path.join(".lab", "context", "decisions.md"),
   path.join(".lab", "context", "state.md"),
+  path.join(".lab", "context", "workflow-state.md"),
   path.join(".lab", "context", "open-questions.md"),
   path.join(".lab", "context", "evidence-index.md"),
 ];
@@ -288,6 +289,7 @@ function stageContractSnapshot(targetDir, stage) {
     report: [
       path.join(deliverablesRoot, "report.md"),
       path.join(deliverablesRoot, "main-tables.md"),
+      path.join(deliverablesRoot, "artifact-status.md"),
     ],
     write: [
       path.join(deliverablesRoot, "paper", "main.tex"),
@@ -318,7 +320,7 @@ function verifyStageContract({ stage, snapshot }) {
   if (stage === "review") {
     if (changedPaths.length === 0) {
       throw new Error(
-        "review stage did not update canonical review context (.lab/context/decisions.md, state.md, open-questions.md, or evidence-index.md)"
+        "review stage did not update canonical review context (.lab/context/decisions.md, state.md, workflow-state.md, open-questions.md, or evidence-index.md)"
       );
     }
     return;
@@ -327,7 +329,7 @@ function verifyStageContract({ stage, snapshot }) {
   if (stage === "report") {
     const missing = Array.from(snapshot.keys()).filter((absolutePath) => !changedPaths.includes(absolutePath));
     if (missing.length > 0) {
-      throw new Error("report stage did not produce the deliverable report.md and main-tables.md under deliverables_root");
+      throw new Error("report stage did not produce report.md, main-tables.md, and artifact-status.md under deliverables_root");
     }
     return;
   }

package/lib/context.cjs CHANGED Viewed

@@ -206,6 +206,30 @@ function isMeaningful(value) {
   return !PLACEHOLDER_VALUES.has((value || "").trim().toLowerCase());
 }
+function hasWorkflowStateShape(text) {
+  if (!text) {
+    return false;
+  }
+  return [
+    extractValue(text, ["Active stage", "当前阶段", "Stage"]),
+    extractValue(text, ["Current objective", "当前目标"]),
+    extractValue(text, ["Next required output", "Next required artifact", "下一项必要输出"]),
+    extractValue(text, ["Immediate action", "立即要做的动作"]),
+  ].some((value) => isMeaningful(value));
+}
+function readWorkflowStateContext(targetDir) {
+  const workflowState = readFileIfExists(contextFile(targetDir, "workflow-state.md"));
+  if (hasWorkflowStateShape(workflowState)) {
+    return workflowState;
+  }
+  const legacyState = readFileIfExists(contextFile(targetDir, "state.md"));
+  if (hasWorkflowStateShape(legacyState)) {
+    return legacyState;
+  }
+  return workflowState || legacyState;
+}
 function readWorkflowConfig(targetDir) {
   const configPath = path.join(targetDir, ".lab", "config", "workflow.json");
   if (!fs.existsSync(configPath)) {
@@ -232,6 +256,7 @@ function getCollaboratorDeliverablePaths(targetDir) {
     deliverablesRoot,
     reportPath: path.join(deliverablesRoot, "report.md"),
     mainTablesPath: path.join(deliverablesRoot, "main-tables.md"),
+    artifactStatusPath: path.join(deliverablesRoot, "artifact-status.md"),
   };
 }
@@ -610,11 +635,16 @@ function labelValue(text, englishLabels, chineseLabels = []) {
 function collectHydrationSources(targetDir) {
   const { reportPath, mainTablesPath } = getCollaboratorDeliverablePaths(targetDir);
+  const workflowStatePath = hasWorkflowStateShape(readFileIfExists(contextFile(targetDir, "workflow-state.md")))
+    ? ".lab/context/workflow-state.md"
+    : hasWorkflowStateShape(readFileIfExists(contextFile(targetDir, "state.md")))
+      ? ".lab/context/state.md"
+      : "";
   return [
     fs.existsSync(reportPath) ? path.relative(targetDir, reportPath) : "",
     fs.existsSync(mainTablesPath) ? path.relative(targetDir, mainTablesPath) : "",
     readFileIfExists(contextFile(targetDir, "data-decisions.md")) ? ".lab/context/data-decisions.md" : "",
-    readFileIfExists(contextFile(targetDir, "state.md")) ? ".lab/context/state.md" : "",
+    workflowStatePath,
     readFileIfExists(contextFile(targetDir, "evidence-index.md")) ? ".lab/context/evidence-index.md" : "",
   ].filter(Boolean);
 }
@@ -626,7 +656,7 @@ function hydrateMissionContext(targetDir) {
   const lang = readWorkflowLanguage(targetDir);
   const missionText = readFileIfExists(contextFile(targetDir, "mission.md"));
-  const stateText = readFileIfExists(contextFile(targetDir, "state.md"));
+  const workflowStateText = readWorkflowStateContext(targetDir);
   const evidenceText = readFileIfExists(contextFile(targetDir, "evidence-index.md"));
   const dataDecisions = readFileIfExists(contextFile(targetDir, "data-decisions.md"));
   const reportText = readFileIfExists(getCollaboratorDeliverablePaths(targetDir).reportPath);
@@ -637,7 +667,7 @@ function hydrateMissionContext(targetDir) {
     problem: mergePreferred(
       extractValue(missionText, ["One-sentence problem", "一句话问题"]),
       extractReportValue(reportText, "problem"),
-      extractValue(stateText, ["Current objective", "当前目标", "Current objective"])
+      extractValue(workflowStateText, ["Current objective", "当前目标", "Current objective"])
     ),
     whyItMatters: mergePreferred(
       extractValue(missionText, ["Why it matters", "为什么重要"]),
@@ -680,7 +710,7 @@ function hydrateMissionContext(targetDir) {
     currentOwner: extractValue(missionText, ["Current owner or session", "当前 owner 或会话"]),
     latestStage: mergePreferred(
       extractValue(missionText, ["Latest stage to update this mission", "最近一次允许更新 mission 的阶段"]),
-      extractValue(stateText, ["Active stage", "当前阶段", "Stage"])
+      extractValue(workflowStateText, ["Active stage", "当前阶段", "Stage"])
     ),
   };
@@ -935,6 +965,110 @@ function hydrateCanonicalContext(targetDir) {
   };
 }
+function renderResearchState(lang, data) {
+  if (lang === "zh") {
+    return `# 研究状态
+## 已批准方向
+- One-sentence problem: ${data.problem || "待补充"}
+- Approved direction: ${data.direction || "待补充"}
+- Strongest supported claim: ${data.claim || "待补充"}
+## 证据边界
+- What the current evidence really supports: ${data.reportModeReason || data.direction || "待补充"}
+- What is still outside the boundary: ${data.question || "待补充"}
+- Biggest research risk: ${data.risk || "待补充"}
+## 当前研究主线
+- Current research focus: ${data.immediateAction || data.direction || "待补充"}
+- Primary metric: ${data.evalPrimaryMetrics || data.threshold || "待补充"}
+- Dataset or benchmark scope: ${data.datasetPackage || data.benchmarkRole || "待补充"}
+## 当前研究约束
+- Hard constraints: ${data.boundary || "待补充"}
+- Claim boundary: ${data.evalClaimBoundary || "待补充"}
+- Conditions that require reopening the direction: ${data.humanDecision || "待补充"}
+`;
+  }
+  return `# Research State
+## Approved Direction
+- One-sentence problem: ${data.problem || "TBD"}
+- Approved direction: ${data.direction || "TBD"}
+- Strongest supported claim: ${data.claim || "TBD"}
+## Evidence Boundary
+- What the current evidence really supports: ${data.reportModeReason || data.direction || "TBD"}
+- What is still outside the boundary: ${data.question || "TBD"}
+- Biggest research risk: ${data.risk || "TBD"}
+## Active Research Track
+- Current research focus: ${data.immediateAction || data.direction || "TBD"}
+- Primary metric: ${data.evalPrimaryMetrics || data.threshold || "TBD"}
+- Dataset or benchmark scope: ${data.datasetPackage || data.benchmarkRole || "TBD"}
+## Current Research Constraints
+- Hard constraints: ${data.boundary || "TBD"}
+- Claim boundary: ${data.evalClaimBoundary || "TBD"}
+- Conditions that require reopening the direction: ${data.humanDecision || "TBD"}
+`;
+}
+function renderWorkflowState(lang, data) {
+  if (lang === "zh") {
+    return `# 工作流状态
+## 当前阶段
+- Active stage: ${data.stage || "待补充"}
+- 当前目标：${data.workflowObjective || "待补充"}
+- 下一项必要输出：${data.nextArtifact || "待补充"}
+## 最近更新
+- 最近完成动作：${data.latestAction || "待补充"}
+- 最新工件路径：${data.latestArtifactPath || "待补充"}
+- 最新 run 或 report id：${data.latestRunOrReportId || "待补充"}
+## 下一步
+- 立即要做的动作：${data.immediateAction || "待补充"}
+- 当前阻塞：${data.blocker || "待补充"}
+- 是否需要人工决策：${data.humanDecision || "待补充"}
+`;
+  }
+  return `# Workflow State
+## Current Stage
+- Active stage: ${data.stage || "TBD"}
+- Current objective: ${data.workflowObjective || "TBD"}
+- Next required output: ${data.nextArtifact || "TBD"}
+## Latest Update
+- Last completed action: ${data.latestAction || "TBD"}
+- Latest artifact path: ${data.latestArtifactPath || "TBD"}
+- Latest run or report id: ${data.latestRunOrReportId || "TBD"}
+## Next Step
+- Immediate next action: ${data.immediateAction || "TBD"}
+- Blocking issue: ${data.blocker || "TBD"}
+- Human decision needed: ${data.humanDecision || "TBD"}
+`;
+}
 function renderSummary(lang, data) {
   if (lang === "zh") {
     return `# 研究摘要
@@ -1220,7 +1354,7 @@ ${data.problem || "待补充"}
 ## 先读这些文件
 1. \`.lab/context/mission.md\`
-2. \`.lab/context/state.md\`
+2. \`.lab/context/workflow-state.md\`
 3. \`.lab/context/evidence-index.md\`
 ## 不要静默修改
@@ -1309,7 +1443,7 @@ ${data.problem || "TBD"}
 ## Read First
 1. \`.lab/context/mission.md\`
-2. \`.lab/context/state.md\`
+2. \`.lab/context/workflow-state.md\`
 3. \`.lab/context/evidence-index.md\`
 ## Do Not Change Silently
@@ -1322,7 +1456,7 @@ ${data.problem || "TBD"}
 function buildContextSnapshot(targetDir) {
   const reportStatus = getCollaboratorReportStatus(targetDir);
   const mission = readFileIfExists(contextFile(targetDir, "mission.md"));
-  const state = readFileIfExists(contextFile(targetDir, "state.md"));
+  const workflowState = readWorkflowStateContext(targetDir);
   const evidence = readFileIfExists(contextFile(targetDir, "evidence-index.md"));
   const questions = readFileIfExists(contextFile(targetDir, "open-questions.md"));
   const dataDecisions = readFileIfExists(contextFile(targetDir, "data-decisions.md"));
@@ -1390,16 +1524,22 @@ function buildContextSnapshot(targetDir) {
   return {
     problem: extractValue(mission, ["One-sentence problem", "一句话问题"]),
     direction: extractValue(mission, ["Approved direction", "已批准方向"]),
-    stage: extractValue(state, ["Active stage", "当前阶段", "Stage"]),
-    nextArtifact: extractValue(state, ["Next required artifact", "下一项必要输出"]),
-    immediateAction: extractValue(state, ["Immediate action", "立即要做的动作"]),
-    blocker: extractValue(state, ["Current blocker", "当前阻塞"]),
-    humanDecision: extractValue(state, ["Human decision needed", "是否需要人工决策"]),
+    stage: extractValue(workflowState, ["Active stage", "当前阶段", "Stage"]),
+    workflowObjective: extractValue(workflowState, ["Current objective", "当前目标"]),
+    nextArtifact: extractValue(workflowState, ["Next required artifact", "下一项必要输出"]),
+    latestAction: extractValue(workflowState, ["Latest completed action", "Last completed action", "最近完成动作"]),
+    latestArtifactPath: extractValue(workflowState, ["Latest artifact path", "最新工件路径"]),
+    latestRunOrReportId: extractValue(workflowState, ["Latest run or report id", "最新 run 或 report id"]),
+    immediateAction: extractValue(workflowState, ["Immediate action", "立即要做的动作"]),
+    blocker: extractValue(workflowState, ["Current blocker", "Blocking issue", "当前阻塞"]),
+    humanDecision: extractValue(workflowState, ["Human decision needed", "是否需要人工决策"]),
     threshold: extractValue(mission, ["Success threshold", "成功阈值"]),
     boundary: extractValue(mission, ["Hard constraints", "硬约束"]),
     claim: extractClaim(evidence),
     question: extractOpenQuestion(questions),
-    risk: extractValue(questions, ["Why it matters", "为什么重要"]) || extractValue(state, ["Current blocker", "当前阻塞"]),
+    risk:
+      extractValue(questions, ["Why it matters", "为什么重要"]) ||
+      extractValue(workflowState, ["Current blocker", "Blocking issue", "当前阻塞"]),
     datasetPackage:
       extractValue(dataDecisions, ["Approved dataset package", "已批准数据集包"]) ||
       extractValue(dataDecisions, ["Approved datasets", "已批准数据集"]),
@@ -1583,6 +1723,8 @@ function refreshContext({ targetDir }) {
   hydrateCanonicalContext(targetDir);
   const lang = readWorkflowLanguage(targetDir);
   const snapshot = buildContextSnapshot(targetDir);
+  writeContextFile(targetDir, "state.md", renderResearchState(lang, snapshot));
+  writeContextFile(targetDir, "workflow-state.md", renderWorkflowState(lang, snapshot));
   writeContextFile(targetDir, "summary.md", renderSummary(lang, snapshot));
   writeContextFile(targetDir, "next-action.md", renderNextAction(lang, snapshot));
   writeContextFile(targetDir, "session-brief.md", renderSessionBrief(lang, snapshot));

package/lib/i18n.cjs CHANGED Viewed

@@ -55,7 +55,7 @@ const ZH_CONTENT = {
   [path.join(".codex", "prompts", "lab-report.md")]: codexPrompt(
     "基于验证后的迭代工件生成最终报告",
     "report context",
-    "使用已安装的 `lab` 技能：`.codex/skills/lab/SKILL.md`。\n\n立刻针对用户当前给出的参数执行 `/lab:report`，不要只推荐别的 `/lab` 阶段。只有在缺少阻塞性前提时，才明确指出缺什么，并且一次最多追问一个问题。\n\n本命令运行 `/lab:report` 阶段。它必须生成给用户直接阅读的最终实验报告和受管的 `main-tables.md`，明确写出主指标、次级指标和必要终局证据，并用白话解释这些指标分别衡量什么、哪些只是健康度或支持性指标、以及每张主表到底证明了什么和没证明什么。"
+    "使用已安装的 `lab` 技能：`.codex/skills/lab/SKILL.md`。\n\n立刻针对用户当前给出的参数执行 `/lab:report`，不要只推荐别的 `/lab` 阶段。只有在缺少阻塞性前提时，才明确指出缺什么，并且一次最多追问一个问题。\n\n本命令运行 `/lab:report` 阶段。它必须生成给用户直接阅读的最终实验报告、受管的 `main-tables.md`，以及单独的内部 `artifact-status.md`。主报告要明确写出主指标、次级指标和必要终局证据，并用白话解释这些指标分别衡量什么、哪些只是健康度或支持性指标、以及每张主表到底证明了什么和没证明什么。"
   ),
   [path.join(".codex", "prompts", "lab-write.md")]: codexPrompt(
     "把验证过的研究工件转成论文 section，并按小步方式修订",
@@ -102,7 +102,7 @@ const ZH_CONTENT = {
     "lab-report",
     "基于验证后的迭代工件生成最终报告",
     "report context",
-    "使用已安装的 `lab` 技能：`.claude/skills/lab/SKILL.md`。\n\n立刻针对用户当前给出的参数执行 `report` 阶段，不要只推荐别的 lab 阶段。只有在缺少阻塞性前提时，才明确指出缺什么，并且一次最多追问一个问题。\n\n本命令运行 lab workflow 的 `report` 阶段。它必须生成给用户直接阅读的最终实验报告和受管的 `main-tables.md`，明确写出主指标、次级指标和必要终局证据，并用白话解释这些指标分别衡量什么、哪些只是健康度或支持性指标、以及每张主表到底证明了什么和没证明什么。"
+    "使用已安装的 `lab` 技能：`.claude/skills/lab/SKILL.md`。\n\n立刻针对用户当前给出的参数执行 `report` 阶段，不要只推荐别的 lab 阶段。只有在缺少阻塞性前提时，才明确指出缺什么，并且一次最多追问一个问题。\n\n本命令运行 lab workflow 的 `report` 阶段。它必须生成给用户直接阅读的最终实验报告、受管的 `main-tables.md`，以及单独的内部 `artifact-status.md`。主报告要明确写出主指标、次级指标和必要终局证据，并用白话解释这些指标分别衡量什么、哪些只是健康度或支持性指标、以及每张主表到底证明了什么和没证明什么。"
   ),
   [path.join(".claude", "commands", "lab-write.md")]: claudeCommand(
     "lab-write",
@@ -300,6 +300,7 @@ const ZH_SKILL_FILES = {
 - 实验设置
 - 已验证主结果
 - 位于 \`<deliverables_root>/main-tables.md\` 的受管主表工件
+- 位于 \`<deliverables_root>/artifact-status.md\` 的内部工件状态
 - 怎么看主表的阅读指引
 - 消融
 - 失败尝试
@@ -311,6 +312,7 @@ const ZH_SKILL_FILES = {
 - \`.lab/context/mission.md\`
 - \`.lab/context/state.md\`
+- \`.lab/context/workflow-state.md\`
 - \`.lab/context/decisions.md\`
 - \`.lab/context/evidence-index.md\`
 - \`.lab/context/eval-protocol.md\`
@@ -320,6 +322,7 @@ const ZH_SKILL_FILES = {
 - \`.lab/context/mission.md\`
 - \`.lab/context/eval-protocol.md\`
 - \`.lab/context/state.md\`
+- \`.lab/context/workflow-state.md\`
 - \`.lab/context/evidence-index.md\`
 ## 证据规则
@@ -337,14 +340,14 @@ const ZH_SKILL_FILES = {
 - 方法概述必须用协作者能读懂的话说明：我们的方法大致怎么做、相对 closest prior work 或 strongest baseline 改了什么、这些 prior 方法各自做了什么，以及它们为什么在当前 claim 下仍然不够。
 - 只保留少量最关键的 prior work/baseline 锚点；每个锚点都要用一句话交代它做了什么和它的局限。
 - 在“背景来源”“方法与基线来源”“指标来源”里，每个锚点都必须包含：引用、它做了什么或衡量什么、以及至少一个局限或 caveat。
-- 内部 provenance 只能放到 \`工件状态\` 或 \`.lab/context/evidence-index.md\`，不能塞进来源章节。
+- 内部 provenance 只能放到 \`<deliverables_root>/artifact-status.md\` 或 \`.lab/context/evidence-index.md\`，不能塞进来源章节。
 - 在起草报告前，先检查 \`.lab/context/mission.md\` 和 \`.lab/context/eval-protocol.md\` 是否仍是模板空壳。
 - 如果 canonical context 还是空壳，要先根据 frozen result artifacts、data-decisions、evidence-index 和已批准上下文回填“最小可信版本”，再写报告。
 - 如果回填后仍缺少协作者可读所需的关键字段，就必须把输出降级成 \`artifact-anchored interim report\`，不能冒充最终协作者报告。
 - 如果现有的 \`report.md\` 或 \`main-tables.md\` 缺少受管模板要求的协作者可读章节，也必须视为报告缺陷；rerun 需要补齐这些缺失块，不能直接宣称“正文无变化”或把这次 rerun 当成 no-op。
 - 报告起草或 rerun 完成后，必须运行 \`.lab/.managed/scripts/validate_collaborator_report.py --report <deliverables_root>/report.md --main-tables <deliverables_root>/main-tables.md\`。如果校验失败，就继续补正文，不能停在“只新增审计痕迹”的状态。
 - 如果报告依赖了对原始指标或原始实现的偏差，必须明确写出这个偏差。
-- workflow 工件状态、rerun id 或 LaTeX 骨架状态不能混进“已验证主结果”；这些内容必须单列到工件状态部分。
+- workflow 工件状态、rerun id 或 LaTeX 骨架状态不能混进“已验证主结果”；这些内容必须单列到 \`<deliverables_root>/artifact-status.md\`。
 - 如果 workflow language 是中文，\`report.md\` 和 \`<deliverables_root>/main-tables.md\` 也应使用中文，除非文件路径、代码标识符或字面指标名必须保持原样。
 - 解释优先保守，不要写成营销文案。
 - 要给 \`/lab:write\` 留下清晰 handoff，尤其是 section draft 可以直接引用的证据链接。
@@ -814,11 +817,6 @@ const ZH_SKILL_FILES = {
 - 最终表现摘要：
 - 主表覆盖情况：
-## 工件状态
-- 已就绪的交付物或工作流工件：
-- 这些工件状态为什么不是科学结论：
 ## 主要结果
 - 主要发现 1：
@@ -833,6 +831,36 @@ const ZH_SKILL_FILES = {
 - Claim：
 - 缺失支持：
+`,
+  [path.join(".lab", ".managed", "templates", "artifact-status.md")]:
+`# 工件状态
+## 交付物状态
+- 协作者报告路径：
+- 受管主表路径：
+- 当前报告模式：
+- 为什么当前状态是合理的：
+## 工作流审计
+- 最近完成动作：
+- 最新工件路径：
+- 最新 run 或 report id：
+- rerun 或校验备注：
+## 内部溯源
+- 使用的冻结结果工件：
+- 已刷新 canonical context：
+- Evidence index 锚点：
+## 论文交接
+- 已可进入 \`/lab:write\` 的 sections：
+- 可引用的证据包：
+- 仍需要更强支持的 claims：
+- 仍未完成的 paper-finishing 项：
 `,
   [path.join(".lab", ".managed", "templates", "main-tables.md")]:
 `# 主表工件
@@ -1056,6 +1084,33 @@ const ZH_SKILL_FILES = {
 - 协作者可读状态：
 `,
   [path.join(".lab", "context", "state.md")]:
+`# 研究状态
+## 已批准方向
+- One-sentence problem:
+- Approved direction:
+- Strongest supported claim:
+## 证据边界
+- What the current evidence really supports:
+- What is still outside the boundary:
+- Biggest research risk:
+## 当前研究主线
+- Current research focus:
+- Primary metric:
+- Dataset or benchmark scope:
+## 当前研究约束
+- Hard constraints:
+- Claim boundary:
+- Conditions that require reopening the direction:
+`,
+  [path.join(".lab", "context", "workflow-state.md")]:
 `# 工作流状态
 ## 当前阶段
@@ -1172,8 +1227,8 @@ const ZH_SKILL_FILES = {
 - Run stage contract: write persistent outputs under \`results_root\`.
 - Iterate stage contract: update persistent outputs under \`results_root\`.
-- Review stage contract: update canonical review context such as \`.lab/context/decisions.md\`、\`state.md\`、\`open-questions.md\` or \`evidence-index.md\`.
-- Report stage contract: write the final report to \`<deliverables_root>/report.md\`.
+- Review stage contract: update canonical review context such as \`.lab/context/decisions.md\`、\`state.md\`、\`workflow-state.md\`、\`open-questions.md\` or \`evidence-index.md\`.
+- Report stage contract: write \`<deliverables_root>/report.md\`、\`<deliverables_root>/main-tables.md\` and \`<deliverables_root>/artifact-status.md\`.
 - Write stage contract: write LaTeX output under \`<deliverables_root>/paper/\`.
 ## 升格策略
@@ -1284,7 +1339,7 @@ ZH_CONTENT[path.join(".lab", "system", "core.md")] = `# Lab 系统核心
 1. \`.lab/context/session-brief.md\`
 2. \`.lab/context/mission.md\`
-3. \`.lab/context/state.md\`
+3. \`.lab/context/workflow-state.md\`
 4. \`.lab/context/evidence-index.md\`
 5. \`.lab/context/data-decisions.md\`（当问题涉及数据集、benchmark 或对比方法时）
 6. \`.lab/context/auto-mode.md\` 和 \`.lab/context/auto-status.md\`（当任务涉及自动模式时）
@@ -1293,13 +1348,15 @@ ZH_CONTENT[path.join(".lab", "system", "core.md")] = `# Lab 系统核心
 ## 工作流边界
-- \`.lab/context/\` 保存持久研究状态。
+- \`.lab/context/\` 同时保存持久研究状态和轻量工作流状态。
 - \`.lab/changes/\`、\`.lab/iterations/\`、\`.lab/writing/\` 保存工作流控制工件、轻量 manifest 和 change-local harness。
 - \`.lab/.managed/\` 保存工具托管模板和脚本。
 - 持久 run 输出应写到 \`results_root\`，不要写进 \`.lab/changes/\`。
 - 图表和可视化应写到 \`figures_root\`，不要写进 \`.lab/changes/\`。
 - 最终交付物应写到 \`deliverables_root\`，不要写进 \`.lab/context/\`。
 - change-local 的 \`data/\` 目录只应用来放轻量 manifest 或 batch spec，不要当正式数据集入口。
+- \`.lab/context/state.md\` 保存持久研究状态；\`.lab/context/workflow-state.md\` 保存当前工作流状态。
+- \`.lab/context/summary.md\` 是长期项目摘要；\`.lab/context/session-brief.md\` 是下一次会话启动简报。
 - \`.lab/context/auto-mode.md\` 定义自动模式边界，\`.lab/context/auto-status.md\` 记录自动运行状态，二者都属于项目状态。
 - 如果用户提供了 LaTeX 模板目录，先校验并通过 \`paper_template_root\` 接入，再开始写作。
 - 已接入的模板目录视为用户资产，默认不要改模板文件，除非用户明确要求。
@@ -1391,7 +1448,7 @@ ZH_CONTENT[path.join(".lab", "context", "session-brief.md")] = `# 会话简报
 ## 先读这些文件
 1. \`.lab/context/mission.md\`
-2. \`.lab/context/state.md\`
+2. \`.lab/context/workflow-state.md\`
 3. \`.lab/context/evidence-index.md\`
 ## 不要静默修改

package/lib/install.cjs CHANGED Viewed

@@ -36,6 +36,7 @@ const PROJECT_OWNED_LOCALIZED_PATHS = [
   path.join(".lab", "config", "workflow.json"),
   path.join(".lab", "context", "mission.md"),
   path.join(".lab", "context", "state.md"),
+  path.join(".lab", "context", "workflow-state.md"),
   path.join(".lab", "context", "decisions.md"),
   path.join(".lab", "context", "evidence-index.md"),
   path.join(".lab", "context", "open-questions.md"),
@@ -542,6 +543,7 @@ function localizeInstalledAssets(targetDir, lang, { newlyCreatedProjectOwnedPath
     path.join(".lab", ".managed", "templates", "review-checklist.md"),
     path.join(".lab", ".managed", "templates", "final-report.md"),
     path.join(".lab", ".managed", "templates", "main-tables.md"),
+    path.join(".lab", ".managed", "templates", "artifact-status.md"),
     path.join(".lab", ".managed", "templates", "paper-plan.md"),
     path.join(".lab", ".managed", "templates", "paper-section.md"),
     path.join(".lab", ".managed", "templates", "write-iteration.md"),

package/package-assets/shared/lab/.managed/templates/artifact-status.md ADDED Viewed

@@ -0,0 +1,28 @@
+# Artifact Status
+## Deliverable Status
+- Collaborator-facing report path:
+- Managed main tables path:
+- Current report mode:
+- Why this status is appropriate:
+## Workflow Audit
+- Latest completed action:
+- Latest artifact path:
+- Latest run or report id:
+- Rerun or validation notes:
+## Internal Provenance
+- Frozen result artifacts used:
+- Canonical context files refreshed:
+- Evidence index anchors:
+## Paper Handoff
+- Sections ready for `/lab:write`:
+- Evidence bundles to cite:
+- Claims that still need stronger support:
+- Paper-finishing items still open:

package/package-assets/shared/lab/.managed/templates/final-report.md CHANGED Viewed

@@ -105,11 +105,6 @@
 - Final performance summary:
 - Table coverage:
-## Artifact Status
-- Deliverables or workflow artifacts that are ready:
-- Artifact status notes that are not scientific findings:
 ## Main Results
 Summarize validated iteration outcomes.
@@ -129,9 +124,3 @@ Describe unresolved risks and external validity limits.
 ## Next Steps
 List concrete follow-up actions.
-## Paper Handoff
-- Sections ready for `/lab:write`:
-- Evidence bundles to cite:
-- Claims that still need stronger support:

package/package-assets/shared/lab/context/auto-mode.md CHANGED Viewed

@@ -51,8 +51,8 @@ If `eval-protocol.md` declares structured rung entries, auto mode follows those
 - Run stage contract: write persistent outputs under `results_root`.
 - Iterate stage contract: update persistent outputs under `results_root`.
-- Review stage contract: update canonical review context such as `.lab/context/decisions.md`, `state.md`, `open-questions.md`, or `evidence-index.md`.
-- Report stage contract: write the final report to `<deliverables_root>/report.md`.
+- Review stage contract: update canonical review context such as `.lab/context/decisions.md`, `state.md`, `workflow-state.md`, `open-questions.md`, or `evidence-index.md`.
+- Report stage contract: write `<deliverables_root>/report.md`, `<deliverables_root>/main-tables.md`, and `<deliverables_root>/artifact-status.md`.
 - Write stage contract: write LaTeX output under `<deliverables_root>/paper/`.
 ## Promotion Policy

package/package-assets/shared/lab/context/session-brief.md CHANGED Viewed

@@ -24,7 +24,7 @@ One sentence describing the active research mission.
 ## Read First
 1. `.lab/context/mission.md`
-2. `.lab/context/state.md`
+2. `.lab/context/workflow-state.md`
 3. `.lab/context/evidence-index.md`
 ## Do Not Change Silently

package/package-assets/shared/lab/context/state.md CHANGED Viewed

@@ -1,19 +1,25 @@
-# Workflow State
+# Research State
-## Current Stage
+## Approved Direction
-- Active stage:
-- Current objective:
-- Next required output:
+- One-sentence problem:
+- Approved direction:
+- Strongest supported claim:
-## Latest Update
+## Evidence Boundary
-- Last completed action:
-- Latest artifact path:
-- Latest run or report id:
+- What the current evidence really supports:
+- What is still outside the boundary:
+- Biggest research risk:
-## Next Step
+## Active Research Track
-- Immediate next action:
-- Blocking issue:
-- Human decision needed:
+- Current research focus:
+- Primary metric:
+- Dataset or benchmark scope:
+## Current Research Constraints
+- Hard constraints:
+- Claim boundary:
+- Conditions that require reopening the direction:

package/package-assets/shared/lab/context/workflow-state.md ADDED Viewed

@@ -0,0 +1,19 @@
+# Workflow State
+## Current Stage
+- Active stage:
+- Current objective:
+- Next required output:
+## Latest Update
+- Last completed action:
+- Latest artifact path:
+- Latest run or report id:
+## Next Step
+- Immediate next action:
+- Blocking issue:
+- Human decision needed:

package/package-assets/shared/lab/system/core.md CHANGED Viewed

@@ -8,7 +8,7 @@ For a new AI session, read these files in order:
 1. `.lab/context/session-brief.md`
 2. `.lab/context/mission.md`
-3. `.lab/context/state.md`
+3. `.lab/context/workflow-state.md`
 4. `.lab/context/evidence-index.md`
 Only expand to additional context when the brief points to it.
@@ -24,13 +24,15 @@ For auto-mode orchestration or long-running experiment campaigns, also read:
 ## Workflow Boundaries
-- `.lab/context/` holds durable project research state.
+- `.lab/context/` holds durable project research state plus lightweight workflow state.
 - `.lab/changes/`, `.lab/iterations/`, and `.lab/writing/` hold workflow control artifacts, lightweight manifests, and change-local harnesses.
 - `.lab/.managed/` holds tool-managed templates and scripts.
 - Durable run outputs belong under the configured `results_root`, not inside `.lab/changes/`.
 - Figures and plots belong under the configured `figures_root`, not inside `.lab/changes/`.
 - Deliverables belong under the configured `deliverables_root`, not inside `.lab/context/`.
 - Change-local `data/` directories may hold lightweight manifests or batch specs, but not the canonical dataset copy.
+- `.lab/context/state.md` holds durable research state; `.lab/context/workflow-state.md` holds live workflow state.
+- `.lab/context/summary.md` is the durable project summary; `.lab/context/session-brief.md` is the next-session startup brief.
 - `.lab/context/auto-mode.md` defines the bounded autonomous envelope; `.lab/context/auto-status.md` records live state for resume and handoff.
 - If the user provides a LaTeX template directory, validate it and attach it through `paper_template_root` before drafting.
 - Treat attached template directories as user-owned assets. Do not rewrite template files unless the user explicitly asks.

package/package-assets/shared/skills/lab/SKILL.md CHANGED Viewed

@@ -83,7 +83,7 @@ Use this skill when the user invokes `/lab:*` or asks for the structured researc
 ### `/lab:auto`
 - Use this stage to orchestrate approved execution stages with bounded autonomy.
-- Read `.lab/config/workflow.json`, `.lab/context/mission.md`, `.lab/context/state.md`, `.lab/context/decisions.md`, `.lab/context/data-decisions.md`, `.lab/context/evidence-index.md`, `.lab/context/terminology-lock.md`, `.lab/context/auto-mode.md`, and `.lab/context/auto-status.md` before acting.
+- Read `.lab/config/workflow.json`, `.lab/context/mission.md`, `.lab/context/state.md`, `.lab/context/workflow-state.md`, `.lab/context/decisions.md`, `.lab/context/data-decisions.md`, `.lab/context/evidence-index.md`, `.lab/context/terminology-lock.md`, `.lab/context/auto-mode.md`, and `.lab/context/auto-status.md` before acting.
 - Treat `.lab/context/auto-mode.md` as the control contract and `.lab/context/auto-status.md` as the live state file.
 - Require `Autonomy level` and `Approval status` in `.lab/context/auto-mode.md` before execution.
 - Treat `L1` as safe-run validation, `L2` as bounded iteration, and `L3` as aggressive campaign mode.
@@ -93,13 +93,13 @@ Use this skill when the user invokes `/lab:*` or asks for the structured researc
 - You may add exploratory datasets, benchmarks, and comparison methods inside the approved exploration envelope.
 - You may promote an exploratory addition to the primary package only after the promotion policy in `auto-mode.md` is satisfied and the promotion is written back into `.lab/context/data-decisions.md`, `.lab/context/decisions.md`, `.lab/context/state.md`, and `.lab/context/session-brief.md`.
 - Poll long-running commands until they complete, time out, or hit a stop condition.
-- Update `.lab/context/auto-status.md`, `.lab/context/state.md`, `.lab/context/decisions.md`, `.lab/context/data-decisions.md`, `.lab/context/evidence-index.md`, and `.lab/context/session-brief.md` as the campaign advances.
+- Update `.lab/context/auto-status.md`, `.lab/context/state.md`, `.lab/context/workflow-state.md`, `.lab/context/decisions.md`, `.lab/context/data-decisions.md`, `.lab/context/evidence-index.md`, and `.lab/context/session-brief.md` as the campaign advances.
 - Keep an explicit approval gate when a proposed action would leave the frozen core defined by the auto-mode contract.
 ### `/lab:spec`
 - Read `.lab/config/workflow.json` before drafting the change.
-- Read `.lab/context/mission.md`, `.lab/context/decisions.md`, `.lab/context/state.md`, and `.lab/context/data-decisions.md` before drafting the change.
+- Read `.lab/context/mission.md`, `.lab/context/decisions.md`, `.lab/context/state.md`, `.lab/context/workflow-state.md`, and `.lab/context/data-decisions.md` before drafting the change.
 - Use `.lab/changes/<change-id>/` as the canonical lab change directory.
 - Convert the approved idea into lab change artifacts using `.lab/.managed/templates/proposal.md`, `.lab/.managed/templates/design.md`, `.lab/.managed/templates/spec.md`, and `.lab/.managed/templates/tasks.md`.
 - Update `.lab/context/state.md` and `.lab/context/decisions.md` after freezing the spec.
@@ -108,12 +108,12 @@ Use this skill when the user invokes `/lab:*` or asks for the structured researc
 ### `/lab:run`
 - Start with the smallest meaningful experiment.
-- Read `.lab/context/mission.md`, `.lab/context/state.md`, and `.lab/context/data-decisions.md` before choosing the run.
+- Read `.lab/context/mission.md`, `.lab/context/state.md`, `.lab/context/workflow-state.md`, and `.lab/context/data-decisions.md` before choosing the run.
 - Register the run with `.lab/.managed/scripts/register_run.py`.
 - Normalize the result with `.lab/.managed/scripts/eval_report.py`.
 - Validate normalized output with `.lab/.managed/scripts/validate_results.py`.
 - Read `.lab/context/eval-protocol.md` before choosing the smallest run so the first experiment already targets the approved tables, metrics, and gates.
-- Update `.lab/context/state.md`, `.lab/context/evidence-index.md`, and `.lab/context/eval-protocol.md` after the run.
+- Update `.lab/context/state.md`, `.lab/context/workflow-state.md`, `.lab/context/evidence-index.md`, and `.lab/context/eval-protocol.md` after the run.
 - If the evaluation protocol is still skeletal, initialize the smallest trustworthy source-backed version before treating the run as the protocol anchor.
 ### `/lab:iterate`
@@ -128,13 +128,13 @@ Use this skill when the user invokes `/lab:*` or asks for the structured researc
   - maximum iteration count
 - Only change implementation hypotheses within the loop.
 - Require a normalized evaluation report each round.
-- Read `.lab/context/mission.md`, `.lab/context/state.md`, `.lab/context/decisions.md`, and `.lab/context/evidence-index.md` at the start of each round.
+- Read `.lab/context/mission.md`, `.lab/context/state.md`, `.lab/context/workflow-state.md`, `.lab/context/decisions.md`, and `.lab/context/evidence-index.md` at the start of each round.
 - Read `.lab/context/data-decisions.md` before changing benchmark-facing experiments.
 - Read `.lab/context/eval-protocol.md` before changing evaluation ladders, sample sizes, or promotion gates.
 - Keep metric definitions, baseline behavior, and comparison implementations anchored to the source-backed evaluation protocol before changing thresholds, gates, or ladder transitions.
 - Switch to diagnostic mode if risk increases for two consecutive rounds.
 - Write round reports with `.lab/.managed/templates/iteration-report.md`.
-- Update `.lab/context/state.md`, `.lab/context/decisions.md`, `.lab/context/evidence-index.md`, `.lab/context/open-questions.md`, and `.lab/context/eval-protocol.md` each round as needed.
+- Update `.lab/context/state.md`, `.lab/context/workflow-state.md`, `.lab/context/decisions.md`, `.lab/context/evidence-index.md`, `.lab/context/open-questions.md`, and `.lab/context/eval-protocol.md` each round as needed.
 - Keep `.lab/context/eval-protocol.md` synchronized with accepted ladder changes, benchmark scope, and source-backed implementation deviations.
 - Stop at threshold success or iteration cap, and record blockers plus next-best actions when the campaign ends without success.
@@ -151,13 +151,13 @@ Use this skill when the user invokes `/lab:*` or asks for the structured researc
 ### `/lab:report`
 - Summarize all validated iteration summaries.
-- Read `.lab/context/mission.md`, `.lab/context/state.md`, `.lab/context/decisions.md`, `.lab/context/evidence-index.md`, and `.lab/context/data-decisions.md` before drafting.
+- Read `.lab/context/mission.md`, `.lab/context/state.md`, `.lab/context/workflow-state.md`, `.lab/context/decisions.md`, `.lab/context/evidence-index.md`, and `.lab/context/data-decisions.md` before drafting.
 - Read `.lab/context/eval-protocol.md` before choosing tables, thresholds, or final result framing.
 - Keep metric definitions, comparison semantics, and implementation references anchored to the approved evaluation protocol instead of re-deriving them during reporting.
 - Aggregate them with `.lab/.managed/scripts/summarize_iterations.py`.
-- Write the final document with `.lab/.managed/templates/final-report.md` and the managed table summary with `.lab/.managed/templates/main-tables.md`.
+- Write the final document with `.lab/.managed/templates/final-report.md`, the managed table summary with `.lab/.managed/templates/main-tables.md`, and the internal handoff with `.lab/.managed/templates/artifact-status.md`.
 - Keep failed attempts and limitations visible.
-- Update `.lab/context/mission.md`, `.lab/context/eval-protocol.md`, `.lab/context/state.md`, and `.lab/context/evidence-index.md` with report-level handoff notes.
+- Update `.lab/context/mission.md`, `.lab/context/eval-protocol.md`, `.lab/context/state.md`, `.lab/context/workflow-state.md`, and `.lab/context/evidence-index.md` with report-level handoff notes.
 - If canonical context is still skeletal, hydrate the smallest trustworthy version from frozen artifacts before finalizing the report.
 - If collaborator-critical fields remain missing after hydration, downgrade to an `artifact-anchored interim report` instead of presenting a final collaborator-ready report.

package/package-assets/shared/skills/lab/stages/report.md CHANGED Viewed

@@ -16,6 +16,7 @@
 - experiment setup
 - validated main results
 - managed main tables artifact under `<deliverables_root>/main-tables.md`
+- internal artifact-status artifact under `<deliverables_root>/artifact-status.md`
 - how-to-read-the-tables guide
 - ablations
 - failed attempts
@@ -27,6 +28,7 @@
 - `.lab/context/mission.md`
 - `.lab/context/state.md`
+- `.lab/context/workflow-state.md`
 - `.lab/context/decisions.md`
 - `.lab/context/evidence-index.md`
 - `.lab/context/data-decisions.md`
@@ -38,6 +40,7 @@
 - `.lab/context/mission.md`
 - `.lab/context/eval-protocol.md`
 - `.lab/context/state.md`
+- `.lab/context/workflow-state.md`
 - `.lab/context/evidence-index.md`
 ## Evidence Rules
@@ -56,7 +59,7 @@
 - When citing prior work or baselines in the method overview, include only the few anchor references a collaborator needs, and summarize their role and limitation in one short line each.
 - Report only the few references a collaborator needs to orient themselves quickly; do not turn `report.md` into a full bibliography dump.
 - In `Background Sources`, `Method and Baseline Sources`, and `Metric Sources`, every anchor must include a citation line, one short line about what it established or measures, and one limitation or caveat.
-- Internal provenance belongs in `Artifact Status` or `.lab/context/evidence-index.md`, not in the external-review-ready source sections.
+- Internal provenance belongs in `<deliverables_root>/artifact-status.md` or `.lab/context/evidence-index.md`, not in the external-review-ready source sections.
 - If the report depends on a deviation from an original metric or implementation, state that deviation explicitly instead of smoothing it over.
 - Carry the approved `Claim boundary` into the collaborator-facing report instead of implying broader validity than the protocol allows.
 - If the `Academic Validity Checks` or `Integrity self-check` sections are incomplete, contradictory, or obviously violated by the evidence, degrade the report instead of presenting it as collaborator-ready.
@@ -67,7 +70,7 @@
 - If collaborator-critical fields still remain missing after hydration, downgrade the output to an `artifact-anchored interim report` instead of presenting it as a final collaborator-ready report.
 - If the existing `report.md` or `main-tables.md` is missing required collaborator-facing sections from the managed templates, treat that as a report deficiency. A rerun must repair the missing sections instead of declaring "no content change" or treating the rerun as a no-op.
 - After drafting or rerunning the report, run `.lab/.managed/scripts/validate_collaborator_report.py --report <deliverables_root>/report.md --main-tables <deliverables_root>/main-tables.md`. If it fails, keep editing until it passes; do not stop at a no-op audit rerun.
-- Do not mix workflow deliverable status, rerun ids, or manuscript skeleton status into validated scientific findings; keep those in a separate artifact-status section.
+- Do not mix workflow deliverable status, rerun ids, or manuscript skeleton status into validated scientific findings; keep those in `<deliverables_root>/artifact-status.md`.
 - If `.lab/config/workflow.json` sets the workflow language to Chinese, write `report.md` and `<deliverables_root>/main-tables.md` in Chinese unless a file path, code identifier, or literal metric name must remain unchanged.
 - Prefer conservative interpretation over marketing language.
 - Leave a clear handoff path into `/lab:write` with evidence links that section drafts can cite.

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "superlab",
-  "version": "0.1.24",
+  "version": "0.1.25",
   "description": "Strict /lab research workflow installer for Codex and Claude",
   "keywords": [
     "codex",