npm - @sanity/ailf - Versions diffs - 2.6.0 → 2.7.1 - Mend

@sanity/ailf 2.6.0 → 2.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/dist/_vendor/ailf-core/examples/index.d.ts +1 -1
package/dist/_vendor/ailf-core/examples/index.js +1 -1
package/dist/_vendor/ailf-core/types/index.d.ts +7 -2
package/dist/cli.js +2 -0
package/dist/commands/check-staleness.d.ts +14 -0
package/dist/commands/check-staleness.js +74 -0
package/dist/commands/init.js +2 -6
package/dist/orchestration/steps/publish-report-step.js +20 -2
package/package.json +3 -3

package/dist/_vendor/ailf-core/examples/index.d.ts CHANGED Viewed

@@ -433,6 +433,6 @@ export interface ExampleRecord {
 }
 export declare const EXAMPLES: Record<ExampleType, ExampleRecord>;
 /** GitHub Actions workflow template for AI Literacy evaluation */
-export declare const workflowYaml = "# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n# AI Literacy Evaluation \u2014 GitHub Actions workflow\n# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n#\n# Evaluates your documentation quality on every pull request.\n# The AILF CLI reads your .ailf/tasks/ definitions, submits them\n# to the AILF API for evaluation, and writes a score report.\n#\n# Prerequisites:\n#   Add one secret to your repository (Settings \u2192 Secrets \u2192 Actions):\n#     AILF_API_KEY \u2014 your API key (starts with ailf_live_sk_)\n#     NPM_TOKEN   \u2014 npm token with read access to @sanity scope\n#\n# Customization:\n#   - Narrow the trigger paths to reduce cost (see comment below)\n#   - Check debug_mode for faster iteration (fewer tests)\n#   - See: https://github.com/sanity-labs/ai-literacy-framework\n# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n\nname: AI Literacy Eval\n\non:\n  pull_request:\n    branches: [main]\n    # Runs on every PR to main by default. To reduce cost:\n    #   paths: [\".ailf/**\", \"docs/**\"]\n\n  workflow_dispatch:\n    inputs:\n      debug_mode:\n        description: \"Run in debug mode (fewer tests, faster iteration)\"\n        type: boolean\n        default: false\n\nconcurrency:\n  group: ailf-eval-${{ github.event.pull_request.number || github.ref }}\n  cancel-in-progress: true\n\njobs:\n  evaluate:\n    name: AI Literacy Evaluation\n    runs-on: ubuntu-latest\n    permissions:\n      contents: read\n      pull-requests: write\n    steps:\n      - uses: actions/checkout@v4\n\n      - name: Configure npm for @sanity scope\n        run:\n          echo \"//registry.npmjs.org/:_authToken=${{ secrets.NPM_TOKEN }}\" >>\n          ~/.npmrc\n\n      - name: Run evaluation\n        id: eval\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n        run: |\n          npx @sanity/ailf@latest pipeline --remote \\\n            --output /tmp/ailf-report.md \\\n            ${{ inputs.debug_mode && '--debug' || '' }}\n\n      - name: Post PR comment\n        if: always() && github.event_name == 'pull_request'\n        uses: actions/github-script@v7\n        with:\n          script: |\n            const fs = require('fs');\n\n            // --- Constants ---\n            const MARKER = '<!-- ailf-score-report -->';\n            const HISTORY_START = '<!-- ailf-score-history -->';\n            const HISTORY_END = '<!-- /ailf-score-history -->';\n            const MAX_HISTORY = 3; // keep at most 3 prior runs\n\n            // --- Read new report ---\n            let newReport;\n            try {\n              newReport = fs.readFileSync('/tmp/ailf-report.md', 'utf-8');\n            } catch {\n              newReport = `## \u26A0\uFE0F AI Literacy Evaluation\\n\\nNo report generated. Check the [workflow logs](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}).`;\n            }\n\n            const prNumber = context.issue?.number || context.payload?.pull_request?.number;\n            if (!prNumber) {\n              console.log('No PR number found, skipping comment');\n              return;\n            }\n\n            // --- Find existing comment ---\n            const { data: comments } = await github.rest.issues.listComments({\n              owner: context.repo.owner, repo: context.repo.repo,\n              issue_number: prNumber,\n            });\n            const existing = comments.find(c => c.body?.includes(MARKER));\n\n            // --- Build history from previous comment ---\n            let historyEntries = [];\n            if (existing) {\n              const oldBody = existing.body || '';\n\n              // Collect existing collapsed history entries\n              const histStart = oldBody.indexOf(HISTORY_START);\n              const histEnd = oldBody.indexOf(HISTORY_END);\n              if (histStart !== -1 && histEnd !== -1) {\n                const historyContent = oldBody.slice(histStart + HISTORY_START.length, histEnd).trim();\n                // Split on </details> boundaries to get individual entries\n                if (historyContent) {\n                  historyEntries = historyContent\n                    .split(/<\\/details>\\s*/)\n                    .map(s => s.trim())\n                    .filter(s => s.startsWith('<details>'))\n                    .map(s => s + '\\n</details>');\n                }\n              }\n\n              // Extract the current report (will become the newest history entry)\n              let previousReport = '';\n              if (histStart !== -1) {\n                // Report is between MARKER and the \"Previous runs\" heading (or history section)\n                const markerIdx = oldBody.indexOf(MARKER);\n                // Find the --- separator before history\n                const separatorIdx = oldBody.lastIndexOf('---', histStart);\n                const endIdx = separatorIdx > markerIdx ? separatorIdx : histStart;\n                previousReport = oldBody.slice(markerIdx + MARKER.length, endIdx).trim();\n              } else {\n                // No history yet \u2014 everything after MARKER is the report\n                const markerIdx = oldBody.indexOf(MARKER);\n                if (markerIdx !== -1) {\n                  previousReport = oldBody.slice(markerIdx + MARKER.length).trim();\n                }\n              }\n\n              // Collapse the previous report into a <details> entry\n              if (previousReport) {\n                const scoreMatch = previousReport.match(/Overall:\\s*(\\d+)\\/100/);\n                const score = scoreMatch ? scoreMatch[1] : '?';\n                const dateMatch = previousReport.match(/Generated by.*?\u00B7\\s*([^\u00B7<\\n*]+)/);\n                const date = dateMatch\n                  ? dateMatch[1].trim()\n                  : new Date().toISOString().slice(0, 16).replace('T', ' ') + ' UTC';\n                const entry = `<details>\\n<summary>\uD83D\uDCDC ${date} \u2014 ${score}/100</summary>\\n\\n${previousReport}\\n\\n</details>`;\n                historyEntries.unshift(entry); // newest first\n              }\n\n              // Enforce max history limit\n              historyEntries = historyEntries.slice(0, MAX_HISTORY);\n            }\n\n            // --- Assemble final comment ---\n            const historySection = historyEntries.length > 0\n              ? `\\n\\n---\\n\\n### \uD83D\uDCDC Previous runs\\n\\n${HISTORY_START}\\n${historyEntries.join('\\n\\n')}\\n${HISTORY_END}`\n              : '';\n            const finalBody = `${MARKER}\\n${newReport}${historySection}`;\n\n            if (existing) {\n              await github.rest.issues.updateComment({\n                owner: context.repo.owner, repo: context.repo.repo,\n                comment_id: existing.id, body: finalBody,\n              });\n              console.log(`Updated comment (${historyEntries.length} history entries)`);\n            } else {\n              await github.rest.issues.createComment({\n                owner: context.repo.owner, repo: context.repo.repo,\n                issue_number: prNumber, body: finalBody,\n              });\n              console.log('Created new PR comment');\n            }\n\n      - name: Summary\n        if: always()\n        run: |\n          if [ -f /tmp/ailf-report.md ]; then\n            cat /tmp/ailf-report.md >> \"$GITHUB_STEP_SUMMARY\"\n          else\n            echo \"## \u26A0\uFE0F AI Literacy Evaluation\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"No report generated. Check the workflow logs.\" >> \"$GITHUB_STEP_SUMMARY\"\n          fi\n";
+export declare const workflowYaml = "# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n# AI Literacy Evaluation \u2014 GitHub Actions workflow\n# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n#\n# Evaluates your documentation quality on every pull request.\n# The AILF CLI reads your .ailf/tasks/ definitions, submits them\n# to the AILF API for evaluation, and writes a score report.\n#\n# Prerequisites:\n#   Add one secret to your repository (Settings \u2192 Secrets \u2192 Actions):\n#     AILF_API_KEY \u2014 your API key (starts with ailf_live_sk_)\n#\n#   @sanity/ailf is published with public npm access, so no npm token is\n#   needed to install the CLI.\n#\n# Customization:\n#   - Narrow the trigger paths to reduce cost (see comment below)\n#   - Check debug_mode for faster iteration (fewer tests)\n#   - See: https://github.com/sanity-labs/ai-literacy-framework\n# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n\nname: AI Literacy Eval\n\non:\n  pull_request:\n    branches: [main]\n    # Runs on every PR to main by default. To reduce cost:\n    #   paths: [\".ailf/**\", \"docs/**\"]\n\n  workflow_dispatch:\n    inputs:\n      debug_mode:\n        description: \"Run in debug mode (fewer tests, faster iteration)\"\n        type: boolean\n        default: false\n\nconcurrency:\n  group: ailf-eval-${{ github.event.pull_request.number || github.ref }}\n  cancel-in-progress: true\n\njobs:\n  evaluate:\n    name: AI Literacy Evaluation\n    runs-on: ubuntu-latest\n    permissions:\n      contents: read\n      pull-requests: write\n    steps:\n      - uses: actions/checkout@v4\n\n      - name: Run evaluation\n        id: eval\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n        run: |\n          npx @sanity/ailf@latest pipeline --remote \\\n            --output /tmp/ailf-report.md \\\n            ${{ inputs.debug_mode && '--debug' || '' }}\n\n      - name: Post PR comment\n        if: always() && github.event_name == 'pull_request'\n        uses: actions/github-script@v7\n        with:\n          script: |\n            const fs = require('fs');\n\n            // --- Constants ---\n            const MARKER = '<!-- ailf-score-report -->';\n            const HISTORY_START = '<!-- ailf-score-history -->';\n            const HISTORY_END = '<!-- /ailf-score-history -->';\n            const MAX_HISTORY = 3; // keep at most 3 prior runs\n\n            // --- Read new report ---\n            let newReport;\n            try {\n              newReport = fs.readFileSync('/tmp/ailf-report.md', 'utf-8');\n            } catch {\n              newReport = `## \u26A0\uFE0F AI Literacy Evaluation\\n\\nNo report generated. Check the [workflow logs](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}).`;\n            }\n\n            const prNumber = context.issue?.number || context.payload?.pull_request?.number;\n            if (!prNumber) {\n              console.log('No PR number found, skipping comment');\n              return;\n            }\n\n            // --- Find existing comment ---\n            const { data: comments } = await github.rest.issues.listComments({\n              owner: context.repo.owner, repo: context.repo.repo,\n              issue_number: prNumber,\n            });\n            const existing = comments.find(c => c.body?.includes(MARKER));\n\n            // --- Build history from previous comment ---\n            let historyEntries = [];\n            if (existing) {\n              const oldBody = existing.body || '';\n\n              // Collect existing collapsed history entries\n              const histStart = oldBody.indexOf(HISTORY_START);\n              const histEnd = oldBody.indexOf(HISTORY_END);\n              if (histStart !== -1 && histEnd !== -1) {\n                const historyContent = oldBody.slice(histStart + HISTORY_START.length, histEnd).trim();\n                // Split on </details> boundaries to get individual entries\n                if (historyContent) {\n                  historyEntries = historyContent\n                    .split(/<\\/details>\\s*/)\n                    .map(s => s.trim())\n                    .filter(s => s.startsWith('<details>'))\n                    .map(s => s + '\\n</details>');\n                }\n              }\n\n              // Extract the current report (will become the newest history entry)\n              let previousReport = '';\n              if (histStart !== -1) {\n                // Report is between MARKER and the \"Previous runs\" heading (or history section)\n                const markerIdx = oldBody.indexOf(MARKER);\n                // Find the --- separator before history\n                const separatorIdx = oldBody.lastIndexOf('---', histStart);\n                const endIdx = separatorIdx > markerIdx ? separatorIdx : histStart;\n                previousReport = oldBody.slice(markerIdx + MARKER.length, endIdx).trim();\n              } else {\n                // No history yet \u2014 everything after MARKER is the report\n                const markerIdx = oldBody.indexOf(MARKER);\n                if (markerIdx !== -1) {\n                  previousReport = oldBody.slice(markerIdx + MARKER.length).trim();\n                }\n              }\n\n              // Collapse the previous report into a <details> entry\n              if (previousReport) {\n                const scoreMatch = previousReport.match(/Overall:\\s*(\\d+)\\/100/);\n                const score = scoreMatch ? scoreMatch[1] : '?';\n                const dateMatch = previousReport.match(/Generated by.*?\u00B7\\s*([^\u00B7<\\n*]+)/);\n                const date = dateMatch\n                  ? dateMatch[1].trim()\n                  : new Date().toISOString().slice(0, 16).replace('T', ' ') + ' UTC';\n                const entry = `<details>\\n<summary>\uD83D\uDCDC ${date} \u2014 ${score}/100</summary>\\n\\n${previousReport}\\n\\n</details>`;\n                historyEntries.unshift(entry); // newest first\n              }\n\n              // Enforce max history limit\n              historyEntries = historyEntries.slice(0, MAX_HISTORY);\n            }\n\n            // --- Assemble final comment ---\n            const historySection = historyEntries.length > 0\n              ? `\\n\\n---\\n\\n### \uD83D\uDCDC Previous runs\\n\\n${HISTORY_START}\\n${historyEntries.join('\\n\\n')}\\n${HISTORY_END}`\n              : '';\n            const finalBody = `${MARKER}\\n${newReport}${historySection}`;\n\n            if (existing) {\n              await github.rest.issues.updateComment({\n                owner: context.repo.owner, repo: context.repo.repo,\n                comment_id: existing.id, body: finalBody,\n              });\n              console.log(`Updated comment (${historyEntries.length} history entries)`);\n            } else {\n              await github.rest.issues.createComment({\n                owner: context.repo.owner, repo: context.repo.repo,\n                issue_number: prNumber, body: finalBody,\n              });\n              console.log('Created new PR comment');\n            }\n\n      - name: Summary\n        if: always()\n        run: |\n          if [ -f /tmp/ailf-report.md ]; then\n            cat /tmp/ailf-report.md >> \"$GITHUB_STEP_SUMMARY\"\n          else\n            echo \"## \u26A0\uFE0F AI Literacy Evaluation\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"No report generated. Check the workflow logs.\" >> \"$GITHUB_STEP_SUMMARY\"\n          fi\n";
 /** TypeScript project configuration template (ailf.config.ts) */
 export declare const ailfConfigTs = "/**\n * .ailf/ailf.config.ts \u2014 AI Literacy Framework project configuration.\n *\n * This file configures how the AILF evaluation pipeline runs in this\n * repository. Place it at .ailf/ailf.config.ts in your project root.\n *\n * Evaluations are submitted to the AILF API (ailf-api.sanity.build).\n * The API handles LLM calls, doc fetching, grading, and report\n * publishing. Your repo only needs one secret: AILF_API_KEY.\n *\n * Docs: https://github.com/sanity-labs/ai-literacy-framework\n */\n\nexport default {\n  /**\n   * Documentation source \u2014 which docs are being evaluated.\n   *\n   * This tells the pipeline which Sanity project and dataset contain\n   * the documentation under test. For most users, this is Sanity's own\n   * docs project.\n   */\n  source: {\n    /** Sanity project ID (find yours at sanity.io/manage) */\n    projectId: \"3do82whm\",\n    /** The dataset to query (e.g., \"production\", \"next\") */\n    dataset: \"next\",\n    /**\n     * The public URL of your documentation site.\n     * Used by agentic mode to test agent discoverability.\n     */\n    baseUrl: \"https://www.sanity.io/docs\",\n  },\n\n  /**\n   * Trigger configuration \u2014 when evaluations run automatically.\n   *\n   * Each key is a trigger context. The pipeline checks which trigger\n   * matches the current execution context (PR, merge, schedule, etc.)\n   * and applies its settings.\n   *\n   * Mode options:\n   *   \"validate-only\" \u2014 check that task files parse correctly (fast, no LLM calls)\n   *   \"eval\"          \u2014 run the full evaluation pipeline\n   */\n  triggers: {\n    /** On pull requests: just validate task files parse correctly. */\n    pr: {\n      mode: \"validate-only\",\n    },\n\n    /** When .ailf/ files change in a PR: run a real evaluation. */\n    \"pr-task-change\": {\n      mode: \"eval\",\n      paths: [\".ailf/**\"],\n    },\n\n    /** On merge to main: run evaluation (non-blocking). */\n    main: {\n      mode: \"eval\",\n      blocking: false,\n      notify: true,\n    },\n  },\n}\n";

package/dist/_vendor/ailf-core/examples/index.js CHANGED Viewed

@@ -630,7 +630,7 @@ export const EXAMPLES = {
 // Raw file exports (non-data files, exported as raw strings)
 // ---------------------------------------------------------------------------
 /** GitHub Actions workflow template for AI Literacy evaluation */
-export const workflowYaml = "# ──────────────────────────────────────────────────────────────────────\n# AI Literacy Evaluation — GitHub Actions workflow\n# ──────────────────────────────────────────────────────────────────────\n#\n# Evaluates your documentation quality on every pull request.\n# The AILF CLI reads your .ailf/tasks/ definitions, submits them\n# to the AILF API for evaluation, and writes a score report.\n#\n# Prerequisites:\n#   Add one secret to your repository (Settings → Secrets → Actions):\n#     AILF_API_KEY — your API key (starts with ailf_live_sk_)\n#     NPM_TOKEN   — npm token with read access to @sanity scope\n#\n# Customization:\n#   - Narrow the trigger paths to reduce cost (see comment below)\n#   - Check debug_mode for faster iteration (fewer tests)\n#   - See: https://github.com/sanity-labs/ai-literacy-framework\n# ──────────────────────────────────────────────────────────────────────\n\nname: AI Literacy Eval\n\non:\n  pull_request:\n    branches: [main]\n    # Runs on every PR to main by default. To reduce cost:\n    #   paths: [\".ailf/**\", \"docs/**\"]\n\n  workflow_dispatch:\n    inputs:\n      debug_mode:\n        description: \"Run in debug mode (fewer tests, faster iteration)\"\n        type: boolean\n        default: false\n\nconcurrency:\n  group: ailf-eval-${{ github.event.pull_request.number || github.ref }}\n  cancel-in-progress: true\n\njobs:\n  evaluate:\n    name: AI Literacy Evaluation\n    runs-on: ubuntu-latest\n    permissions:\n      contents: read\n      pull-requests: write\n    steps:\n      - uses: actions/checkout@v4\n\n      - name: Configure npm for @sanity scope\n        run:\n          echo \"//registry.npmjs.org/:_authToken=${{ secrets.NPM_TOKEN }}\" >>\n          ~/.npmrc\n\n      - name: Run evaluation\n        id: eval\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n        run: |\n          npx @sanity/ailf@latest pipeline --remote \\\n            --output /tmp/ailf-report.md \\\n            ${{ inputs.debug_mode && '--debug' || '' }}\n\n      - name: Post PR comment\n        if: always() && github.event_name == 'pull_request'\n        uses: actions/github-script@v7\n        with:\n          script: |\n            const fs = require('fs');\n\n            // --- Constants ---\n            const MARKER = '<!-- ailf-score-report -->';\n            const HISTORY_START = '<!-- ailf-score-history -->';\n            const HISTORY_END = '<!-- /ailf-score-history -->';\n            const MAX_HISTORY = 3; // keep at most 3 prior runs\n\n            // --- Read new report ---\n            let newReport;\n            try {\n              newReport = fs.readFileSync('/tmp/ailf-report.md', 'utf-8');\n            } catch {\n              newReport = `## ⚠️ AI Literacy Evaluation\\n\\nNo report generated. Check the [workflow logs](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}).`;\n            }\n\n            const prNumber = context.issue?.number || context.payload?.pull_request?.number;\n            if (!prNumber) {\n              console.log('No PR number found, skipping comment');\n              return;\n            }\n\n            // --- Find existing comment ---\n            const { data: comments } = await github.rest.issues.listComments({\n              owner: context.repo.owner, repo: context.repo.repo,\n              issue_number: prNumber,\n            });\n            const existing = comments.find(c => c.body?.includes(MARKER));\n\n            // --- Build history from previous comment ---\n            let historyEntries = [];\n            if (existing) {\n              const oldBody = existing.body || '';\n\n              // Collect existing collapsed history entries\n              const histStart = oldBody.indexOf(HISTORY_START);\n              const histEnd = oldBody.indexOf(HISTORY_END);\n              if (histStart !== -1 && histEnd !== -1) {\n                const historyContent = oldBody.slice(histStart + HISTORY_START.length, histEnd).trim();\n                // Split on </details> boundaries to get individual entries\n                if (historyContent) {\n                  historyEntries = historyContent\n                    .split(/<\\/details>\\s*/)\n                    .map(s => s.trim())\n                    .filter(s => s.startsWith('<details>'))\n                    .map(s => s + '\\n</details>');\n                }\n              }\n\n              // Extract the current report (will become the newest history entry)\n              let previousReport = '';\n              if (histStart !== -1) {\n                // Report is between MARKER and the \"Previous runs\" heading (or history section)\n                const markerIdx = oldBody.indexOf(MARKER);\n                // Find the --- separator before history\n                const separatorIdx = oldBody.lastIndexOf('---', histStart);\n                const endIdx = separatorIdx > markerIdx ? separatorIdx : histStart;\n                previousReport = oldBody.slice(markerIdx + MARKER.length, endIdx).trim();\n              } else {\n                // No history yet — everything after MARKER is the report\n                const markerIdx = oldBody.indexOf(MARKER);\n                if (markerIdx !== -1) {\n                  previousReport = oldBody.slice(markerIdx + MARKER.length).trim();\n                }\n              }\n\n              // Collapse the previous report into a <details> entry\n              if (previousReport) {\n                const scoreMatch = previousReport.match(/Overall:\\s*(\\d+)\\/100/);\n                const score = scoreMatch ? scoreMatch[1] : '?';\n                const dateMatch = previousReport.match(/Generated by.*?·\\s*([^·<\\n*]+)/);\n                const date = dateMatch\n                  ? dateMatch[1].trim()\n                  : new Date().toISOString().slice(0, 16).replace('T', ' ') + ' UTC';\n                const entry = `<details>\\n<summary>📜 ${date} — ${score}/100</summary>\\n\\n${previousReport}\\n\\n</details>`;\n                historyEntries.unshift(entry); // newest first\n              }\n\n              // Enforce max history limit\n              historyEntries = historyEntries.slice(0, MAX_HISTORY);\n            }\n\n            // --- Assemble final comment ---\n            const historySection = historyEntries.length > 0\n              ? `\\n\\n---\\n\\n### 📜 Previous runs\\n\\n${HISTORY_START}\\n${historyEntries.join('\\n\\n')}\\n${HISTORY_END}`\n              : '';\n            const finalBody = `${MARKER}\\n${newReport}${historySection}`;\n\n            if (existing) {\n              await github.rest.issues.updateComment({\n                owner: context.repo.owner, repo: context.repo.repo,\n                comment_id: existing.id, body: finalBody,\n              });\n              console.log(`Updated comment (${historyEntries.length} history entries)`);\n            } else {\n              await github.rest.issues.createComment({\n                owner: context.repo.owner, repo: context.repo.repo,\n                issue_number: prNumber, body: finalBody,\n              });\n              console.log('Created new PR comment');\n            }\n\n      - name: Summary\n        if: always()\n        run: |\n          if [ -f /tmp/ailf-report.md ]; then\n            cat /tmp/ailf-report.md >> \"$GITHUB_STEP_SUMMARY\"\n          else\n            echo \"## ⚠️ AI Literacy Evaluation\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"No report generated. Check the workflow logs.\" >> \"$GITHUB_STEP_SUMMARY\"\n          fi\n";
+export const workflowYaml = "# ──────────────────────────────────────────────────────────────────────\n# AI Literacy Evaluation — GitHub Actions workflow\n# ──────────────────────────────────────────────────────────────────────\n#\n# Evaluates your documentation quality on every pull request.\n# The AILF CLI reads your .ailf/tasks/ definitions, submits them\n# to the AILF API for evaluation, and writes a score report.\n#\n# Prerequisites:\n#   Add one secret to your repository (Settings → Secrets → Actions):\n#     AILF_API_KEY — your API key (starts with ailf_live_sk_)\n#\n#   @sanity/ailf is published with public npm access, so no npm token is\n#   needed to install the CLI.\n#\n# Customization:\n#   - Narrow the trigger paths to reduce cost (see comment below)\n#   - Check debug_mode for faster iteration (fewer tests)\n#   - See: https://github.com/sanity-labs/ai-literacy-framework\n# ──────────────────────────────────────────────────────────────────────\n\nname: AI Literacy Eval\n\non:\n  pull_request:\n    branches: [main]\n    # Runs on every PR to main by default. To reduce cost:\n    #   paths: [\".ailf/**\", \"docs/**\"]\n\n  workflow_dispatch:\n    inputs:\n      debug_mode:\n        description: \"Run in debug mode (fewer tests, faster iteration)\"\n        type: boolean\n        default: false\n\nconcurrency:\n  group: ailf-eval-${{ github.event.pull_request.number || github.ref }}\n  cancel-in-progress: true\n\njobs:\n  evaluate:\n    name: AI Literacy Evaluation\n    runs-on: ubuntu-latest\n    permissions:\n      contents: read\n      pull-requests: write\n    steps:\n      - uses: actions/checkout@v4\n\n      - name: Run evaluation\n        id: eval\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n        run: |\n          npx @sanity/ailf@latest pipeline --remote \\\n            --output /tmp/ailf-report.md \\\n            ${{ inputs.debug_mode && '--debug' || '' }}\n\n      - name: Post PR comment\n        if: always() && github.event_name == 'pull_request'\n        uses: actions/github-script@v7\n        with:\n          script: |\n            const fs = require('fs');\n\n            // --- Constants ---\n            const MARKER = '<!-- ailf-score-report -->';\n            const HISTORY_START = '<!-- ailf-score-history -->';\n            const HISTORY_END = '<!-- /ailf-score-history -->';\n            const MAX_HISTORY = 3; // keep at most 3 prior runs\n\n            // --- Read new report ---\n            let newReport;\n            try {\n              newReport = fs.readFileSync('/tmp/ailf-report.md', 'utf-8');\n            } catch {\n              newReport = `## ⚠️ AI Literacy Evaluation\\n\\nNo report generated. Check the [workflow logs](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}).`;\n            }\n\n            const prNumber = context.issue?.number || context.payload?.pull_request?.number;\n            if (!prNumber) {\n              console.log('No PR number found, skipping comment');\n              return;\n            }\n\n            // --- Find existing comment ---\n            const { data: comments } = await github.rest.issues.listComments({\n              owner: context.repo.owner, repo: context.repo.repo,\n              issue_number: prNumber,\n            });\n            const existing = comments.find(c => c.body?.includes(MARKER));\n\n            // --- Build history from previous comment ---\n            let historyEntries = [];\n            if (existing) {\n              const oldBody = existing.body || '';\n\n              // Collect existing collapsed history entries\n              const histStart = oldBody.indexOf(HISTORY_START);\n              const histEnd = oldBody.indexOf(HISTORY_END);\n              if (histStart !== -1 && histEnd !== -1) {\n                const historyContent = oldBody.slice(histStart + HISTORY_START.length, histEnd).trim();\n                // Split on </details> boundaries to get individual entries\n                if (historyContent) {\n                  historyEntries = historyContent\n                    .split(/<\\/details>\\s*/)\n                    .map(s => s.trim())\n                    .filter(s => s.startsWith('<details>'))\n                    .map(s => s + '\\n</details>');\n                }\n              }\n\n              // Extract the current report (will become the newest history entry)\n              let previousReport = '';\n              if (histStart !== -1) {\n                // Report is between MARKER and the \"Previous runs\" heading (or history section)\n                const markerIdx = oldBody.indexOf(MARKER);\n                // Find the --- separator before history\n                const separatorIdx = oldBody.lastIndexOf('---', histStart);\n                const endIdx = separatorIdx > markerIdx ? separatorIdx : histStart;\n                previousReport = oldBody.slice(markerIdx + MARKER.length, endIdx).trim();\n              } else {\n                // No history yet — everything after MARKER is the report\n                const markerIdx = oldBody.indexOf(MARKER);\n                if (markerIdx !== -1) {\n                  previousReport = oldBody.slice(markerIdx + MARKER.length).trim();\n                }\n              }\n\n              // Collapse the previous report into a <details> entry\n              if (previousReport) {\n                const scoreMatch = previousReport.match(/Overall:\\s*(\\d+)\\/100/);\n                const score = scoreMatch ? scoreMatch[1] : '?';\n                const dateMatch = previousReport.match(/Generated by.*?·\\s*([^·<\\n*]+)/);\n                const date = dateMatch\n                  ? dateMatch[1].trim()\n                  : new Date().toISOString().slice(0, 16).replace('T', ' ') + ' UTC';\n                const entry = `<details>\\n<summary>📜 ${date} — ${score}/100</summary>\\n\\n${previousReport}\\n\\n</details>`;\n                historyEntries.unshift(entry); // newest first\n              }\n\n              // Enforce max history limit\n              historyEntries = historyEntries.slice(0, MAX_HISTORY);\n            }\n\n            // --- Assemble final comment ---\n            const historySection = historyEntries.length > 0\n              ? `\\n\\n---\\n\\n### 📜 Previous runs\\n\\n${HISTORY_START}\\n${historyEntries.join('\\n\\n')}\\n${HISTORY_END}`\n              : '';\n            const finalBody = `${MARKER}\\n${newReport}${historySection}`;\n\n            if (existing) {\n              await github.rest.issues.updateComment({\n                owner: context.repo.owner, repo: context.repo.repo,\n                comment_id: existing.id, body: finalBody,\n              });\n              console.log(`Updated comment (${historyEntries.length} history entries)`);\n            } else {\n              await github.rest.issues.createComment({\n                owner: context.repo.owner, repo: context.repo.repo,\n                issue_number: prNumber, body: finalBody,\n              });\n              console.log('Created new PR comment');\n            }\n\n      - name: Summary\n        if: always()\n        run: |\n          if [ -f /tmp/ailf-report.md ]; then\n            cat /tmp/ailf-report.md >> \"$GITHUB_STEP_SUMMARY\"\n          else\n            echo \"## ⚠️ AI Literacy Evaluation\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"No report generated. Check the workflow logs.\" >> \"$GITHUB_STEP_SUMMARY\"\n          fi\n";
 // ---------------------------------------------------------------------------
 // TypeScript template exports (for ailf init --output-format ts)
 // ---------------------------------------------------------------------------

package/dist/_vendor/ailf-core/types/index.d.ts CHANGED Viewed

@@ -309,8 +309,13 @@ export interface StoredTestResult {
      * API error, or refusal). Same semantics as GraderJudgment.outputFailure.
      */
     outputFailure?: boolean;
-    /** The model's generated code/response (truncated to 8000 chars) */
-    responseOutput: string;
+    /**
+     * The model's generated code/response (truncated to 8000 chars).
+     * Populated by the scoring step and used by uploadTestOutputs. Stripped
+     * from the inline shape after upload (D0030) — the full value lives in
+     * the GCS artifact, keyed by `{taskId}::{modelId}`.
+     */
+    responseOutput?: string;
     /** True when responseOutput was truncated from a longer response */
     responseOutputTruncated?: boolean;
     /** Task description (e.g. "Functions - Webhook handler (gold)") */

package/dist/cli.js CHANGED Viewed

@@ -147,6 +147,8 @@ import { createAgentReportCommand } from "./commands/agent-report.js";
 program.addCommand(createAgentReportCommand().helpGroup(CommandGroup.AnalysisReports));
 import { createWeeklyDigestCommand } from "./commands/weekly-digest.js";
 program.addCommand(createWeeklyDigestCommand().helpGroup(CommandGroup.AnalysisReports));
+import { createCheckStalenessCommand } from "./commands/check-staleness.js";
+program.addCommand(createCheckStalenessCommand().helpGroup(CommandGroup.AnalysisReports));
 // ── Grader Reliability ────────────────────────────────────────────────
 import { createGraderCommand } from "./commands/grader/index.js";
 program.addCommand(createGraderCommand().helpGroup(CommandGroup.GraderReliability));

package/dist/commands/check-staleness.d.ts ADDED Viewed

@@ -0,0 +1,14 @@
+/**
+ * check-staleness command — verifies recent evaluation reports exist.
+ *
+ * Exits 0 when the most recent report in the Sanity Content Lake is within
+ * the max-age window, 1 otherwise (including "no reports at all"). Emits a
+ * single JSON line on stdout summarizing the decision so CI can pipe it
+ * directly into an alert payload.
+ *
+ * Used by the scheduled staleness workflow to detect silent pipeline
+ * failures — cases where scheduled evaluations stop producing reports but
+ * no workflow run fails loudly enough to be noticed.
+ */
+import { Command } from "commander";
+export declare function createCheckStalenessCommand(): Command;

package/dist/commands/check-staleness.js ADDED Viewed

@@ -0,0 +1,74 @@
+/**
+ * check-staleness command — verifies recent evaluation reports exist.
+ *
+ * Exits 0 when the most recent report in the Sanity Content Lake is within
+ * the max-age window, 1 otherwise (including "no reports at all"). Emits a
+ * single JSON line on stdout summarizing the decision so CI can pipe it
+ * directly into an alert payload.
+ *
+ * Used by the scheduled staleness workflow to detect silent pipeline
+ * failures — cases where scheduled evaluations stop producing reports but
+ * no workflow run fails loudly enough to be noticed.
+ */
+import { Command } from "commander";
+export function createCheckStalenessCommand() {
+    return new Command("check-staleness")
+        .description("Exit 1 if no evaluation report has been produced within the max-age window")
+        .option("--max-age <days>", "Max age in days before reports are considered stale", (v) => Number.parseInt(v, 10), 3)
+        .action(async (opts) => {
+        const { getSanityClient } = await import("../sanity/client.js");
+        // Resolve report-store credentials with the same precedence as
+        // weekly-digest.ts and composition-root.ts — AILF_REPORT_* wins over
+        // the evaluated-source SANITY_* defaults so the staleness probe tracks
+        // the actual report dataset even when it diverges from the eval source.
+        const client = getSanityClient({
+            dataset: process.env.AILF_REPORT_DATASET,
+            projectId: process.env.AILF_REPORT_PROJECT_ID,
+            token: process.env.AILF_REPORT_SANITY_API_TOKEN ??
+                process.env.SANITY_API_TOKEN,
+        });
+        const maxAgeDays = opts.maxAge;
+        // Bound the GROQ sort with a `completedAt > $floor` filter. Beyond
+        // ~10,000 reports the unbounded `order(completedAt desc)[0]` scan
+        // becomes a noticeable cost; a floor proportional to the max-age
+        // window keeps the scan cheap regardless of corpus size. The factor
+        // of 10× max-age gives plenty of headroom — if the last report
+        // predates the floor, the absence of any result still yields the
+        // correct "stale" verdict.
+        const floorDays = Math.max(maxAgeDays * 10, 30);
+        const floor = new Date(Date.now() - floorDays * 24 * 60 * 60 * 1000).toISOString();
+        const QUERY = `*[_type == "ailf.report" && completedAt > $floor] | order(completedAt desc)[0]{
+        "reportId": reportId,
+        "completedAt": completedAt,
+        "tag": tag
+      }`;
+        const latest = await client.fetch(QUERY, { floor });
+        // Use `process.exitCode` + `return` rather than `process.exit()` so
+        // stdout flushes cleanly when the caller captures via `$(...)` — a
+        // hard exit can drop buffered output on piped captures. Matches the
+        // pattern used by agent-report.ts, capture-list.ts, etc.
+        if (!latest || !latest.completedAt) {
+            console.log(JSON.stringify({
+                floorDays,
+                maxAgeDays,
+                reason: "no-reports",
+                stale: true,
+            }));
+            process.exitCode = 1;
+            return;
+        }
+        const ageMs = Date.now() - new Date(latest.completedAt).getTime();
+        const ageDays = Number((ageMs / (24 * 60 * 60 * 1000)).toFixed(2));
+        const stale = ageDays > maxAgeDays;
+        console.log(JSON.stringify({
+            ageDays,
+            floorDays,
+            latestCompletedAt: latest.completedAt,
+            latestReportId: latest.reportId,
+            latestTag: latest.tag,
+            maxAgeDays,
+            stale,
+        }));
+        process.exitCode = stale ? 1 : 0;
+    });
+}

package/dist/commands/init.js CHANGED Viewed

@@ -250,10 +250,9 @@ async function runInit(opts) {
     console.log(`  1. Edit the example tasks in ${rel(targetDir, tasksDir)}/ — update`);
     console.log("     slugs and prompts for your documentation");
     console.log(`  2. Validate locally: npx @sanity/ailf@latest validate-tasks .ailf/tasks/`);
-    console.log("  3. Add two GitHub Actions secrets");
+    console.log("  3. Add a GitHub Actions secret");
     console.log("     (Settings → Secrets and variables → Actions):");
     console.log("     • AILF_API_KEY — your API key (starts with ailf_live_sk_)");
-    console.log("     • NPM_TOKEN   — npm token with read access to @sanity scope");
     console.log("  4. Push — the workflow at .github/workflows/ailf-eval.yml runs");
     console.log("     automatically on PRs");
     if (format === "ts") {
@@ -262,14 +261,11 @@ async function runInit(opts) {
         console.log("     via defineTask() from @sanity/ailf-core.");
     }
     console.log();
-    console.log("  🔑 Retrieve secrets from 1Password (Sanity employees):");
+    console.log("  🔑 Retrieve the API key from 1Password (Sanity employees):");
     console.log();
     console.log("     # Shared dev API key (for local testing and CI)");
     console.log('     op read "op://Shared/AI Literacy Framework - Shared API Tokens/AILF_API_KEY_DEV"');
     console.log();
-    console.log("     # npm token (read access to @sanity scope)");
-    console.log('     op read "op://Shared/AI Literacy Framework - Shared API Tokens/NPM_TOKEN"');
-    console.log();
     console.log("     Not a Sanity employee? Request an API key from the AILF team.");
     console.log();
     console.log("  💡 Test locally before pushing:");

package/dist/orchestration/steps/publish-report-step.js CHANGED Viewed

@@ -113,11 +113,20 @@ export class PublishReportStep {
             tag: this.options.publishTag ?? ctx.config.publishTag,
             title,
         };
-        // Upload test output artifacts to GCS (D0030 — non-blocking, P5)
+        // Upload test output artifacts to GCS (D0030 — non-blocking, P5).
+        // When upload succeeds, strip responseOutput from the inline
+        // testResults[] so the Content Lake document carries only the slim
+        // shape; the full output lives in the GCS artifact. When upload
+        // fails, leave the inline shape intact so Studio's drill-down UI
+        // still works via the backward-compat fallback.
         if (ctx.artifactUploader && summary.testResults?.length) {
             const artifactRef = await uploadTestOutputs(ctx.artifactUploader, reportId, now, summary.testResults);
             if (artifactRef) {
                 report.artifacts = { testOutputs: artifactRef };
+                report.summary = {
+                    ...summary,
+                    testResults: summary.testResults.map(slimTestResult),
+                };
             }
         }
         // Share reportId with downstream steps (CallbackStep + orchestrator job update)
@@ -218,6 +227,15 @@ function buildProvenanceInput(summary, ctx, options, autoScope) {
         taskIds,
     };
 }
+/**
+ * Strip the large responseOutput fields from a StoredTestResult so the
+ * remaining object is safe to inline in the Content Lake document (D0030).
+ * The full output lives in the GCS artifact uploaded by uploadTestOutputs.
+ */
+function slimTestResult(tr) {
+    const { responseOutput: _o, responseOutputTruncated: _t, ...rest } = tr;
+    return rest;
+}
 /**
  * Extract test outputs from StoredTestResult[] and upload as a single
  * JSON artifact to GCS. The artifact is keyed by `{taskId}::{modelId}`
@@ -230,7 +248,7 @@ async function uploadTestOutputs(uploader, reportId, createdAt, testResults) {
     for (const tr of testResults) {
         const key = `${tr.taskId}::${tr.modelId}`;
         entries[key] = {
-            responseOutput: tr.responseOutput,
+            responseOutput: tr.responseOutput ?? "",
             responseOutputTruncated: tr.responseOutputTruncated ?? false,
         };
     }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@sanity/ailf",
-  "version": "2.6.0",
+  "version": "2.7.1",
   "private": false,
   "publishConfig": {
     "access": "public"
@@ -52,8 +52,8 @@
     "@types/node": "^22.13.1",
     "tsx": "^4.19.2",
     "typescript": "^5.7.3",
-    "@sanity/ailf-core": "0.1.0",
-    "@sanity/ailf-shared": "0.1.0"
+    "@sanity/ailf-shared": "0.1.0",
+    "@sanity/ailf-core": "0.1.0"
   },
   "scripts": {
     "build": "tsc && tsx scripts/bundle-workspace-deps.ts",