npm - @sanity/ailf - Versions diffs - 0.1.5 → 0.1.7 - Mend

@sanity/ailf 0.1.5 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (54) hide show

package/dist/_vendor/ailf-core/examples/index.d.ts +1 -1
package/dist/_vendor/ailf-core/examples/index.js +1 -1
package/dist/_vendor/ailf-core/ports/context.d.ts +6 -0
package/dist/_vendor/ailf-core/schemas/pipeline-request.d.ts +1 -53
package/dist/_vendor/ailf-core/schemas/pipeline-request.js +1 -2
package/dist/_vendor/ailf-tasks/cli.d.ts +8 -0
package/dist/_vendor/ailf-tasks/cli.js +61 -0
package/dist/_vendor/ailf-tasks/index.d.ts +13 -0
package/dist/_vendor/ailf-tasks/index.js +16 -0
package/dist/_vendor/ailf-tasks/parser.d.ts +27 -0
package/dist/_vendor/ailf-tasks/parser.js +73 -0
package/dist/_vendor/ailf-tasks/schemas.d.ts +186 -0
package/dist/_vendor/ailf-tasks/schemas.js +176 -0
package/dist/_vendor/ailf-tasks/validation.d.ts +47 -0
package/dist/_vendor/ailf-tasks/validation.js +162 -0
package/dist/adapters/api-client/api-client.d.ts +75 -0
package/dist/adapters/api-client/api-client.js +201 -0
package/dist/adapters/api-client/build-request.d.ts +75 -0
package/dist/adapters/api-client/build-request.js +176 -0
package/dist/adapters/api-client/errors.d.ts +43 -0
package/dist/adapters/api-client/errors.js +68 -0
package/dist/adapters/api-client/format-error.d.ts +22 -0
package/dist/adapters/api-client/format-error.js +48 -0
package/dist/adapters/api-client/index.d.ts +13 -0
package/dist/adapters/api-client/index.js +12 -0
package/dist/adapters/api-client/progress.d.ts +26 -0
package/dist/adapters/api-client/progress.js +69 -0
package/dist/adapters/api-client/remediation.d.ts +19 -0
package/dist/adapters/api-client/remediation.js +76 -0
package/dist/adapters/api-client/types.d.ts +98 -0
package/dist/adapters/api-client/types.js +14 -0
package/dist/adapters/config-sources/file-config-adapter.js +2 -0
package/dist/adapters/task-sources/repo-schemas.d.ts +16 -181
package/dist/adapters/task-sources/repo-schemas.js +27 -184
package/dist/adapters/task-sources/repo-validation.d.ts +5 -46
package/dist/adapters/task-sources/repo-validation.js +5 -161
package/dist/commands/calculate-scores.js +2 -0
package/dist/commands/explain-handler.js +6 -0
package/dist/commands/fetch-docs.js +2 -0
package/dist/commands/generate-configs.js +2 -0
package/dist/commands/init.js +9 -9
package/dist/commands/pipeline-action.d.ts +3 -0
package/dist/commands/pipeline-action.js +13 -0
package/dist/commands/pipeline.d.ts +2 -0
package/dist/commands/pipeline.js +2 -0
package/dist/commands/pr-comment.js +2 -0
package/dist/commands/publish.js +2 -0
package/dist/commands/remote-pipeline.d.ts +27 -0
package/dist/commands/remote-pipeline.js +133 -0
package/dist/commands/remote-results.d.ts +33 -0
package/dist/commands/remote-results.js +97 -0
package/dist/orchestration/build-app-context.js +3 -0
package/dist/pipeline/map-request-to-config.js +2 -0
package/package.json +2 -1

package/dist/_vendor/ailf-core/examples/index.d.ts CHANGED Viewed

@@ -191,4 +191,4 @@ export interface ExampleRecord {
 }
 export declare const EXAMPLES: Record<ExampleType, ExampleRecord>;
 /** GitHub Actions workflow template for AI Literacy evaluation */
-export declare const workflowYaml = "# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n# AI Literacy Evaluation \u2014 GitHub Actions workflow\n# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n#\n# This workflow submits evaluations to the AILF API when task or config\n# files change in a pull request. The API handles all processing\n# (LLM calls, doc fetching, grading, report publishing).\n#\n# Prerequisites:\n#   Add one secret to your repository (Settings \u2192 Secrets \u2192 Actions):\n#     AILF_API_KEY \u2014 your API key (starts with ailf_live_sk_)\n#\n# Customization:\n#   - Adjust `paths` to match your documentation file locations\n#   - Set full_eval to true for comprehensive (slower) evaluation\n#   - See: https://github.com/sanity-labs/ai-literacy-framework/blob/main/docs/API_GATEWAY.md\n# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n\nname: AI Literacy Eval\n\non:\n  pull_request:\n    branches: [main]\n    paths:\n      - \".ailf/**\"\n\n  # Manual trigger from the Actions tab\n  workflow_dispatch:\n    inputs:\n      full_eval:\n        description: \"Run full evaluation (all tests, slower)\"\n        type: boolean\n        default: false\n\nconcurrency:\n  group: ailf-eval-${{ github.event.pull_request.number || github.ref }}\n  cancel-in-progress: true\n\njobs:\n  evaluate:\n    name: AI Literacy Evaluation\n    runs-on: ubuntu-latest\n    permissions:\n      pull-requests: write\n    steps:\n      # \u2500\u2500\u2500 Submit evaluation to the AILF API \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n      - name: Submit evaluation\n        id: submit\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n          FULL_EVAL: ${{ inputs.full_eval || 'false' }}\n        run: |\n          if [ \"$FULL_EVAL\" = \"true\" ]; then\n            DEBUG_FIELD=\"\"\n          else\n            DEBUG_FIELD='\"debug\": { \"enabled\": true, \"firstN\": 2 },'\n          fi\n\n          PAYLOAD=$(cat <<EOF\n          {\n            \"mode\": \"baseline\",\n            ${DEBUG_FIELD}\n            \"publish\": true,\n            \"compare\": true\n          }\n          EOF\n          )\n\n          RESPONSE=$(curl -sf -X POST \\\n            -H \"Authorization: Bearer $AILF_API_KEY\" \\\n            -H \"Content-Type: application/json\" \\\n            https://ailf-api.sanity.build/v1/pipeline \\\n            -d \"$PAYLOAD\")\n\n          JOB_ID=$(echo \"$RESPONSE\" | jq -r '.jobId')\n          echo \"job_id=$JOB_ID\" >> $GITHUB_OUTPUT\n          echo \"\uD83D\uDCCB Submitted job: $JOB_ID\"\n\n      # \u2500\u2500\u2500 Poll for results (long-polling) \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n      - name: Wait for results\n        id: results\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n          JOB_ID: ${{ steps.submit.outputs.job_id }}\n        run: |\n          for i in $(seq 1 40); do\n            RESPONSE=$(curl -s \\\n              -H \"Authorization: Bearer $AILF_API_KEY\" \\\n              -H \"Prefer: wait=25\" \\\n              \"https://ailf-api.sanity.build/v1/jobs/$JOB_ID\")\n\n            STATUS=$(echo \"$RESPONSE\" | jq -r '.status')\n\n            case \"$STATUS\" in\n              completed)\n                echo \"status=completed\" >> $GITHUB_OUTPUT\n                echo \"report_id=$(echo $RESPONSE | jq -r '.reportId // empty')\" >> $GITHUB_OUTPUT\n                echo \"score=$(echo $RESPONSE | jq -r '.score // empty')\" >> $GITHUB_OUTPUT\n                echo \"\u2705 Evaluation completed\"\n                exit 0\n                ;;\n              failed|timed-out)\n                echo \"status=$STATUS\" >> $GITHUB_OUTPUT\n                echo \"::error::Evaluation $STATUS\"\n                exit 1\n                ;;\n              *)\n                echo \"\u23F3 [$i/40] $STATUS\"\n                ;;\n            esac\n          done\n\n          echo \"::error::Timed out waiting for evaluation\"\n          exit 1\n\n      # \u2500\u2500\u2500 Fetch the markdown report \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n      - name: Fetch markdown report\n        id: markdown\n        if: steps.results.outputs.report_id != ''\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n          REPORT_ID: ${{ steps.results.outputs.report_id }}\n        run: |\n          REPORT_MD=$(curl -sf \\\n            -H \"Authorization: Bearer $AILF_API_KEY\" \\\n            \"https://ailf-api.sanity.build/v1/reports/$REPORT_ID/markdown\")\n\n          if [ $? -eq 0 ] && [ -n \"$REPORT_MD\" ]; then\n            # Write to a temp file to avoid shell quoting issues\n            echo \"$REPORT_MD\" > /tmp/ailf-report.md\n            echo \"fetched=true\" >> $GITHUB_OUTPUT\n          else\n            echo \"fetched=false\" >> $GITHUB_OUTPUT\n            echo \"::warning::Could not fetch markdown report\"\n          fi\n\n      # \u2500\u2500\u2500 Post results to PR \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n      - name: Post PR comment\n        if: >-\n          always() && github.event_name == 'pull_request' &&\n          steps.submit.outputs.job_id != ''\n        uses: actions/github-script@v7\n        env:\n          JOB_STATUS: ${{ steps.results.outputs.status || 'unknown' }}\n          REPORT_ID: ${{ steps.results.outputs.report_id || '' }}\n          JOB_ID: ${{ steps.submit.outputs.job_id }}\n          SCORE: ${{ steps.results.outputs.score || '' }}\n          MARKDOWN_FETCHED: ${{ steps.markdown.outputs.fetched || 'false' }}\n        with:\n          script: |\n            const fs = require('fs');\n            const marker = '<!-- ailf-score-report -->';\n            const status = process.env.JOB_STATUS;\n            const reportId = process.env.REPORT_ID;\n            const jobId = process.env.JOB_ID;\n            const score = process.env.SCORE;\n            const mdFetched = process.env.MARKDOWN_FETCHED === 'true';\n\n            let body;\n\n            if (status === 'completed' && mdFetched) {\n              // Use the full markdown report from the API\n              const reportMd = fs.readFileSync('/tmp/ailf-report.md', 'utf-8');\n              body = `${marker}\\n${reportMd}`;\n              if (reportId) {\n                body += `\\n\uD83D\uDD17 [View in Studio](https://admin.sanity.io/ailf/report/${reportId})`;\n              }\n              body += `\\n\\n<sub>Job: \\`${jobId}\\`</sub>\\n`;\n            } else {\n              // Fallback: minimal comment when markdown is unavailable\n              let icon, message;\n              if (status === 'completed') {\n                icon = '\u2705';\n                message = score\n                  ? `Evaluation completed \u2014 score: **${score}/100**`\n                  : 'Evaluation completed successfully.';\n              } else if (status === 'failed' || status === 'timed-out') {\n                icon = '\u26A0\uFE0F';\n                message = `Evaluation ${status}.`;\n              } else {\n                icon = '\u23F3';\n                message = 'Evaluation status unknown (may still be running).';\n              }\n\n              body = `${marker}\\n## ${icon} AI Literacy Evaluation\\n\\n${message}\\n`;\n              if (reportId) {\n                body += `\\n\uD83D\uDD17 [View in Studio](https://admin.sanity.io/ailf/report/${reportId})\\n`;\n              }\n              body += `\\n<sub>Job: \\`${jobId}\\`</sub>\\n`;\n            }\n\n            const { data: comments } = await github.rest.issues.listComments({\n              owner: context.repo.owner,\n              repo: context.repo.repo,\n              issue_number: context.issue.number,\n            });\n            const existing = comments.find(c => c.body?.includes(marker));\n\n            if (existing) {\n              await github.rest.issues.updateComment({\n                owner: context.repo.owner,\n                repo: context.repo.repo,\n                comment_id: existing.id,\n                body,\n              });\n            } else {\n              await github.rest.issues.createComment({\n                owner: context.repo.owner,\n                repo: context.repo.repo,\n                issue_number: context.issue.number,\n                body,\n              });\n            }\n\n      # \u2500\u2500\u2500 Job summary \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n      - name: Summary\n        if: always()\n        env:\n          JOB_STATUS: ${{ steps.results.outputs.status || 'unknown' }}\n          REPORT_ID: ${{ steps.results.outputs.report_id || '' }}\n          JOB_ID: ${{ steps.submit.outputs.job_id }}\n          SCORE: ${{ steps.results.outputs.score || '' }}\n          MARKDOWN_FETCHED: ${{ steps.markdown.outputs.fetched || 'false' }}\n        run: |\n          if [ \"$JOB_STATUS\" = \"completed\" ] && [ \"$MARKDOWN_FETCHED\" = \"true\" ] && [ -f /tmp/ailf-report.md ]; then\n            # Use the full markdown report as the job summary\n            cat /tmp/ailf-report.md >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            [ -n \"$REPORT_ID\" ] && echo \"\uD83D\uDD17 [View in Studio](https://admin.sanity.io/ailf/report/$REPORT_ID)\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"<sub>Job: \\`$JOB_ID\\`</sub>\" >> \"$GITHUB_STEP_SUMMARY\"\n          else\n            # Fallback: minimal table\n            {\n              echo \"## \uD83D\uDCCA AI Literacy Evaluation\"\n              echo \"\"\n              echo \"| Field | Value |\"\n              echo \"|-------|-------|\"\n              echo \"| Job | \\`$JOB_ID\\` |\"\n              echo \"| Status | $JOB_STATUS |\"\n              [ -n \"$SCORE\" ] && echo \"| Score | $SCORE/100 |\"\n              [ -n \"$REPORT_ID\" ] && echo \"| Report | [$REPORT_ID](https://admin.sanity.io/ailf/report/$REPORT_ID) |\"\n            } >> \"$GITHUB_STEP_SUMMARY\"\n          fi\n";
+export declare const workflowYaml = "# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n# AI Literacy Evaluation \u2014 GitHub Actions workflow\n# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n#\n# Evaluates your documentation quality on every pull request.\n# The AILF CLI reads your .ailf/tasks/ definitions, submits them\n# to the AILF API for evaluation, and writes a score report.\n#\n# Prerequisites:\n#   Add one secret to your repository (Settings \u2192 Secrets \u2192 Actions):\n#     AILF_API_KEY \u2014 your API key (starts with ailf_live_sk_)\n#\n# Customization:\n#   - Narrow the trigger paths to reduce cost (see comment below)\n#   - Set full_eval to true for comprehensive evaluation\n#   - See: https://github.com/sanity-io/ai-literacy-framework\n# \u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\n\nname: AI Literacy Eval\n\non:\n  pull_request:\n    branches: [main]\n    # Runs on every PR to main by default. To reduce cost:\n    #   paths: [\".ailf/**\", \"docs/**\"]\n\n  workflow_dispatch:\n    inputs:\n      full_eval:\n        description: \"Run full evaluation (all tests, slower)\"\n        type: boolean\n        default: false\n\nconcurrency:\n  group: ailf-eval-${{ github.event.pull_request.number || github.ref }}\n  cancel-in-progress: true\n\njobs:\n  evaluate:\n    name: AI Literacy Evaluation\n    runs-on: ubuntu-latest\n    permissions:\n      contents: read\n      pull-requests: write\n    steps:\n      - uses: actions/checkout@v4\n\n      - name: Run evaluation\n        id: eval\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n        run: |\n          npx @sanity/ailf@latest pipeline --remote \\\n            --output /tmp/ailf-report.md \\\n            ${{ inputs.full_eval != 'true' && '--debug' || '' }}\n\n      - name: Post PR comment\n        if: always() && github.event_name == 'pull_request'\n        uses: actions/github-script@v7\n        with:\n          script: |\n            const fs = require('fs');\n            const marker = '<!-- ailf-score-report -->';\n            let body;\n            try {\n              const report = fs.readFileSync('/tmp/ailf-report.md', 'utf-8');\n              body = `${marker}\\n${report}`;\n            } catch {\n              body = `${marker}\\n## \u26A0\uFE0F AI Literacy Evaluation\\n\\nNo report generated. Check the [workflow logs](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}).`;\n            }\n            const { data: comments } = await github.rest.issues.listComments({\n              owner: context.repo.owner, repo: context.repo.repo,\n              issue_number: context.issue.number,\n            });\n            const existing = comments.find(c => c.body?.includes(marker));\n            const params = {\n              owner: context.repo.owner, repo: context.repo.repo,\n              body,\n            };\n            if (existing) {\n              await github.rest.issues.updateComment({ ...params, comment_id: existing.id });\n            } else {\n              await github.rest.issues.createComment({ ...params, issue_number: context.issue.number });\n            }\n\n      - name: Summary\n        if: always()\n        run: |\n          if [ -f /tmp/ailf-report.md ]; then\n            cat /tmp/ailf-report.md >> \"$GITHUB_STEP_SUMMARY\"\n          else\n            echo \"## \u26A0\uFE0F AI Literacy Evaluation\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"No report generated. Check the workflow logs.\" >> \"$GITHUB_STEP_SUMMARY\"\n          fi\n";

package/dist/_vendor/ailf-core/examples/index.js CHANGED Viewed

@@ -289,4 +289,4 @@ export const EXAMPLES = {
 // Raw file exports (non-data files, exported as raw strings)
 // ---------------------------------------------------------------------------
 /** GitHub Actions workflow template for AI Literacy evaluation */
-export const workflowYaml = "# ──────────────────────────────────────────────────────────────────────\n# AI Literacy Evaluation — GitHub Actions workflow\n# ──────────────────────────────────────────────────────────────────────\n#\n# This workflow submits evaluations to the AILF API when task or config\n# files change in a pull request. The API handles all processing\n# (LLM calls, doc fetching, grading, report publishing).\n#\n# Prerequisites:\n#   Add one secret to your repository (Settings → Secrets → Actions):\n#     AILF_API_KEY — your API key (starts with ailf_live_sk_)\n#\n# Customization:\n#   - Adjust `paths` to match your documentation file locations\n#   - Set full_eval to true for comprehensive (slower) evaluation\n#   - See: https://github.com/sanity-labs/ai-literacy-framework/blob/main/docs/API_GATEWAY.md\n# ──────────────────────────────────────────────────────────────────────\n\nname: AI Literacy Eval\n\non:\n  pull_request:\n    branches: [main]\n    paths:\n      - \".ailf/**\"\n\n  # Manual trigger from the Actions tab\n  workflow_dispatch:\n    inputs:\n      full_eval:\n        description: \"Run full evaluation (all tests, slower)\"\n        type: boolean\n        default: false\n\nconcurrency:\n  group: ailf-eval-${{ github.event.pull_request.number || github.ref }}\n  cancel-in-progress: true\n\njobs:\n  evaluate:\n    name: AI Literacy Evaluation\n    runs-on: ubuntu-latest\n    permissions:\n      pull-requests: write\n    steps:\n      # ─── Submit evaluation to the AILF API ─────────────────────\n      - name: Submit evaluation\n        id: submit\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n          FULL_EVAL: ${{ inputs.full_eval || 'false' }}\n        run: |\n          if [ \"$FULL_EVAL\" = \"true\" ]; then\n            DEBUG_FIELD=\"\"\n          else\n            DEBUG_FIELD='\"debug\": { \"enabled\": true, \"firstN\": 2 },'\n          fi\n\n          PAYLOAD=$(cat <<EOF\n          {\n            \"mode\": \"baseline\",\n            ${DEBUG_FIELD}\n            \"publish\": true,\n            \"compare\": true\n          }\n          EOF\n          )\n\n          RESPONSE=$(curl -sf -X POST \\\n            -H \"Authorization: Bearer $AILF_API_KEY\" \\\n            -H \"Content-Type: application/json\" \\\n            https://ailf-api.sanity.build/v1/pipeline \\\n            -d \"$PAYLOAD\")\n\n          JOB_ID=$(echo \"$RESPONSE\" | jq -r '.jobId')\n          echo \"job_id=$JOB_ID\" >> $GITHUB_OUTPUT\n          echo \"📋 Submitted job: $JOB_ID\"\n\n      # ─── Poll for results (long-polling) ───────────────────────\n      - name: Wait for results\n        id: results\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n          JOB_ID: ${{ steps.submit.outputs.job_id }}\n        run: |\n          for i in $(seq 1 40); do\n            RESPONSE=$(curl -s \\\n              -H \"Authorization: Bearer $AILF_API_KEY\" \\\n              -H \"Prefer: wait=25\" \\\n              \"https://ailf-api.sanity.build/v1/jobs/$JOB_ID\")\n\n            STATUS=$(echo \"$RESPONSE\" | jq -r '.status')\n\n            case \"$STATUS\" in\n              completed)\n                echo \"status=completed\" >> $GITHUB_OUTPUT\n                echo \"report_id=$(echo $RESPONSE | jq -r '.reportId // empty')\" >> $GITHUB_OUTPUT\n                echo \"score=$(echo $RESPONSE | jq -r '.score // empty')\" >> $GITHUB_OUTPUT\n                echo \"✅ Evaluation completed\"\n                exit 0\n                ;;\n              failed|timed-out)\n                echo \"status=$STATUS\" >> $GITHUB_OUTPUT\n                echo \"::error::Evaluation $STATUS\"\n                exit 1\n                ;;\n              *)\n                echo \"⏳ [$i/40] $STATUS\"\n                ;;\n            esac\n          done\n\n          echo \"::error::Timed out waiting for evaluation\"\n          exit 1\n\n      # ─── Fetch the markdown report ─────────────────────────────\n      - name: Fetch markdown report\n        id: markdown\n        if: steps.results.outputs.report_id != ''\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n          REPORT_ID: ${{ steps.results.outputs.report_id }}\n        run: |\n          REPORT_MD=$(curl -sf \\\n            -H \"Authorization: Bearer $AILF_API_KEY\" \\\n            \"https://ailf-api.sanity.build/v1/reports/$REPORT_ID/markdown\")\n\n          if [ $? -eq 0 ] && [ -n \"$REPORT_MD\" ]; then\n            # Write to a temp file to avoid shell quoting issues\n            echo \"$REPORT_MD\" > /tmp/ailf-report.md\n            echo \"fetched=true\" >> $GITHUB_OUTPUT\n          else\n            echo \"fetched=false\" >> $GITHUB_OUTPUT\n            echo \"::warning::Could not fetch markdown report\"\n          fi\n\n      # ─── Post results to PR ────────────────────────────────────\n      - name: Post PR comment\n        if: >-\n          always() && github.event_name == 'pull_request' &&\n          steps.submit.outputs.job_id != ''\n        uses: actions/github-script@v7\n        env:\n          JOB_STATUS: ${{ steps.results.outputs.status || 'unknown' }}\n          REPORT_ID: ${{ steps.results.outputs.report_id || '' }}\n          JOB_ID: ${{ steps.submit.outputs.job_id }}\n          SCORE: ${{ steps.results.outputs.score || '' }}\n          MARKDOWN_FETCHED: ${{ steps.markdown.outputs.fetched || 'false' }}\n        with:\n          script: |\n            const fs = require('fs');\n            const marker = '<!-- ailf-score-report -->';\n            const status = process.env.JOB_STATUS;\n            const reportId = process.env.REPORT_ID;\n            const jobId = process.env.JOB_ID;\n            const score = process.env.SCORE;\n            const mdFetched = process.env.MARKDOWN_FETCHED === 'true';\n\n            let body;\n\n            if (status === 'completed' && mdFetched) {\n              // Use the full markdown report from the API\n              const reportMd = fs.readFileSync('/tmp/ailf-report.md', 'utf-8');\n              body = `${marker}\\n${reportMd}`;\n              if (reportId) {\n                body += `\\n🔗 [View in Studio](https://admin.sanity.io/ailf/report/${reportId})`;\n              }\n              body += `\\n\\n<sub>Job: \\`${jobId}\\`</sub>\\n`;\n            } else {\n              // Fallback: minimal comment when markdown is unavailable\n              let icon, message;\n              if (status === 'completed') {\n                icon = '✅';\n                message = score\n                  ? `Evaluation completed — score: **${score}/100**`\n                  : 'Evaluation completed successfully.';\n              } else if (status === 'failed' || status === 'timed-out') {\n                icon = '⚠️';\n                message = `Evaluation ${status}.`;\n              } else {\n                icon = '⏳';\n                message = 'Evaluation status unknown (may still be running).';\n              }\n\n              body = `${marker}\\n## ${icon} AI Literacy Evaluation\\n\\n${message}\\n`;\n              if (reportId) {\n                body += `\\n🔗 [View in Studio](https://admin.sanity.io/ailf/report/${reportId})\\n`;\n              }\n              body += `\\n<sub>Job: \\`${jobId}\\`</sub>\\n`;\n            }\n\n            const { data: comments } = await github.rest.issues.listComments({\n              owner: context.repo.owner,\n              repo: context.repo.repo,\n              issue_number: context.issue.number,\n            });\n            const existing = comments.find(c => c.body?.includes(marker));\n\n            if (existing) {\n              await github.rest.issues.updateComment({\n                owner: context.repo.owner,\n                repo: context.repo.repo,\n                comment_id: existing.id,\n                body,\n              });\n            } else {\n              await github.rest.issues.createComment({\n                owner: context.repo.owner,\n                repo: context.repo.repo,\n                issue_number: context.issue.number,\n                body,\n              });\n            }\n\n      # ─── Job summary ───────────────────────────────────────────\n      - name: Summary\n        if: always()\n        env:\n          JOB_STATUS: ${{ steps.results.outputs.status || 'unknown' }}\n          REPORT_ID: ${{ steps.results.outputs.report_id || '' }}\n          JOB_ID: ${{ steps.submit.outputs.job_id }}\n          SCORE: ${{ steps.results.outputs.score || '' }}\n          MARKDOWN_FETCHED: ${{ steps.markdown.outputs.fetched || 'false' }}\n        run: |\n          if [ \"$JOB_STATUS\" = \"completed\" ] && [ \"$MARKDOWN_FETCHED\" = \"true\" ] && [ -f /tmp/ailf-report.md ]; then\n            # Use the full markdown report as the job summary\n            cat /tmp/ailf-report.md >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            [ -n \"$REPORT_ID\" ] && echo \"🔗 [View in Studio](https://admin.sanity.io/ailf/report/$REPORT_ID)\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"<sub>Job: \\`$JOB_ID\\`</sub>\" >> \"$GITHUB_STEP_SUMMARY\"\n          else\n            # Fallback: minimal table\n            {\n              echo \"## 📊 AI Literacy Evaluation\"\n              echo \"\"\n              echo \"| Field | Value |\"\n              echo \"|-------|-------|\"\n              echo \"| Job | \\`$JOB_ID\\` |\"\n              echo \"| Status | $JOB_STATUS |\"\n              [ -n \"$SCORE\" ] && echo \"| Score | $SCORE/100 |\"\n              [ -n \"$REPORT_ID\" ] && echo \"| Report | [$REPORT_ID](https://admin.sanity.io/ailf/report/$REPORT_ID) |\"\n            } >> \"$GITHUB_STEP_SUMMARY\"\n          fi\n";
+export const workflowYaml = "# ──────────────────────────────────────────────────────────────────────\n# AI Literacy Evaluation — GitHub Actions workflow\n# ──────────────────────────────────────────────────────────────────────\n#\n# Evaluates your documentation quality on every pull request.\n# The AILF CLI reads your .ailf/tasks/ definitions, submits them\n# to the AILF API for evaluation, and writes a score report.\n#\n# Prerequisites:\n#   Add one secret to your repository (Settings → Secrets → Actions):\n#     AILF_API_KEY — your API key (starts with ailf_live_sk_)\n#\n# Customization:\n#   - Narrow the trigger paths to reduce cost (see comment below)\n#   - Set full_eval to true for comprehensive evaluation\n#   - See: https://github.com/sanity-io/ai-literacy-framework\n# ──────────────────────────────────────────────────────────────────────\n\nname: AI Literacy Eval\n\non:\n  pull_request:\n    branches: [main]\n    # Runs on every PR to main by default. To reduce cost:\n    #   paths: [\".ailf/**\", \"docs/**\"]\n\n  workflow_dispatch:\n    inputs:\n      full_eval:\n        description: \"Run full evaluation (all tests, slower)\"\n        type: boolean\n        default: false\n\nconcurrency:\n  group: ailf-eval-${{ github.event.pull_request.number || github.ref }}\n  cancel-in-progress: true\n\njobs:\n  evaluate:\n    name: AI Literacy Evaluation\n    runs-on: ubuntu-latest\n    permissions:\n      contents: read\n      pull-requests: write\n    steps:\n      - uses: actions/checkout@v4\n\n      - name: Run evaluation\n        id: eval\n        env:\n          AILF_API_KEY: ${{ secrets.AILF_API_KEY }}\n        run: |\n          npx @sanity/ailf@latest pipeline --remote \\\n            --output /tmp/ailf-report.md \\\n            ${{ inputs.full_eval != 'true' && '--debug' || '' }}\n\n      - name: Post PR comment\n        if: always() && github.event_name == 'pull_request'\n        uses: actions/github-script@v7\n        with:\n          script: |\n            const fs = require('fs');\n            const marker = '<!-- ailf-score-report -->';\n            let body;\n            try {\n              const report = fs.readFileSync('/tmp/ailf-report.md', 'utf-8');\n              body = `${marker}\\n${report}`;\n            } catch {\n              body = `${marker}\\n## ⚠️ AI Literacy Evaluation\\n\\nNo report generated. Check the [workflow logs](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}).`;\n            }\n            const { data: comments } = await github.rest.issues.listComments({\n              owner: context.repo.owner, repo: context.repo.repo,\n              issue_number: context.issue.number,\n            });\n            const existing = comments.find(c => c.body?.includes(marker));\n            const params = {\n              owner: context.repo.owner, repo: context.repo.repo,\n              body,\n            };\n            if (existing) {\n              await github.rest.issues.updateComment({ ...params, comment_id: existing.id });\n            } else {\n              await github.rest.issues.createComment({ ...params, issue_number: context.issue.number });\n            }\n\n      - name: Summary\n        if: always()\n        run: |\n          if [ -f /tmp/ailf-report.md ]; then\n            cat /tmp/ailf-report.md >> \"$GITHUB_STEP_SUMMARY\"\n          else\n            echo \"## ⚠️ AI Literacy Evaluation\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"\" >> \"$GITHUB_STEP_SUMMARY\"\n            echo \"No report generated. Check the workflow logs.\" >> \"$GITHUB_STEP_SUMMARY\"\n          fi\n";

package/dist/_vendor/ailf-core/ports/context.d.ts CHANGED Viewed

@@ -106,6 +106,12 @@ export interface ResolvedConfig {
     };
     /** Job ID for tracking API-triggered evaluations in the Content Lake */
     jobId?: string;
+    /** Whether to run in remote mode (submit to AILF API) */
+    remote: boolean;
+    /** AILF API base URL */
+    apiUrl: string;
+    /** AILF API key (from AILF_API_KEY env var) */
+    apiKey?: string;
 }
 /**
  * Application context — the complete dependency carrier.

package/dist/_vendor/ailf-core/schemas/pipeline-request.d.ts CHANGED Viewed

@@ -40,59 +40,7 @@ export declare const PipelineRequestSchema: z.ZodObject<{
     gapAnalysis: z.ZodOptional<z.ZodBoolean>;
     graderReplications: z.ZodOptional<z.ZodNumber>;
     headers: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodString>>;
-    inlineTasks: z.ZodOptional<z.ZodArray<z.ZodObject<{
-        assert: z.ZodArray<z.ZodUnion<readonly [z.ZodObject<{
-            criteria: z.ZodArray<z.ZodString>;
-            template: z.ZodString;
-            type: z.ZodLiteral<"llm-rubric">;
-            weight: z.ZodOptional<z.ZodNumber>;
-        }, z.core.$strip>, z.ZodObject<{
-            type: z.ZodLiteral<"contains">;
-            value: z.ZodString;
-            weight: z.ZodOptional<z.ZodNumber>;
-        }, z.core.$strip>, z.ZodObject<{
-            type: z.ZodLiteral<"contains-any">;
-            value: z.ZodArray<z.ZodString>;
-            weight: z.ZodOptional<z.ZodNumber>;
-        }, z.core.$strip>, z.ZodObject<{
-            type: z.ZodLiteral<"not-contains">;
-            value: z.ZodString;
-            weight: z.ZodOptional<z.ZodNumber>;
-        }, z.core.$strip>, z.ZodObject<{
-            type: z.ZodLiteral<"javascript">;
-            value: z.ZodString;
-            weight: z.ZodOptional<z.ZodNumber>;
-        }, z.core.$strip>]>>;
-        baseline: z.ZodOptional<z.ZodObject<{
-            enabled: z.ZodOptional<z.ZodBoolean>;
-            rubric: z.ZodOptional<z.ZodEnum<{
-                full: "full";
-                abbreviated: "abbreviated";
-                none: "none";
-            }>>;
-        }, z.core.$strip>>;
-        canonical_docs: z.ZodArray<z.ZodUnion<readonly [z.ZodObject<{
-            reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
-            slug: z.ZodString;
-        }, z.core.$strip>, z.ZodObject<{
-            path: z.ZodString;
-            reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
-        }, z.core.$strip>, z.ZodObject<{
-            id: z.ZodString;
-            reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
-        }, z.core.$strip>, z.ZodObject<{
-            perspective: z.ZodString;
-            reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
-        }, z.core.$strip>]>>;
-        description: z.ZodString;
-        doc_coverage: z.ZodOptional<z.ZodBoolean>;
-        id: z.ZodString;
-        reference_solution: z.ZodString;
-        vars: z.ZodObject<{
-            docs: z.ZodString;
-            task: z.ZodString;
-        }, z.core.$loose>;
-    }, z.core.$strip>>>;
+    inlineTasks: z.ZodOptional<z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>>>;
     jobId: z.ZodOptional<z.ZodString>;
     mode: z.ZodOptional<z.ZodEnum<{
         agentic: "agentic";

package/dist/_vendor/ailf-core/schemas/pipeline-request.js CHANGED Viewed

@@ -13,7 +13,6 @@
  * @see packages/eval/src/pipeline/map-request-to-config.ts — maps to ResolvedConfig
  */
 import { z } from "zod";
-import { SingleTaskSchema } from "./pipeline.js";
 // ---------------------------------------------------------------------------
 // Debug options — boolean shorthand or structured object
 // ---------------------------------------------------------------------------
@@ -49,7 +48,7 @@ export const PipelineRequestSchema = z.object({
     gapAnalysis: z.boolean().optional(),
     graderReplications: z.number().int().positive().optional(),
     headers: z.record(z.string(), z.string()).optional(),
-    inlineTasks: z.array(SingleTaskSchema).optional(),
+    inlineTasks: z.array(z.record(z.string(), z.unknown())).optional(),
     jobId: z.string().optional(),
     mode: z.enum(["baseline", "agentic", "observed", "full"]).optional(),
     noCache: z.boolean().optional(),

package/dist/_vendor/ailf-tasks/cli.d.ts ADDED Viewed

@@ -0,0 +1,8 @@
+/**
+ * cli.ts — Minimal CLI for standalone task validation.
+ *
+ * Usage:
+ *   npx @sanity/ailf-tasks validate .ailf/tasks/
+ *   npx @sanity/ailf-tasks validate             # defaults to .ailf/tasks/
+ */
+export declare function run(): void;

package/dist/_vendor/ailf-tasks/cli.js ADDED Viewed

@@ -0,0 +1,61 @@
+/**
+ * cli.ts — Minimal CLI for standalone task validation.
+ *
+ * Usage:
+ *   npx @sanity/ailf-tasks validate .ailf/tasks/
+ *   npx @sanity/ailf-tasks validate             # defaults to .ailf/tasks/
+ */
+import { loadTaskDir } from "./parser.js";
+import { formatValidationResult, validateRepoTasks } from "./validation.js";
+export function run() {
+    const args = process.argv.slice(2);
+    const command = args[0];
+    if (command === "validate") {
+        const dir = args[1] ?? ".ailf/tasks";
+        validateCommand(dir);
+    }
+    else if (command === "--help" ||
+        command === "-h" ||
+        command === undefined) {
+        printUsage();
+    }
+    else {
+        console.error(`Unknown command: ${command}`);
+        printUsage();
+        process.exit(1);
+    }
+}
+function validateCommand(dir) {
+    try {
+        const tasks = loadTaskDir(dir);
+        // Run semantic validation
+        const result = validateRepoTasks(tasks);
+        const formatted = formatValidationResult(result);
+        console.log(`✅ ${tasks.length} task(s) validated from ${dir}`);
+        for (const task of tasks) {
+            console.log(`   ${task.id} — ${task.description}`);
+        }
+        if (result.warnings.length > 0 || result.errors.length > 0) {
+            console.log("");
+            console.log(formatted);
+        }
+        if (!result.valid) {
+            process.exit(1);
+        }
+    }
+    catch (err) {
+        console.error(`❌ ${err instanceof Error ? err.message : String(err)}`);
+        process.exit(1);
+    }
+}
+function printUsage() {
+    console.log("Usage: ailf-tasks <command> [options]");
+    console.log("");
+    console.log("Commands:");
+    console.log("  validate [dir]  Validate task YAML files (default: .ailf/tasks/)");
+    console.log("");
+    console.log("Examples:");
+    console.log("  ailf-tasks validate");
+    console.log("  ailf-tasks validate .ailf/tasks/");
+    console.log("  ailf-tasks validate /path/to/tasks/");
+}

package/dist/_vendor/ailf-tasks/index.d.ts ADDED Viewed

@@ -0,0 +1,13 @@
+/**
+ * @sanity/ailf-tasks — Task definition schemas and YAML parser.
+ *
+ * Lightweight package for parsing and validating .ailf/tasks/*.yaml files
+ * without depending on the full AILF CLI or its heavyweight dependencies
+ * (Promptfoo, LLM SDKs, Sanity client).
+ *
+ * Usage:
+ *   import { parseTaskFile, loadTaskDir, RepoTaskSchema } from '@sanity/ailf-tasks'
+ */
+export { CURATED_ASSERTION_TYPES, RepoTaskFileSchema, RepoTaskSchema, RUBRIC_TEMPLATE_NAMES, type CuratedAssertionType, type RepoTask, type RubricTemplateName, } from "./schemas.js";
+export { loadTaskDir, parseTaskFile } from "./parser.js";
+export { detectSnakeCaseFields, formatValidationResult, validateRepoTasks, type ValidationMessage, type ValidationResult, } from "./validation.js";

package/dist/_vendor/ailf-tasks/index.js ADDED Viewed

@@ -0,0 +1,16 @@
+/**
+ * @sanity/ailf-tasks — Task definition schemas and YAML parser.
+ *
+ * Lightweight package for parsing and validating .ailf/tasks/*.yaml files
+ * without depending on the full AILF CLI or its heavyweight dependencies
+ * (Promptfoo, LLM SDKs, Sanity client).
+ *
+ * Usage:
+ *   import { parseTaskFile, loadTaskDir, RepoTaskSchema } from '@sanity/ailf-tasks'
+ */
+// Schemas and types
+export { CURATED_ASSERTION_TYPES, RepoTaskFileSchema, RepoTaskSchema, RUBRIC_TEMPLATE_NAMES, } from "./schemas.js";
+// Parsing
+export { loadTaskDir, parseTaskFile } from "./parser.js";
+// Validation
+export { detectSnakeCaseFields, formatValidationResult, validateRepoTasks, } from "./validation.js";

package/dist/_vendor/ailf-tasks/parser.d.ts ADDED Viewed

@@ -0,0 +1,27 @@
+/**
+ * parser.ts — Standalone task file and directory parsing.
+ *
+ * High-level functions for loading and validating .ailf/tasks/ YAML
+ * files without any dependency on the eval pipeline.
+ *
+ * Usage:
+ *   import { parseTaskFile, loadTaskDir } from '@sanity/ailf-tasks'
+ */
+import { type RepoTask } from "./schemas.js";
+/**
+ * Parse a single task YAML string and return validated tasks.
+ *
+ * @param content - Raw YAML string content
+ * @param filename - Source filename (for error messages)
+ * @returns Validated array of RepoTask objects
+ * @throws Error if YAML parsing or Zod validation fails
+ */
+export declare function parseTaskFile(content: string, filename?: string): RepoTask[];
+/**
+ * Load and parse all task YAML files from a directory.
+ *
+ * @param dirPath - Path to directory containing .yaml/.yml files
+ * @returns All validated tasks, sorted by filename
+ * @throws Error if directory not found, no YAML files, or validation fails
+ */
+export declare function loadTaskDir(dirPath: string): RepoTask[];

package/dist/_vendor/ailf-tasks/parser.js ADDED Viewed

@@ -0,0 +1,73 @@
+/**
+ * parser.ts — Standalone task file and directory parsing.
+ *
+ * High-level functions for loading and validating .ailf/tasks/ YAML
+ * files without any dependency on the eval pipeline.
+ *
+ * Usage:
+ *   import { parseTaskFile, loadTaskDir } from '@sanity/ailf-tasks'
+ */
+import { existsSync, readdirSync, readFileSync } from "fs";
+import { resolve } from "path";
+import { load } from "js-yaml";
+import { RepoTaskFileSchema } from "./schemas.js";
+// ---------------------------------------------------------------------------
+// Public API
+// ---------------------------------------------------------------------------
+/**
+ * Parse a single task YAML string and return validated tasks.
+ *
+ * @param content - Raw YAML string content
+ * @param filename - Source filename (for error messages)
+ * @returns Validated array of RepoTask objects
+ * @throws Error if YAML parsing or Zod validation fails
+ */
+export function parseTaskFile(content, filename = "<string>") {
+    const parsed = load(content);
+    if (!Array.isArray(parsed)) {
+        throw new Error(`${filename} did not parse to an array of tasks. ` +
+            "Task files must contain a YAML array of task definitions.");
+    }
+    const result = RepoTaskFileSchema.safeParse(parsed);
+    if (!result.success) {
+        const messages = result.error.issues
+            .map((i) => `  [${i.path.join(".")}]: ${i.message}`)
+            .join("\n");
+        throw new Error(`Invalid task file "${filename}":\n${messages}`);
+    }
+    return result.data;
+}
+/**
+ * Load and parse all task YAML files from a directory.
+ *
+ * @param dirPath - Path to directory containing .yaml/.yml files
+ * @returns All validated tasks, sorted by filename
+ * @throws Error if directory not found, no YAML files, or validation fails
+ */
+export function loadTaskDir(dirPath) {
+    if (!existsSync(dirPath)) {
+        throw new Error(`Tasks directory not found: ${dirPath}\n` +
+            "  Expected a directory containing .ailf/tasks/*.yaml files.");
+    }
+    const yamlFiles = readdirSync(dirPath)
+        .filter((f) => (f.endsWith(".yaml") || f.endsWith(".yml")) && !f.startsWith("."))
+        .sort();
+    if (yamlFiles.length === 0) {
+        throw new Error(`No YAML files found in ${dirPath}\n` +
+            "  Expected .ailf/tasks/*.yaml files with task definitions.");
+    }
+    const allTasks = [];
+    for (const file of yamlFiles) {
+        const filePath = resolve(dirPath, file);
+        const content = readFileSync(filePath, "utf-8");
+        try {
+            const tasks = parseTaskFile(content, file);
+            allTasks.push(...tasks);
+        }
+        catch (err) {
+            const msg = err instanceof Error ? err.message : String(err);
+            throw new Error(`Failed to load ${file}:\n${msg}`, { cause: err });
+        }
+    }
+    return allTasks;
+}

package/dist/_vendor/ailf-tasks/schemas.d.ts ADDED Viewed

@@ -0,0 +1,186 @@
+/**
+ * schemas.ts — Zod schemas for repo-based task definitions.
+ *
+ * Validates .ailf/tasks/*.yaml task files from external repositories.
+ * These schemas are the contract between external repos and the AILF eval
+ * pipeline — they define exactly what fields are accepted, with friendly
+ * error messages for authors writing task YAML by hand.
+ *
+ * This module is the single source of truth for task schemas. The eval
+ * package re-exports from here to avoid duplication.
+ *
+ * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
+ */
+import { z } from "zod";
+/**
+ * The set of assertion types allowed in repo-based task files.
+ *
+ * This is a curated subset of Promptfoo assertion types — we expose only the
+ * types that are stable, well-documented, and useful for external authors.
+ */
+export declare const CURATED_ASSERTION_TYPES: readonly ["llm-rubric", "contains", "contains-any", "contains-all", "not-contains", "icontains", "icontains-any", "regex", "javascript", "similar", "cost", "latency"];
+export type CuratedAssertionType = (typeof CURATED_ASSERTION_TYPES)[number];
+/**
+ * Valid rubric template names — must match keys in config/rubrics.yaml.
+ */
+export declare const RUBRIC_TEMPLATE_NAMES: readonly ["task-completion", "code-correctness", "doc-coverage"];
+export type RubricTemplateName = (typeof RUBRIC_TEMPLATE_NAMES)[number];
+/**
+ * Zod schema for a single repo-based task definition.
+ *
+ * This is the external-author-facing contract. Field names are camelCase
+ * to match the Content Lake document schema (ailf.task).
+ */
+export declare const RepoTaskSchema: z.ZodObject<{
+    id: z.ZodString;
+    description: z.ZodString;
+    featureArea: z.ZodString;
+    tags: z.ZodOptional<z.ZodArray<z.ZodString>>;
+    canonicalDocs: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodUnion<readonly [z.ZodObject<{
+        id: z.ZodString;
+        reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
+        slug: z.ZodOptional<z.ZodString>;
+        path: z.ZodOptional<z.ZodString>;
+    }, z.core.$strip>, z.ZodObject<{
+        slug: z.ZodString;
+        reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
+    }, z.core.$strip>, z.ZodObject<{
+        path: z.ZodString;
+        reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
+    }, z.core.$strip>, z.ZodObject<{
+        perspective: z.ZodString;
+        reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
+    }, z.core.$strip>]>>>>;
+    vars: z.ZodOptional<z.ZodObject<{
+        task: z.ZodString;
+    }, z.core.$loose>>;
+    assert: z.ZodArray<z.ZodUnion<readonly [z.ZodObject<{
+        type: z.ZodLiteral<"llm-rubric">;
+        template: z.ZodEnum<{
+            "task-completion": "task-completion";
+            "code-correctness": "code-correctness";
+            "doc-coverage": "doc-coverage";
+        }>;
+        criteria: z.ZodArray<z.ZodString>;
+        weight: z.ZodOptional<z.ZodNumber>;
+    }, z.core.$strip>, z.ZodObject<{
+        type: z.ZodEnum<{
+            "llm-rubric": "llm-rubric";
+            contains: "contains";
+            "contains-any": "contains-any";
+            "contains-all": "contains-all";
+            "not-contains": "not-contains";
+            icontains: "icontains";
+            "icontains-any": "icontains-any";
+            regex: "regex";
+            javascript: "javascript";
+            similar: "similar";
+            cost: "cost";
+            latency: "latency";
+        }>;
+        value: z.ZodOptional<z.ZodUnknown>;
+        threshold: z.ZodOptional<z.ZodNumber>;
+        weight: z.ZodOptional<z.ZodNumber>;
+    }, z.core.$loose>]>>;
+    baseline: z.ZodOptional<z.ZodObject<{
+        enabled: z.ZodOptional<z.ZodBoolean>;
+        rubric: z.ZodOptional<z.ZodEnum<{
+            abbreviated: "abbreviated";
+            full: "full";
+            none: "none";
+        }>>;
+    }, z.core.$strip>>;
+    docCoverage: z.ZodDefault<z.ZodOptional<z.ZodBoolean>>;
+    referenceSolution: z.ZodOptional<z.ZodString>;
+    execution: z.ZodOptional<z.ZodObject<{
+        enabled: z.ZodDefault<z.ZodOptional<z.ZodBoolean>>;
+        blocking: z.ZodDefault<z.ZodOptional<z.ZodBoolean>>;
+        threshold: z.ZodOptional<z.ZodObject<{
+            score: z.ZodOptional<z.ZodNumber>;
+        }, z.core.$strip>>;
+        trigger: z.ZodOptional<z.ZodObject<{
+            branches: z.ZodOptional<z.ZodArray<z.ZodString>>;
+            paths: z.ZodOptional<z.ZodArray<z.ZodString>>;
+        }, z.core.$strip>>;
+        source: z.ZodOptional<z.ZodString>;
+    }, z.core.$strip>>;
+}, z.core.$strip>;
+export type RepoTask = z.infer<typeof RepoTaskSchema>;
+/**
+ * Schema for an array of repo tasks — what a single .ailf/tasks/*.yaml file
+ * contains. Each file must define at least one task.
+ */
+export declare const RepoTaskFileSchema: z.ZodArray<z.ZodObject<{
+    id: z.ZodString;
+    description: z.ZodString;
+    featureArea: z.ZodString;
+    tags: z.ZodOptional<z.ZodArray<z.ZodString>>;
+    canonicalDocs: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodUnion<readonly [z.ZodObject<{
+        id: z.ZodString;
+        reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
+        slug: z.ZodOptional<z.ZodString>;
+        path: z.ZodOptional<z.ZodString>;
+    }, z.core.$strip>, z.ZodObject<{
+        slug: z.ZodString;
+        reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
+    }, z.core.$strip>, z.ZodObject<{
+        path: z.ZodString;
+        reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
+    }, z.core.$strip>, z.ZodObject<{
+        perspective: z.ZodString;
+        reason: z.ZodDefault<z.ZodOptional<z.ZodString>>;
+    }, z.core.$strip>]>>>>;
+    vars: z.ZodOptional<z.ZodObject<{
+        task: z.ZodString;
+    }, z.core.$loose>>;
+    assert: z.ZodArray<z.ZodUnion<readonly [z.ZodObject<{
+        type: z.ZodLiteral<"llm-rubric">;
+        template: z.ZodEnum<{
+            "task-completion": "task-completion";
+            "code-correctness": "code-correctness";
+            "doc-coverage": "doc-coverage";
+        }>;
+        criteria: z.ZodArray<z.ZodString>;
+        weight: z.ZodOptional<z.ZodNumber>;
+    }, z.core.$strip>, z.ZodObject<{
+        type: z.ZodEnum<{
+            "llm-rubric": "llm-rubric";
+            contains: "contains";
+            "contains-any": "contains-any";
+            "contains-all": "contains-all";
+            "not-contains": "not-contains";
+            icontains: "icontains";
+            "icontains-any": "icontains-any";
+            regex: "regex";
+            javascript: "javascript";
+            similar: "similar";
+            cost: "cost";
+            latency: "latency";
+        }>;
+        value: z.ZodOptional<z.ZodUnknown>;
+        threshold: z.ZodOptional<z.ZodNumber>;
+        weight: z.ZodOptional<z.ZodNumber>;
+    }, z.core.$loose>]>>;
+    baseline: z.ZodOptional<z.ZodObject<{
+        enabled: z.ZodOptional<z.ZodBoolean>;
+        rubric: z.ZodOptional<z.ZodEnum<{
+            abbreviated: "abbreviated";
+            full: "full";
+            none: "none";
+        }>>;
+    }, z.core.$strip>>;
+    docCoverage: z.ZodDefault<z.ZodOptional<z.ZodBoolean>>;
+    referenceSolution: z.ZodOptional<z.ZodString>;
+    execution: z.ZodOptional<z.ZodObject<{
+        enabled: z.ZodDefault<z.ZodOptional<z.ZodBoolean>>;
+        blocking: z.ZodDefault<z.ZodOptional<z.ZodBoolean>>;
+        threshold: z.ZodOptional<z.ZodObject<{
+            score: z.ZodOptional<z.ZodNumber>;
+        }, z.core.$strip>>;
+        trigger: z.ZodOptional<z.ZodObject<{
+            branches: z.ZodOptional<z.ZodArray<z.ZodString>>;
+            paths: z.ZodOptional<z.ZodArray<z.ZodString>>;
+        }, z.core.$strip>>;
+        source: z.ZodOptional<z.ZodString>;
+    }, z.core.$strip>>;
+}, z.core.$strip>>;