npm - @skill-graph/cli - Versions diffs - 0.5.6 - Mend

@skill-graph/cli 0.5.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (330) hide show

package/CHANGELOG.md +247 -0
package/LICENSE +200 -0
package/NOTICE +62 -0
package/README.md +398 -0
package/SKILL_GRAPH.md +443 -0
package/bin/skill-graph.js +374 -0
package/docs/ADOPTION.md +117 -0
package/docs/CONFORMANCE.md +66 -0
package/docs/PRIMER.md +384 -0
package/docs/QUICKSTART-30MIN.md +333 -0
package/docs/ROUTING-METRICS.md +120 -0
package/docs/SKILL-MD-FORMAT-COMPATIBILITY.md +127 -0
package/docs/SKILL_AUDIT_CHECKLIST.md +199 -0
package/docs/SKILL_AUDIT_LOOP.md +195 -0
package/docs/SKILL_METADATA_PROTOCOL.md +609 -0
package/docs/_archived/marketplace-publication-priority-2026-05-18.md +239 -0
package/docs/adr/0001-predicate-set.md +69 -0
package/docs/adr/0002-json-ld-context.md +82 -0
package/docs/adr/0003-ontoclean-rigidity-tags.md +65 -0
package/docs/adr/0004-persistent-identifiers.md +74 -0
package/docs/adr/0005-freshness-consolidation.md +70 -0
package/docs/adr/0006-revise-predicate-rename.md +105 -0
package/docs/adr/0007-audit-loop-cadence.md +99 -0
package/docs/adr/0008-skill-surface-split-and-curation-policy.md +93 -0
package/docs/category-consumers.md +168 -0
package/docs/concept-map.md +194 -0
package/docs/diagrams/drift-states.mmd +21 -0
package/docs/diagrams/manifest-pipeline.mmd +25 -0
package/docs/diagrams/routing-harness.mmd +41 -0
package/docs/diagrams/starter-graph.mmd +53 -0
package/docs/field-decision-guide.md +315 -0
package/docs/field-rationale.md +211 -0
package/docs/field-reference.generated.md +624 -0
package/docs/field-reference.md +1426 -0
package/docs/glossary.md +190 -0
package/docs/head-noun-glossary.md +63 -0
package/docs/images/audit-phases.png +0 -0
package/docs/images/drift-states.png +0 -0
package/docs/images/graded-mode.png +0 -0
package/docs/images/manifest-pipeline.png +0 -0
package/docs/images/routing-harness.png +0 -0
package/docs/images/skill-anatomy.png +0 -0
package/docs/images/starter-graph.png +0 -0
package/docs/images/system-model.png +0 -0
package/docs/integrations/github-actions.md +155 -0
package/docs/manifest-field-mapping.md +443 -0
package/docs/marketplace-publication-queue.generated.md +240 -0
package/docs/marketplace-release-agent-prompt.md +82 -0
package/docs/marketplace-skill-candidate-list.md +272 -0
package/docs/marketplace-syndication.md +222 -0
package/docs/migration-sample-review.md +155 -0
package/docs/migrations/v4-to-v5.md +168 -0
package/docs/migrations/v5-to-v6.md +221 -0
package/docs/name-exceptions.yaml +37 -0
package/docs/plans/marketplace-p1-public-migration-plan.md +41 -0
package/docs/plans/multi-root-workspace.md +148 -0
package/docs/plans/scripts-roadmap.md +107 -0
package/docs/plans/v4-schema-bump.md +160 -0
package/docs/plans/wave-2-extraction.md +122 -0
package/docs/positioning-vs-marketplaces.md +175 -0
package/docs/proposals/skill-audit-loop-positioning.md +160 -0
package/docs/quality-doctrine.md +138 -0
package/docs/recommended-skills.md +150 -0
package/docs/research/skill-comprehension-eval-research.md +1830 -0
package/docs/research/skill-retrieval-evidence.md +66 -0
package/docs/skill-metadata-protocol.md +471 -0
package/docs/skills-sh-maintainer-cleanup-request.md +80 -0
package/examples/audits/a11y/findings.md +52 -0
package/examples/audits/a11y/scorecard.md +21 -0
package/examples/audits/a11y/verdict.md +44 -0
package/examples/audits/debugging/findings.md +59 -0
package/examples/audits/debugging/scorecard.md +22 -0
package/examples/audits/debugging/verdict.md +33 -0
package/examples/audits/documentation/findings.md +59 -0
package/examples/audits/documentation/scorecard.md +22 -0
package/examples/audits/documentation/verdict.md +33 -0
package/examples/evals/a11y.json +140 -0
package/examples/evals/api-design.json +52 -0
package/examples/evals/code-review.json +52 -0
package/examples/evals/data-modeling.json +52 -0
package/examples/evals/database-migration.json +52 -0
package/examples/evals/debugging.json +118 -0
package/examples/evals/dependency-architecture.json +52 -0
package/examples/evals/design-system-architecture.json +52 -0
package/examples/evals/error-tracking.json +52 -0
package/examples/evals/event-contract-design.json +52 -0
package/examples/evals/form-ux-architecture.json +52 -0
package/examples/evals/framework-fit-analysis.json +52 -0
package/examples/evals/graph-audit.json +139 -0
package/examples/evals/information-architecture.json +52 -0
package/examples/evals/interaction-feedback.json +52 -0
package/examples/evals/interaction-patterns.json +52 -0
package/examples/evals/layout-composition.json +52 -0
package/examples/evals/lint-overlay.json +117 -0
package/examples/evals/microcopy.json +52 -0
package/examples/evals/observability-modeling.json +52 -0
package/examples/evals/pattern-recognition.json +96 -0
package/examples/evals/performance-engineering.json +52 -0
package/examples/evals/refactor.json +128 -0
package/examples/evals/semiotics.json +52 -0
package/examples/evals/skill-infrastructure.json +96 -0
package/examples/evals/skill-router.json +140 -0
package/examples/evals/skill-router.routing.json +113 -0
package/examples/evals/system-interface-contracts.json +52 -0
package/examples/evals/task-analysis.json +52 -0
package/examples/evals/testing-strategy.json +118 -0
package/examples/evals/type-safety.json +249 -0
package/examples/evals/visual-design-foundations.json +52 -0
package/examples/evals/webhook-integration.json +52 -0
package/examples/exports/a11y.skill-md.md +80 -0
package/examples/exports/debugging.skill-md.md +80 -0
package/examples/exports/refactor.skill-md.md +78 -0
package/examples/exports/testing-strategy.skill-md.md +81 -0
package/examples/projects/markdown-static-site/README.md +115 -0
package/examples/projects/markdown-static-site/skills/content-source-router/SKILL.md +131 -0
package/examples/projects/markdown-static-site/skills/image-optimization-pipeline-config/SKILL.md +132 -0
package/examples/projects/markdown-static-site/skills/link-rot-detection/SKILL.md +103 -0
package/examples/projects/markdown-static-site/skills/markdown-post-frontmatter-validation/SKILL.md +133 -0
package/examples/projects/markdown-static-site/skills/migrate-posts-to-v2-frontmatter/SKILL.md +140 -0
package/examples/projects/saas-stripe-postgres/README.md +208 -0
package/examples/projects/saas-stripe-postgres/db/migrations/0004_canonicalize_orders.sql +37 -0
package/examples/projects/saas-stripe-postgres/db/schema.sql +112 -0
package/examples/projects/saas-stripe-postgres/skills/migrate-orders-to-canonical-schema/SKILL.md +149 -0
package/examples/projects/saas-stripe-postgres/skills/nextjs-server-action-validation/SKILL.md +154 -0
package/examples/projects/saas-stripe-postgres/skills/payment-provider-router/SKILL.md +153 -0
package/examples/projects/saas-stripe-postgres/skills/postgres-rls-pattern/SKILL.md +163 -0
package/examples/projects/saas-stripe-postgres/skills/stripe-webhook-signature-verification/SKILL.md +137 -0
package/examples/protocol/skill-metadata-template.md +301 -0
package/examples/protocol/skills.manifest.sample.json +13245 -0
package/examples/skill-metadata-template.md +317 -0
package/examples/skills.manifest.sample.json +13519 -0
package/examples/tests/v3-1-skos-fixture/SKILL.md +93 -0
package/marketplace/README.md +17 -0
package/marketplace/skills/a11y/SKILL.md +66 -0
package/marketplace/skills/acid-fundamentals/SKILL.md +106 -0
package/marketplace/skills/agent-engineering/SKILL.md +386 -0
package/marketplace/skills/agent-eval-design/SKILL.md +55 -0
package/marketplace/skills/ai-native-development/SKILL.md +294 -0
package/marketplace/skills/api-design/SKILL.md +60 -0
package/marketplace/skills/architecture-decision-records/SKILL.md +55 -0
package/marketplace/skills/background-jobs/SKILL.md +265 -0
package/marketplace/skills/bounded-context-mapping/SKILL.md +55 -0
package/marketplace/skills/cap-theorem-tradeoffs/SKILL.md +127 -0
package/marketplace/skills/client-server-boundary/SKILL.md +187 -0
package/marketplace/skills/code-review/SKILL.md +120 -0
package/marketplace/skills/color-system-design/SKILL.md +43 -0
package/marketplace/skills/component-architecture/SKILL.md +126 -0
package/marketplace/skills/compression/SKILL.md +112 -0
package/marketplace/skills/conceptual-modeling/SKILL.md +181 -0
package/marketplace/skills/connection-pooling/SKILL.md +105 -0
package/marketplace/skills/constraint-awareness/SKILL.md +287 -0
package/marketplace/skills/content-monitor/SKILL.md +209 -0
package/marketplace/skills/context-engineering/SKILL.md +320 -0
package/marketplace/skills/context-graph/SKILL.md +174 -0
package/marketplace/skills/context-management/SKILL.md +174 -0
package/marketplace/skills/context-window/SKILL.md +239 -0
package/marketplace/skills/contract-testing/SKILL.md +120 -0
package/marketplace/skills/cron-scheduling/SKILL.md +223 -0
package/marketplace/skills/dark-mode-implementation/SKILL.md +47 -0
package/marketplace/skills/data-modeling/SKILL.md +59 -0
package/marketplace/skills/data-modeling-fundamentals/SKILL.md +117 -0
package/marketplace/skills/database-migration/SKILL.md +429 -0
package/marketplace/skills/debugging/SKILL.md +67 -0
package/marketplace/skills/dependency-architecture/SKILL.md +58 -0
package/marketplace/skills/design-module-composition/SKILL.md +43 -0
package/marketplace/skills/design-system-architecture/SKILL.md +61 -0
package/marketplace/skills/design-thinking/SKILL.md +44 -0
package/marketplace/skills/diagnosis/SKILL.md +296 -0
package/marketplace/skills/diff-analysis/SKILL.md +188 -0
package/marketplace/skills/e2e-test-design/SKILL.md +113 -0
package/marketplace/skills/entity-relationship-modeling/SKILL.md +218 -0
package/marketplace/skills/epistemic-grounding/SKILL.md +112 -0
package/marketplace/skills/error-boundary/SKILL.md +235 -0
package/marketplace/skills/error-tracking/SKILL.md +261 -0
package/marketplace/skills/eval-driven-development/SKILL.md +147 -0
package/marketplace/skills/evaluation/SKILL.md +113 -0
package/marketplace/skills/event-contract-design/SKILL.md +60 -0
package/marketplace/skills/event-storming/SKILL.md +56 -0
package/marketplace/skills/form-ux-architecture/SKILL.md +60 -0
package/marketplace/skills/framework-fit-analysis/SKILL.md +59 -0
package/marketplace/skills/frontend-architecture/SKILL.md +43 -0
package/marketplace/skills/generative-ui/SKILL.md +118 -0
package/marketplace/skills/graph-audit/SKILL.md +81 -0
package/marketplace/skills/guardrails/SKILL.md +118 -0
package/marketplace/skills/hooks-patterns/SKILL.md +185 -0
package/marketplace/skills/http-semantics/SKILL.md +136 -0
package/marketplace/skills/ideation/SKILL.md +41 -0
package/marketplace/skills/indexing-strategy/SKILL.md +108 -0
package/marketplace/skills/information-architecture/SKILL.md +59 -0
package/marketplace/skills/integration-test-design/SKILL.md +111 -0
package/marketplace/skills/intent-recognition/SKILL.md +136 -0
package/marketplace/skills/interaction-feedback/SKILL.md +59 -0
package/marketplace/skills/interaction-patterns/SKILL.md +59 -0
package/marketplace/skills/journey-mapping/SKILL.md +41 -0
package/marketplace/skills/keywords/SKILL.md +213 -0
package/marketplace/skills/knowledge-modeling/SKILL.md +232 -0
package/marketplace/skills/layout-composition/SKILL.md +59 -0
package/marketplace/skills/linguistics/SKILL.md +429 -0
package/marketplace/skills/lint-overlay/SKILL.md +76 -0
package/marketplace/skills/mental-models/SKILL.md +126 -0
package/marketplace/skills/merge-queue/SKILL.md +94 -0
package/marketplace/skills/methodology/SKILL.md +317 -0
package/marketplace/skills/microcopy/SKILL.md +232 -0
package/marketplace/skills/middleware-patterns/SKILL.md +363 -0
package/marketplace/skills/mobile-responsive-ux/SKILL.md +287 -0
package/marketplace/skills/mutation-testing/SKILL.md +112 -0
package/marketplace/skills/naming-conventions/SKILL.md +112 -0
package/marketplace/skills/observability-modeling/SKILL.md +59 -0
package/marketplace/skills/ontology-modeling/SKILL.md +67 -0
package/marketplace/skills/owasp-security/SKILL.md +153 -0
package/marketplace/skills/pattern-recognition/SKILL.md +472 -0
package/marketplace/skills/performance-budgets/SKILL.md +185 -0
package/marketplace/skills/performance-engineering/SKILL.md +58 -0
package/marketplace/skills/performance-testing/SKILL.md +125 -0
package/marketplace/skills/printify/SKILL.md +42 -0
package/marketplace/skills/prioritization/SKILL.md +118 -0
package/marketplace/skills/problem-framing/SKILL.md +41 -0
package/marketplace/skills/problem-locating-solving/SKILL.md +203 -0
package/marketplace/skills/project-knowledge-extraction/SKILL.md +54 -0
package/marketplace/skills/prompt-craft/SKILL.md +134 -0
package/marketplace/skills/prompt-injection-defense/SKILL.md +132 -0
package/marketplace/skills/property-based-testing/SKILL.md +100 -0
package/marketplace/skills/prototyping/SKILL.md +43 -0
package/marketplace/skills/query-optimization/SKILL.md +144 -0
package/marketplace/skills/real-time-updates/SKILL.md +324 -0
package/marketplace/skills/ref-patterns/SKILL.md +284 -0
package/marketplace/skills/refactor/SKILL.md +65 -0
package/marketplace/skills/rendering-models/SKILL.md +142 -0
package/marketplace/skills/replication-patterns/SKILL.md +110 -0
package/marketplace/skills/research-synthesis/SKILL.md +41 -0
package/marketplace/skills/route-handler-design/SKILL.md +347 -0
package/marketplace/skills/schema-evolution/SKILL.md +140 -0
package/marketplace/skills/security-fundamentals/SKILL.md +139 -0
package/marketplace/skills/semantic-center/SKILL.md +194 -0
package/marketplace/skills/semantic-relations/SKILL.md +250 -0
package/marketplace/skills/semantics/SKILL.md +366 -0
package/marketplace/skills/semiotics/SKILL.md +230 -0
package/marketplace/skills/seo-strategy/SKILL.md +260 -0
package/marketplace/skills/server-actions-design/SKILL.md +243 -0
package/marketplace/skills/server-components-design/SKILL.md +190 -0
package/marketplace/skills/sharding-strategy/SKILL.md +123 -0
package/marketplace/skills/shopify/SKILL.md +42 -0
package/marketplace/skills/skill-infrastructure/SKILL.md +320 -0
package/marketplace/skills/skill-router/SKILL.md +71 -0
package/marketplace/skills/skill-scaffold/SKILL.md +105 -0
package/marketplace/skills/snapshot-testing/SKILL.md +120 -0
package/marketplace/skills/spec-driven-development/SKILL.md +148 -0
package/marketplace/skills/state-machine-modeling/SKILL.md +56 -0
package/marketplace/skills/state-management/SKILL.md +134 -0
package/marketplace/skills/streaming-architecture/SKILL.md +194 -0
package/marketplace/skills/summarization/SKILL.md +156 -0
package/marketplace/skills/suspense-patterns/SKILL.md +265 -0
package/marketplace/skills/system-interface-contracts/SKILL.md +59 -0
package/marketplace/skills/task-analysis/SKILL.md +201 -0
package/marketplace/skills/taxonomy-design/SKILL.md +66 -0
package/marketplace/skills/test-coverage-strategy/SKILL.md +108 -0
package/marketplace/skills/test-doubles-design/SKILL.md +98 -0
package/marketplace/skills/test-driven-development/SKILL.md +96 -0
package/marketplace/skills/testing-strategy/SKILL.md +67 -0
package/marketplace/skills/theme-system-design/SKILL.md +43 -0
package/marketplace/skills/tool-call-flow/SKILL.md +229 -0
package/marketplace/skills/tool-call-strategy/SKILL.md +292 -0
package/marketplace/skills/transaction-isolation/SKILL.md +98 -0
package/marketplace/skills/type-safety/SKILL.md +177 -0
package/marketplace/skills/typography-system/SKILL.md +43 -0
package/marketplace/skills/usability-testing/SKILL.md +43 -0
package/marketplace/skills/user-research/SKILL.md +43 -0
package/marketplace/skills/vercel-composition-patterns/SKILL.md +157 -0
package/marketplace/skills/version-control/SKILL.md +233 -0
package/marketplace/skills/visual-design-foundations/SKILL.md +59 -0
package/marketplace/skills/visual-hierarchy/SKILL.md +43 -0
package/marketplace/skills/webhook-integration/SKILL.md +331 -0
package/marketplace/skills/writing-humanizer/SKILL.md +380 -0
package/package.json +67 -0
package/schemas/manifest.schema.json +811 -0
package/schemas/manifest.v2.schema.json +164 -0
package/schemas/manifest.v3.schema.json +758 -0
package/schemas/manifest.v4.schema.json +755 -0
package/schemas/manifest.v5.schema.json +755 -0
package/schemas/manifest.v6.schema.json +811 -0
package/schemas/skill.context.jsonld +279 -0
package/schemas/skill.schema.json +919 -0
package/schemas/skill.v2.schema.json +201 -0
package/schemas/skill.v3.schema.json +827 -0
package/schemas/skill.v4.schema.json +822 -0
package/schemas/skill.v5.schema.json +830 -0
package/schemas/skill.v6.schema.json +946 -0
package/schemas/vocabulary/keywords.json +180 -0
package/schemas/vocabulary/workspace_tags.json +23 -0
package/scripts/__tests__/migrate-skill-v2-to-v3.test.js +161 -0
package/scripts/__tests__/migrate-skill-v3-to-v4.test.js +158 -0
package/scripts/__tests__/test-export-parser-drift.js +149 -0
package/scripts/__tests__/test-marketplace-export.js +114 -0
package/scripts/__tests__/test-router-paths.js +82 -0
package/scripts/__tests__/test-stability-promotion.js +244 -0
package/scripts/__tests__/test-v3-1-alias-contract.js +109 -0
package/scripts/__tests__/test-v3-1-skos-runtime.js +116 -0
package/scripts/backfill-schema-version.js +198 -0
package/scripts/build-field-reference.js +160 -0
package/scripts/build-retrieval-baseline.js +511 -0
package/scripts/check-markdown-links.js +211 -0
package/scripts/check-protocol-consistency.js +979 -0
package/scripts/export-marketplace-skills.js +610 -0
package/scripts/export-skill.js +374 -0
package/scripts/generate-manifest.js +787 -0
package/scripts/lib/alias-contract.js +83 -0
package/scripts/lib/audit-prompt-builder.js +771 -0
package/scripts/lib/mock-grader.js +134 -0
package/scripts/lib/parse-frontmatter.js +429 -0
package/scripts/lib/roots.js +119 -0
package/scripts/lint/check-archetype-sections.js +185 -0
package/scripts/lint/check-category-enum.js +83 -0
package/scripts/lint/check-routing-eval.js +146 -0
package/scripts/lint/check-routing-quality.js +211 -0
package/scripts/lint/check-stability-promotion.js +220 -0
package/scripts/lint/format-code-frame.js +206 -0
package/scripts/marketplace-install.js +125 -0
package/scripts/migrate-category-to-enum.js +169 -0
package/scripts/migrate-skill-v2-to-v3.js +424 -0
package/scripts/migrate-skill-v3-to-v4.js +200 -0
package/scripts/migrate-skill-v5-to-v6.js +304 -0
package/scripts/restructure-by-category.js +85 -0
package/scripts/seed-publication-classification.js +282 -0
package/scripts/skill-audit.js +893 -0
package/scripts/skill-graph-drift.js +483 -0
package/scripts/skill-graph-route.js +766 -0
package/scripts/skill-graph-routing-eval.js +393 -0
package/scripts/skill-lint.js +1317 -0
package/scripts/skill-overlap.js +213 -0
package/scripts/verify-skill-md-export.js +201 -0

package/examples/evals/database-migration.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "database-migration",
+  "subject": "Safe database migration design for expand-contract rollout, locks, backfills, deploy ordering, rollback, and verification",
+  "adjacent_concepts": ["data-modeling", "testing-strategy", "debugging", "owasp-security"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while routing boundaries are tightened.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A migration adds a NOT NULL column to a large production table. Which skill owns the rollout sequence and lock-risk analysis?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/database-migration/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "The schema change needs an expand-contract path, a backfill, application deploy ordering, and rollback conditions. What should database-migration produce?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/database-migration/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The team is still deciding entity relationships and normalized shape before any DDL is drafted. Should database-migration accept or hand off?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/database-migration/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "A production query is slow and the user asks for profiling and caching strategy, not schema rollout. Which boundary should database-migration respect?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/database-migration/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/debugging.json ADDED Viewed

@@ -0,0 +1,118 @@
+{
+  "skill_name": "debugging",
+  "subject": "Failure-driven diagnosis workflow: reproduction, scope reduction, evidence capture, root-cause isolation, fix verification, and regression-test creation",
+  "adjacent_concepts": ["testing-strategy", "refactor"],
+  "grounding_note": "This skill is deliberately self-grounding. The debugging workflow is a synthesis of industry practice rather than a derivation from a single canonical text, so truth_sources cite skills/debugging/SKILL.md line ranges rather than external references. The `checkEvalTruthSourceRanges` lint check (D2 in scripts/skill-lint.js) catches citation drift by verifying that every cited line range still exists in the file. Attach external truth_sources only when the skill is later narrowed to a specific methodology (e.g., the SRE debugging runbook).",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A bug report says \"checkout sometimes fails.\" An engineer is tempted to start reading the checkout code. According to the debugging skill's Workflow table, what is step 1 and why must it come before any hypothesis?",
+      "dimension": "definition",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/debugging/SKILL.md:82-89"]
+    },
+    {
+      "id": 2,
+      "prompt": "The debugging skill's Philosophy section warns that \"a clever fix that skips the reproduction step ships the same bug again under a different name.\" Explain the causal chain behind that claim — why does skipping reproduction make the same failure likely to reappear?",
+      "dimension": "mental_model",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/debugging/SKILL.md:74-76"]
+    },
+    {
+      "id": 3,
+      "prompt": "A team wants to plan test coverage for a newly built billing module that has not yet failed in production. Should they reach for the debugging skill or a different one? Cite the negative-routing rule that decides this.",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/debugging/SKILL.md:109-115"]
+    },
+    {
+      "id": 4,
+      "prompt": "An engineer has a working hypothesis that explains why the error is visible but not why a related field is simultaneously empty. Per the debugging skill's step 4, can they proceed to step 5? If not, what do they do instead and why?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "critical",
+      "truth_sources": ["skills/debugging/SKILL.md:82-89"]
+    },
+    {
+      "id": 5,
+      "prompt": "The debugging skill requires that a regression test both fail without the fix and pass with it. Why is \"passes with the fix\" alone insufficient, and what failure mode does the two-way check prevent?",
+      "dimension": "purpose",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/debugging/SKILL.md:82-89", "skills/debugging/SKILL.md:101-107"]
+    },
+    {
+      "id": 6,
+      "prompt": "An engineer has spent 90 minutes trying to reproduce a production intermittent failure on their laptop without success. According to the debugging skill's \"When to stop and escalate\" guidance, what does this symptom suggest and what is the correct next move?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/debugging/SKILL.md:91-95"]
+    },
+    {
+      "id": 7,
+      "prompt": "An engineer opens a PR that renames three variables, inlines a helper, and reorders parameter lists inside a module whose test suite is entirely green. No failure has been reported. The engineer asks the debugging skill to review it as a debugging task. Should the skill accept or refuse, and which `Do NOT Use When` row decides this?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/debugging/SKILL.md:109-115"]
+    },
+    {
+      "id": 8,
+      "prompt": "A bug reproduces only when the full application runs — the engineer cannot isolate it to a single module or test. According to Workflow step 2 (Scope), what is the prescribed move, and why is halving preferable to sequentially reading every file in the suspected path?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/debugging/SKILL.md:82-89"]
+    },
+    {
+      "id": 9,
+      "prompt": "A fix has been written and verified against the original failure path (step 5 passes). The engineer is now at step 6. Describe the concrete authoring procedure for the regression test — what input, what assertion, what two-way run — that would satisfy step 6's \"fails without the fix and passes with it\" gate. Distinguish this from merely asserting the fix is present.",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/debugging/SKILL.md:82-89", "skills/debugging/SKILL.md:101-107"]
+    },
+    {
+      "id": 10,
+      "prompt": "An on-call engineer is debugging a production cart-abandonment spike. They notice a null dereference in the checkout path, wrap it in a `try { ... } catch { return null }`, deploy the patch, and the error rate drops. Two weeks later, a different symptom appears (orders with empty line items) that traces back to the same swallowed null. According to the debugging skill's Philosophy and Workflow step 4, is the original patch a valid fix? Name the specific failure mode this commits, explain why the cart-abandonment rate dropping is not evidence the fix was correct, and describe what step 4 required instead.",
+      "dimension": "anti_pattern",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "critical",
+      "truth_sources": ["skills/debugging/SKILL.md:74-76", "skills/debugging/SKILL.md:82-89"]
+    }
+  ]
+}

package/examples/evals/dependency-architecture.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "dependency-architecture",
+  "subject": "Dependency graph architecture for package boundaries, direct and transitive dependencies, adapters, duplicate-purpose libraries, lock-in, upgrades, and supply-chain risk",
+  "adjacent_concepts": ["framework-fit-analysis", "owasp-security", "refactor", "architecture-decision-records"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while routing boundaries are tightened.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A monorepo imports provider SDKs directly from many packages and the team wants dependency boundary rules. Which skill owns the architecture review?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/dependency-architecture/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "The repo has two libraries that solve the same problem and one should be wrapped behind an adapter. What should dependency-architecture inspect?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/dependency-architecture/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The team has not chosen whether to use Next.js, Remix, or Astro for a new app. Should dependency-architecture accept the framework selection task?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/dependency-architecture/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "The request is a vulnerability-only scan of installed packages. Which boundary should dependency-architecture respect?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/dependency-architecture/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/design-system-architecture.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "design-system-architecture",
+  "subject": "Design-system architecture for token taxonomy, semantic tokens, component APIs, variants, theming, accessibility contracts, governance, and migration",
+  "adjacent_concepts": ["a11y", "microcopy", "layout-composition", "visual-design-foundations"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while routing boundaries are tightened.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A product needs semantic tokens for statuses, chart colors, surfaces, and dark mode before teams keep hardcoding raw colors. Which skill owns this?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/design-system-architecture/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "A component library has inconsistent props, missing state contracts, and no migration path for deprecated tokens. What should design-system-architecture verify?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/design-system-architecture/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The task is to decide page hierarchy, sitemap, and navigation labels for a product. Should design-system-architecture accept or hand off?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/design-system-architecture/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "The task is to rewrite button labels and empty-state copy, not component APIs or tokens. Which boundary should design-system-architecture respect?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/design-system-architecture/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/error-tracking.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "error-tracking",
+  "subject": "Exception-reporting pipeline design for error boundaries, centralized tracker wrappers, environment gating, PII sanitization, breadcrumbs, and capture verification",
+  "adjacent_concepts": ["observability-modeling", "a11y", "debugging", "owasp-security"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while routing boundaries are tightened.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A React app needs component, route, global, and manual exception reporting paths wired through one sanitized wrapper. Which skill owns the design?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/error-tracking/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "The tracker is receiving customer emails in payloads. According to error-tracking, what must happen before any external send?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/error-tracking/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The user needs accessible error-message copy and recovery UI for a 404 page. Should error-tracking accept the task?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/error-tracking/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "An observed production exception already exists in the tracker and the task is to find its root cause. Which boundary should error-tracking respect?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/error-tracking/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/event-contract-design.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "event-contract-design",
+  "subject": "Asynchronous event contract design for schemas, envelopes, topics, compatibility, idempotency, ordering, replay, and observability",
+  "adjacent_concepts": ["event-storming", "system-interface-contracts", "webhook-integration", "api-design"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while the new skill settles.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "The team has selected OrderPaid as a domain event and now needs topic name, envelope fields, payload schema, idempotency, and versioning. Which skill owns this?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/event-contract-design/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "A team is still discovering commands, policies, aggregates, and the timeline for a business process. Should event-contract-design take over?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/event-contract-design/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "An outbound webhook product sends customer-facing events, but there are no compatibility rules or negative fixtures. Which verification gates fail?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/event-contract-design/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "A provider sends inbound webhook deliveries and the handler must verify HMAC signatures on raw bytes. Which skill owns that mechanics work?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/event-contract-design/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/form-ux-architecture.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "form-ux-architecture",
+  "subject": "Form structure and validation UX across field grouping, validation timing, submission lifecycle, recovery, and client/server split",
+  "adjacent_concepts": ["a11y", "microcopy", "api-design", "data-modeling"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while the new skill settles.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A checkout form asks for 24 fields before shipping can be estimated. How should form-ux-architecture decide what stays, defers, or becomes progressive disclosure?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/form-ux-architecture/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "A form validates every keystroke and shows red errors while the user is still typing. Which validation-timing rule should be applied?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/form-ux-architecture/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "A developer says client-side validation is enough because the browser blocks malformed input. What boundary or philosophy point should form-ux-architecture enforce?",
+      "dimension": "mental_model",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "critical",
+      "truth_sources": ["skills/form-ux-architecture/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "The team asks for final inline validation text after the form lifecycle is settled. Which skill owns that wording?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/form-ux-architecture/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/framework-fit-analysis.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "framework-fit-analysis",
+  "subject": "Technology fit analysis for choosing, replacing, or justifying frameworks, libraries, SDKs, runtimes, databases, UI kits, and platforms",
+  "adjacent_concepts": ["dependency-architecture", "architecture-decision-records", "performance-engineering", "owasp-security"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while routing boundaries are tightened.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A team must choose between Next.js route handlers, server actions, and a separate API service under real deployment constraints. Which skill owns the fit analysis?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/framework-fit-analysis/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "Before adding a charting library, the team wants to weigh ecosystem maturity, migration cost, bundle impact, lock-in, and exit cost. What should framework-fit-analysis evaluate?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/framework-fit-analysis/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The framework was already chosen and the task is routine dependency hygiene for duplicate packages. Should framework-fit-analysis accept?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/framework-fit-analysis/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "The team has already decided and now needs the formal ADR. Which boundary should framework-fit-analysis respect?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/framework-fit-analysis/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/graph-audit.json ADDED Viewed

@@ -0,0 +1,139 @@
+{
+  "skill_name": "graph-audit",
+  "subject": "Skill metadata and manifest consistency auditing for the Skill Graph repository",
+  "adjacent_concepts": ["documentation", "refactor", "testing-strategy"],
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A contributor adds a new skill and sets `eval_artifacts: present` in the frontmatter, but does not create a corresponding eval artifact under `examples/evals/`. What does the graph-audit skill say will happen when `node scripts/skill-lint.js` runs, and which specific check catches this?",
+      "dimension": "definition",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/graph-audit/SKILL.md", "scripts/skill-lint.js"]
+    },
+    {
+      "id": 2,
+      "prompt": "A skill with `scope: codebase` is missing its `grounding` block entirely. According to the graph-audit skill, which two enforcement layers catch this violation — name them and explain the role of each.",
+      "dimension": "mental_model",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/graph-audit/SKILL.md", "schemas/skill.schema.json"]
+    },
+    {
+      "id": 3,
+      "prompt": "When should an agent use the graph-audit skill instead of the refactor skill to address a problem found in a SKILL.md file? Cite the negative-routing boundary that decides this.",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/graph-audit/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "A skill names `relations.verify_with: [missing-skill]` where `missing-skill` does not exist as a directory under `skills/`. What does the graph-audit skill say is the correct fix, and what is the category of this failure mode?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/graph-audit/SKILL.md", "scripts/skill-lint.js"]
+    },
+    {
+      "id": 5,
+      "prompt": "Why does the graph-audit skill set `grounding.grounding_mode: repo_specific` rather than `universal`? What concrete truth sources does this ground it to, and what would be lost if those files changed?",
+      "dimension": "purpose",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/graph-audit/SKILL.md", "docs/skill-metadata-protocol.md"]
+    },
+    {
+      "id": 6,
+      "prompt": "A contributor renames `skills/shopify/` to `skills/shopify-integration/` but forgets to update the `name:` field inside `skills/shopify-integration/SKILL.md` (which still reads `name: shopify`). According to the graph-audit skill, what does `scripts/skill-lint.js` do with this skill, why does this matter for SKILL.md compatibility, and what is the correct fix?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/graph-audit/SKILL.md", "scripts/skill-lint.js", "docs/skill-metadata-protocol.md"]
+    },
+    {
+      "id": 7,
+      "prompt": "An agent regenerates `examples/skills.manifest.sample.json` but uses a different `generated_at` timestamp each time, so the sample drifts from whatever `scripts/generate-manifest.js` would produce on the next run. How does the graph-audit skill say this drift is caught, and why does manifest-sample drift matter even when no real consumer reads the sample?",
+      "dimension": "mental_model",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/graph-audit/SKILL.md", "scripts/generate-manifest.js", "examples/skills.manifest.sample.json"]
+    },
+    {
+      "id": 8,
+      "prompt": "Given the following synthetic SKILL.md frontmatter excerpt:\n\n```yaml\nschema_version: 3\nname: example\ntype: capability\nbrowse_category: quality\nscope: portable\nowner: maintainer\nfreshness: \"2026-04-19\"\ndrift_check:\n  last_verified: \"2026-04-19\"\neval_artifacts: pending\neval_state: passing\nrouting_eval: absent\n```\n\nPredict which check in `scripts/skill-lint.js` will fire first when this skill is linted, what the exact error category will be (per the eleven-check list), and what the underlying rule is. (Hint: one required field has a value that is not in the schema's allowed enum.)",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "output_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/graph-audit/SKILL.md", "schemas/skill.schema.json", "scripts/skill-lint.js"]
+    },
+    {
+      "id": 9,
+      "prompt": "A skill ships with `schema_version: 2` while the current schema locks `schema_version: const 3`. According to the graph-audit skill, which of the eleven lint checks detects this specifically, and why does `additionalProperties: false` in the schema matter for catching schema drift beyond just the version field?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/graph-audit/SKILL.md", "schemas/skill.schema.json", "scripts/skill-lint.js"]
+    },
+    {
+      "id": 10,
+      "prompt": "A contributor runs `node scripts/skill-lint.js skills/a11y` on a correct skill and receives exit code 0, then introduces a typo changing `eval_artifacts: present` to `eval_artifacts: presnt` (misspelled enum value) and re-runs the same command. According to the graph-audit skill's `## Verification` gate, describe the end-to-end behavioral outcome: what exit code returns, what output category surfaces, which specific check produces the error, and what decision should the contributor's CI make based on the non-zero exit? This is a behavioral assertion — the answer is an observable CI outcome, not a skill-quotation.",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "output_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/graph-audit/SKILL.md", "scripts/skill-lint.js", "schemas/skill.schema.json"]
+    },
+    {
+      "id": 11,
+      "prompt": "A contributor asks graph-audit to debug why their agent is looping infinitely when it tries to resolve a relation target. Should graph-audit take this task? Cite the `Do NOT Use When` row that decides this and name the correct skill.",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/graph-audit/SKILL.md"]
+    },
+    {
+      "id": 12,
+      "prompt": "A contributor asks graph-audit to help rewrite the `## Coverage` prose in an existing SKILL.md to read more naturally — no schema change, no manifest change, just prose polish. Should graph-audit take this task? Cite the `Do NOT Use When` row that decides this and name the correct skill.",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/graph-audit/SKILL.md"]
+    }
+  ]
+}