npm - @skill-graph/cli - Versions diffs - 0.5.6 - Mend

@skill-graph/cli 0.5.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (330) hide show

package/CHANGELOG.md +247 -0
package/LICENSE +200 -0
package/NOTICE +62 -0
package/README.md +398 -0
package/SKILL_GRAPH.md +443 -0
package/bin/skill-graph.js +374 -0
package/docs/ADOPTION.md +117 -0
package/docs/CONFORMANCE.md +66 -0
package/docs/PRIMER.md +384 -0
package/docs/QUICKSTART-30MIN.md +333 -0
package/docs/ROUTING-METRICS.md +120 -0
package/docs/SKILL-MD-FORMAT-COMPATIBILITY.md +127 -0
package/docs/SKILL_AUDIT_CHECKLIST.md +199 -0
package/docs/SKILL_AUDIT_LOOP.md +195 -0
package/docs/SKILL_METADATA_PROTOCOL.md +609 -0
package/docs/_archived/marketplace-publication-priority-2026-05-18.md +239 -0
package/docs/adr/0001-predicate-set.md +69 -0
package/docs/adr/0002-json-ld-context.md +82 -0
package/docs/adr/0003-ontoclean-rigidity-tags.md +65 -0
package/docs/adr/0004-persistent-identifiers.md +74 -0
package/docs/adr/0005-freshness-consolidation.md +70 -0
package/docs/adr/0006-revise-predicate-rename.md +105 -0
package/docs/adr/0007-audit-loop-cadence.md +99 -0
package/docs/adr/0008-skill-surface-split-and-curation-policy.md +93 -0
package/docs/category-consumers.md +168 -0
package/docs/concept-map.md +194 -0
package/docs/diagrams/drift-states.mmd +21 -0
package/docs/diagrams/manifest-pipeline.mmd +25 -0
package/docs/diagrams/routing-harness.mmd +41 -0
package/docs/diagrams/starter-graph.mmd +53 -0
package/docs/field-decision-guide.md +315 -0
package/docs/field-rationale.md +211 -0
package/docs/field-reference.generated.md +624 -0
package/docs/field-reference.md +1426 -0
package/docs/glossary.md +190 -0
package/docs/head-noun-glossary.md +63 -0
package/docs/images/audit-phases.png +0 -0
package/docs/images/drift-states.png +0 -0
package/docs/images/graded-mode.png +0 -0
package/docs/images/manifest-pipeline.png +0 -0
package/docs/images/routing-harness.png +0 -0
package/docs/images/skill-anatomy.png +0 -0
package/docs/images/starter-graph.png +0 -0
package/docs/images/system-model.png +0 -0
package/docs/integrations/github-actions.md +155 -0
package/docs/manifest-field-mapping.md +443 -0
package/docs/marketplace-publication-queue.generated.md +240 -0
package/docs/marketplace-release-agent-prompt.md +82 -0
package/docs/marketplace-skill-candidate-list.md +272 -0
package/docs/marketplace-syndication.md +222 -0
package/docs/migration-sample-review.md +155 -0
package/docs/migrations/v4-to-v5.md +168 -0
package/docs/migrations/v5-to-v6.md +221 -0
package/docs/name-exceptions.yaml +37 -0
package/docs/plans/marketplace-p1-public-migration-plan.md +41 -0
package/docs/plans/multi-root-workspace.md +148 -0
package/docs/plans/scripts-roadmap.md +107 -0
package/docs/plans/v4-schema-bump.md +160 -0
package/docs/plans/wave-2-extraction.md +122 -0
package/docs/positioning-vs-marketplaces.md +175 -0
package/docs/proposals/skill-audit-loop-positioning.md +160 -0
package/docs/quality-doctrine.md +138 -0
package/docs/recommended-skills.md +150 -0
package/docs/research/skill-comprehension-eval-research.md +1830 -0
package/docs/research/skill-retrieval-evidence.md +66 -0
package/docs/skill-metadata-protocol.md +471 -0
package/docs/skills-sh-maintainer-cleanup-request.md +80 -0
package/examples/audits/a11y/findings.md +52 -0
package/examples/audits/a11y/scorecard.md +21 -0
package/examples/audits/a11y/verdict.md +44 -0
package/examples/audits/debugging/findings.md +59 -0
package/examples/audits/debugging/scorecard.md +22 -0
package/examples/audits/debugging/verdict.md +33 -0
package/examples/audits/documentation/findings.md +59 -0
package/examples/audits/documentation/scorecard.md +22 -0
package/examples/audits/documentation/verdict.md +33 -0
package/examples/evals/a11y.json +140 -0
package/examples/evals/api-design.json +52 -0
package/examples/evals/code-review.json +52 -0
package/examples/evals/data-modeling.json +52 -0
package/examples/evals/database-migration.json +52 -0
package/examples/evals/debugging.json +118 -0
package/examples/evals/dependency-architecture.json +52 -0
package/examples/evals/design-system-architecture.json +52 -0
package/examples/evals/error-tracking.json +52 -0
package/examples/evals/event-contract-design.json +52 -0
package/examples/evals/form-ux-architecture.json +52 -0
package/examples/evals/framework-fit-analysis.json +52 -0
package/examples/evals/graph-audit.json +139 -0
package/examples/evals/information-architecture.json +52 -0
package/examples/evals/interaction-feedback.json +52 -0
package/examples/evals/interaction-patterns.json +52 -0
package/examples/evals/layout-composition.json +52 -0
package/examples/evals/lint-overlay.json +117 -0
package/examples/evals/microcopy.json +52 -0
package/examples/evals/observability-modeling.json +52 -0
package/examples/evals/pattern-recognition.json +96 -0
package/examples/evals/performance-engineering.json +52 -0
package/examples/evals/refactor.json +128 -0
package/examples/evals/semiotics.json +52 -0
package/examples/evals/skill-infrastructure.json +96 -0
package/examples/evals/skill-router.json +140 -0
package/examples/evals/skill-router.routing.json +113 -0
package/examples/evals/system-interface-contracts.json +52 -0
package/examples/evals/task-analysis.json +52 -0
package/examples/evals/testing-strategy.json +118 -0
package/examples/evals/type-safety.json +249 -0
package/examples/evals/visual-design-foundations.json +52 -0
package/examples/evals/webhook-integration.json +52 -0
package/examples/exports/a11y.skill-md.md +80 -0
package/examples/exports/debugging.skill-md.md +80 -0
package/examples/exports/refactor.skill-md.md +78 -0
package/examples/exports/testing-strategy.skill-md.md +81 -0
package/examples/projects/markdown-static-site/README.md +115 -0
package/examples/projects/markdown-static-site/skills/content-source-router/SKILL.md +131 -0
package/examples/projects/markdown-static-site/skills/image-optimization-pipeline-config/SKILL.md +132 -0
package/examples/projects/markdown-static-site/skills/link-rot-detection/SKILL.md +103 -0
package/examples/projects/markdown-static-site/skills/markdown-post-frontmatter-validation/SKILL.md +133 -0
package/examples/projects/markdown-static-site/skills/migrate-posts-to-v2-frontmatter/SKILL.md +140 -0
package/examples/projects/saas-stripe-postgres/README.md +208 -0
package/examples/projects/saas-stripe-postgres/db/migrations/0004_canonicalize_orders.sql +37 -0
package/examples/projects/saas-stripe-postgres/db/schema.sql +112 -0
package/examples/projects/saas-stripe-postgres/skills/migrate-orders-to-canonical-schema/SKILL.md +149 -0
package/examples/projects/saas-stripe-postgres/skills/nextjs-server-action-validation/SKILL.md +154 -0
package/examples/projects/saas-stripe-postgres/skills/payment-provider-router/SKILL.md +153 -0
package/examples/projects/saas-stripe-postgres/skills/postgres-rls-pattern/SKILL.md +163 -0
package/examples/projects/saas-stripe-postgres/skills/stripe-webhook-signature-verification/SKILL.md +137 -0
package/examples/protocol/skill-metadata-template.md +301 -0
package/examples/protocol/skills.manifest.sample.json +13245 -0
package/examples/skill-metadata-template.md +317 -0
package/examples/skills.manifest.sample.json +13519 -0
package/examples/tests/v3-1-skos-fixture/SKILL.md +93 -0
package/marketplace/README.md +17 -0
package/marketplace/skills/a11y/SKILL.md +66 -0
package/marketplace/skills/acid-fundamentals/SKILL.md +106 -0
package/marketplace/skills/agent-engineering/SKILL.md +386 -0
package/marketplace/skills/agent-eval-design/SKILL.md +55 -0
package/marketplace/skills/ai-native-development/SKILL.md +294 -0
package/marketplace/skills/api-design/SKILL.md +60 -0
package/marketplace/skills/architecture-decision-records/SKILL.md +55 -0
package/marketplace/skills/background-jobs/SKILL.md +265 -0
package/marketplace/skills/bounded-context-mapping/SKILL.md +55 -0
package/marketplace/skills/cap-theorem-tradeoffs/SKILL.md +127 -0
package/marketplace/skills/client-server-boundary/SKILL.md +187 -0
package/marketplace/skills/code-review/SKILL.md +120 -0
package/marketplace/skills/color-system-design/SKILL.md +43 -0
package/marketplace/skills/component-architecture/SKILL.md +126 -0
package/marketplace/skills/compression/SKILL.md +112 -0
package/marketplace/skills/conceptual-modeling/SKILL.md +181 -0
package/marketplace/skills/connection-pooling/SKILL.md +105 -0
package/marketplace/skills/constraint-awareness/SKILL.md +287 -0
package/marketplace/skills/content-monitor/SKILL.md +209 -0
package/marketplace/skills/context-engineering/SKILL.md +320 -0
package/marketplace/skills/context-graph/SKILL.md +174 -0
package/marketplace/skills/context-management/SKILL.md +174 -0
package/marketplace/skills/context-window/SKILL.md +239 -0
package/marketplace/skills/contract-testing/SKILL.md +120 -0
package/marketplace/skills/cron-scheduling/SKILL.md +223 -0
package/marketplace/skills/dark-mode-implementation/SKILL.md +47 -0
package/marketplace/skills/data-modeling/SKILL.md +59 -0
package/marketplace/skills/data-modeling-fundamentals/SKILL.md +117 -0
package/marketplace/skills/database-migration/SKILL.md +429 -0
package/marketplace/skills/debugging/SKILL.md +67 -0
package/marketplace/skills/dependency-architecture/SKILL.md +58 -0
package/marketplace/skills/design-module-composition/SKILL.md +43 -0
package/marketplace/skills/design-system-architecture/SKILL.md +61 -0
package/marketplace/skills/design-thinking/SKILL.md +44 -0
package/marketplace/skills/diagnosis/SKILL.md +296 -0
package/marketplace/skills/diff-analysis/SKILL.md +188 -0
package/marketplace/skills/e2e-test-design/SKILL.md +113 -0
package/marketplace/skills/entity-relationship-modeling/SKILL.md +218 -0
package/marketplace/skills/epistemic-grounding/SKILL.md +112 -0
package/marketplace/skills/error-boundary/SKILL.md +235 -0
package/marketplace/skills/error-tracking/SKILL.md +261 -0
package/marketplace/skills/eval-driven-development/SKILL.md +147 -0
package/marketplace/skills/evaluation/SKILL.md +113 -0
package/marketplace/skills/event-contract-design/SKILL.md +60 -0
package/marketplace/skills/event-storming/SKILL.md +56 -0
package/marketplace/skills/form-ux-architecture/SKILL.md +60 -0
package/marketplace/skills/framework-fit-analysis/SKILL.md +59 -0
package/marketplace/skills/frontend-architecture/SKILL.md +43 -0
package/marketplace/skills/generative-ui/SKILL.md +118 -0
package/marketplace/skills/graph-audit/SKILL.md +81 -0
package/marketplace/skills/guardrails/SKILL.md +118 -0
package/marketplace/skills/hooks-patterns/SKILL.md +185 -0
package/marketplace/skills/http-semantics/SKILL.md +136 -0
package/marketplace/skills/ideation/SKILL.md +41 -0
package/marketplace/skills/indexing-strategy/SKILL.md +108 -0
package/marketplace/skills/information-architecture/SKILL.md +59 -0
package/marketplace/skills/integration-test-design/SKILL.md +111 -0
package/marketplace/skills/intent-recognition/SKILL.md +136 -0
package/marketplace/skills/interaction-feedback/SKILL.md +59 -0
package/marketplace/skills/interaction-patterns/SKILL.md +59 -0
package/marketplace/skills/journey-mapping/SKILL.md +41 -0
package/marketplace/skills/keywords/SKILL.md +213 -0
package/marketplace/skills/knowledge-modeling/SKILL.md +232 -0
package/marketplace/skills/layout-composition/SKILL.md +59 -0
package/marketplace/skills/linguistics/SKILL.md +429 -0
package/marketplace/skills/lint-overlay/SKILL.md +76 -0
package/marketplace/skills/mental-models/SKILL.md +126 -0
package/marketplace/skills/merge-queue/SKILL.md +94 -0
package/marketplace/skills/methodology/SKILL.md +317 -0
package/marketplace/skills/microcopy/SKILL.md +232 -0
package/marketplace/skills/middleware-patterns/SKILL.md +363 -0
package/marketplace/skills/mobile-responsive-ux/SKILL.md +287 -0
package/marketplace/skills/mutation-testing/SKILL.md +112 -0
package/marketplace/skills/naming-conventions/SKILL.md +112 -0
package/marketplace/skills/observability-modeling/SKILL.md +59 -0
package/marketplace/skills/ontology-modeling/SKILL.md +67 -0
package/marketplace/skills/owasp-security/SKILL.md +153 -0
package/marketplace/skills/pattern-recognition/SKILL.md +472 -0
package/marketplace/skills/performance-budgets/SKILL.md +185 -0
package/marketplace/skills/performance-engineering/SKILL.md +58 -0
package/marketplace/skills/performance-testing/SKILL.md +125 -0
package/marketplace/skills/printify/SKILL.md +42 -0
package/marketplace/skills/prioritization/SKILL.md +118 -0
package/marketplace/skills/problem-framing/SKILL.md +41 -0
package/marketplace/skills/problem-locating-solving/SKILL.md +203 -0
package/marketplace/skills/project-knowledge-extraction/SKILL.md +54 -0
package/marketplace/skills/prompt-craft/SKILL.md +134 -0
package/marketplace/skills/prompt-injection-defense/SKILL.md +132 -0
package/marketplace/skills/property-based-testing/SKILL.md +100 -0
package/marketplace/skills/prototyping/SKILL.md +43 -0
package/marketplace/skills/query-optimization/SKILL.md +144 -0
package/marketplace/skills/real-time-updates/SKILL.md +324 -0
package/marketplace/skills/ref-patterns/SKILL.md +284 -0
package/marketplace/skills/refactor/SKILL.md +65 -0
package/marketplace/skills/rendering-models/SKILL.md +142 -0
package/marketplace/skills/replication-patterns/SKILL.md +110 -0
package/marketplace/skills/research-synthesis/SKILL.md +41 -0
package/marketplace/skills/route-handler-design/SKILL.md +347 -0
package/marketplace/skills/schema-evolution/SKILL.md +140 -0
package/marketplace/skills/security-fundamentals/SKILL.md +139 -0
package/marketplace/skills/semantic-center/SKILL.md +194 -0
package/marketplace/skills/semantic-relations/SKILL.md +250 -0
package/marketplace/skills/semantics/SKILL.md +366 -0
package/marketplace/skills/semiotics/SKILL.md +230 -0
package/marketplace/skills/seo-strategy/SKILL.md +260 -0
package/marketplace/skills/server-actions-design/SKILL.md +243 -0
package/marketplace/skills/server-components-design/SKILL.md +190 -0
package/marketplace/skills/sharding-strategy/SKILL.md +123 -0
package/marketplace/skills/shopify/SKILL.md +42 -0
package/marketplace/skills/skill-infrastructure/SKILL.md +320 -0
package/marketplace/skills/skill-router/SKILL.md +71 -0
package/marketplace/skills/skill-scaffold/SKILL.md +105 -0
package/marketplace/skills/snapshot-testing/SKILL.md +120 -0
package/marketplace/skills/spec-driven-development/SKILL.md +148 -0
package/marketplace/skills/state-machine-modeling/SKILL.md +56 -0
package/marketplace/skills/state-management/SKILL.md +134 -0
package/marketplace/skills/streaming-architecture/SKILL.md +194 -0
package/marketplace/skills/summarization/SKILL.md +156 -0
package/marketplace/skills/suspense-patterns/SKILL.md +265 -0
package/marketplace/skills/system-interface-contracts/SKILL.md +59 -0
package/marketplace/skills/task-analysis/SKILL.md +201 -0
package/marketplace/skills/taxonomy-design/SKILL.md +66 -0
package/marketplace/skills/test-coverage-strategy/SKILL.md +108 -0
package/marketplace/skills/test-doubles-design/SKILL.md +98 -0
package/marketplace/skills/test-driven-development/SKILL.md +96 -0
package/marketplace/skills/testing-strategy/SKILL.md +67 -0
package/marketplace/skills/theme-system-design/SKILL.md +43 -0
package/marketplace/skills/tool-call-flow/SKILL.md +229 -0
package/marketplace/skills/tool-call-strategy/SKILL.md +292 -0
package/marketplace/skills/transaction-isolation/SKILL.md +98 -0
package/marketplace/skills/type-safety/SKILL.md +177 -0
package/marketplace/skills/typography-system/SKILL.md +43 -0
package/marketplace/skills/usability-testing/SKILL.md +43 -0
package/marketplace/skills/user-research/SKILL.md +43 -0
package/marketplace/skills/vercel-composition-patterns/SKILL.md +157 -0
package/marketplace/skills/version-control/SKILL.md +233 -0
package/marketplace/skills/visual-design-foundations/SKILL.md +59 -0
package/marketplace/skills/visual-hierarchy/SKILL.md +43 -0
package/marketplace/skills/webhook-integration/SKILL.md +331 -0
package/marketplace/skills/writing-humanizer/SKILL.md +380 -0
package/package.json +67 -0
package/schemas/manifest.schema.json +811 -0
package/schemas/manifest.v2.schema.json +164 -0
package/schemas/manifest.v3.schema.json +758 -0
package/schemas/manifest.v4.schema.json +755 -0
package/schemas/manifest.v5.schema.json +755 -0
package/schemas/manifest.v6.schema.json +811 -0
package/schemas/skill.context.jsonld +279 -0
package/schemas/skill.schema.json +919 -0
package/schemas/skill.v2.schema.json +201 -0
package/schemas/skill.v3.schema.json +827 -0
package/schemas/skill.v4.schema.json +822 -0
package/schemas/skill.v5.schema.json +830 -0
package/schemas/skill.v6.schema.json +946 -0
package/schemas/vocabulary/keywords.json +180 -0
package/schemas/vocabulary/workspace_tags.json +23 -0
package/scripts/__tests__/migrate-skill-v2-to-v3.test.js +161 -0
package/scripts/__tests__/migrate-skill-v3-to-v4.test.js +158 -0
package/scripts/__tests__/test-export-parser-drift.js +149 -0
package/scripts/__tests__/test-marketplace-export.js +114 -0
package/scripts/__tests__/test-router-paths.js +82 -0
package/scripts/__tests__/test-stability-promotion.js +244 -0
package/scripts/__tests__/test-v3-1-alias-contract.js +109 -0
package/scripts/__tests__/test-v3-1-skos-runtime.js +116 -0
package/scripts/backfill-schema-version.js +198 -0
package/scripts/build-field-reference.js +160 -0
package/scripts/build-retrieval-baseline.js +511 -0
package/scripts/check-markdown-links.js +211 -0
package/scripts/check-protocol-consistency.js +979 -0
package/scripts/export-marketplace-skills.js +610 -0
package/scripts/export-skill.js +374 -0
package/scripts/generate-manifest.js +787 -0
package/scripts/lib/alias-contract.js +83 -0
package/scripts/lib/audit-prompt-builder.js +771 -0
package/scripts/lib/mock-grader.js +134 -0
package/scripts/lib/parse-frontmatter.js +429 -0
package/scripts/lib/roots.js +119 -0
package/scripts/lint/check-archetype-sections.js +185 -0
package/scripts/lint/check-category-enum.js +83 -0
package/scripts/lint/check-routing-eval.js +146 -0
package/scripts/lint/check-routing-quality.js +211 -0
package/scripts/lint/check-stability-promotion.js +220 -0
package/scripts/lint/format-code-frame.js +206 -0
package/scripts/marketplace-install.js +125 -0
package/scripts/migrate-category-to-enum.js +169 -0
package/scripts/migrate-skill-v2-to-v3.js +424 -0
package/scripts/migrate-skill-v3-to-v4.js +200 -0
package/scripts/migrate-skill-v5-to-v6.js +304 -0
package/scripts/restructure-by-category.js +85 -0
package/scripts/seed-publication-classification.js +282 -0
package/scripts/skill-audit.js +893 -0
package/scripts/skill-graph-drift.js +483 -0
package/scripts/skill-graph-route.js +766 -0
package/scripts/skill-graph-routing-eval.js +393 -0
package/scripts/skill-lint.js +1317 -0
package/scripts/skill-overlap.js +213 -0
package/scripts/verify-skill-md-export.js +201 -0

package/examples/evals/information-architecture.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "information-architecture",
+  "subject": "Information architecture for navigation, page hierarchy, sitemaps, wayfinding, labeling systems, content grouping, and findability",
+  "adjacent_concepts": ["task-analysis", "taxonomy-design", "layout-composition", "microcopy"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while routing boundaries are tightened.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A docs site has useful content but users cannot find setup instructions. Which skill owns navigation, grouping, and wayfinding improvements?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/information-architecture/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "A product team is deciding whether information belongs in top-level nav, tabs, filters, or a page section. What should information-architecture inspect?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/information-architecture/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The task is to build a formal category taxonomy and assignment rules for the skill library. Should information-architecture accept?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/information-architecture/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "The route hierarchy is known and the next task is responsive grid and breakpoint composition. Which boundary should information-architecture respect?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/information-architecture/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/interaction-feedback.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "interaction-feedback",
+  "subject": "UI feedback-state staging for user actions, asynchronous work, success, failure, retry, undo, and perceived latency",
+  "adjacent_concepts": ["microcopy", "a11y", "state-machine-modeling", "performance-engineering"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while the new skill settles.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A user clicks Export and nothing changes for 8 seconds before a file appears. Which feedback states should interaction-feedback design before wording is written?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/interaction-feedback/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "A toast message is too vague and needs better copy. Should interaction-feedback own the words?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/interaction-feedback/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "A save action updates the UI optimistically, then the server rejects the change. What must the interaction-feedback verification cover?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/interaction-feedback/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "An order lifecycle has pending, paid, fulfilled, refunded, and cancelled states with legal transitions. Should interaction-feedback define the lifecycle itself?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/interaction-feedback/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/interaction-patterns.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "interaction-patterns",
+  "subject": "Choosing and auditing UI interaction patterns and controls before implementation",
+  "adjacent_concepts": ["a11y", "task-analysis", "interaction-feedback", "design-system-architecture"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while the new skill settles.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A user needs to compare five mutually exclusive pricing options before choosing one. Should the interface hide them in a dropdown? Apply the interaction-patterns method.",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/interaction-patterns/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "A custom combobox has already been chosen and now needs ARIA roles, focus behavior, and keyboard support. Which skill owns that next step?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/interaction-patterns/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "A flow uses a modal to edit a record while the user needs to compare values in the table behind it. What should interaction-patterns inspect before recommending inline edit, drawer, or modal?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/interaction-patterns/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "A team asks interaction-patterns to define component props and semantic tokens for the selected control. Should the skill continue or hand off?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/interaction-patterns/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/layout-composition.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "layout-composition",
+  "subject": "Responsive layout and screen composition for page structure, scan pattern, breakpoints, and stable viewport hierarchy",
+  "adjacent_concepts": ["task-analysis", "information-architecture", "visual-design-foundations", "design-system-architecture"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while the new skill settles.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A route contract already names primary, secondary, and supporting content. The user asks how to order the sections on desktop and mobile. Which skill owns the next step, and what should it produce?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/layout-composition/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "A dashboard looks fine at 1440px but the chart controls jump above the title and the table overflows on mobile. According to the layout-composition skill, what verification gates are failing?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/layout-composition/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The user asks for a color palette and type scale after the grid is already settled. Should layout-composition accept the task or route elsewhere?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/layout-composition/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "A card grid changes height when a status label appears, causing nearby buttons to move. Which layout-composition principle applies?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "normal",
+      "truth_sources": ["skills/layout-composition/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/lint-overlay.json ADDED Viewed

@@ -0,0 +1,117 @@
+{
+  "skill_name": "lint-overlay",
+  "subject": "Overlay for testing-strategy covering lint as verification: rule selection, gate placement, failure triage, and migration planning when introducing rules to an existing codebase",
+  "adjacent_concepts": ["testing-strategy", "refactor", "debugging"],
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A contributor loads lint-overlay alone and asks it to decide whether lint belongs in a change's verification plan at all. According to the overlay's Extends section, is that a valid use? If not, what does the overlay say must be loaded alongside it and why?",
+      "dimension": "definition",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "critical",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:65-82"]
+    },
+    {
+      "id": 2,
+      "prompt": "The overlay says \"effort-to-risk matching\" is NOT overridden — the base testing-strategy skill still decides whether to lint before this overlay decides how. Explain why the overlay deliberately leaves that decision to the base rather than re-deriving it.",
+      "dimension": "mental_model",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:65-82"]
+    },
+    {
+      "id": 3,
+      "prompt": "An engineer is staring at a single failing ESLint rule in one file and wants help fixing that specific violation. Should they load lint-overlay? Cite the negative-routing rule that decides this and name the skill that should be loaded instead.",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:118-124"]
+    },
+    {
+      "id": 4,
+      "prompt": "A team wants to introduce a new `no-console` lint rule to an existing codebase that already has ~200 violations. According to the lint-overlay's Overlay Rules table, what is the correct migration approach and why does adding a rule that immediately fails 200 files count as a scope change rather than a test?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:102-112"]
+    },
+    {
+      "id": 5,
+      "prompt": "The lint-overlay places lint after unit tests but before integration tests in the verification sequence. Why this specific ordering? What property of lint failures makes running them earlier than integration tests a win, and what property of unit tests makes them still earlier?",
+      "dimension": "purpose",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:102-112"]
+    },
+    {
+      "id": 6,
+      "prompt": "A reviewer argues that lint failures on pre-existing violations should be downgraded to warnings because the current change did not introduce them. According to the lint-overlay, is that correct? Cite the rule it would invoke instead.",
+      "dimension": "application",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:102-112"]
+    },
+    {
+      "id": 7,
+      "prompt": "A team asks the lint-overlay to help decide whether their codebase should have lint at all. Should the overlay answer directly? Cite what the overlay says about the scope of decisions it adds vs. the scope it leaves to the base skill.",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "critical",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:65-82", "skills/lint-overlay/SKILL.md:118-124"]
+    },
+    {
+      "id": 8,
+      "prompt": "A CI pipeline currently runs lint across the entire repository tree on every pull request, including files the current change did not touch. According to the lint-overlay's `Lint scope matches the test scope` rule, is this the correct posture? When is tree-wide lint justified, and when should it be restricted to changed files?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:102-112", "skills/lint-overlay/SKILL.md:92-100"]
+    },
+    {
+      "id": 9,
+      "prompt": "A team configures their CI so that lint produces output but does not fail the build — the rationale is \"developers will see the warnings and fix them eventually.\" According to the lint-overlay's `Lint failures are blocking, not advisory` rule, is this posture consistent with the overlay's doctrine? What is the overlay's position on warn-only lint, and when (if ever) is it acceptable?",
+      "dimension": "application",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:102-112", "skills/lint-overlay/SKILL.md:92-100"]
+    },
+    {
+      "id": 10,
+      "prompt": "A team wants to introduce `react-hooks/exhaustive-deps` as a new ESLint rule. The codebase currently has ~150 files that would newly fail this rule, across 8 feature teams, on code paths that range from new (<1 month old) to legacy (>3 years, unowned). According to the lint-overlay's `New lint rules require a migration plan` rule, produce the migration plan the overlay would require — including phased gates, cleanup ownership, timeline, and the explicit artifact(s) the plan must ship with. Distinguish this from the adjacent `Only enforce rules that were green before the change` rule: what does the migration plan add beyond pinning pre-change green state?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "workflow",
+      "criticality": "high",
+      "truth_sources": ["skills/lint-overlay/SKILL.md:102-112"]
+    }
+  ]
+}

package/examples/evals/microcopy.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "microcopy",
+  "subject": "Functional UI text for action labels, empty states, tooltips, dialogs, loading messages, toasts, validation, permissions, and onboarding steps",
+  "adjacent_concepts": ["semiotics", "a11y", "interaction-feedback", "writing-humanizer"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while routing boundaries are tightened.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A destructive dialog says Submit and the team needs a specific, consequence-first action label. Which skill owns the wording pattern?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/microcopy/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "An empty state needs to acknowledge what is missing, explain why, and guide the next action in one compact UI surface. What should microcopy produce?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/microcopy/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The task is marketing persuasion for the pricing-page headline. Should microcopy accept the work?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/microcopy/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "The task is to decide the loading, success, retry, and undo state sequence, not the words inside those states. Which boundary should microcopy respect?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/microcopy/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/observability-modeling.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "observability-modeling",
+  "subject": "Telemetry semantics for diagnostic questions, logs, metrics, traces, spans, attributes, correlation IDs, SLOs, alert signals, cardinality, privacy, and sampling",
+  "adjacent_concepts": ["error-tracking", "event-contract-design", "performance-engineering", "debugging"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while routing boundaries are tightened.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A background ingestion pipeline needs logs, metrics, spans, correlation IDs, and alert signals designed before implementation. Which skill owns the telemetry model?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/observability-modeling/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "The team has diagnostic questions but no event attributes or SLO signals. What should observability-modeling turn those questions into?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/observability-modeling/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The task is to configure Sentry error boundaries and sanitized exception capture only. Should observability-modeling accept?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/observability-modeling/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "There is a live production incident and the user wants root-cause debugging. Which boundary should observability-modeling respect?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/observability-modeling/SKILL.md"]
+    }
+  ]
+}

package/examples/evals/pattern-recognition.json ADDED Viewed

@@ -0,0 +1,96 @@
+{
+  "skill_name": "pattern-recognition",
+  "subject": "Recurring-structure recognition across code, errors, board state, conventions, and domain encodings",
+  "adjacent_concepts": ["debugging", "code-review", "diagnosis", "lint-overlay"],
+  "grounding_note": "This portable skill is grounded in its own method description and cited public pattern-recognition sources rather than repo-local implementation files. These evals exercise the recurring-instance threshold, clustering discipline, prevention loop, lifecycle states, and negative-routing boundaries.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "The same SQL string interpolation bug appears in three route handlers. Should the agent fix only the latest one?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/pattern-recognition/SKILL.md:61-80"]
+    },
+    {
+      "id": 2,
+      "prompt": "An agent saw one strange failure once in the logs and wants to write a lint rule immediately. Is that pattern recognition?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/pattern-recognition/SKILL.md:72-80", "skills/pattern-recognition/SKILL.md:462-481"]
+    },
+    {
+      "id": 3,
+      "prompt": "Twelve component files contain hardcoded hex colors outside the design-token source. What is the pattern-recognition response?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/pattern-recognition/SKILL.md:233-279"]
+    },
+    {
+      "id": 4,
+      "prompt": "A session log contains many errors that differ only by timestamps, file paths, and line numbers. How should the agent reason about them?",
+      "dimension": "mental_model",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/pattern-recognition/SKILL.md:155-187"]
+    },
+    {
+      "id": 5,
+      "prompt": "A board has many stale In Progress tasks, WIP overflow, and duplicate-looking tickets. Is that random clutter?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/pattern-recognition/SKILL.md:197-231"]
+    },
+    {
+      "id": 6,
+      "prompt": "The same dashboard NaN display bug keeps coming back. A developer proposes adding `|| 0` at every callsite. What should pattern-recognition say?",
+      "dimension": "purpose",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "critical",
+      "truth_sources": ["skills/pattern-recognition/SKILL.md:281-329", "skills/pattern-recognition/SKILL.md:366-395"]
+    },
+    {
+      "id": 7,
+      "prompt": "A detection rule for an old import path now returns zero matches every week after the migration finished. What state is that pattern in?",
+      "dimension": "taxonomy",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/pattern-recognition/SKILL.md:397-429"]
+    },
+    {
+      "id": 8,
+      "prompt": "The user asks: 'Review this PR for semantic correctness and maintainability.' Should this skill take over?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/pattern-recognition/SKILL.md:483-494"]
+    }
+  ]
+}

package/examples/evals/performance-engineering.json ADDED Viewed

@@ -0,0 +1,52 @@
+{
+  "skill_name": "performance-engineering",
+  "subject": "Performance measurement and improvement for latency, throughput, Core Web Vitals, database queries, caching, bundle size, concurrency, resource use, and regressions",
+  "adjacent_concepts": ["observability-modeling", "testing-strategy", "api-design", "data-modeling"],
+  "grounding_note": "Truth sources cite the whole SKILL.md file to keep the initial eval surface stable while routing boundaries are tightened.",
+  "evals": [
+    {
+      "id": 1,
+      "prompt": "A dashboard is slow and the team needs measurement, bottleneck analysis, and a decision about what to optimize first. Which skill owns the work?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "process",
+      "truth_mode": "process_correctness",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/performance-engineering/SKILL.md"]
+    },
+    {
+      "id": 2,
+      "prompt": "An endpoint risks N+1 queries and cache mistakes, and the team wants regression prevention. What should performance-engineering verify?",
+      "dimension": "application",
+      "substance": "domain",
+      "calibration": "semantic",
+      "truth_mode": "conceptual_correctness_plus_repo_application",
+      "skill_type": "concept",
+      "criticality": "high",
+      "truth_sources": ["skills/performance-engineering/SKILL.md"]
+    },
+    {
+      "id": 3,
+      "prompt": "The task is to design logs, metrics, spans, and correlation IDs before implementation, not optimize a measured bottleneck. Should performance-engineering accept?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/performance-engineering/SKILL.md"]
+    },
+    {
+      "id": 4,
+      "prompt": "The user asks for random micro-optimizations without a measurement or bottleneck. Which performance-engineering guardrail applies?",
+      "dimension": "boundary",
+      "substance": "contradiction-check",
+      "calibration": "semantic",
+      "truth_mode": "code_verification",
+      "skill_type": "concept",
+      "criticality": "normal",
+      "truth_sources": ["skills/performance-engineering/SKILL.md"]
+    }
+  ]
+}