cli-jaw 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +21 -0
- package/README.ko.md +411 -0
- package/README.md +416 -0
- package/README.zh-CN.md +411 -0
- package/dist/bin/cli-jaw.js +108 -0
- package/dist/bin/cli-jaw.js.map +1 -0
- package/dist/bin/commands/browser.js +241 -0
- package/dist/bin/commands/browser.js.map +1 -0
- package/dist/bin/commands/chat.js +878 -0
- package/dist/bin/commands/chat.js.map +1 -0
- package/dist/bin/commands/doctor.js +152 -0
- package/dist/bin/commands/doctor.js.map +1 -0
- package/dist/bin/commands/employee.js +70 -0
- package/dist/bin/commands/employee.js.map +1 -0
- package/dist/bin/commands/init.js +110 -0
- package/dist/bin/commands/init.js.map +1 -0
- package/dist/bin/commands/mcp.js +219 -0
- package/dist/bin/commands/mcp.js.map +1 -0
- package/dist/bin/commands/memory.js +105 -0
- package/dist/bin/commands/memory.js.map +1 -0
- package/dist/bin/commands/reset.js +109 -0
- package/dist/bin/commands/reset.js.map +1 -0
- package/dist/bin/commands/serve.js +75 -0
- package/dist/bin/commands/serve.js.map +1 -0
- package/dist/bin/commands/skill.js +232 -0
- package/dist/bin/commands/skill.js.map +1 -0
- package/dist/bin/commands/status.js +51 -0
- package/dist/bin/commands/status.js.map +1 -0
- package/dist/bin/postinstall.js +218 -0
- package/dist/bin/postinstall.js.map +1 -0
- package/dist/lib/mcp-sync.js +639 -0
- package/dist/lib/mcp-sync.js.map +1 -0
- package/dist/lib/quota-copilot.js +62 -0
- package/dist/lib/quota-copilot.js.map +1 -0
- package/dist/lib/upload.js +72 -0
- package/dist/lib/upload.js.map +1 -0
- package/dist/server.js +832 -0
- package/dist/server.js.map +1 -0
- package/dist/src/agent/args.js +66 -0
- package/dist/src/agent/args.js.map +1 -0
- package/dist/src/agent/events.js +328 -0
- package/dist/src/agent/events.js.map +1 -0
- package/dist/src/agent/spawn.js +646 -0
- package/dist/src/agent/spawn.js.map +1 -0
- package/dist/src/browser/actions.js +168 -0
- package/dist/src/browser/actions.js.map +1 -0
- package/dist/src/browser/connection.js +79 -0
- package/dist/src/browser/connection.js.map +1 -0
- package/dist/src/browser/index.js +4 -0
- package/dist/src/browser/index.js.map +1 -0
- package/dist/src/browser/vision.js +128 -0
- package/dist/src/browser/vision.js.map +1 -0
- package/dist/src/cli/acp-client.js +298 -0
- package/dist/src/cli/acp-client.js.map +1 -0
- package/dist/src/cli/commands.js +267 -0
- package/dist/src/cli/commands.js.map +1 -0
- package/dist/src/cli/handlers.js +405 -0
- package/dist/src/cli/handlers.js.map +1 -0
- package/dist/src/cli/registry.js +87 -0
- package/dist/src/cli/registry.js.map +1 -0
- package/dist/src/command-contract/catalog.js +36 -0
- package/dist/src/command-contract/catalog.js.map +1 -0
- package/dist/src/command-contract/help-renderer.js +39 -0
- package/dist/src/command-contract/help-renderer.js.map +1 -0
- package/dist/src/command-contract/policy.js +34 -0
- package/dist/src/command-contract/policy.js.map +1 -0
- package/dist/src/core/bus.js +17 -0
- package/dist/src/core/bus.js.map +1 -0
- package/dist/src/core/config.js +198 -0
- package/dist/src/core/config.js.map +1 -0
- package/dist/src/core/db.js +97 -0
- package/dist/src/core/db.js.map +1 -0
- package/dist/src/core/i18n.js +86 -0
- package/dist/src/core/i18n.js.map +1 -0
- package/dist/src/core/logger.js +14 -0
- package/dist/src/core/logger.js.map +1 -0
- package/dist/src/core/settings-merge.js +40 -0
- package/dist/src/core/settings-merge.js.map +1 -0
- package/dist/src/http/async-handler.js +6 -0
- package/dist/src/http/async-handler.js.map +1 -0
- package/dist/src/http/error-middleware.js +24 -0
- package/dist/src/http/error-middleware.js.map +1 -0
- package/dist/src/http/response.js +16 -0
- package/dist/src/http/response.js.map +1 -0
- package/dist/src/memory/heartbeat.js +106 -0
- package/dist/src/memory/heartbeat.js.map +1 -0
- package/dist/src/memory/memory.js +119 -0
- package/dist/src/memory/memory.js.map +1 -0
- package/dist/src/memory/worklog.js +154 -0
- package/dist/src/memory/worklog.js.map +1 -0
- package/dist/src/orchestrator/distribute.js +310 -0
- package/dist/src/orchestrator/distribute.js.map +1 -0
- package/dist/src/orchestrator/parser.js +118 -0
- package/dist/src/orchestrator/parser.js.map +1 -0
- package/dist/src/orchestrator/pipeline.js +343 -0
- package/dist/src/orchestrator/pipeline.js.map +1 -0
- package/dist/src/prompt/builder.js +531 -0
- package/dist/src/prompt/builder.js.map +1 -0
- package/dist/src/routes/browser.js +126 -0
- package/dist/src/routes/browser.js.map +1 -0
- package/dist/src/routes/quota.js +94 -0
- package/dist/src/routes/quota.js.map +1 -0
- package/dist/src/security/decode.js +23 -0
- package/dist/src/security/decode.js.map +1 -0
- package/dist/src/security/path-guards.js +62 -0
- package/dist/src/security/path-guards.js.map +1 -0
- package/dist/src/telegram/bot.js +469 -0
- package/dist/src/telegram/bot.js.map +1 -0
- package/dist/src/telegram/forwarder.js +93 -0
- package/dist/src/telegram/forwarder.js.map +1 -0
- package/package.json +80 -0
- package/public/css/chat.css +571 -0
- package/public/css/layout.css +350 -0
- package/public/css/markdown.css +270 -0
- package/public/css/modals.css +172 -0
- package/public/css/sidebar.css +225 -0
- package/public/css/variables.css +142 -0
- package/public/index.html +470 -0
- package/public/js/api.js +55 -0
- package/public/js/constants.js +119 -0
- package/public/js/features/appname.js +43 -0
- package/public/js/features/chat.js +242 -0
- package/public/js/features/employees.js +120 -0
- package/public/js/features/heartbeat.js +80 -0
- package/public/js/features/i18n.js +125 -0
- package/public/js/features/memory.js +85 -0
- package/public/js/features/settings.js +512 -0
- package/public/js/features/sidebar.js +88 -0
- package/public/js/features/skills.js +68 -0
- package/public/js/features/slash-commands.js +231 -0
- package/public/js/features/theme.js +40 -0
- package/public/js/locale.js +23 -0
- package/public/js/main.js +281 -0
- package/public/js/render.js +294 -0
- package/public/js/state.js +16 -0
- package/public/js/ui.js +172 -0
- package/public/js/ws.js +76 -0
- package/public/locales/en.json +180 -0
- package/public/locales/ko.json +180 -0
- package/public/theme-test.html +545 -0
- package/skills_ref/1password/SKILL.md +70 -0
- package/skills_ref/agents-sdk/SKILL.md +155 -0
- package/skills_ref/agents-sdk/references/callable.md +92 -0
- package/skills_ref/agents-sdk/references/codemode.md +207 -0
- package/skills_ref/agents-sdk/references/email.md +146 -0
- package/skills_ref/agents-sdk/references/mcp.md +154 -0
- package/skills_ref/agents-sdk/references/state-scheduling.md +164 -0
- package/skills_ref/agents-sdk/references/streaming-chat.md +178 -0
- package/skills_ref/agents-sdk/references/workflows.md +132 -0
- package/skills_ref/algorithmic-art/LICENSE.txt +202 -0
- package/skills_ref/algorithmic-art/SKILL.md +405 -0
- package/skills_ref/algorithmic-art/templates/generator_template.js +223 -0
- package/skills_ref/algorithmic-art/templates/viewer.html +599 -0
- package/skills_ref/apple-notes/SKILL.md +77 -0
- package/skills_ref/apple-reminders/SKILL.md +118 -0
- package/skills_ref/atlas/SKILL.md +99 -0
- package/skills_ref/brainstorming/SKILL.md +96 -0
- package/skills_ref/browser/SKILL.md +179 -0
- package/skills_ref/canvas-design/LICENSE.txt +202 -0
- package/skills_ref/canvas-design/SKILL.md +130 -0
- package/skills_ref/canvas-design/canvas-fonts/ArsenalSC-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/ArsenalSC-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/BigShoulders-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/BigShoulders-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/BigShoulders-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Boldonse-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/Boldonse-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/BricolageGrotesque-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/BricolageGrotesque-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/BricolageGrotesque-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/CrimsonPro-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/CrimsonPro-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/CrimsonPro-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/CrimsonPro-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/DMMono-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/DMMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/EricaOne-OFL.txt +94 -0
- package/skills_ref/canvas-design/canvas-fonts/EricaOne-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/GeistMono-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/GeistMono-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/GeistMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Gloock-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/Gloock-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexMono-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexMono-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexSerif-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexSerif-BoldItalic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexSerif-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexSerif-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-BoldItalic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSerif-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSerif-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Italiana-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/Italiana-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/JetBrainsMono-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/JetBrainsMono-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/JetBrainsMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Jura-Light.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Jura-Medium.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Jura-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/LibreBaskerville-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/LibreBaskerville-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Lora-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Lora-BoldItalic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Lora-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Lora-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/Lora-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/NationalPark-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/NationalPark-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/NationalPark-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/NothingYouCouldDo-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/NothingYouCouldDo-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Outfit-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Outfit-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/Outfit-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/PixelifySans-Medium.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/PixelifySans-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/PoiretOne-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/PoiretOne-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/RedHatMono-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/RedHatMono-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/RedHatMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Silkscreen-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/Silkscreen-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/SmoochSans-Medium.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/SmoochSans-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/Tektur-Medium.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Tektur-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/Tektur-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-BoldItalic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/YoungSerif-OFL.txt +93 -0
- package/skills_ref/canvas-design/canvas-fonts/YoungSerif-Regular.ttf +0 -0
- package/skills_ref/changelog-generator/SKILL.md +104 -0
- package/skills_ref/cloudflare-deploy/SKILL.md +207 -0
- package/skills_ref/codebase-orientation/SKILL.md +29 -0
- package/skills_ref/config-file-explainer/SKILL.md +26 -0
- package/skills_ref/context-compression/SKILL.md +265 -0
- package/skills_ref/context-compression/references/evaluation-framework.md +213 -0
- package/skills_ref/context-compression/scripts/compression_evaluator.py +658 -0
- package/skills_ref/data-structure-chooser/SKILL.md +26 -0
- package/skills_ref/debugging-checklist/SKILL.md +26 -0
- package/skills_ref/debugging-helpers/CREATION-LOG.md +119 -0
- package/skills_ref/debugging-helpers/SKILL.md +296 -0
- package/skills_ref/debugging-helpers/condition-based-waiting-example.ts +158 -0
- package/skills_ref/debugging-helpers/condition-based-waiting.md +115 -0
- package/skills_ref/debugging-helpers/defense-in-depth.md +122 -0
- package/skills_ref/debugging-helpers/find-polluter.sh +63 -0
- package/skills_ref/debugging-helpers/root-cause-tracing.md +169 -0
- package/skills_ref/debugging-helpers/test-academic.md +14 -0
- package/skills_ref/debugging-helpers/test-pressure-1.md +58 -0
- package/skills_ref/debugging-helpers/test-pressure-2.md +68 -0
- package/skills_ref/debugging-helpers/test-pressure-3.md +69 -0
- package/skills_ref/deep-research/.env.example +7 -0
- package/skills_ref/deep-research/README.md +246 -0
- package/skills_ref/deep-research/SKILL.md +106 -0
- package/skills_ref/deep-research/requirements.txt +2 -0
- package/skills_ref/deep-research/scripts/research.py +692 -0
- package/skills_ref/dependency-install-helper/SKILL.md +26 -0
- package/skills_ref/dev/SKILL.md +65 -0
- package/skills_ref/dev-backend/SKILL.md +61 -0
- package/skills_ref/dev-data/SKILL.md +76 -0
- package/skills_ref/dev-frontend/LICENSE.txt +177 -0
- package/skills_ref/dev-frontend/SKILL.md +42 -0
- package/skills_ref/dev-testing/LICENSE.txt +202 -0
- package/skills_ref/dev-testing/SKILL.md +96 -0
- package/skills_ref/dev-testing/examples/console_logging.py +35 -0
- package/skills_ref/dev-testing/examples/element_discovery.py +40 -0
- package/skills_ref/dev-testing/examples/static_html_automation.py +33 -0
- package/skills_ref/dev-testing/scripts/with_server.py +106 -0
- package/skills_ref/develop-web-game/SKILL.md +149 -0
- package/skills_ref/differential-review/.claude-plugin/plugin.json +10 -0
- package/skills_ref/differential-review/README.md +109 -0
- package/skills_ref/differential-review/commands/diff-review.md +21 -0
- package/skills_ref/differential-review/skills/differential-review/SKILL.md +220 -0
- package/skills_ref/differential-review/skills/differential-review/adversarial.md +203 -0
- package/skills_ref/differential-review/skills/differential-review/methodology.md +234 -0
- package/skills_ref/differential-review/skills/differential-review/patterns.md +300 -0
- package/skills_ref/differential-review/skills/differential-review/reporting.md +369 -0
- package/skills_ref/dispatching-parallel-agents/SKILL.md +180 -0
- package/skills_ref/doc-coauthoring/SKILL.md +375 -0
- package/skills_ref/docx/LICENSE.txt +30 -0
- package/skills_ref/docx/SKILL.md +481 -0
- package/skills_ref/docx/scripts/__init__.py +1 -0
- package/skills_ref/docx/scripts/accept_changes.py +135 -0
- package/skills_ref/docx/scripts/comment.py +318 -0
- package/skills_ref/docx/scripts/office/helpers/__init__.py +0 -0
- package/skills_ref/docx/scripts/office/helpers/merge_runs.py +199 -0
- package/skills_ref/docx/scripts/office/helpers/simplify_redlines.py +197 -0
- package/skills_ref/docx/scripts/office/pack.py +159 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -0
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -0
- package/skills_ref/docx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -0
- package/skills_ref/docx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -0
- package/skills_ref/docx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -0
- package/skills_ref/docx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -0
- package/skills_ref/docx/scripts/office/schemas/mce/mc.xsd +75 -0
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-2010.xsd +560 -0
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-2012.xsd +67 -0
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-2018.xsd +14 -0
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -0
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -0
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -0
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -0
- package/skills_ref/docx/scripts/office/soffice.py +183 -0
- package/skills_ref/docx/scripts/office/unpack.py +132 -0
- package/skills_ref/docx/scripts/office/validate.py +111 -0
- package/skills_ref/docx/scripts/office/validators/__init__.py +15 -0
- package/skills_ref/docx/scripts/office/validators/base.py +847 -0
- package/skills_ref/docx/scripts/office/validators/docx.py +446 -0
- package/skills_ref/docx/scripts/office/validators/pptx.py +275 -0
- package/skills_ref/docx/scripts/office/validators/redlining.py +247 -0
- package/skills_ref/docx/scripts/templates/comments.xml +3 -0
- package/skills_ref/docx/scripts/templates/commentsExtended.xml +3 -0
- package/skills_ref/docx/scripts/templates/commentsExtensible.xml +3 -0
- package/skills_ref/docx/scripts/templates/commentsIds.xml +3 -0
- package/skills_ref/docx/scripts/templates/people.xml +3 -0
- package/skills_ref/durable-objects/SKILL.md +186 -0
- package/skills_ref/durable-objects/references/rules.md +286 -0
- package/skills_ref/durable-objects/references/testing.md +264 -0
- package/skills_ref/durable-objects/references/workers.md +346 -0
- package/skills_ref/email-draft-polish/SKILL.md +24 -0
- package/skills_ref/error-message-explainer/SKILL.md +27 -0
- package/skills_ref/fal-image-edit/SKILL.md +249 -0
- package/skills_ref/fal-image-edit/scripts/edit-image.sh +199 -0
- package/skills_ref/figma-implement-design/SKILL.md +264 -0
- package/skills_ref/git-worktrees/SKILL.md +218 -0
- package/skills_ref/github/SKILL.md +210 -0
- package/skills_ref/gog/SKILL.md +116 -0
- package/skills_ref/goplaces/SKILL.md +52 -0
- package/skills_ref/himalaya/SKILL.md +257 -0
- package/skills_ref/hugging-face-cli/SKILL.md +186 -0
- package/skills_ref/hugging-face-cli/references/commands.md +954 -0
- package/skills_ref/hugging-face-cli/references/examples.md +374 -0
- package/skills_ref/hugging-face-evaluation/SKILL.md +651 -0
- package/skills_ref/hugging-face-evaluation/examples/.env.example +7 -0
- package/skills_ref/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
- package/skills_ref/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
- package/skills_ref/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
- package/skills_ref/hugging-face-evaluation/examples/metric_mapping.json +50 -0
- package/skills_ref/hugging-face-evaluation/requirements.txt +20 -0
- package/skills_ref/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
- package/skills_ref/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
- package/skills_ref/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
- package/skills_ref/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
- package/skills_ref/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
- package/skills_ref/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
- package/skills_ref/hugging-face-evaluation/scripts/test_extraction.py +206 -0
- package/skills_ref/hugging-face-model-trainer/SKILL.md +718 -0
- package/skills_ref/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
- package/skills_ref/hugging-face-model-trainer/references/hardware_guide.md +283 -0
- package/skills_ref/hugging-face-model-trainer/references/hub_saving.md +364 -0
- package/skills_ref/hugging-face-model-trainer/references/reliability_principles.md +371 -0
- package/skills_ref/hugging-face-model-trainer/references/trackio_guide.md +189 -0
- package/skills_ref/hugging-face-model-trainer/references/training_methods.md +150 -0
- package/skills_ref/hugging-face-model-trainer/references/training_patterns.md +203 -0
- package/skills_ref/hugging-face-model-trainer/references/troubleshooting.md +282 -0
- package/skills_ref/hugging-face-model-trainer/references/unsloth.md +313 -0
- package/skills_ref/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
- package/skills_ref/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
- package/skills_ref/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
- package/skills_ref/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
- package/skills_ref/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
- package/skills_ref/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
- package/skills_ref/hugging-face-model-trainer/scripts/unsloth_sft_example.py +512 -0
- package/skills_ref/imagegen/SKILL.md +174 -0
- package/skills_ref/insecure-defaults/.claude-plugin/plugin.json +10 -0
- package/skills_ref/insecure-defaults/README.md +45 -0
- package/skills_ref/insecure-defaults/skills/insecure-defaults/SKILL.md +117 -0
- package/skills_ref/insecure-defaults/skills/insecure-defaults/references/examples.md +409 -0
- package/skills_ref/jupyter-notebook/SKILL.md +107 -0
- package/skills_ref/linear/SKILL.md +87 -0
- package/skills_ref/linter-fix-guide/SKILL.md +27 -0
- package/skills_ref/log-summarizer/SKILL.md +27 -0
- package/skills_ref/mcp-builder/LICENSE.txt +202 -0
- package/skills_ref/mcp-builder/SKILL.md +236 -0
- package/skills_ref/mcp-builder/reference/evaluation.md +602 -0
- package/skills_ref/mcp-builder/reference/mcp_best_practices.md +249 -0
- package/skills_ref/mcp-builder/reference/node_mcp_server.md +970 -0
- package/skills_ref/mcp-builder/reference/python_mcp_server.md +719 -0
- package/skills_ref/mcp-builder/scripts/connections.py +151 -0
- package/skills_ref/mcp-builder/scripts/evaluation.py +373 -0
- package/skills_ref/mcp-builder/scripts/example_evaluation.xml +22 -0
- package/skills_ref/mcp-builder/scripts/requirements.txt +2 -0
- package/skills_ref/memory/SKILL.md +129 -0
- package/skills_ref/modern-python/.claude-plugin/plugin.json +10 -0
- package/skills_ref/modern-python/README.md +66 -0
- package/skills_ref/modern-python/hooks/hooks.json +16 -0
- package/skills_ref/modern-python/hooks/setup-shims.bats +70 -0
- package/skills_ref/modern-python/hooks/setup-shims.sh +24 -0
- package/skills_ref/modern-python/hooks/shims/pip +27 -0
- package/skills_ref/modern-python/hooks/shims/pip-shim.bats +45 -0
- package/skills_ref/modern-python/hooks/shims/pip3 +27 -0
- package/skills_ref/modern-python/hooks/shims/pipx +41 -0
- package/skills_ref/modern-python/hooks/shims/pipx-shim.bats +64 -0
- package/skills_ref/modern-python/hooks/shims/python +26 -0
- package/skills_ref/modern-python/hooks/shims/python-shim.bats +53 -0
- package/skills_ref/modern-python/hooks/shims/python3 +26 -0
- package/skills_ref/modern-python/hooks/shims/uv +27 -0
- package/skills_ref/modern-python/hooks/shims/uv-shim.bats +47 -0
- package/skills_ref/modern-python/skills/modern-python/SKILL.md +333 -0
- package/skills_ref/modern-python/skills/modern-python/references/dependabot.md +43 -0
- package/skills_ref/modern-python/skills/modern-python/references/migration-checklist.md +141 -0
- package/skills_ref/modern-python/skills/modern-python/references/pep723-scripts.md +259 -0
- package/skills_ref/modern-python/skills/modern-python/references/prek.md +211 -0
- package/skills_ref/modern-python/skills/modern-python/references/pyproject.md +254 -0
- package/skills_ref/modern-python/skills/modern-python/references/ruff-config.md +240 -0
- package/skills_ref/modern-python/skills/modern-python/references/security-setup.md +255 -0
- package/skills_ref/modern-python/skills/modern-python/references/testing.md +284 -0
- package/skills_ref/modern-python/skills/modern-python/references/uv-commands.md +200 -0
- package/skills_ref/modern-python/skills/modern-python/templates/dependabot.yml +36 -0
- package/skills_ref/modern-python/skills/modern-python/templates/pre-commit-config.yaml +66 -0
- package/skills_ref/nano-banana-pro/SKILL.md +58 -0
- package/skills_ref/netlify-deploy/SKILL.md +233 -0
- package/skills_ref/notion/SKILL.md +304 -0
- package/skills_ref/notion-knowledge-capture/SKILL.md +56 -0
- package/skills_ref/notion-meeting-intelligence/SKILL.md +60 -0
- package/skills_ref/notion-research-documentation/SKILL.md +59 -0
- package/skills_ref/notion-spec-to-implementation/SKILL.md +58 -0
- package/skills_ref/obsidian/SKILL.md +81 -0
- package/skills_ref/openai-docs/SKILL.md +56 -0
- package/skills_ref/openhue/SKILL.md +112 -0
- package/skills_ref/pdf/SKILL.md +69 -0
- package/skills_ref/postgres/README.md +77 -0
- package/skills_ref/postgres/SKILL.md +129 -0
- package/skills_ref/postgres/connections.example.json +34 -0
- package/skills_ref/postgres/requirements.txt +1 -0
- package/skills_ref/postgres/scripts/query.py +262 -0
- package/skills_ref/pptx/LICENSE.txt +30 -0
- package/skills_ref/pptx/SKILL.md +232 -0
- package/skills_ref/pptx/editing.md +205 -0
- package/skills_ref/pptx/pptxgenjs.md +420 -0
- package/skills_ref/pptx/scripts/__init__.py +0 -0
- package/skills_ref/pptx/scripts/add_slide.py +195 -0
- package/skills_ref/pptx/scripts/clean.py +286 -0
- package/skills_ref/pptx/scripts/office/helpers/__init__.py +0 -0
- package/skills_ref/pptx/scripts/office/helpers/merge_runs.py +199 -0
- package/skills_ref/pptx/scripts/office/helpers/simplify_redlines.py +197 -0
- package/skills_ref/pptx/scripts/office/pack.py +159 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -0
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -0
- package/skills_ref/pptx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -0
- package/skills_ref/pptx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -0
- package/skills_ref/pptx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -0
- package/skills_ref/pptx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -0
- package/skills_ref/pptx/scripts/office/schemas/mce/mc.xsd +75 -0
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-2010.xsd +560 -0
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-2012.xsd +67 -0
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-2018.xsd +14 -0
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -0
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -0
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -0
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -0
- package/skills_ref/pptx/scripts/office/soffice.py +183 -0
- package/skills_ref/pptx/scripts/office/unpack.py +132 -0
- package/skills_ref/pptx/scripts/office/validate.py +111 -0
- package/skills_ref/pptx/scripts/office/validators/__init__.py +15 -0
- package/skills_ref/pptx/scripts/office/validators/base.py +847 -0
- package/skills_ref/pptx/scripts/office/validators/docx.py +446 -0
- package/skills_ref/pptx/scripts/office/validators/pptx.py +275 -0
- package/skills_ref/pptx/scripts/office/validators/redlining.py +247 -0
- package/skills_ref/pptx/scripts/thumbnail.py +289 -0
- package/skills_ref/property-based-testing/.claude-plugin/plugin.json +9 -0
- package/skills_ref/property-based-testing/README.md +47 -0
- package/skills_ref/property-based-testing/skills/property-based-testing/README.md +88 -0
- package/skills_ref/property-based-testing/skills/property-based-testing/SKILL.md +123 -0
- package/skills_ref/property-based-testing/skills/property-based-testing/references/design.md +191 -0
- package/skills_ref/property-based-testing/skills/property-based-testing/references/generating.md +204 -0
- package/skills_ref/property-based-testing/skills/property-based-testing/references/interpreting-failures.md +239 -0
- package/skills_ref/property-based-testing/skills/property-based-testing/references/libraries.md +130 -0
- package/skills_ref/property-based-testing/skills/property-based-testing/references/refactoring.md +181 -0
- package/skills_ref/property-based-testing/skills/property-based-testing/references/reviewing.md +209 -0
- package/skills_ref/property-based-testing/skills/property-based-testing/references/strategies.md +124 -0
- package/skills_ref/react-best-practices/AGENTS.md +2934 -0
- package/skills_ref/react-best-practices/README.md +123 -0
- package/skills_ref/react-best-practices/SKILL.md +136 -0
- package/skills_ref/react-best-practices/metadata.json +15 -0
- package/skills_ref/react-best-practices/rules/_sections.md +46 -0
- package/skills_ref/react-best-practices/rules/_template.md +28 -0
- package/skills_ref/react-best-practices/rules/advanced-event-handler-refs.md +55 -0
- package/skills_ref/react-best-practices/rules/advanced-init-once.md +42 -0
- package/skills_ref/react-best-practices/rules/advanced-use-latest.md +39 -0
- package/skills_ref/react-best-practices/rules/async-api-routes.md +38 -0
- package/skills_ref/react-best-practices/rules/async-defer-await.md +80 -0
- package/skills_ref/react-best-practices/rules/async-dependencies.md +51 -0
- package/skills_ref/react-best-practices/rules/async-parallel.md +28 -0
- package/skills_ref/react-best-practices/rules/async-suspense-boundaries.md +99 -0
- package/skills_ref/react-best-practices/rules/bundle-barrel-imports.md +59 -0
- package/skills_ref/react-best-practices/rules/bundle-conditional.md +31 -0
- package/skills_ref/react-best-practices/rules/bundle-defer-third-party.md +49 -0
- package/skills_ref/react-best-practices/rules/bundle-dynamic-imports.md +35 -0
- package/skills_ref/react-best-practices/rules/bundle-preload.md +50 -0
- package/skills_ref/react-best-practices/rules/client-event-listeners.md +74 -0
- package/skills_ref/react-best-practices/rules/client-localstorage-schema.md +71 -0
- package/skills_ref/react-best-practices/rules/client-passive-event-listeners.md +48 -0
- package/skills_ref/react-best-practices/rules/client-swr-dedup.md +56 -0
- package/skills_ref/react-best-practices/rules/js-batch-dom-css.md +107 -0
- package/skills_ref/react-best-practices/rules/js-cache-function-results.md +80 -0
- package/skills_ref/react-best-practices/rules/js-cache-property-access.md +28 -0
- package/skills_ref/react-best-practices/rules/js-cache-storage.md +70 -0
- package/skills_ref/react-best-practices/rules/js-combine-iterations.md +32 -0
- package/skills_ref/react-best-practices/rules/js-early-exit.md +50 -0
- package/skills_ref/react-best-practices/rules/js-hoist-regexp.md +45 -0
- package/skills_ref/react-best-practices/rules/js-index-maps.md +37 -0
- package/skills_ref/react-best-practices/rules/js-length-check-first.md +49 -0
- package/skills_ref/react-best-practices/rules/js-min-max-loop.md +82 -0
- package/skills_ref/react-best-practices/rules/js-set-map-lookups.md +24 -0
- package/skills_ref/react-best-practices/rules/js-tosorted-immutable.md +57 -0
- package/skills_ref/react-best-practices/rules/rendering-activity.md +26 -0
- package/skills_ref/react-best-practices/rules/rendering-animate-svg-wrapper.md +47 -0
- package/skills_ref/react-best-practices/rules/rendering-conditional-render.md +40 -0
- package/skills_ref/react-best-practices/rules/rendering-content-visibility.md +38 -0
- package/skills_ref/react-best-practices/rules/rendering-hoist-jsx.md +46 -0
- package/skills_ref/react-best-practices/rules/rendering-hydration-no-flicker.md +82 -0
- package/skills_ref/react-best-practices/rules/rendering-hydration-suppress-warning.md +30 -0
- package/skills_ref/react-best-practices/rules/rendering-svg-precision.md +28 -0
- package/skills_ref/react-best-practices/rules/rendering-usetransition-loading.md +75 -0
- package/skills_ref/react-best-practices/rules/rerender-defer-reads.md +39 -0
- package/skills_ref/react-best-practices/rules/rerender-dependencies.md +45 -0
- package/skills_ref/react-best-practices/rules/rerender-derived-state-no-effect.md +40 -0
- package/skills_ref/react-best-practices/rules/rerender-derived-state.md +29 -0
- package/skills_ref/react-best-practices/rules/rerender-functional-setstate.md +74 -0
- package/skills_ref/react-best-practices/rules/rerender-lazy-state-init.md +58 -0
- package/skills_ref/react-best-practices/rules/rerender-memo-with-default-value.md +38 -0
- package/skills_ref/react-best-practices/rules/rerender-memo.md +44 -0
- package/skills_ref/react-best-practices/rules/rerender-move-effect-to-event.md +45 -0
- package/skills_ref/react-best-practices/rules/rerender-simple-expression-in-memo.md +35 -0
- package/skills_ref/react-best-practices/rules/rerender-transitions.md +40 -0
- package/skills_ref/react-best-practices/rules/rerender-use-ref-transient-values.md +73 -0
- package/skills_ref/react-best-practices/rules/server-after-nonblocking.md +73 -0
- package/skills_ref/react-best-practices/rules/server-auth-actions.md +96 -0
- package/skills_ref/react-best-practices/rules/server-cache-lru.md +41 -0
- package/skills_ref/react-best-practices/rules/server-cache-react.md +76 -0
- package/skills_ref/react-best-practices/rules/server-dedup-props.md +65 -0
- package/skills_ref/react-best-practices/rules/server-parallel-fetching.md +83 -0
- package/skills_ref/react-best-practices/rules/server-serialization.md +38 -0
- package/skills_ref/receiving-code-review/SKILL.md +213 -0
- package/skills_ref/registry.json +1493 -0
- package/skills_ref/render-deploy/SKILL.md +462 -0
- package/skills_ref/requesting-code-review/SKILL.md +105 -0
- package/skills_ref/requesting-code-review/code-reviewer.md +146 -0
- package/skills_ref/screen-capture/SKILL.md +162 -0
- package/skills_ref/security-best-practices/LICENSE.txt +201 -0
- package/skills_ref/security-best-practices/SKILL.md +86 -0
- package/skills_ref/security-best-practices/agents/openai.yaml +4 -0
- package/skills_ref/security-best-practices/references/golang-general-backend-security.md +826 -0
- package/skills_ref/security-best-practices/references/javascript-express-web-server-security.md +1158 -0
- package/skills_ref/security-best-practices/references/javascript-general-web-frontend-security.md +747 -0
- package/skills_ref/security-best-practices/references/javascript-jquery-web-frontend-security.md +678 -0
- package/skills_ref/security-best-practices/references/javascript-typescript-nextjs-web-server-security.md +1144 -0
- package/skills_ref/security-best-practices/references/javascript-typescript-react-web-frontend-security.md +990 -0
- package/skills_ref/security-best-practices/references/javascript-typescript-vue-web-frontend-security.md +791 -0
- package/skills_ref/security-best-practices/references/python-django-web-server-security.md +882 -0
- package/skills_ref/security-best-practices/references/python-fastapi-web-server-security.md +1036 -0
- package/skills_ref/security-best-practices/references/python-flask-web-server-security.md +705 -0
- package/skills_ref/security-ownership-map/LICENSE.txt +201 -0
- package/skills_ref/security-ownership-map/SKILL.md +206 -0
- package/skills_ref/security-ownership-map/agents/openai.yaml +4 -0
- package/skills_ref/security-ownership-map/references/neo4j-import.md +60 -0
- package/skills_ref/security-ownership-map/scripts/build_ownership_map.py +956 -0
- package/skills_ref/security-ownership-map/scripts/community_maintainers.py +544 -0
- package/skills_ref/security-ownership-map/scripts/query_ownership.py +483 -0
- package/skills_ref/security-ownership-map/scripts/run_ownership_map.py +200 -0
- package/skills_ref/security-threat-model/LICENSE.txt +201 -0
- package/skills_ref/security-threat-model/SKILL.md +81 -0
- package/skills_ref/security-threat-model/agents/openai.yaml +4 -0
- package/skills_ref/security-threat-model/references/prompt-template.md +255 -0
- package/skills_ref/security-threat-model/references/security-controls-and-assets.md +32 -0
- package/skills_ref/sentry/SKILL.md +123 -0
- package/skills_ref/skill-creator/SKILL.md +372 -0
- package/skills_ref/sora/SKILL.md +153 -0
- package/skills_ref/speech/SKILL.md +144 -0
- package/skills_ref/spotify-player/SKILL.md +64 -0
- package/skills_ref/static-analysis/.claude-plugin/plugin.json +8 -0
- package/skills_ref/static-analysis/README.md +65 -0
- package/skills_ref/static-analysis/agents/semgrep-scanner.md +71 -0
- package/skills_ref/static-analysis/agents/semgrep-triager.md +107 -0
- package/skills_ref/static-analysis/skills/codeql/SKILL.md +119 -0
- package/skills_ref/static-analysis/skills/codeql/references/diagnostic-query-templates.md +339 -0
- package/skills_ref/static-analysis/skills/codeql/references/language-details.md +207 -0
- package/skills_ref/static-analysis/skills/codeql/references/performance-tuning.md +111 -0
- package/skills_ref/static-analysis/skills/codeql/references/ruleset-catalog.md +63 -0
- package/skills_ref/static-analysis/skills/codeql/references/threat-models.md +44 -0
- package/skills_ref/static-analysis/skills/codeql/workflows/build-database.md +669 -0
- package/skills_ref/static-analysis/skills/codeql/workflows/create-data-extensions.md +536 -0
- package/skills_ref/static-analysis/skills/codeql/workflows/run-analysis.md +436 -0
- package/skills_ref/static-analysis/skills/sarif-parsing/SKILL.md +479 -0
- package/skills_ref/static-analysis/skills/sarif-parsing/resources/jq-queries.md +162 -0
- package/skills_ref/static-analysis/skills/sarif-parsing/resources/sarif_helpers.py +331 -0
- package/skills_ref/static-analysis/skills/semgrep/SKILL.md +431 -0
- package/skills_ref/static-analysis/skills/semgrep/references/rulesets.md +162 -0
- package/skills_ref/static-analysis/skills/semgrep/references/scanner-task-prompt.md +102 -0
- package/skills_ref/static-analysis/skills/semgrep/references/triage-task-prompt.md +122 -0
- package/skills_ref/static-analysis/skills/semgrep/scripts/merge_triaged_sarif.py +252 -0
- package/skills_ref/summarize/SKILL.md +87 -0
- package/skills_ref/tdd/SKILL.md +371 -0
- package/skills_ref/tdd/testing-anti-patterns.md +299 -0
- package/skills_ref/telegram-send/SKILL.md +99 -0
- package/skills_ref/terraform/README.md +105 -0
- package/skills_ref/terraform/code-generation/.claude-plugin/plugin.json +30 -0
- package/skills_ref/terraform/code-generation/skills/azure-verified-modules/SKILL.md +613 -0
- package/skills_ref/terraform/code-generation/skills/terraform-style-guide/SKILL.md +353 -0
- package/skills_ref/terraform/code-generation/skills/terraform-test/SKILL.md +1669 -0
- package/skills_ref/terraform/module-generation/.claude-plugin/plugin.json +30 -0
- package/skills_ref/terraform/module-generation/skills/refactor-module/SKILL.md +538 -0
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/SKILL.md +468 -0
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/api-monitoring.md +543 -0
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/component-blocks.md +476 -0
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/deployment-blocks.md +391 -0
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/examples.md +1529 -0
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/linked-stacks.md +187 -0
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/troubleshooting.md +671 -0
- package/skills_ref/terraform/provider-development/.claude-plugin/plugin.json +13 -0
- package/skills_ref/terraform/provider-development/skills/new-terraform-provider/SKILL.md +25 -0
- package/skills_ref/terraform/provider-development/skills/new-terraform-provider/assets/main.go +40 -0
- package/skills_ref/terraform/provider-development/skills/provider-actions/SKILL.md +478 -0
- package/skills_ref/terraform/provider-development/skills/provider-resources/SKILL.md +599 -0
- package/skills_ref/terraform/provider-development/skills/run-acceptance-tests/SKILL.md +41 -0
- package/skills_ref/theme-factory/LICENSE.txt +202 -0
- package/skills_ref/theme-factory/SKILL.md +59 -0
- package/skills_ref/theme-factory/theme-showcase.pdf +0 -0
- package/skills_ref/theme-factory/themes/arctic-frost.md +19 -0
- package/skills_ref/theme-factory/themes/botanical-garden.md +19 -0
- package/skills_ref/theme-factory/themes/desert-rose.md +19 -0
- package/skills_ref/theme-factory/themes/forest-canopy.md +19 -0
- package/skills_ref/theme-factory/themes/golden-hour.md +19 -0
- package/skills_ref/theme-factory/themes/midnight-galaxy.md +19 -0
- package/skills_ref/theme-factory/themes/modern-minimalist.md +19 -0
- package/skills_ref/theme-factory/themes/ocean-depths.md +19 -0
- package/skills_ref/theme-factory/themes/sunset-boulevard.md +19 -0
- package/skills_ref/theme-factory/themes/tech-innovation.md +19 -0
- package/skills_ref/things-mac/SKILL.md +86 -0
- package/skills_ref/tmux/SKILL.md +153 -0
- package/skills_ref/transcribe/SKILL.md +81 -0
- package/skills_ref/trello/SKILL.md +95 -0
- package/skills_ref/tts/SKILL.md +99 -0
- package/skills_ref/vercel-deploy/SKILL.md +115 -0
- package/skills_ref/video-downloader/SKILL.md +99 -0
- package/skills_ref/video-downloader/scripts/download_video.py +145 -0
- package/skills_ref/video-frames/SKILL.md +46 -0
- package/skills_ref/vision-click/SKILL.md +128 -0
- package/skills_ref/weather/SKILL.md +112 -0
- package/skills_ref/web-artifacts-builder/LICENSE.txt +202 -0
- package/skills_ref/web-artifacts-builder/SKILL.md +74 -0
- package/skills_ref/web-artifacts-builder/scripts/bundle-artifact.sh +54 -0
- package/skills_ref/web-artifacts-builder/scripts/init-artifact.sh +322 -0
- package/skills_ref/web-artifacts-builder/scripts/shadcn-components.tar.gz +0 -0
- package/skills_ref/web-perf/SKILL.md +193 -0
- package/skills_ref/web-routing/SKILL.md +26 -0
- package/skills_ref/whatsapp/SKILL.md +255 -0
- package/skills_ref/whatsapp/assets/agent-app-integration-example.json +35 -0
- package/skills_ref/whatsapp/assets/databases-example.json +11 -0
- package/skills_ref/whatsapp/assets/function-decide-route-interactive-buttons.json +6 -0
- package/skills_ref/whatsapp/assets/functions-example.json +5 -0
- package/skills_ref/whatsapp/assets/workflow-agent-simple.json +31 -0
- package/skills_ref/whatsapp/assets/workflow-api-template-wait-agent.json +59 -0
- package/skills_ref/whatsapp/assets/workflow-customer-support-intake-agent.json +56 -0
- package/skills_ref/whatsapp/assets/workflow-decision.json +83 -0
- package/skills_ref/whatsapp/assets/workflow-interactive-buttons-decide-ai.json +89 -0
- package/skills_ref/whatsapp/assets/workflow-interactive-buttons-decide-function.json +88 -0
- package/skills_ref/whatsapp/assets/workflow-linear.json +53 -0
- package/skills_ref/whatsapp/package.json +10 -0
- package/skills_ref/whatsapp/references/app-integrations.md +89 -0
- package/skills_ref/whatsapp/references/databases-reference.md +21 -0
- package/skills_ref/whatsapp/references/execution-context.md +42 -0
- package/skills_ref/whatsapp/references/function-contracts.md +55 -0
- package/skills_ref/whatsapp/references/functions-payloads.md +87 -0
- package/skills_ref/whatsapp/references/functions-reference.md +133 -0
- package/skills_ref/whatsapp/references/graph-contract.md +145 -0
- package/skills_ref/whatsapp/references/node-types.md +430 -0
- package/skills_ref/whatsapp/references/triggers.md +20 -0
- package/skills_ref/whatsapp/references/workflow-overview.md +22 -0
- package/skills_ref/whatsapp/references/workflow-reference.md +123 -0
- package/skills_ref/whatsapp/scripts/configure-prop.js +113 -0
- package/skills_ref/whatsapp/scripts/create-connect-token.js +38 -0
- package/skills_ref/whatsapp/scripts/create-function.js +64 -0
- package/skills_ref/whatsapp/scripts/create-integration.js +137 -0
- package/skills_ref/whatsapp/scripts/create-row.js +47 -0
- package/skills_ref/whatsapp/scripts/create-trigger.js +88 -0
- package/skills_ref/whatsapp/scripts/create-workflow.js +85 -0
- package/skills_ref/whatsapp/scripts/delete-integration.js +44 -0
- package/skills_ref/whatsapp/scripts/delete-row.js +49 -0
- package/skills_ref/whatsapp/scripts/delete-trigger.js +44 -0
- package/skills_ref/whatsapp/scripts/deploy-function.js +47 -0
- package/skills_ref/whatsapp/scripts/edit-graph.js +289 -0
- package/skills_ref/whatsapp/scripts/get-action-schema.js +44 -0
- package/skills_ref/whatsapp/scripts/get-context-value.js +80 -0
- package/skills_ref/whatsapp/scripts/get-execution-event.js +55 -0
- package/skills_ref/whatsapp/scripts/get-execution.js +44 -0
- package/skills_ref/whatsapp/scripts/get-function.js +43 -0
- package/skills_ref/whatsapp/scripts/get-graph.js +85 -0
- package/skills_ref/whatsapp/scripts/get-table.js +45 -0
- package/skills_ref/whatsapp/scripts/get-workflow.js +44 -0
- package/skills_ref/whatsapp/scripts/invoke-function.js +60 -0
- package/skills_ref/whatsapp/scripts/lib/databases/args.js +87 -0
- package/skills_ref/whatsapp/scripts/lib/databases/filters.js +30 -0
- package/skills_ref/whatsapp/scripts/lib/databases/kapso-api.js +70 -0
- package/skills_ref/whatsapp/scripts/lib/functions/args.js +55 -0
- package/skills_ref/whatsapp/scripts/lib/functions/kapso-api.js +70 -0
- package/skills_ref/whatsapp/scripts/lib/workflows/args.js +53 -0
- package/skills_ref/whatsapp/scripts/lib/workflows/kapso-api.js +123 -0
- package/skills_ref/whatsapp/scripts/lib/workflows/result.js +16 -0
- package/skills_ref/whatsapp/scripts/list-accounts.js +62 -0
- package/skills_ref/whatsapp/scripts/list-apps.js +42 -0
- package/skills_ref/whatsapp/scripts/list-execution-events.js +61 -0
- package/skills_ref/whatsapp/scripts/list-executions.js +53 -0
- package/skills_ref/whatsapp/scripts/list-function-invocations.js +53 -0
- package/skills_ref/whatsapp/scripts/list-functions.js +41 -0
- package/skills_ref/whatsapp/scripts/list-integrations.js +41 -0
- package/skills_ref/whatsapp/scripts/list-provider-models.js +48 -0
- package/skills_ref/whatsapp/scripts/list-tables.js +41 -0
- package/skills_ref/whatsapp/scripts/list-triggers.js +44 -0
- package/skills_ref/whatsapp/scripts/list-whatsapp-phone-numbers.js +56 -0
- package/skills_ref/whatsapp/scripts/list-workflows.js +44 -0
- package/skills_ref/whatsapp/scripts/openapi-explore.mjs +1273 -0
- package/skills_ref/whatsapp/scripts/query-rows.js +71 -0
- package/skills_ref/whatsapp/scripts/reload-props.js +110 -0
- package/skills_ref/whatsapp/scripts/resume-execution.js +75 -0
- package/skills_ref/whatsapp/scripts/search-actions.js +64 -0
- package/skills_ref/whatsapp/scripts/update-execution-status.js +51 -0
- package/skills_ref/whatsapp/scripts/update-function.js +65 -0
- package/skills_ref/whatsapp/scripts/update-graph.js +154 -0
- package/skills_ref/whatsapp/scripts/update-integration.js +82 -0
- package/skills_ref/whatsapp/scripts/update-row.js +51 -0
- package/skills_ref/whatsapp/scripts/update-trigger.js +60 -0
- package/skills_ref/whatsapp/scripts/update-workflow-settings.js +67 -0
- package/skills_ref/whatsapp/scripts/upsert-row.js +64 -0
- package/skills_ref/whatsapp/scripts/validate-graph.js +293 -0
- package/skills_ref/whatsapp/scripts/variables-delete.js +37 -0
- package/skills_ref/whatsapp/scripts/variables-list.js +55 -0
- package/skills_ref/whatsapp/scripts/variables-set.js +39 -0
- package/skills_ref/writing-plans/SKILL.md +116 -0
- package/skills_ref/xlsx/LICENSE.txt +30 -0
- package/skills_ref/xlsx/SKILL.md +292 -0
- package/skills_ref/xlsx/scripts/office/helpers/__init__.py +0 -0
- package/skills_ref/xlsx/scripts/office/helpers/merge_runs.py +199 -0
- package/skills_ref/xlsx/scripts/office/helpers/simplify_redlines.py +197 -0
- package/skills_ref/xlsx/scripts/office/pack.py +159 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +1499 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +146 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +1085 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +11 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +3081 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +23 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +185 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +287 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +1676 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +28 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +144 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +174 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +25 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +18 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +59 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +56 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +195 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +582 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +25 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +4439 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +570 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +509 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +12 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +108 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +96 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +3646 -0
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +116 -0
- package/skills_ref/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +42 -0
- package/skills_ref/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +50 -0
- package/skills_ref/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +49 -0
- package/skills_ref/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +33 -0
- package/skills_ref/xlsx/scripts/office/schemas/mce/mc.xsd +75 -0
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-2010.xsd +560 -0
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-2012.xsd +67 -0
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-2018.xsd +14 -0
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +20 -0
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +13 -0
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +4 -0
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +8 -0
- package/skills_ref/xlsx/scripts/office/soffice.py +183 -0
- package/skills_ref/xlsx/scripts/office/unpack.py +132 -0
- package/skills_ref/xlsx/scripts/office/validate.py +111 -0
- package/skills_ref/xlsx/scripts/office/validators/__init__.py +15 -0
- package/skills_ref/xlsx/scripts/office/validators/base.py +847 -0
- package/skills_ref/xlsx/scripts/office/validators/docx.py +446 -0
- package/skills_ref/xlsx/scripts/office/validators/pptx.py +275 -0
- package/skills_ref/xlsx/scripts/office/validators/redlining.py +247 -0
- package/skills_ref/xlsx/scripts/recalc.py +184 -0
- package/skills_ref/xurl/SKILL.md +461 -0
|
@@ -0,0 +1,382 @@
|
|
|
1
|
+
# Usage Examples
|
|
2
|
+
|
|
3
|
+
This document provides practical examples for both methods of adding evaluations to HuggingFace model cards.
|
|
4
|
+
|
|
5
|
+
## Table of Contents
|
|
6
|
+
1. [Setup](#setup)
|
|
7
|
+
2. [Method 1: Extract from README](#method-1-extract-from-readme)
|
|
8
|
+
3. [Method 2: Import from Artificial Analysis](#method-2-import-from-artificial-analysis)
|
|
9
|
+
4. [Standalone vs Integrated](#standalone-vs-integrated)
|
|
10
|
+
5. [Common Workflows](#common-workflows)
|
|
11
|
+
|
|
12
|
+
## Setup
|
|
13
|
+
|
|
14
|
+
### Initial Configuration
|
|
15
|
+
|
|
16
|
+
```bash
|
|
17
|
+
# Navigate to skill directory
|
|
18
|
+
cd hf_evaluation_skill
|
|
19
|
+
|
|
20
|
+
# Install dependencies
|
|
21
|
+
uv add huggingface_hub python-dotenv pyyaml requests
|
|
22
|
+
|
|
23
|
+
# Configure environment variables
|
|
24
|
+
cp examples/.env.example .env
|
|
25
|
+
# Edit .env with your tokens
|
|
26
|
+
```
|
|
27
|
+
|
|
28
|
+
Your `.env` file should contain:
|
|
29
|
+
```env
|
|
30
|
+
HF_TOKEN=hf_your_write_token_here
|
|
31
|
+
AA_API_KEY=aa_your_api_key_here # Optional for AA imports
|
|
32
|
+
```
|
|
33
|
+
|
|
34
|
+
### Verify Installation
|
|
35
|
+
|
|
36
|
+
```bash
|
|
37
|
+
cd scripts
|
|
38
|
+
python3 test_extraction.py
|
|
39
|
+
```
|
|
40
|
+
|
|
41
|
+
## Method 1: Extract from README
|
|
42
|
+
|
|
43
|
+
Extract evaluation tables from your model's existing README.
|
|
44
|
+
|
|
45
|
+
### Basic Extraction
|
|
46
|
+
|
|
47
|
+
```bash
|
|
48
|
+
# Preview what will be extracted (dry run)
|
|
49
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
50
|
+
--repo-id "meta-llama/Llama-3.3-70B-Instruct" \
|
|
51
|
+
--dry-run
|
|
52
|
+
```
|
|
53
|
+
|
|
54
|
+
### Apply Extraction to Your Model
|
|
55
|
+
|
|
56
|
+
```bash
|
|
57
|
+
# Extract and update model card directly
|
|
58
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
59
|
+
--repo-id "your-username/your-model-7b"
|
|
60
|
+
```
|
|
61
|
+
|
|
62
|
+
### Custom Task and Dataset Names
|
|
63
|
+
|
|
64
|
+
```bash
|
|
65
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
66
|
+
--repo-id "your-username/your-model-7b" \
|
|
67
|
+
--task-type "text-generation" \
|
|
68
|
+
--dataset-name "Standard Benchmarks" \
|
|
69
|
+
--dataset-type "llm_benchmarks"
|
|
70
|
+
```
|
|
71
|
+
|
|
72
|
+
### Create Pull Request (for models you don't own)
|
|
73
|
+
|
|
74
|
+
```bash
|
|
75
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
76
|
+
--repo-id "organization/community-model" \
|
|
77
|
+
--create-pr
|
|
78
|
+
```
|
|
79
|
+
|
|
80
|
+
### Example README Format
|
|
81
|
+
|
|
82
|
+
Your model README should contain tables like:
|
|
83
|
+
|
|
84
|
+
```markdown
|
|
85
|
+
## Evaluation Results
|
|
86
|
+
|
|
87
|
+
| Benchmark | Score |
|
|
88
|
+
|---------------|-------|
|
|
89
|
+
| MMLU | 85.2 |
|
|
90
|
+
| HumanEval | 72.5 |
|
|
91
|
+
| GSM8K | 91.3 |
|
|
92
|
+
| HellaSwag | 88.9 |
|
|
93
|
+
```
|
|
94
|
+
|
|
95
|
+
## Method 2: Import from Artificial Analysis
|
|
96
|
+
|
|
97
|
+
Fetch benchmark scores directly from Artificial Analysis API.
|
|
98
|
+
|
|
99
|
+
### Integrated Approach (Recommended)
|
|
100
|
+
|
|
101
|
+
```bash
|
|
102
|
+
# Import scores for Claude Sonnet 4.5
|
|
103
|
+
python3 scripts/evaluation_manager.py import-aa \
|
|
104
|
+
--creator-slug "anthropic" \
|
|
105
|
+
--model-name "claude-sonnet-4" \
|
|
106
|
+
--repo-id "your-username/claude-mirror"
|
|
107
|
+
```
|
|
108
|
+
|
|
109
|
+
### With Pull Request
|
|
110
|
+
|
|
111
|
+
```bash
|
|
112
|
+
# Create PR instead of direct commit
|
|
113
|
+
python3 scripts/evaluation_manager.py import-aa \
|
|
114
|
+
--creator-slug "openai" \
|
|
115
|
+
--model-name "gpt-4" \
|
|
116
|
+
--repo-id "your-username/gpt-4-mirror" \
|
|
117
|
+
--create-pr
|
|
118
|
+
```
|
|
119
|
+
|
|
120
|
+
### Standalone Script
|
|
121
|
+
|
|
122
|
+
For simple, one-off imports, use the standalone script:
|
|
123
|
+
|
|
124
|
+
```bash
|
|
125
|
+
# Navigate to examples directory
|
|
126
|
+
cd examples
|
|
127
|
+
|
|
128
|
+
# Run standalone script
|
|
129
|
+
AA_API_KEY="your-key" HF_TOKEN="your-token" \
|
|
130
|
+
python3 artificial_analysis_to_hub.py \
|
|
131
|
+
--creator-slug "anthropic" \
|
|
132
|
+
--model-name "claude-sonnet-4" \
|
|
133
|
+
--repo-id "your-username/your-repo"
|
|
134
|
+
```
|
|
135
|
+
|
|
136
|
+
### Finding Creator Slug and Model Name
|
|
137
|
+
|
|
138
|
+
1. Visit [Artificial Analysis](https://artificialanalysis.ai/)
|
|
139
|
+
2. Navigate to the model you want to import
|
|
140
|
+
3. The URL format is: `https://artificialanalysis.ai/models/{creator-slug}/{model-name}`
|
|
141
|
+
4. Or check their [API documentation](https://artificialanalysis.ai/api)
|
|
142
|
+
|
|
143
|
+
Common examples:
|
|
144
|
+
- Anthropic: `--creator-slug "anthropic" --model-name "claude-sonnet-4"`
|
|
145
|
+
- OpenAI: `--creator-slug "openai" --model-name "gpt-4-turbo"`
|
|
146
|
+
- Meta: `--creator-slug "meta" --model-name "llama-3-70b"`
|
|
147
|
+
|
|
148
|
+
## Standalone vs Integrated
|
|
149
|
+
|
|
150
|
+
### Standalone Script Features
|
|
151
|
+
- ✓ Simple, single-purpose
|
|
152
|
+
- ✓ Can run via `uv run` from URL
|
|
153
|
+
- ✓ Minimal dependencies
|
|
154
|
+
- ✗ No README extraction
|
|
155
|
+
- ✗ No validation
|
|
156
|
+
- ✗ No dry-run mode
|
|
157
|
+
|
|
158
|
+
**Use when:** You only need AA imports and want a simple script.
|
|
159
|
+
|
|
160
|
+
### Integrated Script Features
|
|
161
|
+
- ✓ Both README extraction AND AA import
|
|
162
|
+
- ✓ Validation and show commands
|
|
163
|
+
- ✓ Dry-run preview mode
|
|
164
|
+
- ✓ Better error handling
|
|
165
|
+
- ✓ Merge with existing evaluations
|
|
166
|
+
- ✓ More flexible options
|
|
167
|
+
|
|
168
|
+
**Use when:** You want full evaluation management capabilities.
|
|
169
|
+
|
|
170
|
+
## Common Workflows
|
|
171
|
+
|
|
172
|
+
### Workflow 1: New Model with README Tables
|
|
173
|
+
|
|
174
|
+
You've just created a model with evaluation tables in the README.
|
|
175
|
+
|
|
176
|
+
```bash
|
|
177
|
+
# Step 1: Preview extraction
|
|
178
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
179
|
+
--repo-id "your-username/new-model-7b" \
|
|
180
|
+
--dry-run
|
|
181
|
+
|
|
182
|
+
# Step 2: Apply if it looks good
|
|
183
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
184
|
+
--repo-id "your-username/new-model-7b"
|
|
185
|
+
|
|
186
|
+
# Step 3: Validate
|
|
187
|
+
python3 scripts/evaluation_manager.py validate \
|
|
188
|
+
--repo-id "your-username/new-model-7b"
|
|
189
|
+
|
|
190
|
+
# Step 4: View results
|
|
191
|
+
python3 scripts/evaluation_manager.py show \
|
|
192
|
+
--repo-id "your-username/new-model-7b"
|
|
193
|
+
```
|
|
194
|
+
|
|
195
|
+
### Workflow 2: Model Benchmarked on AA
|
|
196
|
+
|
|
197
|
+
Your model appears on Artificial Analysis with fresh benchmarks.
|
|
198
|
+
|
|
199
|
+
```bash
|
|
200
|
+
# Import scores and create PR for review
|
|
201
|
+
python3 scripts/evaluation_manager.py import-aa \
|
|
202
|
+
--creator-slug "your-org" \
|
|
203
|
+
--model-name "your-model" \
|
|
204
|
+
--repo-id "your-org/your-model-hf" \
|
|
205
|
+
--create-pr
|
|
206
|
+
```
|
|
207
|
+
|
|
208
|
+
### Workflow 3: Combine Both Methods
|
|
209
|
+
|
|
210
|
+
You have README tables AND AA scores.
|
|
211
|
+
|
|
212
|
+
```bash
|
|
213
|
+
# Step 1: Extract from README
|
|
214
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
215
|
+
--repo-id "your-username/hybrid-model"
|
|
216
|
+
|
|
217
|
+
# Step 2: Import from AA (will merge with existing)
|
|
218
|
+
python3 scripts/evaluation_manager.py import-aa \
|
|
219
|
+
--creator-slug "your-org" \
|
|
220
|
+
--model-name "hybrid-model" \
|
|
221
|
+
--repo-id "your-username/hybrid-model"
|
|
222
|
+
|
|
223
|
+
# Step 3: View combined results
|
|
224
|
+
python3 scripts/evaluation_manager.py show \
|
|
225
|
+
--repo-id "your-username/hybrid-model"
|
|
226
|
+
```
|
|
227
|
+
|
|
228
|
+
### Workflow 4: Contributing to Community Models
|
|
229
|
+
|
|
230
|
+
Help improve community models by adding missing evaluations.
|
|
231
|
+
|
|
232
|
+
```bash
|
|
233
|
+
# Find a model with evaluations in README but no model-index
|
|
234
|
+
# Example: community/awesome-7b
|
|
235
|
+
|
|
236
|
+
# Create PR with extracted evaluations
|
|
237
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
238
|
+
--repo-id "community/awesome-7b" \
|
|
239
|
+
--create-pr
|
|
240
|
+
|
|
241
|
+
# GitHub will notify the repository owner
|
|
242
|
+
# They can review and merge your PR
|
|
243
|
+
```
|
|
244
|
+
|
|
245
|
+
### Workflow 5: Batch Processing
|
|
246
|
+
|
|
247
|
+
Update multiple models at once.
|
|
248
|
+
|
|
249
|
+
```bash
|
|
250
|
+
# Create a list of repos
|
|
251
|
+
cat > models.txt << EOF
|
|
252
|
+
your-org/model-1-7b
|
|
253
|
+
your-org/model-2-13b
|
|
254
|
+
your-org/model-3-70b
|
|
255
|
+
EOF
|
|
256
|
+
|
|
257
|
+
# Process each
|
|
258
|
+
while read repo_id; do
|
|
259
|
+
echo "Processing $repo_id..."
|
|
260
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
261
|
+
--repo-id "$repo_id"
|
|
262
|
+
done < models.txt
|
|
263
|
+
```
|
|
264
|
+
|
|
265
|
+
### Workflow 6: Automated Updates (CI/CD)
|
|
266
|
+
|
|
267
|
+
Set up automatic evaluation updates using GitHub Actions.
|
|
268
|
+
|
|
269
|
+
```yaml
|
|
270
|
+
# .github/workflows/update-evals.yml
|
|
271
|
+
name: Update Evaluations Weekly
|
|
272
|
+
on:
|
|
273
|
+
schedule:
|
|
274
|
+
- cron: '0 0 * * 0' # Every Sunday
|
|
275
|
+
workflow_dispatch: # Manual trigger
|
|
276
|
+
|
|
277
|
+
jobs:
|
|
278
|
+
update:
|
|
279
|
+
runs-on: ubuntu-latest
|
|
280
|
+
steps:
|
|
281
|
+
- uses: actions/checkout@v4
|
|
282
|
+
|
|
283
|
+
- name: Set up Python
|
|
284
|
+
uses: actions/setup-python@v4
|
|
285
|
+
with:
|
|
286
|
+
python-version: '3.13'
|
|
287
|
+
|
|
288
|
+
- name: Install dependencies
|
|
289
|
+
run: |
|
|
290
|
+
pip install huggingface-hub python-dotenv pyyaml requests
|
|
291
|
+
|
|
292
|
+
- name: Update from Artificial Analysis
|
|
293
|
+
env:
|
|
294
|
+
AA_API_KEY: ${{ secrets.AA_API_KEY }}
|
|
295
|
+
HF_TOKEN: ${{ secrets.HF_TOKEN }}
|
|
296
|
+
run: |
|
|
297
|
+
python scripts/evaluation_manager.py import-aa \
|
|
298
|
+
--creator-slug "${{ vars.AA_CREATOR_SLUG }}" \
|
|
299
|
+
--model-name "${{ vars.AA_MODEL_NAME }}" \
|
|
300
|
+
--repo-id "${{ github.repository }}" \
|
|
301
|
+
--create-pr
|
|
302
|
+
```
|
|
303
|
+
|
|
304
|
+
## Verification and Validation
|
|
305
|
+
|
|
306
|
+
### Check Current Evaluations
|
|
307
|
+
|
|
308
|
+
```bash
|
|
309
|
+
python3 scripts/evaluation_manager.py show \
|
|
310
|
+
--repo-id "your-username/your-model"
|
|
311
|
+
```
|
|
312
|
+
|
|
313
|
+
### Validate Format
|
|
314
|
+
|
|
315
|
+
```bash
|
|
316
|
+
python3 scripts/evaluation_manager.py validate \
|
|
317
|
+
--repo-id "your-username/your-model"
|
|
318
|
+
```
|
|
319
|
+
|
|
320
|
+
### View in HuggingFace UI
|
|
321
|
+
|
|
322
|
+
After updating, visit:
|
|
323
|
+
```
|
|
324
|
+
https://huggingface.co/your-username/your-model
|
|
325
|
+
```
|
|
326
|
+
|
|
327
|
+
The evaluation widget should display your scores automatically.
|
|
328
|
+
|
|
329
|
+
## Troubleshooting Examples
|
|
330
|
+
|
|
331
|
+
### Problem: No tables found
|
|
332
|
+
|
|
333
|
+
```bash
|
|
334
|
+
# Check what tables exist in your README
|
|
335
|
+
python3 scripts/evaluation_manager.py extract-readme \
|
|
336
|
+
--repo-id "your-username/your-model" \
|
|
337
|
+
--dry-run
|
|
338
|
+
|
|
339
|
+
# If no output, ensure your README has markdown tables with numeric scores
|
|
340
|
+
```
|
|
341
|
+
|
|
342
|
+
### Problem: AA model not found
|
|
343
|
+
|
|
344
|
+
```bash
|
|
345
|
+
# Verify the creator and model slugs
|
|
346
|
+
# Check the AA website URL or API directly
|
|
347
|
+
curl -H "x-api-key: $AA_API_KEY" \
|
|
348
|
+
https://artificialanalysis.ai/api/v2/data/llms/models | jq
|
|
349
|
+
```
|
|
350
|
+
|
|
351
|
+
### Problem: Token permission error
|
|
352
|
+
|
|
353
|
+
```bash
|
|
354
|
+
# Verify your token has write access
|
|
355
|
+
# Generate a new token at: https://huggingface.co/settings/tokens
|
|
356
|
+
# Ensure "Write" scope is enabled
|
|
357
|
+
```
|
|
358
|
+
|
|
359
|
+
## Tips and Best Practices
|
|
360
|
+
|
|
361
|
+
1. **Always dry-run first**: Use `--dry-run` to preview changes
|
|
362
|
+
2. **Use PRs for others' repos**: Always use `--create-pr` for repositories you don't own
|
|
363
|
+
3. **Validate after updates**: Run `validate` to ensure proper formatting
|
|
364
|
+
4. **Keep evaluations current**: Set up automated updates for AA scores
|
|
365
|
+
5. **Document sources**: The tool automatically adds source attribution
|
|
366
|
+
6. **Check the UI**: Always verify the evaluation widget displays correctly
|
|
367
|
+
|
|
368
|
+
## Getting Help
|
|
369
|
+
|
|
370
|
+
```bash
|
|
371
|
+
# General help
|
|
372
|
+
python3 scripts/evaluation_manager.py --help
|
|
373
|
+
|
|
374
|
+
# Command-specific help
|
|
375
|
+
python3 scripts/evaluation_manager.py extract-readme --help
|
|
376
|
+
python3 scripts/evaluation_manager.py import-aa --help
|
|
377
|
+
```
|
|
378
|
+
|
|
379
|
+
For issues or questions, consult:
|
|
380
|
+
- `../SKILL.md` - Complete documentation
|
|
381
|
+
- `../README.md` - Troubleshooting guide
|
|
382
|
+
- `../QUICKSTART.md` - Quick start guide
|
|
@@ -0,0 +1,141 @@
|
|
|
1
|
+
# /// script
|
|
2
|
+
# requires-python = ">=3.13"
|
|
3
|
+
# dependencies = [
|
|
4
|
+
# "huggingface-hub>=1.1.4",
|
|
5
|
+
# "python-dotenv>=1.2.1",
|
|
6
|
+
# "pyyaml>=6.0.3",
|
|
7
|
+
# "requests>=2.32.5",
|
|
8
|
+
# ]
|
|
9
|
+
# ///
|
|
10
|
+
|
|
11
|
+
"""
|
|
12
|
+
Add Artificial Analysis evaluations to a Hugging Face model card.
|
|
13
|
+
|
|
14
|
+
NOTE: This is a standalone reference script. For integrated functionality
|
|
15
|
+
with additional features (README extraction, validation, etc.), use:
|
|
16
|
+
../scripts/evaluation_manager.py import-aa [options]
|
|
17
|
+
|
|
18
|
+
STANDALONE USAGE:
|
|
19
|
+
AA_API_KEY="<your-api-key>" HF_TOKEN="<your-huggingface-token>" \
|
|
20
|
+
python artificial_analysis_to_hub.py \
|
|
21
|
+
--creator-slug <artificial-analysis-creator-slug> \
|
|
22
|
+
--model-name <artificial-analysis-model-name> \
|
|
23
|
+
--repo-id <huggingface-repo-id>
|
|
24
|
+
|
|
25
|
+
INTEGRATED USAGE (Recommended):
|
|
26
|
+
python ../scripts/evaluation_manager.py import-aa \
|
|
27
|
+
--creator-slug <creator-slug> \
|
|
28
|
+
--model-name <model-name> \
|
|
29
|
+
--repo-id <repo-id> \
|
|
30
|
+
[--create-pr]
|
|
31
|
+
"""
|
|
32
|
+
|
|
33
|
+
import argparse
|
|
34
|
+
import os
|
|
35
|
+
|
|
36
|
+
import requests
|
|
37
|
+
import dotenv
|
|
38
|
+
from huggingface_hub import ModelCard
|
|
39
|
+
|
|
40
|
+
dotenv.load_dotenv()
|
|
41
|
+
|
|
42
|
+
API_KEY = os.getenv("AA_API_KEY")
|
|
43
|
+
HF_TOKEN = os.getenv("HF_TOKEN")
|
|
44
|
+
URL = "https://artificialanalysis.ai/api/v2/data/llms/models"
|
|
45
|
+
HEADERS = {"x-api-key": API_KEY}
|
|
46
|
+
|
|
47
|
+
if not API_KEY:
|
|
48
|
+
raise ValueError("AA_API_KEY is not set")
|
|
49
|
+
if not HF_TOKEN:
|
|
50
|
+
raise ValueError("HF_TOKEN is not set")
|
|
51
|
+
|
|
52
|
+
|
|
53
|
+
def get_model_evaluations_data(creator_slug, model_name):
|
|
54
|
+
response = requests.get(URL, headers=HEADERS)
|
|
55
|
+
response_data = response.json()["data"]
|
|
56
|
+
for model in response_data:
|
|
57
|
+
if (
|
|
58
|
+
model["model_creator"]["slug"] == creator_slug
|
|
59
|
+
and model["slug"] == model_name
|
|
60
|
+
):
|
|
61
|
+
return model
|
|
62
|
+
raise ValueError(f"Model {model_name} not found")
|
|
63
|
+
|
|
64
|
+
|
|
65
|
+
def aa_evaluations_to_model_index(
|
|
66
|
+
model,
|
|
67
|
+
dataset_name="Artificial Analysis Benchmarks",
|
|
68
|
+
dataset_type="artificial_analysis",
|
|
69
|
+
task_type="evaluation",
|
|
70
|
+
):
|
|
71
|
+
if not model:
|
|
72
|
+
raise ValueError("Model data is required")
|
|
73
|
+
|
|
74
|
+
model_name = model.get("name", model.get("slug", "unknown-model"))
|
|
75
|
+
evaluations = model.get("evaluations", {})
|
|
76
|
+
|
|
77
|
+
metrics = []
|
|
78
|
+
for key, value in evaluations.items():
|
|
79
|
+
metrics.append(
|
|
80
|
+
{
|
|
81
|
+
"name": key.replace("_", " ").title(),
|
|
82
|
+
"type": key,
|
|
83
|
+
"value": value,
|
|
84
|
+
}
|
|
85
|
+
)
|
|
86
|
+
|
|
87
|
+
model_index = [
|
|
88
|
+
{
|
|
89
|
+
"name": model_name,
|
|
90
|
+
"results": [
|
|
91
|
+
{
|
|
92
|
+
"task": {"type": task_type},
|
|
93
|
+
"dataset": {"name": dataset_name, "type": dataset_type},
|
|
94
|
+
"metrics": metrics,
|
|
95
|
+
"source": {
|
|
96
|
+
"name": "Artificial Analysis API",
|
|
97
|
+
"url": "https://artificialanalysis.ai",
|
|
98
|
+
},
|
|
99
|
+
}
|
|
100
|
+
],
|
|
101
|
+
}
|
|
102
|
+
]
|
|
103
|
+
|
|
104
|
+
return model_index
|
|
105
|
+
|
|
106
|
+
|
|
107
|
+
def main():
|
|
108
|
+
parser = argparse.ArgumentParser()
|
|
109
|
+
parser.add_argument("--creator-slug", type=str, required=True)
|
|
110
|
+
parser.add_argument("--model-name", type=str, required=True)
|
|
111
|
+
parser.add_argument("--repo-id", type=str, required=True)
|
|
112
|
+
args = parser.parse_args()
|
|
113
|
+
|
|
114
|
+
aa_evaluations_data = get_model_evaluations_data(
|
|
115
|
+
creator_slug=args.creator_slug, model_name=args.model_name
|
|
116
|
+
)
|
|
117
|
+
|
|
118
|
+
model_index = aa_evaluations_to_model_index(model=aa_evaluations_data)
|
|
119
|
+
|
|
120
|
+
card = ModelCard.load(args.repo_id)
|
|
121
|
+
card.data["model-index"] = model_index
|
|
122
|
+
|
|
123
|
+
commit_message = (
|
|
124
|
+
f"Add Artificial Analysis evaluations for {args.model_name}"
|
|
125
|
+
)
|
|
126
|
+
commit_description = (
|
|
127
|
+
f"This commit adds the Artificial Analysis evaluations for the {args.model_name} model to this repository. "
|
|
128
|
+
"To see the scores, visit the [Artificial Analysis](https://artificialanalysis.ai) website."
|
|
129
|
+
)
|
|
130
|
+
|
|
131
|
+
card.push_to_hub(
|
|
132
|
+
args.repo_id,
|
|
133
|
+
token=HF_TOKEN,
|
|
134
|
+
commit_message=commit_message,
|
|
135
|
+
commit_description=commit_description,
|
|
136
|
+
create_pr=True,
|
|
137
|
+
)
|
|
138
|
+
|
|
139
|
+
|
|
140
|
+
if __name__ == "__main__":
|
|
141
|
+
main()
|
|
@@ -0,0 +1,135 @@
|
|
|
1
|
+
# Example Evaluation Table Formats
|
|
2
|
+
|
|
3
|
+
This file shows various formats of evaluation tables that can be extracted from model README files.
|
|
4
|
+
|
|
5
|
+
## Format 1: Benchmarks as Rows (Most Common)
|
|
6
|
+
|
|
7
|
+
```markdown
|
|
8
|
+
| Benchmark | Score |
|
|
9
|
+
|-----------|-------|
|
|
10
|
+
| MMLU | 85.2 |
|
|
11
|
+
| HumanEval | 72.5 |
|
|
12
|
+
| GSM8K | 91.3 |
|
|
13
|
+
| HellaSwag | 88.9 |
|
|
14
|
+
```
|
|
15
|
+
|
|
16
|
+
## Format 2: Multiple Metric Columns
|
|
17
|
+
|
|
18
|
+
```markdown
|
|
19
|
+
| Benchmark | Accuracy | F1 Score |
|
|
20
|
+
|-----------|----------|----------|
|
|
21
|
+
| MMLU | 85.2 | 0.84 |
|
|
22
|
+
| GSM8K | 91.3 | 0.91 |
|
|
23
|
+
| DROP | 78.5 | 0.77 |
|
|
24
|
+
```
|
|
25
|
+
|
|
26
|
+
## Format 3: Benchmarks as Columns
|
|
27
|
+
|
|
28
|
+
```markdown
|
|
29
|
+
| MMLU | HumanEval | GSM8K | HellaSwag |
|
|
30
|
+
|------|-----------|-------|-----------|
|
|
31
|
+
| 85.2 | 72.5 | 91.3 | 88.9 |
|
|
32
|
+
```
|
|
33
|
+
|
|
34
|
+
## Format 4: Percentage Values
|
|
35
|
+
|
|
36
|
+
```markdown
|
|
37
|
+
| Benchmark | Score |
|
|
38
|
+
|---------------|----------|
|
|
39
|
+
| MMLU | 85.2% |
|
|
40
|
+
| HumanEval | 72.5% |
|
|
41
|
+
| GSM8K | 91.3% |
|
|
42
|
+
| TruthfulQA | 68.7% |
|
|
43
|
+
```
|
|
44
|
+
|
|
45
|
+
## Format 5: Mixed Format with Categories
|
|
46
|
+
|
|
47
|
+
```markdown
|
|
48
|
+
### Reasoning
|
|
49
|
+
|
|
50
|
+
| Benchmark | Score |
|
|
51
|
+
|-----------|-------|
|
|
52
|
+
| MMLU | 85.2 |
|
|
53
|
+
| BBH | 82.4 |
|
|
54
|
+
| GPQA | 71.3 |
|
|
55
|
+
|
|
56
|
+
### Coding
|
|
57
|
+
|
|
58
|
+
| Benchmark | Score |
|
|
59
|
+
|-----------|-------|
|
|
60
|
+
| HumanEval | 72.5 |
|
|
61
|
+
| MBPP | 78.9 |
|
|
62
|
+
|
|
63
|
+
### Math
|
|
64
|
+
|
|
65
|
+
| Benchmark | Score |
|
|
66
|
+
|-----------|-------|
|
|
67
|
+
| GSM8K | 91.3 |
|
|
68
|
+
| MATH | 65.8 |
|
|
69
|
+
```
|
|
70
|
+
|
|
71
|
+
## Format 6: With Additional Columns
|
|
72
|
+
|
|
73
|
+
```markdown
|
|
74
|
+
| Benchmark | Score | Rank | Notes |
|
|
75
|
+
|-----------|-------|------|--------------------|
|
|
76
|
+
| MMLU | 85.2 | #5 | 5-shot |
|
|
77
|
+
| HumanEval | 72.5 | #8 | pass@1 |
|
|
78
|
+
| GSM8K | 91.3 | #3 | 8-shot, maj@1 |
|
|
79
|
+
```
|
|
80
|
+
|
|
81
|
+
## How the Extractor Works
|
|
82
|
+
|
|
83
|
+
The script will:
|
|
84
|
+
1. Find all markdown tables in the README
|
|
85
|
+
2. Identify which tables contain evaluation results
|
|
86
|
+
3. Parse the table structure (rows vs columns)
|
|
87
|
+
4. Extract numeric values as scores
|
|
88
|
+
5. Convert to model-index YAML format
|
|
89
|
+
|
|
90
|
+
## Tips for README Authors
|
|
91
|
+
|
|
92
|
+
To ensure your evaluation tables are properly extracted:
|
|
93
|
+
|
|
94
|
+
1. **Use clear headers**: Include "Benchmark", "Score", or similar terms
|
|
95
|
+
2. **Keep it simple**: Stick to benchmark name + score columns
|
|
96
|
+
3. **Use standard formats**: Follow markdown table syntax
|
|
97
|
+
4. **Include numeric values**: Ensure scores are parseable numbers
|
|
98
|
+
5. **Be consistent**: Use the same format across multiple tables
|
|
99
|
+
|
|
100
|
+
## Example Complete README Section
|
|
101
|
+
|
|
102
|
+
```markdown
|
|
103
|
+
# Model Card for MyModel-7B
|
|
104
|
+
|
|
105
|
+
## Evaluation Results
|
|
106
|
+
|
|
107
|
+
Our model was evaluated on several standard benchmarks:
|
|
108
|
+
|
|
109
|
+
| Benchmark | Score |
|
|
110
|
+
|---------------|-------|
|
|
111
|
+
| MMLU | 85.2 |
|
|
112
|
+
| HumanEval | 72.5 |
|
|
113
|
+
| GSM8K | 91.3 |
|
|
114
|
+
| HellaSwag | 88.9 |
|
|
115
|
+
| ARC-Challenge | 81.7 |
|
|
116
|
+
| TruthfulQA | 68.7 |
|
|
117
|
+
|
|
118
|
+
### Detailed Results
|
|
119
|
+
|
|
120
|
+
For more detailed results and methodology, see our [paper](link).
|
|
121
|
+
```
|
|
122
|
+
|
|
123
|
+
## Running the Extractor
|
|
124
|
+
|
|
125
|
+
```bash
|
|
126
|
+
# Extract from this example
|
|
127
|
+
python scripts/evaluation_manager.py extract-readme \
|
|
128
|
+
--repo-id "your-username/your-model" \
|
|
129
|
+
--dry-run
|
|
130
|
+
|
|
131
|
+
# Apply to your model card
|
|
132
|
+
python scripts/evaluation_manager.py extract-readme \
|
|
133
|
+
--repo-id "your-username/your-model" \
|
|
134
|
+
--task-type "text-generation"
|
|
135
|
+
```
|
|
@@ -0,0 +1,50 @@
|
|
|
1
|
+
{
|
|
2
|
+
"MMLU": {
|
|
3
|
+
"type": "mmlu",
|
|
4
|
+
"name": "Massive Multitask Language Understanding"
|
|
5
|
+
},
|
|
6
|
+
"HumanEval": {
|
|
7
|
+
"type": "humaneval",
|
|
8
|
+
"name": "Code Generation (HumanEval)"
|
|
9
|
+
},
|
|
10
|
+
"GSM8K": {
|
|
11
|
+
"type": "gsm8k",
|
|
12
|
+
"name": "Grade School Math"
|
|
13
|
+
},
|
|
14
|
+
"HellaSwag": {
|
|
15
|
+
"type": "hellaswag",
|
|
16
|
+
"name": "HellaSwag Common Sense"
|
|
17
|
+
},
|
|
18
|
+
"ARC-C": {
|
|
19
|
+
"type": "arc_challenge",
|
|
20
|
+
"name": "ARC Challenge"
|
|
21
|
+
},
|
|
22
|
+
"ARC-E": {
|
|
23
|
+
"type": "arc_easy",
|
|
24
|
+
"name": "ARC Easy"
|
|
25
|
+
},
|
|
26
|
+
"Winogrande": {
|
|
27
|
+
"type": "winogrande",
|
|
28
|
+
"name": "Winogrande"
|
|
29
|
+
},
|
|
30
|
+
"TruthfulQA": {
|
|
31
|
+
"type": "truthfulqa",
|
|
32
|
+
"name": "TruthfulQA"
|
|
33
|
+
},
|
|
34
|
+
"GPQA": {
|
|
35
|
+
"type": "gpqa",
|
|
36
|
+
"name": "Graduate-Level Google-Proof Q&A"
|
|
37
|
+
},
|
|
38
|
+
"DROP": {
|
|
39
|
+
"type": "drop",
|
|
40
|
+
"name": "Discrete Reasoning Over Paragraphs"
|
|
41
|
+
},
|
|
42
|
+
"BBH": {
|
|
43
|
+
"type": "bbh",
|
|
44
|
+
"name": "Big Bench Hard"
|
|
45
|
+
},
|
|
46
|
+
"MATH": {
|
|
47
|
+
"type": "math",
|
|
48
|
+
"name": "MATH Dataset"
|
|
49
|
+
}
|
|
50
|
+
}
|