cli-jaw 0.1.6 → 0.1.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.ko.md +68 -71
- package/README.md +123 -92
- package/README.zh-CN.md +68 -73
- package/dist/bin/cli-claw.js +96 -0
- package/dist/bin/cli-claw.js.map +1 -0
- package/dist/bin/cli-jaw.js +0 -0
- package/dist/bin/commands/doctor.js +3 -0
- package/dist/bin/commands/doctor.js.map +1 -1
- package/dist/bin/commands/init.js +36 -19
- package/dist/bin/commands/init.js.map +1 -1
- package/dist/bin/postinstall.js +175 -104
- package/dist/bin/postinstall.js.map +1 -1
- package/dist/lib/mcp-sync.js +43 -4
- package/dist/lib/mcp-sync.js.map +1 -1
- package/dist/server.js +22 -103
- package/dist/server.js.map +1 -1
- package/dist/src/cli/acp-client.js +1 -1
- package/dist/src/cli/command-context.js +73 -0
- package/dist/src/cli/command-context.js.map +1 -0
- package/dist/src/core/db.js +1 -1
- package/dist/src/memory/heartbeat.js +2 -1
- package/dist/src/memory/heartbeat.js.map +1 -1
- package/dist/src/orchestrator/collect.js +53 -0
- package/dist/src/orchestrator/collect.js.map +1 -0
- package/dist/src/orchestrator/gateway.js +49 -0
- package/dist/src/orchestrator/gateway.js.map +1 -0
- package/dist/src/telegram/bot.js +32 -119
- package/dist/src/telegram/bot.js.map +1 -1
- package/package.json +7 -7
- package/public/css/sidebar.css +14 -0
- package/public/dist/bundle.js +21 -21
- package/public/dist/bundle.js.map +3 -3
- package/public/index.html +2 -2
- package/public/js/features/settings.js +1 -2
- package/public/js/main.js +0 -1
- package/scripts/check-copilot-gap.js +57 -0
- package/scripts/check-deps-offline.mjs +75 -0
- package/scripts/check-deps-online.sh +26 -0
- package/scripts/i18n-registry.py +208 -0
- package/scripts/postinstall-guard.cjs +63 -0
- package/scripts/release.sh +30 -0
- package/skills_ref/1password/SKILL.md +0 -70
- package/skills_ref/agents-sdk/SKILL.md +0 -155
- package/skills_ref/agents-sdk/references/callable.md +0 -92
- package/skills_ref/agents-sdk/references/codemode.md +0 -207
- package/skills_ref/agents-sdk/references/email.md +0 -146
- package/skills_ref/agents-sdk/references/mcp.md +0 -154
- package/skills_ref/agents-sdk/references/state-scheduling.md +0 -164
- package/skills_ref/agents-sdk/references/streaming-chat.md +0 -178
- package/skills_ref/agents-sdk/references/workflows.md +0 -132
- package/skills_ref/algorithmic-art/LICENSE.txt +0 -202
- package/skills_ref/algorithmic-art/SKILL.md +0 -405
- package/skills_ref/algorithmic-art/templates/generator_template.js +0 -223
- package/skills_ref/algorithmic-art/templates/viewer.html +0 -599
- package/skills_ref/apple-notes/SKILL.md +0 -77
- package/skills_ref/apple-reminders/SKILL.md +0 -118
- package/skills_ref/atlas/SKILL.md +0 -99
- package/skills_ref/brainstorming/SKILL.md +0 -96
- package/skills_ref/browser/SKILL.md +0 -179
- package/skills_ref/canvas-design/LICENSE.txt +0 -202
- package/skills_ref/canvas-design/SKILL.md +0 -130
- package/skills_ref/canvas-design/canvas-fonts/ArsenalSC-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/ArsenalSC-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/BigShoulders-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/BigShoulders-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/BigShoulders-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Boldonse-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/Boldonse-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/BricolageGrotesque-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/BricolageGrotesque-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/BricolageGrotesque-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/CrimsonPro-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/CrimsonPro-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/CrimsonPro-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/CrimsonPro-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/DMMono-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/DMMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/EricaOne-OFL.txt +0 -94
- package/skills_ref/canvas-design/canvas-fonts/EricaOne-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/GeistMono-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/GeistMono-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/GeistMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Gloock-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/Gloock-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexMono-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexMono-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexSerif-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexSerif-BoldItalic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexSerif-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/IBMPlexSerif-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-BoldItalic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSans-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSerif-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/InstrumentSerif-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Italiana-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/Italiana-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/JetBrainsMono-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/JetBrainsMono-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/JetBrainsMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Jura-Light.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Jura-Medium.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Jura-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/LibreBaskerville-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/LibreBaskerville-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Lora-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Lora-BoldItalic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Lora-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Lora-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/Lora-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/NationalPark-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/NationalPark-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/NationalPark-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/NothingYouCouldDo-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/NothingYouCouldDo-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Outfit-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Outfit-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/Outfit-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/PixelifySans-Medium.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/PixelifySans-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/PoiretOne-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/PoiretOne-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/RedHatMono-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/RedHatMono-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/RedHatMono-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Silkscreen-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/Silkscreen-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/SmoochSans-Medium.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/SmoochSans-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/Tektur-Medium.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/Tektur-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/Tektur-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-Bold.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-BoldItalic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-Italic.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/WorkSans-Regular.ttf +0 -0
- package/skills_ref/canvas-design/canvas-fonts/YoungSerif-OFL.txt +0 -93
- package/skills_ref/canvas-design/canvas-fonts/YoungSerif-Regular.ttf +0 -0
- package/skills_ref/changelog-generator/SKILL.md +0 -104
- package/skills_ref/cloudflare-deploy/SKILL.md +0 -207
- package/skills_ref/codebase-orientation/SKILL.md +0 -29
- package/skills_ref/config-file-explainer/SKILL.md +0 -26
- package/skills_ref/context-compression/SKILL.md +0 -265
- package/skills_ref/context-compression/references/evaluation-framework.md +0 -213
- package/skills_ref/context-compression/scripts/compression_evaluator.py +0 -658
- package/skills_ref/data-structure-chooser/SKILL.md +0 -26
- package/skills_ref/debugging-checklist/SKILL.md +0 -26
- package/skills_ref/debugging-helpers/CREATION-LOG.md +0 -119
- package/skills_ref/debugging-helpers/SKILL.md +0 -296
- package/skills_ref/debugging-helpers/condition-based-waiting-example.ts +0 -158
- package/skills_ref/debugging-helpers/condition-based-waiting.md +0 -115
- package/skills_ref/debugging-helpers/defense-in-depth.md +0 -122
- package/skills_ref/debugging-helpers/find-polluter.sh +0 -63
- package/skills_ref/debugging-helpers/root-cause-tracing.md +0 -169
- package/skills_ref/debugging-helpers/test-academic.md +0 -14
- package/skills_ref/debugging-helpers/test-pressure-1.md +0 -58
- package/skills_ref/debugging-helpers/test-pressure-2.md +0 -68
- package/skills_ref/debugging-helpers/test-pressure-3.md +0 -69
- package/skills_ref/deep-research/.env.example +0 -7
- package/skills_ref/deep-research/README.md +0 -246
- package/skills_ref/deep-research/SKILL.md +0 -106
- package/skills_ref/deep-research/requirements.txt +0 -2
- package/skills_ref/deep-research/scripts/research.py +0 -692
- package/skills_ref/dependency-install-helper/SKILL.md +0 -26
- package/skills_ref/dev/SKILL.md +0 -65
- package/skills_ref/dev-backend/SKILL.md +0 -61
- package/skills_ref/dev-data/SKILL.md +0 -76
- package/skills_ref/dev-frontend/LICENSE.txt +0 -177
- package/skills_ref/dev-frontend/SKILL.md +0 -42
- package/skills_ref/dev-testing/LICENSE.txt +0 -202
- package/skills_ref/dev-testing/SKILL.md +0 -96
- package/skills_ref/dev-testing/examples/console_logging.py +0 -35
- package/skills_ref/dev-testing/examples/element_discovery.py +0 -40
- package/skills_ref/dev-testing/examples/static_html_automation.py +0 -33
- package/skills_ref/dev-testing/scripts/with_server.py +0 -106
- package/skills_ref/develop-web-game/SKILL.md +0 -149
- package/skills_ref/differential-review/.claude-plugin/plugin.json +0 -10
- package/skills_ref/differential-review/README.md +0 -109
- package/skills_ref/differential-review/commands/diff-review.md +0 -21
- package/skills_ref/differential-review/skills/differential-review/SKILL.md +0 -220
- package/skills_ref/differential-review/skills/differential-review/adversarial.md +0 -203
- package/skills_ref/differential-review/skills/differential-review/methodology.md +0 -234
- package/skills_ref/differential-review/skills/differential-review/patterns.md +0 -300
- package/skills_ref/differential-review/skills/differential-review/reporting.md +0 -369
- package/skills_ref/dispatching-parallel-agents/SKILL.md +0 -180
- package/skills_ref/doc-coauthoring/SKILL.md +0 -375
- package/skills_ref/docx/LICENSE.txt +0 -30
- package/skills_ref/docx/SKILL.md +0 -481
- package/skills_ref/docx/scripts/__init__.py +0 -1
- package/skills_ref/docx/scripts/accept_changes.py +0 -135
- package/skills_ref/docx/scripts/comment.py +0 -318
- package/skills_ref/docx/scripts/office/helpers/__init__.py +0 -0
- package/skills_ref/docx/scripts/office/helpers/merge_runs.py +0 -199
- package/skills_ref/docx/scripts/office/helpers/simplify_redlines.py +0 -197
- package/skills_ref/docx/scripts/office/pack.py +0 -159
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +0 -1499
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +0 -146
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +0 -1085
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +0 -11
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +0 -3081
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +0 -23
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +0 -185
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +0 -287
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +0 -1676
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +0 -28
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +0 -144
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +0 -174
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +0 -25
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +0 -18
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +0 -59
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +0 -56
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +0 -195
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +0 -582
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +0 -25
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +0 -4439
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +0 -570
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +0 -509
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +0 -12
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +0 -108
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +0 -96
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +0 -3646
- package/skills_ref/docx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +0 -116
- package/skills_ref/docx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +0 -42
- package/skills_ref/docx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +0 -50
- package/skills_ref/docx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +0 -49
- package/skills_ref/docx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +0 -33
- package/skills_ref/docx/scripts/office/schemas/mce/mc.xsd +0 -75
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-2010.xsd +0 -560
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-2012.xsd +0 -67
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-2018.xsd +0 -14
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +0 -20
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +0 -13
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +0 -4
- package/skills_ref/docx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +0 -8
- package/skills_ref/docx/scripts/office/soffice.py +0 -183
- package/skills_ref/docx/scripts/office/unpack.py +0 -132
- package/skills_ref/docx/scripts/office/validate.py +0 -111
- package/skills_ref/docx/scripts/office/validators/__init__.py +0 -15
- package/skills_ref/docx/scripts/office/validators/base.py +0 -847
- package/skills_ref/docx/scripts/office/validators/docx.py +0 -446
- package/skills_ref/docx/scripts/office/validators/pptx.py +0 -275
- package/skills_ref/docx/scripts/office/validators/redlining.py +0 -247
- package/skills_ref/docx/scripts/templates/comments.xml +0 -3
- package/skills_ref/docx/scripts/templates/commentsExtended.xml +0 -3
- package/skills_ref/docx/scripts/templates/commentsExtensible.xml +0 -3
- package/skills_ref/docx/scripts/templates/commentsIds.xml +0 -3
- package/skills_ref/docx/scripts/templates/people.xml +0 -3
- package/skills_ref/durable-objects/SKILL.md +0 -186
- package/skills_ref/durable-objects/references/rules.md +0 -286
- package/skills_ref/durable-objects/references/testing.md +0 -264
- package/skills_ref/durable-objects/references/workers.md +0 -346
- package/skills_ref/email-draft-polish/SKILL.md +0 -24
- package/skills_ref/error-message-explainer/SKILL.md +0 -27
- package/skills_ref/fal-image-edit/SKILL.md +0 -249
- package/skills_ref/fal-image-edit/scripts/edit-image.sh +0 -199
- package/skills_ref/figma-implement-design/SKILL.md +0 -264
- package/skills_ref/git-worktrees/SKILL.md +0 -218
- package/skills_ref/github/SKILL.md +0 -210
- package/skills_ref/gog/SKILL.md +0 -116
- package/skills_ref/goplaces/SKILL.md +0 -52
- package/skills_ref/himalaya/SKILL.md +0 -257
- package/skills_ref/hugging-face-cli/SKILL.md +0 -186
- package/skills_ref/hugging-face-cli/references/commands.md +0 -954
- package/skills_ref/hugging-face-cli/references/examples.md +0 -374
- package/skills_ref/hugging-face-evaluation/SKILL.md +0 -651
- package/skills_ref/hugging-face-evaluation/examples/.env.example +0 -7
- package/skills_ref/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +0 -382
- package/skills_ref/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +0 -141
- package/skills_ref/hugging-face-evaluation/examples/example_readme_tables.md +0 -135
- package/skills_ref/hugging-face-evaluation/examples/metric_mapping.json +0 -50
- package/skills_ref/hugging-face-evaluation/requirements.txt +0 -20
- package/skills_ref/hugging-face-evaluation/scripts/evaluation_manager.py +0 -1374
- package/skills_ref/hugging-face-evaluation/scripts/inspect_eval_uv.py +0 -104
- package/skills_ref/hugging-face-evaluation/scripts/inspect_vllm_uv.py +0 -317
- package/skills_ref/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +0 -303
- package/skills_ref/hugging-face-evaluation/scripts/run_eval_job.py +0 -98
- package/skills_ref/hugging-face-evaluation/scripts/run_vllm_eval_job.py +0 -331
- package/skills_ref/hugging-face-evaluation/scripts/test_extraction.py +0 -206
- package/skills_ref/hugging-face-model-trainer/SKILL.md +0 -718
- package/skills_ref/hugging-face-model-trainer/references/gguf_conversion.md +0 -296
- package/skills_ref/hugging-face-model-trainer/references/hardware_guide.md +0 -283
- package/skills_ref/hugging-face-model-trainer/references/hub_saving.md +0 -364
- package/skills_ref/hugging-face-model-trainer/references/reliability_principles.md +0 -371
- package/skills_ref/hugging-face-model-trainer/references/trackio_guide.md +0 -189
- package/skills_ref/hugging-face-model-trainer/references/training_methods.md +0 -150
- package/skills_ref/hugging-face-model-trainer/references/training_patterns.md +0 -203
- package/skills_ref/hugging-face-model-trainer/references/troubleshooting.md +0 -282
- package/skills_ref/hugging-face-model-trainer/references/unsloth.md +0 -313
- package/skills_ref/hugging-face-model-trainer/scripts/convert_to_gguf.py +0 -424
- package/skills_ref/hugging-face-model-trainer/scripts/dataset_inspector.py +0 -417
- package/skills_ref/hugging-face-model-trainer/scripts/estimate_cost.py +0 -150
- package/skills_ref/hugging-face-model-trainer/scripts/train_dpo_example.py +0 -106
- package/skills_ref/hugging-face-model-trainer/scripts/train_grpo_example.py +0 -89
- package/skills_ref/hugging-face-model-trainer/scripts/train_sft_example.py +0 -122
- package/skills_ref/hugging-face-model-trainer/scripts/unsloth_sft_example.py +0 -512
- package/skills_ref/imagegen/SKILL.md +0 -174
- package/skills_ref/insecure-defaults/.claude-plugin/plugin.json +0 -10
- package/skills_ref/insecure-defaults/README.md +0 -45
- package/skills_ref/insecure-defaults/skills/insecure-defaults/SKILL.md +0 -117
- package/skills_ref/insecure-defaults/skills/insecure-defaults/references/examples.md +0 -409
- package/skills_ref/jupyter-notebook/SKILL.md +0 -107
- package/skills_ref/linear/SKILL.md +0 -87
- package/skills_ref/linter-fix-guide/SKILL.md +0 -27
- package/skills_ref/log-summarizer/SKILL.md +0 -27
- package/skills_ref/mcp-builder/LICENSE.txt +0 -202
- package/skills_ref/mcp-builder/SKILL.md +0 -236
- package/skills_ref/mcp-builder/reference/evaluation.md +0 -602
- package/skills_ref/mcp-builder/reference/mcp_best_practices.md +0 -249
- package/skills_ref/mcp-builder/reference/node_mcp_server.md +0 -970
- package/skills_ref/mcp-builder/reference/python_mcp_server.md +0 -719
- package/skills_ref/mcp-builder/scripts/connections.py +0 -151
- package/skills_ref/mcp-builder/scripts/evaluation.py +0 -373
- package/skills_ref/mcp-builder/scripts/example_evaluation.xml +0 -22
- package/skills_ref/mcp-builder/scripts/requirements.txt +0 -2
- package/skills_ref/memory/SKILL.md +0 -129
- package/skills_ref/modern-python/.claude-plugin/plugin.json +0 -10
- package/skills_ref/modern-python/README.md +0 -66
- package/skills_ref/modern-python/hooks/hooks.json +0 -16
- package/skills_ref/modern-python/hooks/setup-shims.bats +0 -70
- package/skills_ref/modern-python/hooks/setup-shims.sh +0 -24
- package/skills_ref/modern-python/hooks/shims/pip +0 -27
- package/skills_ref/modern-python/hooks/shims/pip-shim.bats +0 -45
- package/skills_ref/modern-python/hooks/shims/pip3 +0 -27
- package/skills_ref/modern-python/hooks/shims/pipx +0 -41
- package/skills_ref/modern-python/hooks/shims/pipx-shim.bats +0 -64
- package/skills_ref/modern-python/hooks/shims/python +0 -26
- package/skills_ref/modern-python/hooks/shims/python-shim.bats +0 -53
- package/skills_ref/modern-python/hooks/shims/python3 +0 -26
- package/skills_ref/modern-python/hooks/shims/uv +0 -27
- package/skills_ref/modern-python/hooks/shims/uv-shim.bats +0 -47
- package/skills_ref/modern-python/skills/modern-python/SKILL.md +0 -333
- package/skills_ref/modern-python/skills/modern-python/references/dependabot.md +0 -43
- package/skills_ref/modern-python/skills/modern-python/references/migration-checklist.md +0 -141
- package/skills_ref/modern-python/skills/modern-python/references/pep723-scripts.md +0 -259
- package/skills_ref/modern-python/skills/modern-python/references/prek.md +0 -211
- package/skills_ref/modern-python/skills/modern-python/references/pyproject.md +0 -254
- package/skills_ref/modern-python/skills/modern-python/references/ruff-config.md +0 -240
- package/skills_ref/modern-python/skills/modern-python/references/security-setup.md +0 -255
- package/skills_ref/modern-python/skills/modern-python/references/testing.md +0 -284
- package/skills_ref/modern-python/skills/modern-python/references/uv-commands.md +0 -200
- package/skills_ref/modern-python/skills/modern-python/templates/dependabot.yml +0 -36
- package/skills_ref/modern-python/skills/modern-python/templates/pre-commit-config.yaml +0 -66
- package/skills_ref/nano-banana-pro/SKILL.md +0 -58
- package/skills_ref/netlify-deploy/SKILL.md +0 -233
- package/skills_ref/notion/SKILL.md +0 -304
- package/skills_ref/notion-knowledge-capture/SKILL.md +0 -56
- package/skills_ref/notion-meeting-intelligence/SKILL.md +0 -60
- package/skills_ref/notion-research-documentation/SKILL.md +0 -59
- package/skills_ref/notion-spec-to-implementation/SKILL.md +0 -58
- package/skills_ref/obsidian/SKILL.md +0 -81
- package/skills_ref/openai-docs/SKILL.md +0 -56
- package/skills_ref/openhue/SKILL.md +0 -112
- package/skills_ref/pdf/SKILL.md +0 -69
- package/skills_ref/postgres/README.md +0 -77
- package/skills_ref/postgres/SKILL.md +0 -129
- package/skills_ref/postgres/connections.example.json +0 -34
- package/skills_ref/postgres/requirements.txt +0 -1
- package/skills_ref/postgres/scripts/query.py +0 -262
- package/skills_ref/pptx/LICENSE.txt +0 -30
- package/skills_ref/pptx/SKILL.md +0 -232
- package/skills_ref/pptx/editing.md +0 -205
- package/skills_ref/pptx/pptxgenjs.md +0 -420
- package/skills_ref/pptx/scripts/__init__.py +0 -0
- package/skills_ref/pptx/scripts/add_slide.py +0 -195
- package/skills_ref/pptx/scripts/clean.py +0 -286
- package/skills_ref/pptx/scripts/office/helpers/__init__.py +0 -0
- package/skills_ref/pptx/scripts/office/helpers/merge_runs.py +0 -199
- package/skills_ref/pptx/scripts/office/helpers/simplify_redlines.py +0 -197
- package/skills_ref/pptx/scripts/office/pack.py +0 -159
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +0 -1499
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +0 -146
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +0 -1085
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +0 -11
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +0 -3081
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +0 -23
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +0 -185
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +0 -287
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +0 -1676
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +0 -28
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +0 -144
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +0 -174
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +0 -25
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +0 -18
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +0 -59
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +0 -56
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +0 -195
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +0 -582
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +0 -25
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +0 -4439
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +0 -570
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +0 -509
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +0 -12
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +0 -108
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +0 -96
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +0 -3646
- package/skills_ref/pptx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +0 -116
- package/skills_ref/pptx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +0 -42
- package/skills_ref/pptx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +0 -50
- package/skills_ref/pptx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +0 -49
- package/skills_ref/pptx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +0 -33
- package/skills_ref/pptx/scripts/office/schemas/mce/mc.xsd +0 -75
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-2010.xsd +0 -560
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-2012.xsd +0 -67
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-2018.xsd +0 -14
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +0 -20
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +0 -13
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +0 -4
- package/skills_ref/pptx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +0 -8
- package/skills_ref/pptx/scripts/office/soffice.py +0 -183
- package/skills_ref/pptx/scripts/office/unpack.py +0 -132
- package/skills_ref/pptx/scripts/office/validate.py +0 -111
- package/skills_ref/pptx/scripts/office/validators/__init__.py +0 -15
- package/skills_ref/pptx/scripts/office/validators/base.py +0 -847
- package/skills_ref/pptx/scripts/office/validators/docx.py +0 -446
- package/skills_ref/pptx/scripts/office/validators/pptx.py +0 -275
- package/skills_ref/pptx/scripts/office/validators/redlining.py +0 -247
- package/skills_ref/pptx/scripts/thumbnail.py +0 -289
- package/skills_ref/property-based-testing/.claude-plugin/plugin.json +0 -9
- package/skills_ref/property-based-testing/README.md +0 -47
- package/skills_ref/property-based-testing/skills/property-based-testing/README.md +0 -88
- package/skills_ref/property-based-testing/skills/property-based-testing/SKILL.md +0 -123
- package/skills_ref/property-based-testing/skills/property-based-testing/references/design.md +0 -191
- package/skills_ref/property-based-testing/skills/property-based-testing/references/generating.md +0 -204
- package/skills_ref/property-based-testing/skills/property-based-testing/references/interpreting-failures.md +0 -239
- package/skills_ref/property-based-testing/skills/property-based-testing/references/libraries.md +0 -130
- package/skills_ref/property-based-testing/skills/property-based-testing/references/refactoring.md +0 -181
- package/skills_ref/property-based-testing/skills/property-based-testing/references/reviewing.md +0 -209
- package/skills_ref/property-based-testing/skills/property-based-testing/references/strategies.md +0 -124
- package/skills_ref/react-best-practices/AGENTS.md +0 -2934
- package/skills_ref/react-best-practices/README.md +0 -123
- package/skills_ref/react-best-practices/SKILL.md +0 -136
- package/skills_ref/react-best-practices/metadata.json +0 -15
- package/skills_ref/react-best-practices/rules/_sections.md +0 -46
- package/skills_ref/react-best-practices/rules/_template.md +0 -28
- package/skills_ref/react-best-practices/rules/advanced-event-handler-refs.md +0 -55
- package/skills_ref/react-best-practices/rules/advanced-init-once.md +0 -42
- package/skills_ref/react-best-practices/rules/advanced-use-latest.md +0 -39
- package/skills_ref/react-best-practices/rules/async-api-routes.md +0 -38
- package/skills_ref/react-best-practices/rules/async-defer-await.md +0 -80
- package/skills_ref/react-best-practices/rules/async-dependencies.md +0 -51
- package/skills_ref/react-best-practices/rules/async-parallel.md +0 -28
- package/skills_ref/react-best-practices/rules/async-suspense-boundaries.md +0 -99
- package/skills_ref/react-best-practices/rules/bundle-barrel-imports.md +0 -59
- package/skills_ref/react-best-practices/rules/bundle-conditional.md +0 -31
- package/skills_ref/react-best-practices/rules/bundle-defer-third-party.md +0 -49
- package/skills_ref/react-best-practices/rules/bundle-dynamic-imports.md +0 -35
- package/skills_ref/react-best-practices/rules/bundle-preload.md +0 -50
- package/skills_ref/react-best-practices/rules/client-event-listeners.md +0 -74
- package/skills_ref/react-best-practices/rules/client-localstorage-schema.md +0 -71
- package/skills_ref/react-best-practices/rules/client-passive-event-listeners.md +0 -48
- package/skills_ref/react-best-practices/rules/client-swr-dedup.md +0 -56
- package/skills_ref/react-best-practices/rules/js-batch-dom-css.md +0 -107
- package/skills_ref/react-best-practices/rules/js-cache-function-results.md +0 -80
- package/skills_ref/react-best-practices/rules/js-cache-property-access.md +0 -28
- package/skills_ref/react-best-practices/rules/js-cache-storage.md +0 -70
- package/skills_ref/react-best-practices/rules/js-combine-iterations.md +0 -32
- package/skills_ref/react-best-practices/rules/js-early-exit.md +0 -50
- package/skills_ref/react-best-practices/rules/js-hoist-regexp.md +0 -45
- package/skills_ref/react-best-practices/rules/js-index-maps.md +0 -37
- package/skills_ref/react-best-practices/rules/js-length-check-first.md +0 -49
- package/skills_ref/react-best-practices/rules/js-min-max-loop.md +0 -82
- package/skills_ref/react-best-practices/rules/js-set-map-lookups.md +0 -24
- package/skills_ref/react-best-practices/rules/js-tosorted-immutable.md +0 -57
- package/skills_ref/react-best-practices/rules/rendering-activity.md +0 -26
- package/skills_ref/react-best-practices/rules/rendering-animate-svg-wrapper.md +0 -47
- package/skills_ref/react-best-practices/rules/rendering-conditional-render.md +0 -40
- package/skills_ref/react-best-practices/rules/rendering-content-visibility.md +0 -38
- package/skills_ref/react-best-practices/rules/rendering-hoist-jsx.md +0 -46
- package/skills_ref/react-best-practices/rules/rendering-hydration-no-flicker.md +0 -82
- package/skills_ref/react-best-practices/rules/rendering-hydration-suppress-warning.md +0 -30
- package/skills_ref/react-best-practices/rules/rendering-svg-precision.md +0 -28
- package/skills_ref/react-best-practices/rules/rendering-usetransition-loading.md +0 -75
- package/skills_ref/react-best-practices/rules/rerender-defer-reads.md +0 -39
- package/skills_ref/react-best-practices/rules/rerender-dependencies.md +0 -45
- package/skills_ref/react-best-practices/rules/rerender-derived-state-no-effect.md +0 -40
- package/skills_ref/react-best-practices/rules/rerender-derived-state.md +0 -29
- package/skills_ref/react-best-practices/rules/rerender-functional-setstate.md +0 -74
- package/skills_ref/react-best-practices/rules/rerender-lazy-state-init.md +0 -58
- package/skills_ref/react-best-practices/rules/rerender-memo-with-default-value.md +0 -38
- package/skills_ref/react-best-practices/rules/rerender-memo.md +0 -44
- package/skills_ref/react-best-practices/rules/rerender-move-effect-to-event.md +0 -45
- package/skills_ref/react-best-practices/rules/rerender-simple-expression-in-memo.md +0 -35
- package/skills_ref/react-best-practices/rules/rerender-transitions.md +0 -40
- package/skills_ref/react-best-practices/rules/rerender-use-ref-transient-values.md +0 -73
- package/skills_ref/react-best-practices/rules/server-after-nonblocking.md +0 -73
- package/skills_ref/react-best-practices/rules/server-auth-actions.md +0 -96
- package/skills_ref/react-best-practices/rules/server-cache-lru.md +0 -41
- package/skills_ref/react-best-practices/rules/server-cache-react.md +0 -76
- package/skills_ref/react-best-practices/rules/server-dedup-props.md +0 -65
- package/skills_ref/react-best-practices/rules/server-parallel-fetching.md +0 -83
- package/skills_ref/react-best-practices/rules/server-serialization.md +0 -38
- package/skills_ref/receiving-code-review/SKILL.md +0 -213
- package/skills_ref/registry.json +0 -1493
- package/skills_ref/render-deploy/SKILL.md +0 -462
- package/skills_ref/requesting-code-review/SKILL.md +0 -105
- package/skills_ref/requesting-code-review/code-reviewer.md +0 -146
- package/skills_ref/screen-capture/SKILL.md +0 -162
- package/skills_ref/security-best-practices/LICENSE.txt +0 -201
- package/skills_ref/security-best-practices/SKILL.md +0 -86
- package/skills_ref/security-best-practices/agents/openai.yaml +0 -4
- package/skills_ref/security-best-practices/references/golang-general-backend-security.md +0 -826
- package/skills_ref/security-best-practices/references/javascript-express-web-server-security.md +0 -1158
- package/skills_ref/security-best-practices/references/javascript-general-web-frontend-security.md +0 -747
- package/skills_ref/security-best-practices/references/javascript-jquery-web-frontend-security.md +0 -678
- package/skills_ref/security-best-practices/references/javascript-typescript-nextjs-web-server-security.md +0 -1144
- package/skills_ref/security-best-practices/references/javascript-typescript-react-web-frontend-security.md +0 -990
- package/skills_ref/security-best-practices/references/javascript-typescript-vue-web-frontend-security.md +0 -791
- package/skills_ref/security-best-practices/references/python-django-web-server-security.md +0 -882
- package/skills_ref/security-best-practices/references/python-fastapi-web-server-security.md +0 -1036
- package/skills_ref/security-best-practices/references/python-flask-web-server-security.md +0 -705
- package/skills_ref/security-ownership-map/LICENSE.txt +0 -201
- package/skills_ref/security-ownership-map/SKILL.md +0 -206
- package/skills_ref/security-ownership-map/agents/openai.yaml +0 -4
- package/skills_ref/security-ownership-map/references/neo4j-import.md +0 -60
- package/skills_ref/security-ownership-map/scripts/build_ownership_map.py +0 -956
- package/skills_ref/security-ownership-map/scripts/community_maintainers.py +0 -544
- package/skills_ref/security-ownership-map/scripts/query_ownership.py +0 -483
- package/skills_ref/security-ownership-map/scripts/run_ownership_map.py +0 -200
- package/skills_ref/security-threat-model/LICENSE.txt +0 -201
- package/skills_ref/security-threat-model/SKILL.md +0 -81
- package/skills_ref/security-threat-model/agents/openai.yaml +0 -4
- package/skills_ref/security-threat-model/references/prompt-template.md +0 -255
- package/skills_ref/security-threat-model/references/security-controls-and-assets.md +0 -32
- package/skills_ref/sentry/SKILL.md +0 -123
- package/skills_ref/skill-creator/SKILL.md +0 -372
- package/skills_ref/sora/SKILL.md +0 -153
- package/skills_ref/speech/SKILL.md +0 -144
- package/skills_ref/spotify-player/SKILL.md +0 -64
- package/skills_ref/static-analysis/.claude-plugin/plugin.json +0 -8
- package/skills_ref/static-analysis/README.md +0 -65
- package/skills_ref/static-analysis/agents/semgrep-scanner.md +0 -71
- package/skills_ref/static-analysis/agents/semgrep-triager.md +0 -107
- package/skills_ref/static-analysis/skills/codeql/SKILL.md +0 -119
- package/skills_ref/static-analysis/skills/codeql/references/diagnostic-query-templates.md +0 -339
- package/skills_ref/static-analysis/skills/codeql/references/language-details.md +0 -207
- package/skills_ref/static-analysis/skills/codeql/references/performance-tuning.md +0 -111
- package/skills_ref/static-analysis/skills/codeql/references/ruleset-catalog.md +0 -63
- package/skills_ref/static-analysis/skills/codeql/references/threat-models.md +0 -44
- package/skills_ref/static-analysis/skills/codeql/workflows/build-database.md +0 -669
- package/skills_ref/static-analysis/skills/codeql/workflows/create-data-extensions.md +0 -536
- package/skills_ref/static-analysis/skills/codeql/workflows/run-analysis.md +0 -436
- package/skills_ref/static-analysis/skills/sarif-parsing/SKILL.md +0 -479
- package/skills_ref/static-analysis/skills/sarif-parsing/resources/jq-queries.md +0 -162
- package/skills_ref/static-analysis/skills/sarif-parsing/resources/sarif_helpers.py +0 -331
- package/skills_ref/static-analysis/skills/semgrep/SKILL.md +0 -431
- package/skills_ref/static-analysis/skills/semgrep/references/rulesets.md +0 -162
- package/skills_ref/static-analysis/skills/semgrep/references/scanner-task-prompt.md +0 -102
- package/skills_ref/static-analysis/skills/semgrep/references/triage-task-prompt.md +0 -122
- package/skills_ref/static-analysis/skills/semgrep/scripts/merge_triaged_sarif.py +0 -252
- package/skills_ref/summarize/SKILL.md +0 -87
- package/skills_ref/tdd/SKILL.md +0 -371
- package/skills_ref/tdd/testing-anti-patterns.md +0 -299
- package/skills_ref/telegram-send/SKILL.md +0 -99
- package/skills_ref/terraform/README.md +0 -105
- package/skills_ref/terraform/code-generation/.claude-plugin/plugin.json +0 -30
- package/skills_ref/terraform/code-generation/skills/azure-verified-modules/SKILL.md +0 -613
- package/skills_ref/terraform/code-generation/skills/terraform-style-guide/SKILL.md +0 -353
- package/skills_ref/terraform/code-generation/skills/terraform-test/SKILL.md +0 -1669
- package/skills_ref/terraform/module-generation/.claude-plugin/plugin.json +0 -30
- package/skills_ref/terraform/module-generation/skills/refactor-module/SKILL.md +0 -538
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/SKILL.md +0 -468
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/api-monitoring.md +0 -543
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/component-blocks.md +0 -476
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/deployment-blocks.md +0 -391
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/examples.md +0 -1529
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/linked-stacks.md +0 -187
- package/skills_ref/terraform/module-generation/skills/terraform-stacks/references/troubleshooting.md +0 -671
- package/skills_ref/terraform/provider-development/.claude-plugin/plugin.json +0 -13
- package/skills_ref/terraform/provider-development/skills/new-terraform-provider/SKILL.md +0 -25
- package/skills_ref/terraform/provider-development/skills/new-terraform-provider/assets/main.go +0 -40
- package/skills_ref/terraform/provider-development/skills/provider-actions/SKILL.md +0 -478
- package/skills_ref/terraform/provider-development/skills/provider-resources/SKILL.md +0 -599
- package/skills_ref/terraform/provider-development/skills/run-acceptance-tests/SKILL.md +0 -41
- package/skills_ref/theme-factory/LICENSE.txt +0 -202
- package/skills_ref/theme-factory/SKILL.md +0 -59
- package/skills_ref/theme-factory/theme-showcase.pdf +0 -0
- package/skills_ref/theme-factory/themes/arctic-frost.md +0 -19
- package/skills_ref/theme-factory/themes/botanical-garden.md +0 -19
- package/skills_ref/theme-factory/themes/desert-rose.md +0 -19
- package/skills_ref/theme-factory/themes/forest-canopy.md +0 -19
- package/skills_ref/theme-factory/themes/golden-hour.md +0 -19
- package/skills_ref/theme-factory/themes/midnight-galaxy.md +0 -19
- package/skills_ref/theme-factory/themes/modern-minimalist.md +0 -19
- package/skills_ref/theme-factory/themes/ocean-depths.md +0 -19
- package/skills_ref/theme-factory/themes/sunset-boulevard.md +0 -19
- package/skills_ref/theme-factory/themes/tech-innovation.md +0 -19
- package/skills_ref/things-mac/SKILL.md +0 -86
- package/skills_ref/tmux/SKILL.md +0 -153
- package/skills_ref/transcribe/SKILL.md +0 -81
- package/skills_ref/trello/SKILL.md +0 -95
- package/skills_ref/tts/SKILL.md +0 -99
- package/skills_ref/vercel-deploy/SKILL.md +0 -115
- package/skills_ref/video-downloader/SKILL.md +0 -99
- package/skills_ref/video-downloader/scripts/download_video.py +0 -145
- package/skills_ref/video-frames/SKILL.md +0 -46
- package/skills_ref/vision-click/SKILL.md +0 -128
- package/skills_ref/weather/SKILL.md +0 -112
- package/skills_ref/web-artifacts-builder/LICENSE.txt +0 -202
- package/skills_ref/web-artifacts-builder/SKILL.md +0 -74
- package/skills_ref/web-artifacts-builder/scripts/bundle-artifact.sh +0 -54
- package/skills_ref/web-artifacts-builder/scripts/init-artifact.sh +0 -322
- package/skills_ref/web-artifacts-builder/scripts/shadcn-components.tar.gz +0 -0
- package/skills_ref/web-perf/SKILL.md +0 -193
- package/skills_ref/web-routing/SKILL.md +0 -26
- package/skills_ref/whatsapp/SKILL.md +0 -255
- package/skills_ref/whatsapp/assets/agent-app-integration-example.json +0 -35
- package/skills_ref/whatsapp/assets/databases-example.json +0 -11
- package/skills_ref/whatsapp/assets/function-decide-route-interactive-buttons.json +0 -6
- package/skills_ref/whatsapp/assets/functions-example.json +0 -5
- package/skills_ref/whatsapp/assets/workflow-agent-simple.json +0 -31
- package/skills_ref/whatsapp/assets/workflow-api-template-wait-agent.json +0 -59
- package/skills_ref/whatsapp/assets/workflow-customer-support-intake-agent.json +0 -56
- package/skills_ref/whatsapp/assets/workflow-decision.json +0 -83
- package/skills_ref/whatsapp/assets/workflow-interactive-buttons-decide-ai.json +0 -89
- package/skills_ref/whatsapp/assets/workflow-interactive-buttons-decide-function.json +0 -88
- package/skills_ref/whatsapp/assets/workflow-linear.json +0 -53
- package/skills_ref/whatsapp/package.json +0 -10
- package/skills_ref/whatsapp/references/app-integrations.md +0 -89
- package/skills_ref/whatsapp/references/databases-reference.md +0 -21
- package/skills_ref/whatsapp/references/execution-context.md +0 -42
- package/skills_ref/whatsapp/references/function-contracts.md +0 -55
- package/skills_ref/whatsapp/references/functions-payloads.md +0 -87
- package/skills_ref/whatsapp/references/functions-reference.md +0 -133
- package/skills_ref/whatsapp/references/graph-contract.md +0 -145
- package/skills_ref/whatsapp/references/node-types.md +0 -430
- package/skills_ref/whatsapp/references/triggers.md +0 -20
- package/skills_ref/whatsapp/references/workflow-overview.md +0 -22
- package/skills_ref/whatsapp/references/workflow-reference.md +0 -123
- package/skills_ref/whatsapp/scripts/configure-prop.js +0 -113
- package/skills_ref/whatsapp/scripts/create-connect-token.js +0 -38
- package/skills_ref/whatsapp/scripts/create-function.js +0 -64
- package/skills_ref/whatsapp/scripts/create-integration.js +0 -137
- package/skills_ref/whatsapp/scripts/create-row.js +0 -47
- package/skills_ref/whatsapp/scripts/create-trigger.js +0 -88
- package/skills_ref/whatsapp/scripts/create-workflow.js +0 -85
- package/skills_ref/whatsapp/scripts/delete-integration.js +0 -44
- package/skills_ref/whatsapp/scripts/delete-row.js +0 -49
- package/skills_ref/whatsapp/scripts/delete-trigger.js +0 -44
- package/skills_ref/whatsapp/scripts/deploy-function.js +0 -47
- package/skills_ref/whatsapp/scripts/edit-graph.js +0 -289
- package/skills_ref/whatsapp/scripts/get-action-schema.js +0 -44
- package/skills_ref/whatsapp/scripts/get-context-value.js +0 -80
- package/skills_ref/whatsapp/scripts/get-execution-event.js +0 -55
- package/skills_ref/whatsapp/scripts/get-execution.js +0 -44
- package/skills_ref/whatsapp/scripts/get-function.js +0 -43
- package/skills_ref/whatsapp/scripts/get-graph.js +0 -85
- package/skills_ref/whatsapp/scripts/get-table.js +0 -45
- package/skills_ref/whatsapp/scripts/get-workflow.js +0 -44
- package/skills_ref/whatsapp/scripts/invoke-function.js +0 -60
- package/skills_ref/whatsapp/scripts/lib/databases/args.js +0 -87
- package/skills_ref/whatsapp/scripts/lib/databases/filters.js +0 -30
- package/skills_ref/whatsapp/scripts/lib/databases/kapso-api.js +0 -70
- package/skills_ref/whatsapp/scripts/lib/functions/args.js +0 -55
- package/skills_ref/whatsapp/scripts/lib/functions/kapso-api.js +0 -70
- package/skills_ref/whatsapp/scripts/lib/workflows/args.js +0 -53
- package/skills_ref/whatsapp/scripts/lib/workflows/kapso-api.js +0 -123
- package/skills_ref/whatsapp/scripts/lib/workflows/result.js +0 -16
- package/skills_ref/whatsapp/scripts/list-accounts.js +0 -62
- package/skills_ref/whatsapp/scripts/list-apps.js +0 -42
- package/skills_ref/whatsapp/scripts/list-execution-events.js +0 -61
- package/skills_ref/whatsapp/scripts/list-executions.js +0 -53
- package/skills_ref/whatsapp/scripts/list-function-invocations.js +0 -53
- package/skills_ref/whatsapp/scripts/list-functions.js +0 -41
- package/skills_ref/whatsapp/scripts/list-integrations.js +0 -41
- package/skills_ref/whatsapp/scripts/list-provider-models.js +0 -48
- package/skills_ref/whatsapp/scripts/list-tables.js +0 -41
- package/skills_ref/whatsapp/scripts/list-triggers.js +0 -44
- package/skills_ref/whatsapp/scripts/list-whatsapp-phone-numbers.js +0 -56
- package/skills_ref/whatsapp/scripts/list-workflows.js +0 -44
- package/skills_ref/whatsapp/scripts/openapi-explore.mjs +0 -1273
- package/skills_ref/whatsapp/scripts/query-rows.js +0 -71
- package/skills_ref/whatsapp/scripts/reload-props.js +0 -110
- package/skills_ref/whatsapp/scripts/resume-execution.js +0 -75
- package/skills_ref/whatsapp/scripts/search-actions.js +0 -64
- package/skills_ref/whatsapp/scripts/update-execution-status.js +0 -51
- package/skills_ref/whatsapp/scripts/update-function.js +0 -65
- package/skills_ref/whatsapp/scripts/update-graph.js +0 -154
- package/skills_ref/whatsapp/scripts/update-integration.js +0 -82
- package/skills_ref/whatsapp/scripts/update-row.js +0 -51
- package/skills_ref/whatsapp/scripts/update-trigger.js +0 -60
- package/skills_ref/whatsapp/scripts/update-workflow-settings.js +0 -67
- package/skills_ref/whatsapp/scripts/upsert-row.js +0 -64
- package/skills_ref/whatsapp/scripts/validate-graph.js +0 -293
- package/skills_ref/whatsapp/scripts/variables-delete.js +0 -37
- package/skills_ref/whatsapp/scripts/variables-list.js +0 -55
- package/skills_ref/whatsapp/scripts/variables-set.js +0 -39
- package/skills_ref/writing-plans/SKILL.md +0 -116
- package/skills_ref/xlsx/LICENSE.txt +0 -30
- package/skills_ref/xlsx/SKILL.md +0 -292
- package/skills_ref/xlsx/scripts/office/helpers/__init__.py +0 -0
- package/skills_ref/xlsx/scripts/office/helpers/merge_runs.py +0 -199
- package/skills_ref/xlsx/scripts/office/helpers/simplify_redlines.py +0 -197
- package/skills_ref/xlsx/scripts/office/pack.py +0 -159
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chart.xsd +0 -1499
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-chartDrawing.xsd +0 -146
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-diagram.xsd +0 -1085
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-lockedCanvas.xsd +0 -11
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-main.xsd +0 -3081
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-picture.xsd +0 -23
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-spreadsheetDrawing.xsd +0 -185
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/dml-wordprocessingDrawing.xsd +0 -287
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/pml.xsd +0 -1676
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-additionalCharacteristics.xsd +0 -28
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-bibliography.xsd +0 -144
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-commonSimpleTypes.xsd +0 -174
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlDataProperties.xsd +0 -25
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-customXmlSchemaProperties.xsd +0 -18
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesCustom.xsd +0 -59
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesExtended.xsd +0 -56
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-documentPropertiesVariantTypes.xsd +0 -195
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-math.xsd +0 -582
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/shared-relationshipReference.xsd +0 -25
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/sml.xsd +0 -4439
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-main.xsd +0 -570
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-officeDrawing.xsd +0 -509
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-presentationDrawing.xsd +0 -12
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-spreadsheetDrawing.xsd +0 -108
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/vml-wordprocessingDrawing.xsd +0 -96
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/wml.xsd +0 -3646
- package/skills_ref/xlsx/scripts/office/schemas/ISO-IEC29500-4_2016/xml.xsd +0 -116
- package/skills_ref/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-contentTypes.xsd +0 -42
- package/skills_ref/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-coreProperties.xsd +0 -50
- package/skills_ref/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-digSig.xsd +0 -49
- package/skills_ref/xlsx/scripts/office/schemas/ecma/fouth-edition/opc-relationships.xsd +0 -33
- package/skills_ref/xlsx/scripts/office/schemas/mce/mc.xsd +0 -75
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-2010.xsd +0 -560
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-2012.xsd +0 -67
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-2018.xsd +0 -14
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-cex-2018.xsd +0 -20
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-cid-2016.xsd +0 -13
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-sdtdatahash-2020.xsd +0 -4
- package/skills_ref/xlsx/scripts/office/schemas/microsoft/wml-symex-2015.xsd +0 -8
- package/skills_ref/xlsx/scripts/office/soffice.py +0 -183
- package/skills_ref/xlsx/scripts/office/unpack.py +0 -132
- package/skills_ref/xlsx/scripts/office/validate.py +0 -111
- package/skills_ref/xlsx/scripts/office/validators/__init__.py +0 -15
- package/skills_ref/xlsx/scripts/office/validators/base.py +0 -847
- package/skills_ref/xlsx/scripts/office/validators/docx.py +0 -446
- package/skills_ref/xlsx/scripts/office/validators/pptx.py +0 -275
- package/skills_ref/xlsx/scripts/office/validators/redlining.py +0 -247
- package/skills_ref/xlsx/scripts/recalc.py +0 -184
- package/skills_ref/xurl/SKILL.md +0 -461
|
@@ -1,382 +0,0 @@
|
|
|
1
|
-
# Usage Examples
|
|
2
|
-
|
|
3
|
-
This document provides practical examples for both methods of adding evaluations to HuggingFace model cards.
|
|
4
|
-
|
|
5
|
-
## Table of Contents
|
|
6
|
-
1. [Setup](#setup)
|
|
7
|
-
2. [Method 1: Extract from README](#method-1-extract-from-readme)
|
|
8
|
-
3. [Method 2: Import from Artificial Analysis](#method-2-import-from-artificial-analysis)
|
|
9
|
-
4. [Standalone vs Integrated](#standalone-vs-integrated)
|
|
10
|
-
5. [Common Workflows](#common-workflows)
|
|
11
|
-
|
|
12
|
-
## Setup
|
|
13
|
-
|
|
14
|
-
### Initial Configuration
|
|
15
|
-
|
|
16
|
-
```bash
|
|
17
|
-
# Navigate to skill directory
|
|
18
|
-
cd hf_evaluation_skill
|
|
19
|
-
|
|
20
|
-
# Install dependencies
|
|
21
|
-
uv add huggingface_hub python-dotenv pyyaml requests
|
|
22
|
-
|
|
23
|
-
# Configure environment variables
|
|
24
|
-
cp examples/.env.example .env
|
|
25
|
-
# Edit .env with your tokens
|
|
26
|
-
```
|
|
27
|
-
|
|
28
|
-
Your `.env` file should contain:
|
|
29
|
-
```env
|
|
30
|
-
HF_TOKEN=hf_your_write_token_here
|
|
31
|
-
AA_API_KEY=aa_your_api_key_here # Optional for AA imports
|
|
32
|
-
```
|
|
33
|
-
|
|
34
|
-
### Verify Installation
|
|
35
|
-
|
|
36
|
-
```bash
|
|
37
|
-
cd scripts
|
|
38
|
-
python3 test_extraction.py
|
|
39
|
-
```
|
|
40
|
-
|
|
41
|
-
## Method 1: Extract from README
|
|
42
|
-
|
|
43
|
-
Extract evaluation tables from your model's existing README.
|
|
44
|
-
|
|
45
|
-
### Basic Extraction
|
|
46
|
-
|
|
47
|
-
```bash
|
|
48
|
-
# Preview what will be extracted (dry run)
|
|
49
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
50
|
-
--repo-id "meta-llama/Llama-3.3-70B-Instruct" \
|
|
51
|
-
--dry-run
|
|
52
|
-
```
|
|
53
|
-
|
|
54
|
-
### Apply Extraction to Your Model
|
|
55
|
-
|
|
56
|
-
```bash
|
|
57
|
-
# Extract and update model card directly
|
|
58
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
59
|
-
--repo-id "your-username/your-model-7b"
|
|
60
|
-
```
|
|
61
|
-
|
|
62
|
-
### Custom Task and Dataset Names
|
|
63
|
-
|
|
64
|
-
```bash
|
|
65
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
66
|
-
--repo-id "your-username/your-model-7b" \
|
|
67
|
-
--task-type "text-generation" \
|
|
68
|
-
--dataset-name "Standard Benchmarks" \
|
|
69
|
-
--dataset-type "llm_benchmarks"
|
|
70
|
-
```
|
|
71
|
-
|
|
72
|
-
### Create Pull Request (for models you don't own)
|
|
73
|
-
|
|
74
|
-
```bash
|
|
75
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
76
|
-
--repo-id "organization/community-model" \
|
|
77
|
-
--create-pr
|
|
78
|
-
```
|
|
79
|
-
|
|
80
|
-
### Example README Format
|
|
81
|
-
|
|
82
|
-
Your model README should contain tables like:
|
|
83
|
-
|
|
84
|
-
```markdown
|
|
85
|
-
## Evaluation Results
|
|
86
|
-
|
|
87
|
-
| Benchmark | Score |
|
|
88
|
-
|---------------|-------|
|
|
89
|
-
| MMLU | 85.2 |
|
|
90
|
-
| HumanEval | 72.5 |
|
|
91
|
-
| GSM8K | 91.3 |
|
|
92
|
-
| HellaSwag | 88.9 |
|
|
93
|
-
```
|
|
94
|
-
|
|
95
|
-
## Method 2: Import from Artificial Analysis
|
|
96
|
-
|
|
97
|
-
Fetch benchmark scores directly from Artificial Analysis API.
|
|
98
|
-
|
|
99
|
-
### Integrated Approach (Recommended)
|
|
100
|
-
|
|
101
|
-
```bash
|
|
102
|
-
# Import scores for Claude Sonnet 4.5
|
|
103
|
-
python3 scripts/evaluation_manager.py import-aa \
|
|
104
|
-
--creator-slug "anthropic" \
|
|
105
|
-
--model-name "claude-sonnet-4" \
|
|
106
|
-
--repo-id "your-username/claude-mirror"
|
|
107
|
-
```
|
|
108
|
-
|
|
109
|
-
### With Pull Request
|
|
110
|
-
|
|
111
|
-
```bash
|
|
112
|
-
# Create PR instead of direct commit
|
|
113
|
-
python3 scripts/evaluation_manager.py import-aa \
|
|
114
|
-
--creator-slug "openai" \
|
|
115
|
-
--model-name "gpt-4" \
|
|
116
|
-
--repo-id "your-username/gpt-4-mirror" \
|
|
117
|
-
--create-pr
|
|
118
|
-
```
|
|
119
|
-
|
|
120
|
-
### Standalone Script
|
|
121
|
-
|
|
122
|
-
For simple, one-off imports, use the standalone script:
|
|
123
|
-
|
|
124
|
-
```bash
|
|
125
|
-
# Navigate to examples directory
|
|
126
|
-
cd examples
|
|
127
|
-
|
|
128
|
-
# Run standalone script
|
|
129
|
-
AA_API_KEY="your-key" HF_TOKEN="your-token" \
|
|
130
|
-
python3 artificial_analysis_to_hub.py \
|
|
131
|
-
--creator-slug "anthropic" \
|
|
132
|
-
--model-name "claude-sonnet-4" \
|
|
133
|
-
--repo-id "your-username/your-repo"
|
|
134
|
-
```
|
|
135
|
-
|
|
136
|
-
### Finding Creator Slug and Model Name
|
|
137
|
-
|
|
138
|
-
1. Visit [Artificial Analysis](https://artificialanalysis.ai/)
|
|
139
|
-
2. Navigate to the model you want to import
|
|
140
|
-
3. The URL format is: `https://artificialanalysis.ai/models/{creator-slug}/{model-name}`
|
|
141
|
-
4. Or check their [API documentation](https://artificialanalysis.ai/api)
|
|
142
|
-
|
|
143
|
-
Common examples:
|
|
144
|
-
- Anthropic: `--creator-slug "anthropic" --model-name "claude-sonnet-4"`
|
|
145
|
-
- OpenAI: `--creator-slug "openai" --model-name "gpt-4-turbo"`
|
|
146
|
-
- Meta: `--creator-slug "meta" --model-name "llama-3-70b"`
|
|
147
|
-
|
|
148
|
-
## Standalone vs Integrated
|
|
149
|
-
|
|
150
|
-
### Standalone Script Features
|
|
151
|
-
- ✓ Simple, single-purpose
|
|
152
|
-
- ✓ Can run via `uv run` from URL
|
|
153
|
-
- ✓ Minimal dependencies
|
|
154
|
-
- ✗ No README extraction
|
|
155
|
-
- ✗ No validation
|
|
156
|
-
- ✗ No dry-run mode
|
|
157
|
-
|
|
158
|
-
**Use when:** You only need AA imports and want a simple script.
|
|
159
|
-
|
|
160
|
-
### Integrated Script Features
|
|
161
|
-
- ✓ Both README extraction AND AA import
|
|
162
|
-
- ✓ Validation and show commands
|
|
163
|
-
- ✓ Dry-run preview mode
|
|
164
|
-
- ✓ Better error handling
|
|
165
|
-
- ✓ Merge with existing evaluations
|
|
166
|
-
- ✓ More flexible options
|
|
167
|
-
|
|
168
|
-
**Use when:** You want full evaluation management capabilities.
|
|
169
|
-
|
|
170
|
-
## Common Workflows
|
|
171
|
-
|
|
172
|
-
### Workflow 1: New Model with README Tables
|
|
173
|
-
|
|
174
|
-
You've just created a model with evaluation tables in the README.
|
|
175
|
-
|
|
176
|
-
```bash
|
|
177
|
-
# Step 1: Preview extraction
|
|
178
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
179
|
-
--repo-id "your-username/new-model-7b" \
|
|
180
|
-
--dry-run
|
|
181
|
-
|
|
182
|
-
# Step 2: Apply if it looks good
|
|
183
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
184
|
-
--repo-id "your-username/new-model-7b"
|
|
185
|
-
|
|
186
|
-
# Step 3: Validate
|
|
187
|
-
python3 scripts/evaluation_manager.py validate \
|
|
188
|
-
--repo-id "your-username/new-model-7b"
|
|
189
|
-
|
|
190
|
-
# Step 4: View results
|
|
191
|
-
python3 scripts/evaluation_manager.py show \
|
|
192
|
-
--repo-id "your-username/new-model-7b"
|
|
193
|
-
```
|
|
194
|
-
|
|
195
|
-
### Workflow 2: Model Benchmarked on AA
|
|
196
|
-
|
|
197
|
-
Your model appears on Artificial Analysis with fresh benchmarks.
|
|
198
|
-
|
|
199
|
-
```bash
|
|
200
|
-
# Import scores and create PR for review
|
|
201
|
-
python3 scripts/evaluation_manager.py import-aa \
|
|
202
|
-
--creator-slug "your-org" \
|
|
203
|
-
--model-name "your-model" \
|
|
204
|
-
--repo-id "your-org/your-model-hf" \
|
|
205
|
-
--create-pr
|
|
206
|
-
```
|
|
207
|
-
|
|
208
|
-
### Workflow 3: Combine Both Methods
|
|
209
|
-
|
|
210
|
-
You have README tables AND AA scores.
|
|
211
|
-
|
|
212
|
-
```bash
|
|
213
|
-
# Step 1: Extract from README
|
|
214
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
215
|
-
--repo-id "your-username/hybrid-model"
|
|
216
|
-
|
|
217
|
-
# Step 2: Import from AA (will merge with existing)
|
|
218
|
-
python3 scripts/evaluation_manager.py import-aa \
|
|
219
|
-
--creator-slug "your-org" \
|
|
220
|
-
--model-name "hybrid-model" \
|
|
221
|
-
--repo-id "your-username/hybrid-model"
|
|
222
|
-
|
|
223
|
-
# Step 3: View combined results
|
|
224
|
-
python3 scripts/evaluation_manager.py show \
|
|
225
|
-
--repo-id "your-username/hybrid-model"
|
|
226
|
-
```
|
|
227
|
-
|
|
228
|
-
### Workflow 4: Contributing to Community Models
|
|
229
|
-
|
|
230
|
-
Help improve community models by adding missing evaluations.
|
|
231
|
-
|
|
232
|
-
```bash
|
|
233
|
-
# Find a model with evaluations in README but no model-index
|
|
234
|
-
# Example: community/awesome-7b
|
|
235
|
-
|
|
236
|
-
# Create PR with extracted evaluations
|
|
237
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
238
|
-
--repo-id "community/awesome-7b" \
|
|
239
|
-
--create-pr
|
|
240
|
-
|
|
241
|
-
# GitHub will notify the repository owner
|
|
242
|
-
# They can review and merge your PR
|
|
243
|
-
```
|
|
244
|
-
|
|
245
|
-
### Workflow 5: Batch Processing
|
|
246
|
-
|
|
247
|
-
Update multiple models at once.
|
|
248
|
-
|
|
249
|
-
```bash
|
|
250
|
-
# Create a list of repos
|
|
251
|
-
cat > models.txt << EOF
|
|
252
|
-
your-org/model-1-7b
|
|
253
|
-
your-org/model-2-13b
|
|
254
|
-
your-org/model-3-70b
|
|
255
|
-
EOF
|
|
256
|
-
|
|
257
|
-
# Process each
|
|
258
|
-
while read repo_id; do
|
|
259
|
-
echo "Processing $repo_id..."
|
|
260
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
261
|
-
--repo-id "$repo_id"
|
|
262
|
-
done < models.txt
|
|
263
|
-
```
|
|
264
|
-
|
|
265
|
-
### Workflow 6: Automated Updates (CI/CD)
|
|
266
|
-
|
|
267
|
-
Set up automatic evaluation updates using GitHub Actions.
|
|
268
|
-
|
|
269
|
-
```yaml
|
|
270
|
-
# .github/workflows/update-evals.yml
|
|
271
|
-
name: Update Evaluations Weekly
|
|
272
|
-
on:
|
|
273
|
-
schedule:
|
|
274
|
-
- cron: '0 0 * * 0' # Every Sunday
|
|
275
|
-
workflow_dispatch: # Manual trigger
|
|
276
|
-
|
|
277
|
-
jobs:
|
|
278
|
-
update:
|
|
279
|
-
runs-on: ubuntu-latest
|
|
280
|
-
steps:
|
|
281
|
-
- uses: actions/checkout@v4
|
|
282
|
-
|
|
283
|
-
- name: Set up Python
|
|
284
|
-
uses: actions/setup-python@v4
|
|
285
|
-
with:
|
|
286
|
-
python-version: '3.13'
|
|
287
|
-
|
|
288
|
-
- name: Install dependencies
|
|
289
|
-
run: |
|
|
290
|
-
pip install huggingface-hub python-dotenv pyyaml requests
|
|
291
|
-
|
|
292
|
-
- name: Update from Artificial Analysis
|
|
293
|
-
env:
|
|
294
|
-
AA_API_KEY: ${{ secrets.AA_API_KEY }}
|
|
295
|
-
HF_TOKEN: ${{ secrets.HF_TOKEN }}
|
|
296
|
-
run: |
|
|
297
|
-
python scripts/evaluation_manager.py import-aa \
|
|
298
|
-
--creator-slug "${{ vars.AA_CREATOR_SLUG }}" \
|
|
299
|
-
--model-name "${{ vars.AA_MODEL_NAME }}" \
|
|
300
|
-
--repo-id "${{ github.repository }}" \
|
|
301
|
-
--create-pr
|
|
302
|
-
```
|
|
303
|
-
|
|
304
|
-
## Verification and Validation
|
|
305
|
-
|
|
306
|
-
### Check Current Evaluations
|
|
307
|
-
|
|
308
|
-
```bash
|
|
309
|
-
python3 scripts/evaluation_manager.py show \
|
|
310
|
-
--repo-id "your-username/your-model"
|
|
311
|
-
```
|
|
312
|
-
|
|
313
|
-
### Validate Format
|
|
314
|
-
|
|
315
|
-
```bash
|
|
316
|
-
python3 scripts/evaluation_manager.py validate \
|
|
317
|
-
--repo-id "your-username/your-model"
|
|
318
|
-
```
|
|
319
|
-
|
|
320
|
-
### View in HuggingFace UI
|
|
321
|
-
|
|
322
|
-
After updating, visit:
|
|
323
|
-
```
|
|
324
|
-
https://huggingface.co/your-username/your-model
|
|
325
|
-
```
|
|
326
|
-
|
|
327
|
-
The evaluation widget should display your scores automatically.
|
|
328
|
-
|
|
329
|
-
## Troubleshooting Examples
|
|
330
|
-
|
|
331
|
-
### Problem: No tables found
|
|
332
|
-
|
|
333
|
-
```bash
|
|
334
|
-
# Check what tables exist in your README
|
|
335
|
-
python3 scripts/evaluation_manager.py extract-readme \
|
|
336
|
-
--repo-id "your-username/your-model" \
|
|
337
|
-
--dry-run
|
|
338
|
-
|
|
339
|
-
# If no output, ensure your README has markdown tables with numeric scores
|
|
340
|
-
```
|
|
341
|
-
|
|
342
|
-
### Problem: AA model not found
|
|
343
|
-
|
|
344
|
-
```bash
|
|
345
|
-
# Verify the creator and model slugs
|
|
346
|
-
# Check the AA website URL or API directly
|
|
347
|
-
curl -H "x-api-key: $AA_API_KEY" \
|
|
348
|
-
https://artificialanalysis.ai/api/v2/data/llms/models | jq
|
|
349
|
-
```
|
|
350
|
-
|
|
351
|
-
### Problem: Token permission error
|
|
352
|
-
|
|
353
|
-
```bash
|
|
354
|
-
# Verify your token has write access
|
|
355
|
-
# Generate a new token at: https://huggingface.co/settings/tokens
|
|
356
|
-
# Ensure "Write" scope is enabled
|
|
357
|
-
```
|
|
358
|
-
|
|
359
|
-
## Tips and Best Practices
|
|
360
|
-
|
|
361
|
-
1. **Always dry-run first**: Use `--dry-run` to preview changes
|
|
362
|
-
2. **Use PRs for others' repos**: Always use `--create-pr` for repositories you don't own
|
|
363
|
-
3. **Validate after updates**: Run `validate` to ensure proper formatting
|
|
364
|
-
4. **Keep evaluations current**: Set up automated updates for AA scores
|
|
365
|
-
5. **Document sources**: The tool automatically adds source attribution
|
|
366
|
-
6. **Check the UI**: Always verify the evaluation widget displays correctly
|
|
367
|
-
|
|
368
|
-
## Getting Help
|
|
369
|
-
|
|
370
|
-
```bash
|
|
371
|
-
# General help
|
|
372
|
-
python3 scripts/evaluation_manager.py --help
|
|
373
|
-
|
|
374
|
-
# Command-specific help
|
|
375
|
-
python3 scripts/evaluation_manager.py extract-readme --help
|
|
376
|
-
python3 scripts/evaluation_manager.py import-aa --help
|
|
377
|
-
```
|
|
378
|
-
|
|
379
|
-
For issues or questions, consult:
|
|
380
|
-
- `../SKILL.md` - Complete documentation
|
|
381
|
-
- `../README.md` - Troubleshooting guide
|
|
382
|
-
- `../QUICKSTART.md` - Quick start guide
|
|
@@ -1,141 +0,0 @@
|
|
|
1
|
-
# /// script
|
|
2
|
-
# requires-python = ">=3.13"
|
|
3
|
-
# dependencies = [
|
|
4
|
-
# "huggingface-hub>=1.1.4",
|
|
5
|
-
# "python-dotenv>=1.2.1",
|
|
6
|
-
# "pyyaml>=6.0.3",
|
|
7
|
-
# "requests>=2.32.5",
|
|
8
|
-
# ]
|
|
9
|
-
# ///
|
|
10
|
-
|
|
11
|
-
"""
|
|
12
|
-
Add Artificial Analysis evaluations to a Hugging Face model card.
|
|
13
|
-
|
|
14
|
-
NOTE: This is a standalone reference script. For integrated functionality
|
|
15
|
-
with additional features (README extraction, validation, etc.), use:
|
|
16
|
-
../scripts/evaluation_manager.py import-aa [options]
|
|
17
|
-
|
|
18
|
-
STANDALONE USAGE:
|
|
19
|
-
AA_API_KEY="<your-api-key>" HF_TOKEN="<your-huggingface-token>" \
|
|
20
|
-
python artificial_analysis_to_hub.py \
|
|
21
|
-
--creator-slug <artificial-analysis-creator-slug> \
|
|
22
|
-
--model-name <artificial-analysis-model-name> \
|
|
23
|
-
--repo-id <huggingface-repo-id>
|
|
24
|
-
|
|
25
|
-
INTEGRATED USAGE (Recommended):
|
|
26
|
-
python ../scripts/evaluation_manager.py import-aa \
|
|
27
|
-
--creator-slug <creator-slug> \
|
|
28
|
-
--model-name <model-name> \
|
|
29
|
-
--repo-id <repo-id> \
|
|
30
|
-
[--create-pr]
|
|
31
|
-
"""
|
|
32
|
-
|
|
33
|
-
import argparse
|
|
34
|
-
import os
|
|
35
|
-
|
|
36
|
-
import requests
|
|
37
|
-
import dotenv
|
|
38
|
-
from huggingface_hub import ModelCard
|
|
39
|
-
|
|
40
|
-
dotenv.load_dotenv()
|
|
41
|
-
|
|
42
|
-
API_KEY = os.getenv("AA_API_KEY")
|
|
43
|
-
HF_TOKEN = os.getenv("HF_TOKEN")
|
|
44
|
-
URL = "https://artificialanalysis.ai/api/v2/data/llms/models"
|
|
45
|
-
HEADERS = {"x-api-key": API_KEY}
|
|
46
|
-
|
|
47
|
-
if not API_KEY:
|
|
48
|
-
raise ValueError("AA_API_KEY is not set")
|
|
49
|
-
if not HF_TOKEN:
|
|
50
|
-
raise ValueError("HF_TOKEN is not set")
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
def get_model_evaluations_data(creator_slug, model_name):
|
|
54
|
-
response = requests.get(URL, headers=HEADERS)
|
|
55
|
-
response_data = response.json()["data"]
|
|
56
|
-
for model in response_data:
|
|
57
|
-
if (
|
|
58
|
-
model["model_creator"]["slug"] == creator_slug
|
|
59
|
-
and model["slug"] == model_name
|
|
60
|
-
):
|
|
61
|
-
return model
|
|
62
|
-
raise ValueError(f"Model {model_name} not found")
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
def aa_evaluations_to_model_index(
|
|
66
|
-
model,
|
|
67
|
-
dataset_name="Artificial Analysis Benchmarks",
|
|
68
|
-
dataset_type="artificial_analysis",
|
|
69
|
-
task_type="evaluation",
|
|
70
|
-
):
|
|
71
|
-
if not model:
|
|
72
|
-
raise ValueError("Model data is required")
|
|
73
|
-
|
|
74
|
-
model_name = model.get("name", model.get("slug", "unknown-model"))
|
|
75
|
-
evaluations = model.get("evaluations", {})
|
|
76
|
-
|
|
77
|
-
metrics = []
|
|
78
|
-
for key, value in evaluations.items():
|
|
79
|
-
metrics.append(
|
|
80
|
-
{
|
|
81
|
-
"name": key.replace("_", " ").title(),
|
|
82
|
-
"type": key,
|
|
83
|
-
"value": value,
|
|
84
|
-
}
|
|
85
|
-
)
|
|
86
|
-
|
|
87
|
-
model_index = [
|
|
88
|
-
{
|
|
89
|
-
"name": model_name,
|
|
90
|
-
"results": [
|
|
91
|
-
{
|
|
92
|
-
"task": {"type": task_type},
|
|
93
|
-
"dataset": {"name": dataset_name, "type": dataset_type},
|
|
94
|
-
"metrics": metrics,
|
|
95
|
-
"source": {
|
|
96
|
-
"name": "Artificial Analysis API",
|
|
97
|
-
"url": "https://artificialanalysis.ai",
|
|
98
|
-
},
|
|
99
|
-
}
|
|
100
|
-
],
|
|
101
|
-
}
|
|
102
|
-
]
|
|
103
|
-
|
|
104
|
-
return model_index
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
def main():
|
|
108
|
-
parser = argparse.ArgumentParser()
|
|
109
|
-
parser.add_argument("--creator-slug", type=str, required=True)
|
|
110
|
-
parser.add_argument("--model-name", type=str, required=True)
|
|
111
|
-
parser.add_argument("--repo-id", type=str, required=True)
|
|
112
|
-
args = parser.parse_args()
|
|
113
|
-
|
|
114
|
-
aa_evaluations_data = get_model_evaluations_data(
|
|
115
|
-
creator_slug=args.creator_slug, model_name=args.model_name
|
|
116
|
-
)
|
|
117
|
-
|
|
118
|
-
model_index = aa_evaluations_to_model_index(model=aa_evaluations_data)
|
|
119
|
-
|
|
120
|
-
card = ModelCard.load(args.repo_id)
|
|
121
|
-
card.data["model-index"] = model_index
|
|
122
|
-
|
|
123
|
-
commit_message = (
|
|
124
|
-
f"Add Artificial Analysis evaluations for {args.model_name}"
|
|
125
|
-
)
|
|
126
|
-
commit_description = (
|
|
127
|
-
f"This commit adds the Artificial Analysis evaluations for the {args.model_name} model to this repository. "
|
|
128
|
-
"To see the scores, visit the [Artificial Analysis](https://artificialanalysis.ai) website."
|
|
129
|
-
)
|
|
130
|
-
|
|
131
|
-
card.push_to_hub(
|
|
132
|
-
args.repo_id,
|
|
133
|
-
token=HF_TOKEN,
|
|
134
|
-
commit_message=commit_message,
|
|
135
|
-
commit_description=commit_description,
|
|
136
|
-
create_pr=True,
|
|
137
|
-
)
|
|
138
|
-
|
|
139
|
-
|
|
140
|
-
if __name__ == "__main__":
|
|
141
|
-
main()
|
|
@@ -1,135 +0,0 @@
|
|
|
1
|
-
# Example Evaluation Table Formats
|
|
2
|
-
|
|
3
|
-
This file shows various formats of evaluation tables that can be extracted from model README files.
|
|
4
|
-
|
|
5
|
-
## Format 1: Benchmarks as Rows (Most Common)
|
|
6
|
-
|
|
7
|
-
```markdown
|
|
8
|
-
| Benchmark | Score |
|
|
9
|
-
|-----------|-------|
|
|
10
|
-
| MMLU | 85.2 |
|
|
11
|
-
| HumanEval | 72.5 |
|
|
12
|
-
| GSM8K | 91.3 |
|
|
13
|
-
| HellaSwag | 88.9 |
|
|
14
|
-
```
|
|
15
|
-
|
|
16
|
-
## Format 2: Multiple Metric Columns
|
|
17
|
-
|
|
18
|
-
```markdown
|
|
19
|
-
| Benchmark | Accuracy | F1 Score |
|
|
20
|
-
|-----------|----------|----------|
|
|
21
|
-
| MMLU | 85.2 | 0.84 |
|
|
22
|
-
| GSM8K | 91.3 | 0.91 |
|
|
23
|
-
| DROP | 78.5 | 0.77 |
|
|
24
|
-
```
|
|
25
|
-
|
|
26
|
-
## Format 3: Benchmarks as Columns
|
|
27
|
-
|
|
28
|
-
```markdown
|
|
29
|
-
| MMLU | HumanEval | GSM8K | HellaSwag |
|
|
30
|
-
|------|-----------|-------|-----------|
|
|
31
|
-
| 85.2 | 72.5 | 91.3 | 88.9 |
|
|
32
|
-
```
|
|
33
|
-
|
|
34
|
-
## Format 4: Percentage Values
|
|
35
|
-
|
|
36
|
-
```markdown
|
|
37
|
-
| Benchmark | Score |
|
|
38
|
-
|---------------|----------|
|
|
39
|
-
| MMLU | 85.2% |
|
|
40
|
-
| HumanEval | 72.5% |
|
|
41
|
-
| GSM8K | 91.3% |
|
|
42
|
-
| TruthfulQA | 68.7% |
|
|
43
|
-
```
|
|
44
|
-
|
|
45
|
-
## Format 5: Mixed Format with Categories
|
|
46
|
-
|
|
47
|
-
```markdown
|
|
48
|
-
### Reasoning
|
|
49
|
-
|
|
50
|
-
| Benchmark | Score |
|
|
51
|
-
|-----------|-------|
|
|
52
|
-
| MMLU | 85.2 |
|
|
53
|
-
| BBH | 82.4 |
|
|
54
|
-
| GPQA | 71.3 |
|
|
55
|
-
|
|
56
|
-
### Coding
|
|
57
|
-
|
|
58
|
-
| Benchmark | Score |
|
|
59
|
-
|-----------|-------|
|
|
60
|
-
| HumanEval | 72.5 |
|
|
61
|
-
| MBPP | 78.9 |
|
|
62
|
-
|
|
63
|
-
### Math
|
|
64
|
-
|
|
65
|
-
| Benchmark | Score |
|
|
66
|
-
|-----------|-------|
|
|
67
|
-
| GSM8K | 91.3 |
|
|
68
|
-
| MATH | 65.8 |
|
|
69
|
-
```
|
|
70
|
-
|
|
71
|
-
## Format 6: With Additional Columns
|
|
72
|
-
|
|
73
|
-
```markdown
|
|
74
|
-
| Benchmark | Score | Rank | Notes |
|
|
75
|
-
|-----------|-------|------|--------------------|
|
|
76
|
-
| MMLU | 85.2 | #5 | 5-shot |
|
|
77
|
-
| HumanEval | 72.5 | #8 | pass@1 |
|
|
78
|
-
| GSM8K | 91.3 | #3 | 8-shot, maj@1 |
|
|
79
|
-
```
|
|
80
|
-
|
|
81
|
-
## How the Extractor Works
|
|
82
|
-
|
|
83
|
-
The script will:
|
|
84
|
-
1. Find all markdown tables in the README
|
|
85
|
-
2. Identify which tables contain evaluation results
|
|
86
|
-
3. Parse the table structure (rows vs columns)
|
|
87
|
-
4. Extract numeric values as scores
|
|
88
|
-
5. Convert to model-index YAML format
|
|
89
|
-
|
|
90
|
-
## Tips for README Authors
|
|
91
|
-
|
|
92
|
-
To ensure your evaluation tables are properly extracted:
|
|
93
|
-
|
|
94
|
-
1. **Use clear headers**: Include "Benchmark", "Score", or similar terms
|
|
95
|
-
2. **Keep it simple**: Stick to benchmark name + score columns
|
|
96
|
-
3. **Use standard formats**: Follow markdown table syntax
|
|
97
|
-
4. **Include numeric values**: Ensure scores are parseable numbers
|
|
98
|
-
5. **Be consistent**: Use the same format across multiple tables
|
|
99
|
-
|
|
100
|
-
## Example Complete README Section
|
|
101
|
-
|
|
102
|
-
```markdown
|
|
103
|
-
# Model Card for MyModel-7B
|
|
104
|
-
|
|
105
|
-
## Evaluation Results
|
|
106
|
-
|
|
107
|
-
Our model was evaluated on several standard benchmarks:
|
|
108
|
-
|
|
109
|
-
| Benchmark | Score |
|
|
110
|
-
|---------------|-------|
|
|
111
|
-
| MMLU | 85.2 |
|
|
112
|
-
| HumanEval | 72.5 |
|
|
113
|
-
| GSM8K | 91.3 |
|
|
114
|
-
| HellaSwag | 88.9 |
|
|
115
|
-
| ARC-Challenge | 81.7 |
|
|
116
|
-
| TruthfulQA | 68.7 |
|
|
117
|
-
|
|
118
|
-
### Detailed Results
|
|
119
|
-
|
|
120
|
-
For more detailed results and methodology, see our [paper](link).
|
|
121
|
-
```
|
|
122
|
-
|
|
123
|
-
## Running the Extractor
|
|
124
|
-
|
|
125
|
-
```bash
|
|
126
|
-
# Extract from this example
|
|
127
|
-
python scripts/evaluation_manager.py extract-readme \
|
|
128
|
-
--repo-id "your-username/your-model" \
|
|
129
|
-
--dry-run
|
|
130
|
-
|
|
131
|
-
# Apply to your model card
|
|
132
|
-
python scripts/evaluation_manager.py extract-readme \
|
|
133
|
-
--repo-id "your-username/your-model" \
|
|
134
|
-
--task-type "text-generation"
|
|
135
|
-
```
|
|
@@ -1,50 +0,0 @@
|
|
|
1
|
-
{
|
|
2
|
-
"MMLU": {
|
|
3
|
-
"type": "mmlu",
|
|
4
|
-
"name": "Massive Multitask Language Understanding"
|
|
5
|
-
},
|
|
6
|
-
"HumanEval": {
|
|
7
|
-
"type": "humaneval",
|
|
8
|
-
"name": "Code Generation (HumanEval)"
|
|
9
|
-
},
|
|
10
|
-
"GSM8K": {
|
|
11
|
-
"type": "gsm8k",
|
|
12
|
-
"name": "Grade School Math"
|
|
13
|
-
},
|
|
14
|
-
"HellaSwag": {
|
|
15
|
-
"type": "hellaswag",
|
|
16
|
-
"name": "HellaSwag Common Sense"
|
|
17
|
-
},
|
|
18
|
-
"ARC-C": {
|
|
19
|
-
"type": "arc_challenge",
|
|
20
|
-
"name": "ARC Challenge"
|
|
21
|
-
},
|
|
22
|
-
"ARC-E": {
|
|
23
|
-
"type": "arc_easy",
|
|
24
|
-
"name": "ARC Easy"
|
|
25
|
-
},
|
|
26
|
-
"Winogrande": {
|
|
27
|
-
"type": "winogrande",
|
|
28
|
-
"name": "Winogrande"
|
|
29
|
-
},
|
|
30
|
-
"TruthfulQA": {
|
|
31
|
-
"type": "truthfulqa",
|
|
32
|
-
"name": "TruthfulQA"
|
|
33
|
-
},
|
|
34
|
-
"GPQA": {
|
|
35
|
-
"type": "gpqa",
|
|
36
|
-
"name": "Graduate-Level Google-Proof Q&A"
|
|
37
|
-
},
|
|
38
|
-
"DROP": {
|
|
39
|
-
"type": "drop",
|
|
40
|
-
"name": "Discrete Reasoning Over Paragraphs"
|
|
41
|
-
},
|
|
42
|
-
"BBH": {
|
|
43
|
-
"type": "bbh",
|
|
44
|
-
"name": "Big Bench Hard"
|
|
45
|
-
},
|
|
46
|
-
"MATH": {
|
|
47
|
-
"type": "math",
|
|
48
|
-
"name": "MATH Dataset"
|
|
49
|
-
}
|
|
50
|
-
}
|