@synsci/cli-darwin-x64 1.1.49
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/skills/accelerate/SKILL.md +332 -0
- package/bin/skills/accelerate/references/custom-plugins.md +453 -0
- package/bin/skills/accelerate/references/megatron-integration.md +489 -0
- package/bin/skills/accelerate/references/performance.md +525 -0
- package/bin/skills/audiocraft/SKILL.md +564 -0
- package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
- package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
- package/bin/skills/autogpt/SKILL.md +403 -0
- package/bin/skills/autogpt/references/advanced-usage.md +535 -0
- package/bin/skills/autogpt/references/troubleshooting.md +420 -0
- package/bin/skills/awq/SKILL.md +310 -0
- package/bin/skills/awq/references/advanced-usage.md +324 -0
- package/bin/skills/awq/references/troubleshooting.md +344 -0
- package/bin/skills/axolotl/SKILL.md +158 -0
- package/bin/skills/axolotl/references/api.md +5548 -0
- package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
- package/bin/skills/axolotl/references/index.md +15 -0
- package/bin/skills/axolotl/references/other.md +3563 -0
- package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
- package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
- package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
- package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
- package/bin/skills/bitsandbytes/SKILL.md +411 -0
- package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
- package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
- package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
- package/bin/skills/blip-2/SKILL.md +564 -0
- package/bin/skills/blip-2/references/advanced-usage.md +680 -0
- package/bin/skills/blip-2/references/troubleshooting.md +526 -0
- package/bin/skills/chroma/SKILL.md +406 -0
- package/bin/skills/chroma/references/integration.md +38 -0
- package/bin/skills/clip/SKILL.md +253 -0
- package/bin/skills/clip/references/applications.md +207 -0
- package/bin/skills/constitutional-ai/SKILL.md +290 -0
- package/bin/skills/crewai/SKILL.md +498 -0
- package/bin/skills/crewai/references/flows.md +438 -0
- package/bin/skills/crewai/references/tools.md +429 -0
- package/bin/skills/crewai/references/troubleshooting.md +480 -0
- package/bin/skills/deepspeed/SKILL.md +141 -0
- package/bin/skills/deepspeed/references/08.md +17 -0
- package/bin/skills/deepspeed/references/09.md +173 -0
- package/bin/skills/deepspeed/references/2020.md +378 -0
- package/bin/skills/deepspeed/references/2023.md +279 -0
- package/bin/skills/deepspeed/references/assets.md +179 -0
- package/bin/skills/deepspeed/references/index.md +35 -0
- package/bin/skills/deepspeed/references/mii.md +118 -0
- package/bin/skills/deepspeed/references/other.md +1191 -0
- package/bin/skills/deepspeed/references/tutorials.md +6554 -0
- package/bin/skills/dspy/SKILL.md +590 -0
- package/bin/skills/dspy/references/examples.md +663 -0
- package/bin/skills/dspy/references/modules.md +475 -0
- package/bin/skills/dspy/references/optimizers.md +566 -0
- package/bin/skills/faiss/SKILL.md +221 -0
- package/bin/skills/faiss/references/index_types.md +280 -0
- package/bin/skills/flash-attention/SKILL.md +367 -0
- package/bin/skills/flash-attention/references/benchmarks.md +215 -0
- package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
- package/bin/skills/gguf/SKILL.md +427 -0
- package/bin/skills/gguf/references/advanced-usage.md +504 -0
- package/bin/skills/gguf/references/troubleshooting.md +442 -0
- package/bin/skills/gptq/SKILL.md +450 -0
- package/bin/skills/gptq/references/calibration.md +337 -0
- package/bin/skills/gptq/references/integration.md +129 -0
- package/bin/skills/gptq/references/troubleshooting.md +95 -0
- package/bin/skills/grpo-rl-training/README.md +97 -0
- package/bin/skills/grpo-rl-training/SKILL.md +572 -0
- package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
- package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
- package/bin/skills/guidance/SKILL.md +572 -0
- package/bin/skills/guidance/references/backends.md +554 -0
- package/bin/skills/guidance/references/constraints.md +674 -0
- package/bin/skills/guidance/references/examples.md +767 -0
- package/bin/skills/hqq/SKILL.md +445 -0
- package/bin/skills/hqq/references/advanced-usage.md +528 -0
- package/bin/skills/hqq/references/troubleshooting.md +503 -0
- package/bin/skills/hugging-face-cli/SKILL.md +191 -0
- package/bin/skills/hugging-face-cli/references/commands.md +954 -0
- package/bin/skills/hugging-face-cli/references/examples.md +374 -0
- package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
- package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
- package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
- package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
- package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
- package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
- package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
- package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
- package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
- package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
- package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
- package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
- package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
- package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
- package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
- package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
- package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
- package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
- package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
- package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
- package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
- package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
- package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
- package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
- package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
- package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
- package/bin/skills/hugging-face-jobs/index.html +216 -0
- package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
- package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
- package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
- package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
- package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
- package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
- package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
- package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
- package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
- package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
- package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
- package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
- package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
- package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
- package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
- package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
- package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
- package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
- package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
- package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
- package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
- package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
- package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
- package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
- package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
- package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
- package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
- package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
- package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
- package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
- package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
- package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
- package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
- package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
- package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
- package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
- package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
- package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
- package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
- package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
- package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
- package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
- package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
- package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
- package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
- package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
- package/bin/skills/instructor/SKILL.md +740 -0
- package/bin/skills/instructor/references/examples.md +107 -0
- package/bin/skills/instructor/references/providers.md +70 -0
- package/bin/skills/instructor/references/validation.md +606 -0
- package/bin/skills/knowledge-distillation/SKILL.md +458 -0
- package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
- package/bin/skills/lambda-labs/SKILL.md +545 -0
- package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
- package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
- package/bin/skills/langchain/SKILL.md +480 -0
- package/bin/skills/langchain/references/agents.md +499 -0
- package/bin/skills/langchain/references/integration.md +562 -0
- package/bin/skills/langchain/references/rag.md +600 -0
- package/bin/skills/langsmith/SKILL.md +422 -0
- package/bin/skills/langsmith/references/advanced-usage.md +548 -0
- package/bin/skills/langsmith/references/troubleshooting.md +537 -0
- package/bin/skills/litgpt/SKILL.md +469 -0
- package/bin/skills/litgpt/references/custom-models.md +568 -0
- package/bin/skills/litgpt/references/distributed-training.md +451 -0
- package/bin/skills/litgpt/references/supported-models.md +336 -0
- package/bin/skills/litgpt/references/training-recipes.md +619 -0
- package/bin/skills/llama-cpp/SKILL.md +258 -0
- package/bin/skills/llama-cpp/references/optimization.md +89 -0
- package/bin/skills/llama-cpp/references/quantization.md +213 -0
- package/bin/skills/llama-cpp/references/server.md +125 -0
- package/bin/skills/llama-factory/SKILL.md +80 -0
- package/bin/skills/llama-factory/references/_images.md +23 -0
- package/bin/skills/llama-factory/references/advanced.md +1055 -0
- package/bin/skills/llama-factory/references/getting_started.md +349 -0
- package/bin/skills/llama-factory/references/index.md +19 -0
- package/bin/skills/llama-factory/references/other.md +31 -0
- package/bin/skills/llamaguard/SKILL.md +337 -0
- package/bin/skills/llamaindex/SKILL.md +569 -0
- package/bin/skills/llamaindex/references/agents.md +83 -0
- package/bin/skills/llamaindex/references/data_connectors.md +108 -0
- package/bin/skills/llamaindex/references/query_engines.md +406 -0
- package/bin/skills/llava/SKILL.md +304 -0
- package/bin/skills/llava/references/training.md +197 -0
- package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
- package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
- package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
- package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
- package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
- package/bin/skills/long-context/SKILL.md +536 -0
- package/bin/skills/long-context/references/extension_methods.md +468 -0
- package/bin/skills/long-context/references/fine_tuning.md +611 -0
- package/bin/skills/long-context/references/rope.md +402 -0
- package/bin/skills/mamba/SKILL.md +260 -0
- package/bin/skills/mamba/references/architecture-details.md +206 -0
- package/bin/skills/mamba/references/benchmarks.md +255 -0
- package/bin/skills/mamba/references/training-guide.md +388 -0
- package/bin/skills/megatron-core/SKILL.md +366 -0
- package/bin/skills/megatron-core/references/benchmarks.md +249 -0
- package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
- package/bin/skills/megatron-core/references/production-examples.md +473 -0
- package/bin/skills/megatron-core/references/training-recipes.md +547 -0
- package/bin/skills/miles/SKILL.md +315 -0
- package/bin/skills/miles/references/api-reference.md +141 -0
- package/bin/skills/miles/references/troubleshooting.md +352 -0
- package/bin/skills/mlflow/SKILL.md +704 -0
- package/bin/skills/mlflow/references/deployment.md +744 -0
- package/bin/skills/mlflow/references/model-registry.md +770 -0
- package/bin/skills/mlflow/references/tracking.md +680 -0
- package/bin/skills/modal/SKILL.md +341 -0
- package/bin/skills/modal/references/advanced-usage.md +503 -0
- package/bin/skills/modal/references/troubleshooting.md +494 -0
- package/bin/skills/model-merging/SKILL.md +539 -0
- package/bin/skills/model-merging/references/evaluation.md +462 -0
- package/bin/skills/model-merging/references/examples.md +428 -0
- package/bin/skills/model-merging/references/methods.md +352 -0
- package/bin/skills/model-pruning/SKILL.md +495 -0
- package/bin/skills/model-pruning/references/wanda.md +347 -0
- package/bin/skills/moe-training/SKILL.md +526 -0
- package/bin/skills/moe-training/references/architectures.md +432 -0
- package/bin/skills/moe-training/references/inference.md +348 -0
- package/bin/skills/moe-training/references/training.md +425 -0
- package/bin/skills/nanogpt/SKILL.md +290 -0
- package/bin/skills/nanogpt/references/architecture.md +382 -0
- package/bin/skills/nanogpt/references/data.md +476 -0
- package/bin/skills/nanogpt/references/training.md +564 -0
- package/bin/skills/nemo-curator/SKILL.md +383 -0
- package/bin/skills/nemo-curator/references/deduplication.md +87 -0
- package/bin/skills/nemo-curator/references/filtering.md +102 -0
- package/bin/skills/nemo-evaluator/SKILL.md +494 -0
- package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
- package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
- package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
- package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
- package/bin/skills/nemo-guardrails/SKILL.md +297 -0
- package/bin/skills/nnsight/SKILL.md +436 -0
- package/bin/skills/nnsight/references/README.md +78 -0
- package/bin/skills/nnsight/references/api.md +344 -0
- package/bin/skills/nnsight/references/tutorials.md +300 -0
- package/bin/skills/openrlhf/SKILL.md +249 -0
- package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
- package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
- package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
- package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
- package/bin/skills/outlines/SKILL.md +652 -0
- package/bin/skills/outlines/references/backends.md +615 -0
- package/bin/skills/outlines/references/examples.md +773 -0
- package/bin/skills/outlines/references/json_generation.md +652 -0
- package/bin/skills/peft/SKILL.md +431 -0
- package/bin/skills/peft/references/advanced-usage.md +514 -0
- package/bin/skills/peft/references/troubleshooting.md +480 -0
- package/bin/skills/phoenix/SKILL.md +475 -0
- package/bin/skills/phoenix/references/advanced-usage.md +619 -0
- package/bin/skills/phoenix/references/troubleshooting.md +538 -0
- package/bin/skills/pinecone/SKILL.md +358 -0
- package/bin/skills/pinecone/references/deployment.md +181 -0
- package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
- package/bin/skills/pytorch-fsdp/references/index.md +7 -0
- package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
- package/bin/skills/pytorch-lightning/SKILL.md +346 -0
- package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
- package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
- package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
- package/bin/skills/pyvene/SKILL.md +473 -0
- package/bin/skills/pyvene/references/README.md +73 -0
- package/bin/skills/pyvene/references/api.md +383 -0
- package/bin/skills/pyvene/references/tutorials.md +376 -0
- package/bin/skills/qdrant/SKILL.md +493 -0
- package/bin/skills/qdrant/references/advanced-usage.md +648 -0
- package/bin/skills/qdrant/references/troubleshooting.md +631 -0
- package/bin/skills/ray-data/SKILL.md +326 -0
- package/bin/skills/ray-data/references/integration.md +82 -0
- package/bin/skills/ray-data/references/transformations.md +83 -0
- package/bin/skills/ray-train/SKILL.md +406 -0
- package/bin/skills/ray-train/references/multi-node.md +628 -0
- package/bin/skills/rwkv/SKILL.md +260 -0
- package/bin/skills/rwkv/references/architecture-details.md +344 -0
- package/bin/skills/rwkv/references/rwkv7.md +386 -0
- package/bin/skills/rwkv/references/state-management.md +369 -0
- package/bin/skills/saelens/SKILL.md +386 -0
- package/bin/skills/saelens/references/README.md +70 -0
- package/bin/skills/saelens/references/api.md +333 -0
- package/bin/skills/saelens/references/tutorials.md +318 -0
- package/bin/skills/segment-anything/SKILL.md +500 -0
- package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
- package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
- package/bin/skills/sentence-transformers/SKILL.md +255 -0
- package/bin/skills/sentence-transformers/references/models.md +123 -0
- package/bin/skills/sentencepiece/SKILL.md +235 -0
- package/bin/skills/sentencepiece/references/algorithms.md +200 -0
- package/bin/skills/sentencepiece/references/training.md +304 -0
- package/bin/skills/sglang/SKILL.md +442 -0
- package/bin/skills/sglang/references/deployment.md +490 -0
- package/bin/skills/sglang/references/radix-attention.md +413 -0
- package/bin/skills/sglang/references/structured-generation.md +541 -0
- package/bin/skills/simpo/SKILL.md +219 -0
- package/bin/skills/simpo/references/datasets.md +478 -0
- package/bin/skills/simpo/references/hyperparameters.md +452 -0
- package/bin/skills/simpo/references/loss-functions.md +350 -0
- package/bin/skills/skypilot/SKILL.md +509 -0
- package/bin/skills/skypilot/references/advanced-usage.md +491 -0
- package/bin/skills/skypilot/references/troubleshooting.md +570 -0
- package/bin/skills/slime/SKILL.md +464 -0
- package/bin/skills/slime/references/api-reference.md +392 -0
- package/bin/skills/slime/references/troubleshooting.md +386 -0
- package/bin/skills/speculative-decoding/SKILL.md +467 -0
- package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
- package/bin/skills/speculative-decoding/references/medusa.md +350 -0
- package/bin/skills/stable-diffusion/SKILL.md +519 -0
- package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
- package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
- package/bin/skills/tensorboard/SKILL.md +629 -0
- package/bin/skills/tensorboard/references/integrations.md +638 -0
- package/bin/skills/tensorboard/references/profiling.md +545 -0
- package/bin/skills/tensorboard/references/visualization.md +620 -0
- package/bin/skills/tensorrt-llm/SKILL.md +187 -0
- package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
- package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
- package/bin/skills/tensorrt-llm/references/serving.md +470 -0
- package/bin/skills/tinker/SKILL.md +362 -0
- package/bin/skills/tinker/references/api-reference.md +168 -0
- package/bin/skills/tinker/references/getting-started.md +157 -0
- package/bin/skills/tinker/references/loss-functions.md +163 -0
- package/bin/skills/tinker/references/models-and-lora.md +139 -0
- package/bin/skills/tinker/references/recipes.md +280 -0
- package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
- package/bin/skills/tinker/references/rendering.md +243 -0
- package/bin/skills/tinker/references/supervised-learning.md +232 -0
- package/bin/skills/tinker-training-cost/SKILL.md +187 -0
- package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
- package/bin/skills/torchforge/SKILL.md +433 -0
- package/bin/skills/torchforge/references/api-reference.md +327 -0
- package/bin/skills/torchforge/references/troubleshooting.md +409 -0
- package/bin/skills/torchtitan/SKILL.md +358 -0
- package/bin/skills/torchtitan/references/checkpoint.md +181 -0
- package/bin/skills/torchtitan/references/custom-models.md +258 -0
- package/bin/skills/torchtitan/references/float8.md +133 -0
- package/bin/skills/torchtitan/references/fsdp.md +126 -0
- package/bin/skills/transformer-lens/SKILL.md +346 -0
- package/bin/skills/transformer-lens/references/README.md +54 -0
- package/bin/skills/transformer-lens/references/api.md +362 -0
- package/bin/skills/transformer-lens/references/tutorials.md +339 -0
- package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
- package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
- package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
- package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
- package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
- package/bin/skills/unsloth/SKILL.md +80 -0
- package/bin/skills/unsloth/references/index.md +7 -0
- package/bin/skills/unsloth/references/llms-full.md +16799 -0
- package/bin/skills/unsloth/references/llms-txt.md +12044 -0
- package/bin/skills/unsloth/references/llms.md +82 -0
- package/bin/skills/verl/SKILL.md +391 -0
- package/bin/skills/verl/references/api-reference.md +301 -0
- package/bin/skills/verl/references/troubleshooting.md +391 -0
- package/bin/skills/vllm/SKILL.md +364 -0
- package/bin/skills/vllm/references/optimization.md +226 -0
- package/bin/skills/vllm/references/quantization.md +284 -0
- package/bin/skills/vllm/references/server-deployment.md +255 -0
- package/bin/skills/vllm/references/troubleshooting.md +447 -0
- package/bin/skills/weights-and-biases/SKILL.md +590 -0
- package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
- package/bin/skills/weights-and-biases/references/integrations.md +700 -0
- package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
- package/bin/skills/whisper/SKILL.md +317 -0
- package/bin/skills/whisper/references/languages.md +189 -0
- package/bin/synsc +0 -0
- package/package.json +10 -0
|
@@ -0,0 +1,319 @@
|
|
|
1
|
+
---
|
|
2
|
+
title: {{TITLE}}
|
|
3
|
+
authors: {{AUTHORS}}
|
|
4
|
+
date: {{DATE}}
|
|
5
|
+
arxiv:
|
|
6
|
+
tags: [machine-learning, ai]
|
|
7
|
+
layout: modern
|
|
8
|
+
---
|
|
9
|
+
|
|
10
|
+
<div class="header">
|
|
11
|
+
|
|
12
|
+
# {{TITLE}}
|
|
13
|
+
|
|
14
|
+
<div class="authors">
|
|
15
|
+
{{AUTHORS}}
|
|
16
|
+
</div>
|
|
17
|
+
|
|
18
|
+
<div class="date">
|
|
19
|
+
{{DATE}}
|
|
20
|
+
</div>
|
|
21
|
+
|
|
22
|
+
<div class="links">
|
|
23
|
+
[arXiv](#) · [PDF](#) · [Code](#) · [Demo](#)
|
|
24
|
+
</div>
|
|
25
|
+
|
|
26
|
+
</div>
|
|
27
|
+
|
|
28
|
+
---
|
|
29
|
+
|
|
30
|
+
## Abstract
|
|
31
|
+
|
|
32
|
+
<div class="abstract">
|
|
33
|
+
|
|
34
|
+
{{ABSTRACT}}
|
|
35
|
+
|
|
36
|
+
</div>
|
|
37
|
+
|
|
38
|
+
---
|
|
39
|
+
|
|
40
|
+
## Introduction
|
|
41
|
+
|
|
42
|
+
Modern research requires clear, accessible communication. This template provides a clean, web-friendly format inspired by Distill and modern scientific publications.
|
|
43
|
+
|
|
44
|
+
<div class="key-insight">
|
|
45
|
+
💡 **Key Insight**: Present your main contribution upfront to engage readers immediately.
|
|
46
|
+
</div>
|
|
47
|
+
|
|
48
|
+
### Why This Matters
|
|
49
|
+
|
|
50
|
+
Explain the significance of your work in plain language. What real-world problems does it solve?
|
|
51
|
+
|
|
52
|
+
### Our Approach
|
|
53
|
+
|
|
54
|
+
Summarize your methodology at a high level before diving into details.
|
|
55
|
+
|
|
56
|
+
---
|
|
57
|
+
|
|
58
|
+
## Background
|
|
59
|
+
|
|
60
|
+
<div class="definition">
|
|
61
|
+
**Definition**: Clearly define key terms and concepts early in the paper.
|
|
62
|
+
</div>
|
|
63
|
+
|
|
64
|
+
Provide context necessary to understand your contribution without overwhelming readers with details.
|
|
65
|
+
|
|
66
|
+
### Problem Statement
|
|
67
|
+
|
|
68
|
+
Formally state the problem you're addressing.
|
|
69
|
+
|
|
70
|
+
### Challenges
|
|
71
|
+
|
|
72
|
+
What makes this problem difficult?
|
|
73
|
+
|
|
74
|
+
1. **Challenge 1**: Description
|
|
75
|
+
2. **Challenge 2**: Description
|
|
76
|
+
3. **Challenge 3**: Description
|
|
77
|
+
|
|
78
|
+
---
|
|
79
|
+
|
|
80
|
+
## Method
|
|
81
|
+
|
|
82
|
+
Present your approach with clear visual aids and intuitive explanations.
|
|
83
|
+
|
|
84
|
+
<div class="figure">
|
|
85
|
+
|
|
86
|
+
```
|
|
87
|
+
[Diagram of your architecture goes here]
|
|
88
|
+
```
|
|
89
|
+
|
|
90
|
+
**Figure 1**: Overview of the proposed method. Caption explains the key components.
|
|
91
|
+
|
|
92
|
+
</div>
|
|
93
|
+
|
|
94
|
+
### Model Architecture
|
|
95
|
+
|
|
96
|
+
Describe your model systematically:
|
|
97
|
+
|
|
98
|
+
```python
|
|
99
|
+
# Pseudocode example
|
|
100
|
+
class YourModel:
|
|
101
|
+
def __init__(self):
|
|
102
|
+
self.encoder = Encoder()
|
|
103
|
+
self.decoder = Decoder()
|
|
104
|
+
|
|
105
|
+
def forward(self, x):
|
|
106
|
+
z = self.encoder(x)
|
|
107
|
+
output = self.decoder(z)
|
|
108
|
+
return output
|
|
109
|
+
```
|
|
110
|
+
|
|
111
|
+
### Training Strategy
|
|
112
|
+
|
|
113
|
+
Explain how you train the model, including:
|
|
114
|
+
|
|
115
|
+
- **Objective Function**: Mathematical formulation
|
|
116
|
+
- **Optimization**: Algorithm and hyperparameters
|
|
117
|
+
- **Regularization**: Techniques to prevent overfitting
|
|
118
|
+
|
|
119
|
+
---
|
|
120
|
+
|
|
121
|
+
## Experiments
|
|
122
|
+
|
|
123
|
+
### Setup
|
|
124
|
+
|
|
125
|
+
<div class="experiment-details">
|
|
126
|
+
|
|
127
|
+
| Component | Configuration |
|
|
128
|
+
|-----------|--------------|
|
|
129
|
+
| **Dataset** | Name, Size, Split |
|
|
130
|
+
| **Hardware** | GPU Type, RAM |
|
|
131
|
+
| **Framework** | PyTorch 2.0, Transformers |
|
|
132
|
+
| **Training Time** | Hours/Days |
|
|
133
|
+
|
|
134
|
+
</div>
|
|
135
|
+
|
|
136
|
+
### Results
|
|
137
|
+
|
|
138
|
+
Present results clearly with tables and visualizations.
|
|
139
|
+
|
|
140
|
+
<div class="results-table">
|
|
141
|
+
|
|
142
|
+
| Model | Accuracy | F1 Score | Params | Speed |
|
|
143
|
+
|-------|----------|----------|--------|-------|
|
|
144
|
+
| Baseline | 85.2% | 0.84 | 100M | 100 tok/s |
|
|
145
|
+
| **Ours** | **92.1%** | **0.91** | 120M | 95 tok/s |
|
|
146
|
+
| SOTA | 90.5% | 0.89 | 300M | 60 tok/s |
|
|
147
|
+
|
|
148
|
+
</div>
|
|
149
|
+
|
|
150
|
+
<div class="insight">
|
|
151
|
+
🔍 **Observation**: Our method achieves state-of-the-art performance with fewer parameters.
|
|
152
|
+
</div>
|
|
153
|
+
|
|
154
|
+
### Analysis
|
|
155
|
+
|
|
156
|
+
Deep dive into what the results reveal:
|
|
157
|
+
|
|
158
|
+
1. **Performance**: How does your method compare?
|
|
159
|
+
2. **Efficiency**: What are the computational costs?
|
|
160
|
+
3. **Robustness**: How does it perform across different scenarios?
|
|
161
|
+
|
|
162
|
+
---
|
|
163
|
+
|
|
164
|
+
## Ablation Study
|
|
165
|
+
|
|
166
|
+
Systematically evaluate each component's contribution.
|
|
167
|
+
|
|
168
|
+
<div class="ablation-results">
|
|
169
|
+
|
|
170
|
+
| Configuration | Score | Δ |
|
|
171
|
+
|---------------|-------|---|
|
|
172
|
+
| Full Model | 92.1% | - |
|
|
173
|
+
| - Component A | 89.3% | -2.8% |
|
|
174
|
+
| - Component B | 90.1% | -2.0% |
|
|
175
|
+
| - Component C | 91.5% | -0.6% |
|
|
176
|
+
|
|
177
|
+
</div>
|
|
178
|
+
|
|
179
|
+
**Conclusion**: All components contribute meaningfully, with Component A being most critical.
|
|
180
|
+
|
|
181
|
+
---
|
|
182
|
+
|
|
183
|
+
## Discussion
|
|
184
|
+
|
|
185
|
+
### What We Learned
|
|
186
|
+
|
|
187
|
+
Synthesize insights from your experiments.
|
|
188
|
+
|
|
189
|
+
### Limitations
|
|
190
|
+
|
|
191
|
+
<div class="limitations">
|
|
192
|
+
|
|
193
|
+
⚠️ **Current Limitations**:
|
|
194
|
+
|
|
195
|
+
1. Performance on domain X is limited
|
|
196
|
+
2. Computational requirements are high
|
|
197
|
+
3. Requires large training datasets
|
|
198
|
+
|
|
199
|
+
</div>
|
|
200
|
+
|
|
201
|
+
### Future Directions
|
|
202
|
+
|
|
203
|
+
Where should the community go next?
|
|
204
|
+
|
|
205
|
+
- **Direction 1**: Description
|
|
206
|
+
- **Direction 2**: Description
|
|
207
|
+
- **Direction 3**: Description
|
|
208
|
+
|
|
209
|
+
---
|
|
210
|
+
|
|
211
|
+
## Related Work
|
|
212
|
+
|
|
213
|
+
Compare and contrast with existing methods.
|
|
214
|
+
|
|
215
|
+
### Prior Approaches
|
|
216
|
+
|
|
217
|
+
| Method | Year | Key Idea | Limitation |
|
|
218
|
+
|--------|------|----------|------------|
|
|
219
|
+
| Method A | 2020 | Approach 1 | Issue X |
|
|
220
|
+
| Method B | 2021 | Approach 2 | Issue Y |
|
|
221
|
+
| Method C | 2023 | Approach 3 | Issue Z |
|
|
222
|
+
|
|
223
|
+
### How We Differ
|
|
224
|
+
|
|
225
|
+
Clearly articulate what's novel about your work.
|
|
226
|
+
|
|
227
|
+
---
|
|
228
|
+
|
|
229
|
+
## Conclusion
|
|
230
|
+
|
|
231
|
+
<div class="conclusion">
|
|
232
|
+
|
|
233
|
+
We presented **{{TITLE}}**, which achieves:
|
|
234
|
+
|
|
235
|
+
1. ✅ **Main contribution 1**
|
|
236
|
+
2. ✅ **Main contribution 2**
|
|
237
|
+
3. ✅ **Main contribution 3**
|
|
238
|
+
|
|
239
|
+
Our results demonstrate [key finding], opening new directions for [future work].
|
|
240
|
+
|
|
241
|
+
</div>
|
|
242
|
+
|
|
243
|
+
---
|
|
244
|
+
|
|
245
|
+
## Reproducibility
|
|
246
|
+
|
|
247
|
+
<div class="reproducibility">
|
|
248
|
+
|
|
249
|
+
### Code & Data
|
|
250
|
+
|
|
251
|
+
- **Code**: [github.com/username/repo](#)
|
|
252
|
+
- **Models**: [huggingface.co/username/model](#)
|
|
253
|
+
- **Datasets**: [huggingface.co/datasets/username/dataset](#)
|
|
254
|
+
- **Demo**: [huggingface.co/spaces/username/demo](#)
|
|
255
|
+
|
|
256
|
+
### Citation
|
|
257
|
+
|
|
258
|
+
```bibtex
|
|
259
|
+
@article{yourpaper2025,
|
|
260
|
+
title={{{{TITLE}}}},
|
|
261
|
+
author={{{{AUTHORS}}}},
|
|
262
|
+
year={2025},
|
|
263
|
+
journal={arXiv preprint}
|
|
264
|
+
}
|
|
265
|
+
```
|
|
266
|
+
|
|
267
|
+
</div>
|
|
268
|
+
|
|
269
|
+
---
|
|
270
|
+
|
|
271
|
+
## Acknowledgments
|
|
272
|
+
|
|
273
|
+
Thank funding agencies, collaborators, and computing resources that made this work possible.
|
|
274
|
+
|
|
275
|
+
---
|
|
276
|
+
|
|
277
|
+
<div class="appendix">
|
|
278
|
+
|
|
279
|
+
## Appendix
|
|
280
|
+
|
|
281
|
+
### A. Additional Results
|
|
282
|
+
|
|
283
|
+
Supplementary experiments and extended results.
|
|
284
|
+
|
|
285
|
+
### B. Hyperparameters
|
|
286
|
+
|
|
287
|
+
Complete training configuration:
|
|
288
|
+
|
|
289
|
+
```yaml
|
|
290
|
+
learning_rate: 1e-4
|
|
291
|
+
batch_size: 32
|
|
292
|
+
epochs: 100
|
|
293
|
+
optimizer: AdamW
|
|
294
|
+
scheduler: cosine
|
|
295
|
+
warmup_steps: 1000
|
|
296
|
+
```
|
|
297
|
+
|
|
298
|
+
### C. Dataset Details
|
|
299
|
+
|
|
300
|
+
Detailed information about datasets used.
|
|
301
|
+
|
|
302
|
+
</div>
|
|
303
|
+
|
|
304
|
+
---
|
|
305
|
+
|
|
306
|
+
<style>
|
|
307
|
+
.header { text-align: center; margin-bottom: 2em; }
|
|
308
|
+
.authors { font-size: 1.2em; margin: 0.5em 0; }
|
|
309
|
+
.date { color: #666; margin: 0.5em 0; }
|
|
310
|
+
.links { margin-top: 1em; }
|
|
311
|
+
.abstract { background: #f5f5f5; padding: 1.5em; border-radius: 8px; margin: 1em 0; }
|
|
312
|
+
.key-insight, .insight { background: #e8f4f8; border-left: 4px solid #2196F3; padding: 1em; margin: 1em 0; }
|
|
313
|
+
.definition { background: #fff3e0; border-left: 4px solid #ff9800; padding: 1em; margin: 1em 0; }
|
|
314
|
+
.limitations { background: #ffebee; border-left: 4px solid #f44336; padding: 1em; margin: 1em 0; }
|
|
315
|
+
.conclusion { background: #e8f5e9; border-left: 4px solid #4caf50; padding: 1.5em; margin: 1em 0; }
|
|
316
|
+
.figure { text-align: center; margin: 2em 0; }
|
|
317
|
+
.experiment-details, .results-table, .ablation-results { margin: 1em 0; }
|
|
318
|
+
.reproducibility { background: #f5f5f5; padding: 1.5em; border-radius: 8px; margin: 2em 0; }
|
|
319
|
+
</style>
|
|
@@ -0,0 +1,201 @@
|
|
|
1
|
+
---
|
|
2
|
+
title: {{TITLE}}
|
|
3
|
+
authors: {{AUTHORS}}
|
|
4
|
+
date: {{DATE}}
|
|
5
|
+
arxiv:
|
|
6
|
+
tags: [machine-learning, deep-learning]
|
|
7
|
+
---
|
|
8
|
+
|
|
9
|
+
# {{TITLE}}
|
|
10
|
+
|
|
11
|
+
**{{AUTHORS}}**
|
|
12
|
+
|
|
13
|
+
*{{DATE}}*
|
|
14
|
+
|
|
15
|
+
---
|
|
16
|
+
|
|
17
|
+
## Abstract
|
|
18
|
+
|
|
19
|
+
{{ABSTRACT}}
|
|
20
|
+
|
|
21
|
+
---
|
|
22
|
+
|
|
23
|
+
## 1. Introduction
|
|
24
|
+
|
|
25
|
+
Provide background and motivation for your research. Explain:
|
|
26
|
+
- What problem are you addressing?
|
|
27
|
+
- Why is it important?
|
|
28
|
+
- What is novel about your approach?
|
|
29
|
+
|
|
30
|
+
### 1.1 Motivation
|
|
31
|
+
|
|
32
|
+
Describe the real-world context and importance of the problem.
|
|
33
|
+
|
|
34
|
+
### 1.2 Contributions
|
|
35
|
+
|
|
36
|
+
List the main contributions of your work:
|
|
37
|
+
1. First contribution
|
|
38
|
+
2. Second contribution
|
|
39
|
+
3. Third contribution
|
|
40
|
+
|
|
41
|
+
---
|
|
42
|
+
|
|
43
|
+
## 2. Related Work
|
|
44
|
+
|
|
45
|
+
Survey previous research relevant to your work. Organize by:
|
|
46
|
+
- Different approaches to the problem
|
|
47
|
+
- Complementary methods
|
|
48
|
+
- Alternative solutions
|
|
49
|
+
|
|
50
|
+
### 2.1 Previous Approaches
|
|
51
|
+
|
|
52
|
+
Discuss earlier methods and their limitations.
|
|
53
|
+
|
|
54
|
+
### 2.2 Recent Advances
|
|
55
|
+
|
|
56
|
+
Highlight recent developments in the field.
|
|
57
|
+
|
|
58
|
+
---
|
|
59
|
+
|
|
60
|
+
## 3. Background
|
|
61
|
+
|
|
62
|
+
Provide necessary technical background for understanding your work.
|
|
63
|
+
|
|
64
|
+
### 3.1 Problem Formulation
|
|
65
|
+
|
|
66
|
+
Formally define the problem you're solving.
|
|
67
|
+
|
|
68
|
+
### 3.2 Preliminaries
|
|
69
|
+
|
|
70
|
+
Introduce key concepts, notation, and terminology.
|
|
71
|
+
|
|
72
|
+
---
|
|
73
|
+
|
|
74
|
+
## 4. Methodology
|
|
75
|
+
|
|
76
|
+
Describe your approach in detail.
|
|
77
|
+
|
|
78
|
+
### 4.1 Overview
|
|
79
|
+
|
|
80
|
+
Provide a high-level description of your method.
|
|
81
|
+
|
|
82
|
+
### 4.2 Model Architecture
|
|
83
|
+
|
|
84
|
+
Detail the technical components of your system.
|
|
85
|
+
|
|
86
|
+
### 4.3 Training Procedure
|
|
87
|
+
|
|
88
|
+
Explain how the model is trained.
|
|
89
|
+
|
|
90
|
+
### 4.4 Implementation Details
|
|
91
|
+
|
|
92
|
+
Provide reproducibility information:
|
|
93
|
+
- Hyperparameters
|
|
94
|
+
- Hardware requirements
|
|
95
|
+
- Software dependencies
|
|
96
|
+
|
|
97
|
+
---
|
|
98
|
+
|
|
99
|
+
## 5. Experiments
|
|
100
|
+
|
|
101
|
+
Present your experimental setup and results.
|
|
102
|
+
|
|
103
|
+
### 5.1 Datasets
|
|
104
|
+
|
|
105
|
+
Describe the datasets used for evaluation.
|
|
106
|
+
|
|
107
|
+
### 5.2 Evaluation Metrics
|
|
108
|
+
|
|
109
|
+
Define the metrics used to assess performance.
|
|
110
|
+
|
|
111
|
+
### 5.3 Baselines
|
|
112
|
+
|
|
113
|
+
List comparison methods.
|
|
114
|
+
|
|
115
|
+
### 5.4 Experimental Setup
|
|
116
|
+
|
|
117
|
+
Detail the experimental configuration.
|
|
118
|
+
|
|
119
|
+
---
|
|
120
|
+
|
|
121
|
+
## 6. Results
|
|
122
|
+
|
|
123
|
+
Present and analyze your findings.
|
|
124
|
+
|
|
125
|
+
### 6.1 Main Results
|
|
126
|
+
|
|
127
|
+
Report primary experimental results.
|
|
128
|
+
|
|
129
|
+
| Model | Dataset | Metric | Score |
|
|
130
|
+
|-------|---------|--------|-------|
|
|
131
|
+
| Baseline | Dataset A | Accuracy | 0.85 |
|
|
132
|
+
| Ours | Dataset A | Accuracy | 0.92 |
|
|
133
|
+
|
|
134
|
+
### 6.2 Ablation Studies
|
|
135
|
+
|
|
136
|
+
Analyze the contribution of different components.
|
|
137
|
+
|
|
138
|
+
### 6.3 Qualitative Analysis
|
|
139
|
+
|
|
140
|
+
Provide examples and case studies.
|
|
141
|
+
|
|
142
|
+
---
|
|
143
|
+
|
|
144
|
+
## 7. Discussion
|
|
145
|
+
|
|
146
|
+
Interpret your results and discuss implications.
|
|
147
|
+
|
|
148
|
+
### 7.1 Analysis
|
|
149
|
+
|
|
150
|
+
What do the results tell us?
|
|
151
|
+
|
|
152
|
+
### 7.2 Limitations
|
|
153
|
+
|
|
154
|
+
Acknowledge limitations of your approach.
|
|
155
|
+
|
|
156
|
+
### 7.3 Broader Impact
|
|
157
|
+
|
|
158
|
+
Discuss societal implications and potential applications.
|
|
159
|
+
|
|
160
|
+
---
|
|
161
|
+
|
|
162
|
+
## 8. Conclusion
|
|
163
|
+
|
|
164
|
+
Summarize your work and contributions.
|
|
165
|
+
|
|
166
|
+
### 8.1 Summary
|
|
167
|
+
|
|
168
|
+
Recap the main findings.
|
|
169
|
+
|
|
170
|
+
### 8.2 Future Work
|
|
171
|
+
|
|
172
|
+
Suggest directions for future research.
|
|
173
|
+
|
|
174
|
+
---
|
|
175
|
+
|
|
176
|
+
## Acknowledgments
|
|
177
|
+
|
|
178
|
+
Thank collaborators, funding sources, and computational resources.
|
|
179
|
+
|
|
180
|
+
---
|
|
181
|
+
|
|
182
|
+
## References
|
|
183
|
+
|
|
184
|
+
1. Author A, et al. "Paper Title." Conference/Journal, Year.
|
|
185
|
+
2. Author B, et al. "Another Paper." Conference/Journal, Year.
|
|
186
|
+
|
|
187
|
+
---
|
|
188
|
+
|
|
189
|
+
## Appendix
|
|
190
|
+
|
|
191
|
+
### A. Additional Experiments
|
|
192
|
+
|
|
193
|
+
Supplementary experimental results.
|
|
194
|
+
|
|
195
|
+
### B. Implementation Details
|
|
196
|
+
|
|
197
|
+
Code snippets and configuration details.
|
|
198
|
+
|
|
199
|
+
### C. Hyperparameters
|
|
200
|
+
|
|
201
|
+
Complete list of hyperparameters used.
|
|
@@ -0,0 +1,115 @@
|
|
|
1
|
+
---
|
|
2
|
+
name: hugging-face-tool-builder
|
|
3
|
+
description: Use this skill when the user wants to build tool/scripts or achieve a task where using data from the Hugging Face API would help. This is especially useful when chaining or combining API calls or the task will be repeated/automated. This Skill creates a reusable script to fetch, enrich or process data.
|
|
4
|
+
version: 1.0.0
|
|
5
|
+
author: Synthetic Sciences
|
|
6
|
+
license: MIT
|
|
7
|
+
tags: [Hugging Face, Tools, Agents, MCP]
|
|
8
|
+
dependencies: [huggingface-hub, transformers]
|
|
9
|
+
---
|
|
10
|
+
|
|
11
|
+
# Hugging Face API Tool Builder
|
|
12
|
+
|
|
13
|
+
Your purpose is now is to create reusable command line scripts and utilities for using the Hugging Face API, allowing chaining, piping and intermediate processing where helpful. You can access the API directly, as well as use the `hf` command line tool. Model and Dataset cards can be accessed from repositories directly.
|
|
14
|
+
|
|
15
|
+
## Script Rules
|
|
16
|
+
|
|
17
|
+
Make sure to follow these rules:
|
|
18
|
+
- Scripts must take a `--help` command line argument to describe their inputs and outputs
|
|
19
|
+
- Non-destructive scripts should be tested before handing over to the User
|
|
20
|
+
- Shell scripts are preferred, but use Python or TSX if complexity or user need requires it.
|
|
21
|
+
- IMPORTANT: Use the `HF_TOKEN` environment variable as an Authorization header. For example: `curl -H "Authorization: Bearer ${HF_TOKEN}" https://huggingface.co/api/`. This provides higher rate limits and appropriate authorization for data access.
|
|
22
|
+
- Investigate the shape of the API results before commiting to a final design; make use of piping and chaining where composability would be an advantage - prefer simple solutions where possible.
|
|
23
|
+
- Share usage examples once complete.
|
|
24
|
+
|
|
25
|
+
Be sure to confirm User preferences where there are questions or clarifications needed.
|
|
26
|
+
|
|
27
|
+
## Sample Scripts
|
|
28
|
+
|
|
29
|
+
Paths below are relative to this skill directory.
|
|
30
|
+
|
|
31
|
+
Reference examples:
|
|
32
|
+
- `references/hf_model_papers_auth.sh` — uses `HF_TOKEN` automatically and chains trending → model metadata → model card parsing with fallbacks; it demonstrates multi-step API usage plus auth hygiene for gated/private content.
|
|
33
|
+
- `references/find_models_by_paper.sh` — optional `HF_TOKEN` usage via `--token`, consistent authenticated search, and a retry path when arXiv-prefixed searches are too narrow; it shows resilient query strategy and clear user-facing help.
|
|
34
|
+
- `references/hf_model_card_frontmatter.sh` — uses the `hf` CLI to download model cards, extracts YAML frontmatter, and emits NDJSON summaries (license, pipeline tag, tags, gated prompt flag) for easy filtering.
|
|
35
|
+
|
|
36
|
+
Baseline examples (ultra-simple, minimal logic, raw JSON output with `HF_TOKEN` header):
|
|
37
|
+
- `references/baseline_hf_api.sh` — bash
|
|
38
|
+
- `references/baseline_hf_api.py` — python
|
|
39
|
+
- `references/baseline_hf_api.tsx` — typescript executable
|
|
40
|
+
|
|
41
|
+
Composable utility (stdin → NDJSON):
|
|
42
|
+
- `references/hf_enrich_models.sh` — reads model IDs from stdin, fetches metadata per ID, emits one JSON object per line for streaming pipelines.
|
|
43
|
+
|
|
44
|
+
Composability through piping (shell-friendly JSON output):
|
|
45
|
+
- `references/baseline_hf_api.sh 25 | jq -r '.[].id' | references/hf_enrich_models.sh | jq -s 'sort_by(.downloads) | reverse | .[:10]'`
|
|
46
|
+
- `references/baseline_hf_api.sh 50 | jq '[.[] | {id, downloads}] | sort_by(.downloads) | reverse | .[:10]'`
|
|
47
|
+
- `printf '%s\n' openai/gpt-oss-120b meta-llama/Meta-Llama-3.1-8B | references/hf_model_card_frontmatter.sh | jq -s 'map({id, license, has_extra_gated_prompt})'`
|
|
48
|
+
|
|
49
|
+
## High Level Endpoints
|
|
50
|
+
|
|
51
|
+
The following are the main API endpoints available at `https://huggingface.co`
|
|
52
|
+
|
|
53
|
+
```
|
|
54
|
+
/api/datasets
|
|
55
|
+
/api/models
|
|
56
|
+
/api/spaces
|
|
57
|
+
/api/collections
|
|
58
|
+
/api/daily_papers
|
|
59
|
+
/api/notifications
|
|
60
|
+
/api/settings
|
|
61
|
+
/api/whoami-v2
|
|
62
|
+
/api/trending
|
|
63
|
+
/oauth/userinfo
|
|
64
|
+
```
|
|
65
|
+
|
|
66
|
+
## Accessing the API
|
|
67
|
+
|
|
68
|
+
The API is documented with the OpenAPI standard at `https://huggingface.co/.well-known/openapi.json`.
|
|
69
|
+
|
|
70
|
+
**IMPORTANT:** DO NOT ATTEMPT to read `https://huggingface.co/.well-known/openapi.json` directly as it is too large to process.
|
|
71
|
+
|
|
72
|
+
**IMPORTANT** Use `jq` to query and extract relevant parts. For example,
|
|
73
|
+
|
|
74
|
+
Command to Get All 160 Endpoints
|
|
75
|
+
|
|
76
|
+
```bash
|
|
77
|
+
curl -s "https://huggingface.co/.well-known/openapi.json" | jq '.paths | keys | sort'
|
|
78
|
+
```
|
|
79
|
+
|
|
80
|
+
Model Search Endpoint Details
|
|
81
|
+
|
|
82
|
+
```bash
|
|
83
|
+
curl -s "https://huggingface.co/.well-known/openapi.json" | jq '.paths["/api/models"]'
|
|
84
|
+
```
|
|
85
|
+
|
|
86
|
+
You can also query endpoints to see the shape of the data. When doing so constrain results to low numbers to make them easy to process, yet representative.
|
|
87
|
+
|
|
88
|
+
## Using the HF command line tool
|
|
89
|
+
|
|
90
|
+
The `hf` command line tool gives you further access to Hugging Face repository content and infrastructure.
|
|
91
|
+
|
|
92
|
+
```bash
|
|
93
|
+
❯ hf --help
|
|
94
|
+
Usage: hf [OPTIONS] COMMAND [ARGS]...
|
|
95
|
+
|
|
96
|
+
Hugging Face Hub CLI
|
|
97
|
+
|
|
98
|
+
Options:
|
|
99
|
+
--help Show this message and exit.
|
|
100
|
+
|
|
101
|
+
Commands:
|
|
102
|
+
auth Manage authentication (login, logout, etc.).
|
|
103
|
+
cache Manage local cache directory.
|
|
104
|
+
download Download files from the Hub.
|
|
105
|
+
endpoints Manage Hugging Face Inference Endpoints.
|
|
106
|
+
env Print information about the environment.
|
|
107
|
+
jobs Run and manage Jobs on the Hub.
|
|
108
|
+
repo Manage repos on the Hub.
|
|
109
|
+
repo-files Manage files in a repo on the Hub.
|
|
110
|
+
upload Upload a file or a folder to the Hub.
|
|
111
|
+
upload-large-folder Upload a large folder to the Hub.
|
|
112
|
+
version Print information about the hf version.
|
|
113
|
+
```
|
|
114
|
+
|
|
115
|
+
The `hf` CLI command has replaced the now deprecated `huggingface_hub` CLI command.
|
|
@@ -0,0 +1,57 @@
|
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
"""
|
|
3
|
+
Ultra-simple Hugging Face API example (Python).
|
|
4
|
+
|
|
5
|
+
Fetches a small list of models from the HF API and prints raw JSON.
|
|
6
|
+
Uses HF_TOKEN for auth if the environment variable is set.
|
|
7
|
+
"""
|
|
8
|
+
|
|
9
|
+
from __future__ import annotations
|
|
10
|
+
|
|
11
|
+
import os
|
|
12
|
+
import sys
|
|
13
|
+
import urllib.request
|
|
14
|
+
|
|
15
|
+
|
|
16
|
+
def show_help() -> None:
|
|
17
|
+
print(
|
|
18
|
+
"""Ultra-simple Hugging Face API example (Python)
|
|
19
|
+
|
|
20
|
+
Usage:
|
|
21
|
+
baseline_hf_api.py [limit]
|
|
22
|
+
baseline_hf_api.py --help
|
|
23
|
+
|
|
24
|
+
Description:
|
|
25
|
+
Fetches a small list of models from the HF API and prints raw JSON.
|
|
26
|
+
Uses HF_TOKEN for auth if the environment variable is set.
|
|
27
|
+
|
|
28
|
+
Examples:
|
|
29
|
+
baseline_hf_api.py
|
|
30
|
+
baseline_hf_api.py 5
|
|
31
|
+
HF_TOKEN=your_token baseline_hf_api.py 10
|
|
32
|
+
"""
|
|
33
|
+
)
|
|
34
|
+
|
|
35
|
+
|
|
36
|
+
def main() -> int:
|
|
37
|
+
if len(sys.argv) > 1 and sys.argv[1] == "--help":
|
|
38
|
+
show_help()
|
|
39
|
+
return 0
|
|
40
|
+
|
|
41
|
+
limit = sys.argv[1] if len(sys.argv) > 1 else "3"
|
|
42
|
+
if not limit.isdigit():
|
|
43
|
+
print("Error: limit must be a number", file=sys.stderr)
|
|
44
|
+
return 1
|
|
45
|
+
|
|
46
|
+
token = os.getenv("HF_TOKEN")
|
|
47
|
+
headers = {"Authorization": f"Bearer {token}"} if token else {}
|
|
48
|
+
url = f"https://huggingface.co/api/models?limit={limit}"
|
|
49
|
+
|
|
50
|
+
req = urllib.request.Request(url, headers=headers)
|
|
51
|
+
with urllib.request.urlopen(req) as resp:
|
|
52
|
+
sys.stdout.write(resp.read().decode("utf-8"))
|
|
53
|
+
return 0
|
|
54
|
+
|
|
55
|
+
|
|
56
|
+
if __name__ == "__main__":
|
|
57
|
+
raise SystemExit(main())
|