@synsci/cli-darwin-x64 1.1.49
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/skills/accelerate/SKILL.md +332 -0
- package/bin/skills/accelerate/references/custom-plugins.md +453 -0
- package/bin/skills/accelerate/references/megatron-integration.md +489 -0
- package/bin/skills/accelerate/references/performance.md +525 -0
- package/bin/skills/audiocraft/SKILL.md +564 -0
- package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
- package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
- package/bin/skills/autogpt/SKILL.md +403 -0
- package/bin/skills/autogpt/references/advanced-usage.md +535 -0
- package/bin/skills/autogpt/references/troubleshooting.md +420 -0
- package/bin/skills/awq/SKILL.md +310 -0
- package/bin/skills/awq/references/advanced-usage.md +324 -0
- package/bin/skills/awq/references/troubleshooting.md +344 -0
- package/bin/skills/axolotl/SKILL.md +158 -0
- package/bin/skills/axolotl/references/api.md +5548 -0
- package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
- package/bin/skills/axolotl/references/index.md +15 -0
- package/bin/skills/axolotl/references/other.md +3563 -0
- package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
- package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
- package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
- package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
- package/bin/skills/bitsandbytes/SKILL.md +411 -0
- package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
- package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
- package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
- package/bin/skills/blip-2/SKILL.md +564 -0
- package/bin/skills/blip-2/references/advanced-usage.md +680 -0
- package/bin/skills/blip-2/references/troubleshooting.md +526 -0
- package/bin/skills/chroma/SKILL.md +406 -0
- package/bin/skills/chroma/references/integration.md +38 -0
- package/bin/skills/clip/SKILL.md +253 -0
- package/bin/skills/clip/references/applications.md +207 -0
- package/bin/skills/constitutional-ai/SKILL.md +290 -0
- package/bin/skills/crewai/SKILL.md +498 -0
- package/bin/skills/crewai/references/flows.md +438 -0
- package/bin/skills/crewai/references/tools.md +429 -0
- package/bin/skills/crewai/references/troubleshooting.md +480 -0
- package/bin/skills/deepspeed/SKILL.md +141 -0
- package/bin/skills/deepspeed/references/08.md +17 -0
- package/bin/skills/deepspeed/references/09.md +173 -0
- package/bin/skills/deepspeed/references/2020.md +378 -0
- package/bin/skills/deepspeed/references/2023.md +279 -0
- package/bin/skills/deepspeed/references/assets.md +179 -0
- package/bin/skills/deepspeed/references/index.md +35 -0
- package/bin/skills/deepspeed/references/mii.md +118 -0
- package/bin/skills/deepspeed/references/other.md +1191 -0
- package/bin/skills/deepspeed/references/tutorials.md +6554 -0
- package/bin/skills/dspy/SKILL.md +590 -0
- package/bin/skills/dspy/references/examples.md +663 -0
- package/bin/skills/dspy/references/modules.md +475 -0
- package/bin/skills/dspy/references/optimizers.md +566 -0
- package/bin/skills/faiss/SKILL.md +221 -0
- package/bin/skills/faiss/references/index_types.md +280 -0
- package/bin/skills/flash-attention/SKILL.md +367 -0
- package/bin/skills/flash-attention/references/benchmarks.md +215 -0
- package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
- package/bin/skills/gguf/SKILL.md +427 -0
- package/bin/skills/gguf/references/advanced-usage.md +504 -0
- package/bin/skills/gguf/references/troubleshooting.md +442 -0
- package/bin/skills/gptq/SKILL.md +450 -0
- package/bin/skills/gptq/references/calibration.md +337 -0
- package/bin/skills/gptq/references/integration.md +129 -0
- package/bin/skills/gptq/references/troubleshooting.md +95 -0
- package/bin/skills/grpo-rl-training/README.md +97 -0
- package/bin/skills/grpo-rl-training/SKILL.md +572 -0
- package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
- package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
- package/bin/skills/guidance/SKILL.md +572 -0
- package/bin/skills/guidance/references/backends.md +554 -0
- package/bin/skills/guidance/references/constraints.md +674 -0
- package/bin/skills/guidance/references/examples.md +767 -0
- package/bin/skills/hqq/SKILL.md +445 -0
- package/bin/skills/hqq/references/advanced-usage.md +528 -0
- package/bin/skills/hqq/references/troubleshooting.md +503 -0
- package/bin/skills/hugging-face-cli/SKILL.md +191 -0
- package/bin/skills/hugging-face-cli/references/commands.md +954 -0
- package/bin/skills/hugging-face-cli/references/examples.md +374 -0
- package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
- package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
- package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
- package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
- package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
- package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
- package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
- package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
- package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
- package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
- package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
- package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
- package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
- package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
- package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
- package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
- package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
- package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
- package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
- package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
- package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
- package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
- package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
- package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
- package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
- package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
- package/bin/skills/hugging-face-jobs/index.html +216 -0
- package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
- package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
- package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
- package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
- package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
- package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
- package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
- package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
- package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
- package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
- package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
- package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
- package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
- package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
- package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
- package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
- package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
- package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
- package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
- package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
- package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
- package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
- package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
- package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
- package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
- package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
- package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
- package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
- package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
- package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
- package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
- package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
- package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
- package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
- package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
- package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
- package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
- package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
- package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
- package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
- package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
- package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
- package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
- package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
- package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
- package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
- package/bin/skills/instructor/SKILL.md +740 -0
- package/bin/skills/instructor/references/examples.md +107 -0
- package/bin/skills/instructor/references/providers.md +70 -0
- package/bin/skills/instructor/references/validation.md +606 -0
- package/bin/skills/knowledge-distillation/SKILL.md +458 -0
- package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
- package/bin/skills/lambda-labs/SKILL.md +545 -0
- package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
- package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
- package/bin/skills/langchain/SKILL.md +480 -0
- package/bin/skills/langchain/references/agents.md +499 -0
- package/bin/skills/langchain/references/integration.md +562 -0
- package/bin/skills/langchain/references/rag.md +600 -0
- package/bin/skills/langsmith/SKILL.md +422 -0
- package/bin/skills/langsmith/references/advanced-usage.md +548 -0
- package/bin/skills/langsmith/references/troubleshooting.md +537 -0
- package/bin/skills/litgpt/SKILL.md +469 -0
- package/bin/skills/litgpt/references/custom-models.md +568 -0
- package/bin/skills/litgpt/references/distributed-training.md +451 -0
- package/bin/skills/litgpt/references/supported-models.md +336 -0
- package/bin/skills/litgpt/references/training-recipes.md +619 -0
- package/bin/skills/llama-cpp/SKILL.md +258 -0
- package/bin/skills/llama-cpp/references/optimization.md +89 -0
- package/bin/skills/llama-cpp/references/quantization.md +213 -0
- package/bin/skills/llama-cpp/references/server.md +125 -0
- package/bin/skills/llama-factory/SKILL.md +80 -0
- package/bin/skills/llama-factory/references/_images.md +23 -0
- package/bin/skills/llama-factory/references/advanced.md +1055 -0
- package/bin/skills/llama-factory/references/getting_started.md +349 -0
- package/bin/skills/llama-factory/references/index.md +19 -0
- package/bin/skills/llama-factory/references/other.md +31 -0
- package/bin/skills/llamaguard/SKILL.md +337 -0
- package/bin/skills/llamaindex/SKILL.md +569 -0
- package/bin/skills/llamaindex/references/agents.md +83 -0
- package/bin/skills/llamaindex/references/data_connectors.md +108 -0
- package/bin/skills/llamaindex/references/query_engines.md +406 -0
- package/bin/skills/llava/SKILL.md +304 -0
- package/bin/skills/llava/references/training.md +197 -0
- package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
- package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
- package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
- package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
- package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
- package/bin/skills/long-context/SKILL.md +536 -0
- package/bin/skills/long-context/references/extension_methods.md +468 -0
- package/bin/skills/long-context/references/fine_tuning.md +611 -0
- package/bin/skills/long-context/references/rope.md +402 -0
- package/bin/skills/mamba/SKILL.md +260 -0
- package/bin/skills/mamba/references/architecture-details.md +206 -0
- package/bin/skills/mamba/references/benchmarks.md +255 -0
- package/bin/skills/mamba/references/training-guide.md +388 -0
- package/bin/skills/megatron-core/SKILL.md +366 -0
- package/bin/skills/megatron-core/references/benchmarks.md +249 -0
- package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
- package/bin/skills/megatron-core/references/production-examples.md +473 -0
- package/bin/skills/megatron-core/references/training-recipes.md +547 -0
- package/bin/skills/miles/SKILL.md +315 -0
- package/bin/skills/miles/references/api-reference.md +141 -0
- package/bin/skills/miles/references/troubleshooting.md +352 -0
- package/bin/skills/mlflow/SKILL.md +704 -0
- package/bin/skills/mlflow/references/deployment.md +744 -0
- package/bin/skills/mlflow/references/model-registry.md +770 -0
- package/bin/skills/mlflow/references/tracking.md +680 -0
- package/bin/skills/modal/SKILL.md +341 -0
- package/bin/skills/modal/references/advanced-usage.md +503 -0
- package/bin/skills/modal/references/troubleshooting.md +494 -0
- package/bin/skills/model-merging/SKILL.md +539 -0
- package/bin/skills/model-merging/references/evaluation.md +462 -0
- package/bin/skills/model-merging/references/examples.md +428 -0
- package/bin/skills/model-merging/references/methods.md +352 -0
- package/bin/skills/model-pruning/SKILL.md +495 -0
- package/bin/skills/model-pruning/references/wanda.md +347 -0
- package/bin/skills/moe-training/SKILL.md +526 -0
- package/bin/skills/moe-training/references/architectures.md +432 -0
- package/bin/skills/moe-training/references/inference.md +348 -0
- package/bin/skills/moe-training/references/training.md +425 -0
- package/bin/skills/nanogpt/SKILL.md +290 -0
- package/bin/skills/nanogpt/references/architecture.md +382 -0
- package/bin/skills/nanogpt/references/data.md +476 -0
- package/bin/skills/nanogpt/references/training.md +564 -0
- package/bin/skills/nemo-curator/SKILL.md +383 -0
- package/bin/skills/nemo-curator/references/deduplication.md +87 -0
- package/bin/skills/nemo-curator/references/filtering.md +102 -0
- package/bin/skills/nemo-evaluator/SKILL.md +494 -0
- package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
- package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
- package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
- package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
- package/bin/skills/nemo-guardrails/SKILL.md +297 -0
- package/bin/skills/nnsight/SKILL.md +436 -0
- package/bin/skills/nnsight/references/README.md +78 -0
- package/bin/skills/nnsight/references/api.md +344 -0
- package/bin/skills/nnsight/references/tutorials.md +300 -0
- package/bin/skills/openrlhf/SKILL.md +249 -0
- package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
- package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
- package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
- package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
- package/bin/skills/outlines/SKILL.md +652 -0
- package/bin/skills/outlines/references/backends.md +615 -0
- package/bin/skills/outlines/references/examples.md +773 -0
- package/bin/skills/outlines/references/json_generation.md +652 -0
- package/bin/skills/peft/SKILL.md +431 -0
- package/bin/skills/peft/references/advanced-usage.md +514 -0
- package/bin/skills/peft/references/troubleshooting.md +480 -0
- package/bin/skills/phoenix/SKILL.md +475 -0
- package/bin/skills/phoenix/references/advanced-usage.md +619 -0
- package/bin/skills/phoenix/references/troubleshooting.md +538 -0
- package/bin/skills/pinecone/SKILL.md +358 -0
- package/bin/skills/pinecone/references/deployment.md +181 -0
- package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
- package/bin/skills/pytorch-fsdp/references/index.md +7 -0
- package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
- package/bin/skills/pytorch-lightning/SKILL.md +346 -0
- package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
- package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
- package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
- package/bin/skills/pyvene/SKILL.md +473 -0
- package/bin/skills/pyvene/references/README.md +73 -0
- package/bin/skills/pyvene/references/api.md +383 -0
- package/bin/skills/pyvene/references/tutorials.md +376 -0
- package/bin/skills/qdrant/SKILL.md +493 -0
- package/bin/skills/qdrant/references/advanced-usage.md +648 -0
- package/bin/skills/qdrant/references/troubleshooting.md +631 -0
- package/bin/skills/ray-data/SKILL.md +326 -0
- package/bin/skills/ray-data/references/integration.md +82 -0
- package/bin/skills/ray-data/references/transformations.md +83 -0
- package/bin/skills/ray-train/SKILL.md +406 -0
- package/bin/skills/ray-train/references/multi-node.md +628 -0
- package/bin/skills/rwkv/SKILL.md +260 -0
- package/bin/skills/rwkv/references/architecture-details.md +344 -0
- package/bin/skills/rwkv/references/rwkv7.md +386 -0
- package/bin/skills/rwkv/references/state-management.md +369 -0
- package/bin/skills/saelens/SKILL.md +386 -0
- package/bin/skills/saelens/references/README.md +70 -0
- package/bin/skills/saelens/references/api.md +333 -0
- package/bin/skills/saelens/references/tutorials.md +318 -0
- package/bin/skills/segment-anything/SKILL.md +500 -0
- package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
- package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
- package/bin/skills/sentence-transformers/SKILL.md +255 -0
- package/bin/skills/sentence-transformers/references/models.md +123 -0
- package/bin/skills/sentencepiece/SKILL.md +235 -0
- package/bin/skills/sentencepiece/references/algorithms.md +200 -0
- package/bin/skills/sentencepiece/references/training.md +304 -0
- package/bin/skills/sglang/SKILL.md +442 -0
- package/bin/skills/sglang/references/deployment.md +490 -0
- package/bin/skills/sglang/references/radix-attention.md +413 -0
- package/bin/skills/sglang/references/structured-generation.md +541 -0
- package/bin/skills/simpo/SKILL.md +219 -0
- package/bin/skills/simpo/references/datasets.md +478 -0
- package/bin/skills/simpo/references/hyperparameters.md +452 -0
- package/bin/skills/simpo/references/loss-functions.md +350 -0
- package/bin/skills/skypilot/SKILL.md +509 -0
- package/bin/skills/skypilot/references/advanced-usage.md +491 -0
- package/bin/skills/skypilot/references/troubleshooting.md +570 -0
- package/bin/skills/slime/SKILL.md +464 -0
- package/bin/skills/slime/references/api-reference.md +392 -0
- package/bin/skills/slime/references/troubleshooting.md +386 -0
- package/bin/skills/speculative-decoding/SKILL.md +467 -0
- package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
- package/bin/skills/speculative-decoding/references/medusa.md +350 -0
- package/bin/skills/stable-diffusion/SKILL.md +519 -0
- package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
- package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
- package/bin/skills/tensorboard/SKILL.md +629 -0
- package/bin/skills/tensorboard/references/integrations.md +638 -0
- package/bin/skills/tensorboard/references/profiling.md +545 -0
- package/bin/skills/tensorboard/references/visualization.md +620 -0
- package/bin/skills/tensorrt-llm/SKILL.md +187 -0
- package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
- package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
- package/bin/skills/tensorrt-llm/references/serving.md +470 -0
- package/bin/skills/tinker/SKILL.md +362 -0
- package/bin/skills/tinker/references/api-reference.md +168 -0
- package/bin/skills/tinker/references/getting-started.md +157 -0
- package/bin/skills/tinker/references/loss-functions.md +163 -0
- package/bin/skills/tinker/references/models-and-lora.md +139 -0
- package/bin/skills/tinker/references/recipes.md +280 -0
- package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
- package/bin/skills/tinker/references/rendering.md +243 -0
- package/bin/skills/tinker/references/supervised-learning.md +232 -0
- package/bin/skills/tinker-training-cost/SKILL.md +187 -0
- package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
- package/bin/skills/torchforge/SKILL.md +433 -0
- package/bin/skills/torchforge/references/api-reference.md +327 -0
- package/bin/skills/torchforge/references/troubleshooting.md +409 -0
- package/bin/skills/torchtitan/SKILL.md +358 -0
- package/bin/skills/torchtitan/references/checkpoint.md +181 -0
- package/bin/skills/torchtitan/references/custom-models.md +258 -0
- package/bin/skills/torchtitan/references/float8.md +133 -0
- package/bin/skills/torchtitan/references/fsdp.md +126 -0
- package/bin/skills/transformer-lens/SKILL.md +346 -0
- package/bin/skills/transformer-lens/references/README.md +54 -0
- package/bin/skills/transformer-lens/references/api.md +362 -0
- package/bin/skills/transformer-lens/references/tutorials.md +339 -0
- package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
- package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
- package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
- package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
- package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
- package/bin/skills/unsloth/SKILL.md +80 -0
- package/bin/skills/unsloth/references/index.md +7 -0
- package/bin/skills/unsloth/references/llms-full.md +16799 -0
- package/bin/skills/unsloth/references/llms-txt.md +12044 -0
- package/bin/skills/unsloth/references/llms.md +82 -0
- package/bin/skills/verl/SKILL.md +391 -0
- package/bin/skills/verl/references/api-reference.md +301 -0
- package/bin/skills/verl/references/troubleshooting.md +391 -0
- package/bin/skills/vllm/SKILL.md +364 -0
- package/bin/skills/vllm/references/optimization.md +226 -0
- package/bin/skills/vllm/references/quantization.md +284 -0
- package/bin/skills/vllm/references/server-deployment.md +255 -0
- package/bin/skills/vllm/references/troubleshooting.md +447 -0
- package/bin/skills/weights-and-biases/SKILL.md +590 -0
- package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
- package/bin/skills/weights-and-biases/references/integrations.md +700 -0
- package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
- package/bin/skills/whisper/SKILL.md +317 -0
- package/bin/skills/whisper/references/languages.md +189 -0
- package/bin/synsc +0 -0
- package/package.json +10 -0
|
@@ -0,0 +1,341 @@
|
|
|
1
|
+
---
|
|
2
|
+
name: modal-serverless-gpu
|
|
3
|
+
description: Serverless GPU cloud platform for running ML workloads. Use when you need on-demand GPU access without infrastructure management, deploying ML models as APIs, or running batch jobs with automatic scaling.
|
|
4
|
+
version: 1.0.0
|
|
5
|
+
author: Synthetic Sciences
|
|
6
|
+
license: MIT
|
|
7
|
+
tags: [Infrastructure, Serverless, GPU, Cloud, Deployment, Modal]
|
|
8
|
+
dependencies: [modal>=0.64.0]
|
|
9
|
+
---
|
|
10
|
+
|
|
11
|
+
# Modal Serverless GPU
|
|
12
|
+
|
|
13
|
+
Comprehensive guide to running ML workloads on Modal's serverless GPU cloud platform.
|
|
14
|
+
|
|
15
|
+
## When to use Modal
|
|
16
|
+
|
|
17
|
+
**Use Modal when:**
|
|
18
|
+
- Running GPU-intensive ML workloads without managing infrastructure
|
|
19
|
+
- Deploying ML models as auto-scaling APIs
|
|
20
|
+
- Running batch processing jobs (training, inference, data processing)
|
|
21
|
+
- Need pay-per-second GPU pricing without idle costs
|
|
22
|
+
- Prototyping ML applications quickly
|
|
23
|
+
- Running scheduled jobs (cron-like workloads)
|
|
24
|
+
|
|
25
|
+
**Key features:**
|
|
26
|
+
- **Serverless GPUs**: T4, L4, A10G, L40S, A100, H100, H200, B200 on-demand
|
|
27
|
+
- **Python-native**: Define infrastructure in Python code, no YAML
|
|
28
|
+
- **Auto-scaling**: Scale to zero, scale to 100+ GPUs instantly
|
|
29
|
+
- **Sub-second cold starts**: Rust-based infrastructure for fast container launches
|
|
30
|
+
- **Container caching**: Image layers cached for rapid iteration
|
|
31
|
+
- **Web endpoints**: Deploy functions as REST APIs with zero-downtime updates
|
|
32
|
+
|
|
33
|
+
**Use alternatives instead:**
|
|
34
|
+
- **RunPod**: For longer-running pods with persistent state
|
|
35
|
+
- **Lambda Labs**: For reserved GPU instances
|
|
36
|
+
- **SkyPilot**: For multi-cloud orchestration and cost optimization
|
|
37
|
+
- **Kubernetes**: For complex multi-service architectures
|
|
38
|
+
|
|
39
|
+
## Quick start
|
|
40
|
+
|
|
41
|
+
### Installation
|
|
42
|
+
|
|
43
|
+
```bash
|
|
44
|
+
pip install modal
|
|
45
|
+
modal setup # Opens browser for authentication
|
|
46
|
+
```
|
|
47
|
+
|
|
48
|
+
### Hello World with GPU
|
|
49
|
+
|
|
50
|
+
```python
|
|
51
|
+
import modal
|
|
52
|
+
|
|
53
|
+
app = modal.App("hello-gpu")
|
|
54
|
+
|
|
55
|
+
@app.function(gpu="T4")
|
|
56
|
+
def gpu_info():
|
|
57
|
+
import subprocess
|
|
58
|
+
return subprocess.run(["nvidia-smi"], capture_output=True, text=True).stdout
|
|
59
|
+
|
|
60
|
+
@app.local_entrypoint()
|
|
61
|
+
def main():
|
|
62
|
+
print(gpu_info.remote())
|
|
63
|
+
```
|
|
64
|
+
|
|
65
|
+
Run: `modal run hello_gpu.py`
|
|
66
|
+
|
|
67
|
+
### Basic inference endpoint
|
|
68
|
+
|
|
69
|
+
```python
|
|
70
|
+
import modal
|
|
71
|
+
|
|
72
|
+
app = modal.App("text-generation")
|
|
73
|
+
image = modal.Image.debian_slim().pip_install("transformers", "torch", "accelerate")
|
|
74
|
+
|
|
75
|
+
@app.cls(gpu="A10G", image=image)
|
|
76
|
+
class TextGenerator:
|
|
77
|
+
@modal.enter()
|
|
78
|
+
def load_model(self):
|
|
79
|
+
from transformers import pipeline
|
|
80
|
+
self.pipe = pipeline("text-generation", model="gpt2", device=0)
|
|
81
|
+
|
|
82
|
+
@modal.method()
|
|
83
|
+
def generate(self, prompt: str) -> str:
|
|
84
|
+
return self.pipe(prompt, max_length=100)[0]["generated_text"]
|
|
85
|
+
|
|
86
|
+
@app.local_entrypoint()
|
|
87
|
+
def main():
|
|
88
|
+
print(TextGenerator().generate.remote("Hello, world"))
|
|
89
|
+
```
|
|
90
|
+
|
|
91
|
+
## Core concepts
|
|
92
|
+
|
|
93
|
+
### Key components
|
|
94
|
+
|
|
95
|
+
| Component | Purpose |
|
|
96
|
+
|-----------|---------|
|
|
97
|
+
| `App` | Container for functions and resources |
|
|
98
|
+
| `Function` | Serverless function with compute specs |
|
|
99
|
+
| `Cls` | Class-based functions with lifecycle hooks |
|
|
100
|
+
| `Image` | Container image definition |
|
|
101
|
+
| `Volume` | Persistent storage for models/data |
|
|
102
|
+
| `Secret` | Secure credential storage |
|
|
103
|
+
|
|
104
|
+
### Execution modes
|
|
105
|
+
|
|
106
|
+
| Command | Description |
|
|
107
|
+
|---------|-------------|
|
|
108
|
+
| `modal run script.py` | Execute and exit |
|
|
109
|
+
| `modal serve script.py` | Development with live reload |
|
|
110
|
+
| `modal deploy script.py` | Persistent cloud deployment |
|
|
111
|
+
|
|
112
|
+
## GPU configuration
|
|
113
|
+
|
|
114
|
+
### Available GPUs
|
|
115
|
+
|
|
116
|
+
| GPU | VRAM | Best For |
|
|
117
|
+
|-----|------|----------|
|
|
118
|
+
| `T4` | 16GB | Budget inference, small models |
|
|
119
|
+
| `L4` | 24GB | Inference, Ada Lovelace arch |
|
|
120
|
+
| `A10G` | 24GB | Training/inference, 3.3x faster than T4 |
|
|
121
|
+
| `L40S` | 48GB | Recommended for inference (best cost/perf) |
|
|
122
|
+
| `A100-40GB` | 40GB | Large model training |
|
|
123
|
+
| `A100-80GB` | 80GB | Very large models |
|
|
124
|
+
| `H100` | 80GB | Fastest, FP8 + Transformer Engine |
|
|
125
|
+
| `H200` | 141GB | Auto-upgrade from H100, 4.8TB/s bandwidth |
|
|
126
|
+
| `B200` | Latest | Blackwell architecture |
|
|
127
|
+
|
|
128
|
+
### GPU specification patterns
|
|
129
|
+
|
|
130
|
+
```python
|
|
131
|
+
# Single GPU
|
|
132
|
+
@app.function(gpu="A100")
|
|
133
|
+
|
|
134
|
+
# Specific memory variant
|
|
135
|
+
@app.function(gpu="A100-80GB")
|
|
136
|
+
|
|
137
|
+
# Multiple GPUs (up to 8)
|
|
138
|
+
@app.function(gpu="H100:4")
|
|
139
|
+
|
|
140
|
+
# GPU with fallbacks
|
|
141
|
+
@app.function(gpu=["H100", "A100", "L40S"])
|
|
142
|
+
|
|
143
|
+
# Any available GPU
|
|
144
|
+
@app.function(gpu="any")
|
|
145
|
+
```
|
|
146
|
+
|
|
147
|
+
## Container images
|
|
148
|
+
|
|
149
|
+
```python
|
|
150
|
+
# Basic image with pip
|
|
151
|
+
image = modal.Image.debian_slim(python_version="3.11").pip_install(
|
|
152
|
+
"torch==2.1.0", "transformers==4.36.0", "accelerate"
|
|
153
|
+
)
|
|
154
|
+
|
|
155
|
+
# From CUDA base
|
|
156
|
+
image = modal.Image.from_registry(
|
|
157
|
+
"nvidia/cuda:12.1.0-cudnn8-devel-ubuntu22.04",
|
|
158
|
+
add_python="3.11"
|
|
159
|
+
).pip_install("torch", "transformers")
|
|
160
|
+
|
|
161
|
+
# With system packages
|
|
162
|
+
image = modal.Image.debian_slim().apt_install("git", "ffmpeg").pip_install("whisper")
|
|
163
|
+
```
|
|
164
|
+
|
|
165
|
+
## Persistent storage
|
|
166
|
+
|
|
167
|
+
```python
|
|
168
|
+
volume = modal.Volume.from_name("model-cache", create_if_missing=True)
|
|
169
|
+
|
|
170
|
+
@app.function(gpu="A10G", volumes={"/models": volume})
|
|
171
|
+
def load_model():
|
|
172
|
+
import os
|
|
173
|
+
model_path = "/models/llama-7b"
|
|
174
|
+
if not os.path.exists(model_path):
|
|
175
|
+
model = download_model()
|
|
176
|
+
model.save_pretrained(model_path)
|
|
177
|
+
volume.commit() # Persist changes
|
|
178
|
+
return load_from_path(model_path)
|
|
179
|
+
```
|
|
180
|
+
|
|
181
|
+
## Web endpoints
|
|
182
|
+
|
|
183
|
+
### FastAPI endpoint decorator
|
|
184
|
+
|
|
185
|
+
```python
|
|
186
|
+
@app.function()
|
|
187
|
+
@modal.fastapi_endpoint(method="POST")
|
|
188
|
+
def predict(text: str) -> dict:
|
|
189
|
+
return {"result": model.predict(text)}
|
|
190
|
+
```
|
|
191
|
+
|
|
192
|
+
### Full ASGI app
|
|
193
|
+
|
|
194
|
+
```python
|
|
195
|
+
from fastapi import FastAPI
|
|
196
|
+
web_app = FastAPI()
|
|
197
|
+
|
|
198
|
+
@web_app.post("/predict")
|
|
199
|
+
async def predict(text: str):
|
|
200
|
+
return {"result": await model.predict.remote.aio(text)}
|
|
201
|
+
|
|
202
|
+
@app.function()
|
|
203
|
+
@modal.asgi_app()
|
|
204
|
+
def fastapi_app():
|
|
205
|
+
return web_app
|
|
206
|
+
```
|
|
207
|
+
|
|
208
|
+
### Web endpoint types
|
|
209
|
+
|
|
210
|
+
| Decorator | Use Case |
|
|
211
|
+
|-----------|----------|
|
|
212
|
+
| `@modal.fastapi_endpoint()` | Simple function → API |
|
|
213
|
+
| `@modal.asgi_app()` | Full FastAPI/Starlette apps |
|
|
214
|
+
| `@modal.wsgi_app()` | Django/Flask apps |
|
|
215
|
+
| `@modal.web_server(port)` | Arbitrary HTTP servers |
|
|
216
|
+
|
|
217
|
+
## Dynamic batching
|
|
218
|
+
|
|
219
|
+
```python
|
|
220
|
+
@app.function()
|
|
221
|
+
@modal.batched(max_batch_size=32, wait_ms=100)
|
|
222
|
+
async def batch_predict(inputs: list[str]) -> list[dict]:
|
|
223
|
+
# Inputs automatically batched
|
|
224
|
+
return model.batch_predict(inputs)
|
|
225
|
+
```
|
|
226
|
+
|
|
227
|
+
## Secrets management
|
|
228
|
+
|
|
229
|
+
```bash
|
|
230
|
+
# Create secret
|
|
231
|
+
modal secret create huggingface HF_TOKEN=hf_xxx
|
|
232
|
+
```
|
|
233
|
+
|
|
234
|
+
```python
|
|
235
|
+
@app.function(secrets=[modal.Secret.from_name("huggingface")])
|
|
236
|
+
def download_model():
|
|
237
|
+
import os
|
|
238
|
+
token = os.environ["HF_TOKEN"]
|
|
239
|
+
```
|
|
240
|
+
|
|
241
|
+
## Scheduling
|
|
242
|
+
|
|
243
|
+
```python
|
|
244
|
+
@app.function(schedule=modal.Cron("0 0 * * *")) # Daily midnight
|
|
245
|
+
def daily_job():
|
|
246
|
+
pass
|
|
247
|
+
|
|
248
|
+
@app.function(schedule=modal.Period(hours=1))
|
|
249
|
+
def hourly_job():
|
|
250
|
+
pass
|
|
251
|
+
```
|
|
252
|
+
|
|
253
|
+
## Performance optimization
|
|
254
|
+
|
|
255
|
+
### Cold start mitigation
|
|
256
|
+
|
|
257
|
+
```python
|
|
258
|
+
@app.function(
|
|
259
|
+
container_idle_timeout=300, # Keep warm 5 min
|
|
260
|
+
allow_concurrent_inputs=10, # Handle concurrent requests
|
|
261
|
+
)
|
|
262
|
+
def inference():
|
|
263
|
+
pass
|
|
264
|
+
```
|
|
265
|
+
|
|
266
|
+
### Model loading best practices
|
|
267
|
+
|
|
268
|
+
```python
|
|
269
|
+
@app.cls(gpu="A100")
|
|
270
|
+
class Model:
|
|
271
|
+
@modal.enter() # Run once at container start
|
|
272
|
+
def load(self):
|
|
273
|
+
self.model = load_model() # Load during warm-up
|
|
274
|
+
|
|
275
|
+
@modal.method()
|
|
276
|
+
def predict(self, x):
|
|
277
|
+
return self.model(x)
|
|
278
|
+
```
|
|
279
|
+
|
|
280
|
+
## Parallel processing
|
|
281
|
+
|
|
282
|
+
```python
|
|
283
|
+
@app.function()
|
|
284
|
+
def process_item(item):
|
|
285
|
+
return expensive_computation(item)
|
|
286
|
+
|
|
287
|
+
@app.function()
|
|
288
|
+
def run_parallel():
|
|
289
|
+
items = list(range(1000))
|
|
290
|
+
# Fan out to parallel containers
|
|
291
|
+
results = list(process_item.map(items))
|
|
292
|
+
return results
|
|
293
|
+
```
|
|
294
|
+
|
|
295
|
+
## Common configuration
|
|
296
|
+
|
|
297
|
+
```python
|
|
298
|
+
@app.function(
|
|
299
|
+
gpu="A100",
|
|
300
|
+
memory=32768, # 32GB RAM
|
|
301
|
+
cpu=4, # 4 CPU cores
|
|
302
|
+
timeout=3600, # 1 hour max
|
|
303
|
+
container_idle_timeout=120,# Keep warm 2 min
|
|
304
|
+
retries=3, # Retry on failure
|
|
305
|
+
concurrency_limit=10, # Max concurrent containers
|
|
306
|
+
)
|
|
307
|
+
def my_function():
|
|
308
|
+
pass
|
|
309
|
+
```
|
|
310
|
+
|
|
311
|
+
## Debugging
|
|
312
|
+
|
|
313
|
+
```python
|
|
314
|
+
# Test locally
|
|
315
|
+
if __name__ == "__main__":
|
|
316
|
+
result = my_function.local()
|
|
317
|
+
|
|
318
|
+
# View logs
|
|
319
|
+
# modal app logs my-app
|
|
320
|
+
```
|
|
321
|
+
|
|
322
|
+
## Common issues
|
|
323
|
+
|
|
324
|
+
| Issue | Solution |
|
|
325
|
+
|-------|----------|
|
|
326
|
+
| Cold start latency | Increase `container_idle_timeout`, use `@modal.enter()` |
|
|
327
|
+
| GPU OOM | Use larger GPU (`A100-80GB`), enable gradient checkpointing |
|
|
328
|
+
| Image build fails | Pin dependency versions, check CUDA compatibility |
|
|
329
|
+
| Timeout errors | Increase `timeout`, add checkpointing |
|
|
330
|
+
|
|
331
|
+
## References
|
|
332
|
+
|
|
333
|
+
- **[Advanced Usage](references/advanced-usage.md)** - Multi-GPU, distributed training, cost optimization
|
|
334
|
+
- **[Troubleshooting](references/troubleshooting.md)** - Common issues and solutions
|
|
335
|
+
|
|
336
|
+
## Resources
|
|
337
|
+
|
|
338
|
+
- **Documentation**: https://modal.com/docs
|
|
339
|
+
- **Examples**: https://github.com/modal-labs/modal-examples
|
|
340
|
+
- **Pricing**: https://modal.com/pricing
|
|
341
|
+
- **Discord**: https://discord.gg/modal
|