@synsci/cli-darwin-x64 1.1.49
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/skills/accelerate/SKILL.md +332 -0
- package/bin/skills/accelerate/references/custom-plugins.md +453 -0
- package/bin/skills/accelerate/references/megatron-integration.md +489 -0
- package/bin/skills/accelerate/references/performance.md +525 -0
- package/bin/skills/audiocraft/SKILL.md +564 -0
- package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
- package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
- package/bin/skills/autogpt/SKILL.md +403 -0
- package/bin/skills/autogpt/references/advanced-usage.md +535 -0
- package/bin/skills/autogpt/references/troubleshooting.md +420 -0
- package/bin/skills/awq/SKILL.md +310 -0
- package/bin/skills/awq/references/advanced-usage.md +324 -0
- package/bin/skills/awq/references/troubleshooting.md +344 -0
- package/bin/skills/axolotl/SKILL.md +158 -0
- package/bin/skills/axolotl/references/api.md +5548 -0
- package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
- package/bin/skills/axolotl/references/index.md +15 -0
- package/bin/skills/axolotl/references/other.md +3563 -0
- package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
- package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
- package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
- package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
- package/bin/skills/bitsandbytes/SKILL.md +411 -0
- package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
- package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
- package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
- package/bin/skills/blip-2/SKILL.md +564 -0
- package/bin/skills/blip-2/references/advanced-usage.md +680 -0
- package/bin/skills/blip-2/references/troubleshooting.md +526 -0
- package/bin/skills/chroma/SKILL.md +406 -0
- package/bin/skills/chroma/references/integration.md +38 -0
- package/bin/skills/clip/SKILL.md +253 -0
- package/bin/skills/clip/references/applications.md +207 -0
- package/bin/skills/constitutional-ai/SKILL.md +290 -0
- package/bin/skills/crewai/SKILL.md +498 -0
- package/bin/skills/crewai/references/flows.md +438 -0
- package/bin/skills/crewai/references/tools.md +429 -0
- package/bin/skills/crewai/references/troubleshooting.md +480 -0
- package/bin/skills/deepspeed/SKILL.md +141 -0
- package/bin/skills/deepspeed/references/08.md +17 -0
- package/bin/skills/deepspeed/references/09.md +173 -0
- package/bin/skills/deepspeed/references/2020.md +378 -0
- package/bin/skills/deepspeed/references/2023.md +279 -0
- package/bin/skills/deepspeed/references/assets.md +179 -0
- package/bin/skills/deepspeed/references/index.md +35 -0
- package/bin/skills/deepspeed/references/mii.md +118 -0
- package/bin/skills/deepspeed/references/other.md +1191 -0
- package/bin/skills/deepspeed/references/tutorials.md +6554 -0
- package/bin/skills/dspy/SKILL.md +590 -0
- package/bin/skills/dspy/references/examples.md +663 -0
- package/bin/skills/dspy/references/modules.md +475 -0
- package/bin/skills/dspy/references/optimizers.md +566 -0
- package/bin/skills/faiss/SKILL.md +221 -0
- package/bin/skills/faiss/references/index_types.md +280 -0
- package/bin/skills/flash-attention/SKILL.md +367 -0
- package/bin/skills/flash-attention/references/benchmarks.md +215 -0
- package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
- package/bin/skills/gguf/SKILL.md +427 -0
- package/bin/skills/gguf/references/advanced-usage.md +504 -0
- package/bin/skills/gguf/references/troubleshooting.md +442 -0
- package/bin/skills/gptq/SKILL.md +450 -0
- package/bin/skills/gptq/references/calibration.md +337 -0
- package/bin/skills/gptq/references/integration.md +129 -0
- package/bin/skills/gptq/references/troubleshooting.md +95 -0
- package/bin/skills/grpo-rl-training/README.md +97 -0
- package/bin/skills/grpo-rl-training/SKILL.md +572 -0
- package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
- package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
- package/bin/skills/guidance/SKILL.md +572 -0
- package/bin/skills/guidance/references/backends.md +554 -0
- package/bin/skills/guidance/references/constraints.md +674 -0
- package/bin/skills/guidance/references/examples.md +767 -0
- package/bin/skills/hqq/SKILL.md +445 -0
- package/bin/skills/hqq/references/advanced-usage.md +528 -0
- package/bin/skills/hqq/references/troubleshooting.md +503 -0
- package/bin/skills/hugging-face-cli/SKILL.md +191 -0
- package/bin/skills/hugging-face-cli/references/commands.md +954 -0
- package/bin/skills/hugging-face-cli/references/examples.md +374 -0
- package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
- package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
- package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
- package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
- package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
- package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
- package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
- package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
- package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
- package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
- package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
- package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
- package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
- package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
- package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
- package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
- package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
- package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
- package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
- package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
- package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
- package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
- package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
- package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
- package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
- package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
- package/bin/skills/hugging-face-jobs/index.html +216 -0
- package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
- package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
- package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
- package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
- package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
- package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
- package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
- package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
- package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
- package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
- package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
- package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
- package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
- package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
- package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
- package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
- package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
- package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
- package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
- package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
- package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
- package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
- package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
- package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
- package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
- package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
- package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
- package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
- package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
- package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
- package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
- package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
- package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
- package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
- package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
- package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
- package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
- package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
- package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
- package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
- package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
- package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
- package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
- package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
- package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
- package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
- package/bin/skills/instructor/SKILL.md +740 -0
- package/bin/skills/instructor/references/examples.md +107 -0
- package/bin/skills/instructor/references/providers.md +70 -0
- package/bin/skills/instructor/references/validation.md +606 -0
- package/bin/skills/knowledge-distillation/SKILL.md +458 -0
- package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
- package/bin/skills/lambda-labs/SKILL.md +545 -0
- package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
- package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
- package/bin/skills/langchain/SKILL.md +480 -0
- package/bin/skills/langchain/references/agents.md +499 -0
- package/bin/skills/langchain/references/integration.md +562 -0
- package/bin/skills/langchain/references/rag.md +600 -0
- package/bin/skills/langsmith/SKILL.md +422 -0
- package/bin/skills/langsmith/references/advanced-usage.md +548 -0
- package/bin/skills/langsmith/references/troubleshooting.md +537 -0
- package/bin/skills/litgpt/SKILL.md +469 -0
- package/bin/skills/litgpt/references/custom-models.md +568 -0
- package/bin/skills/litgpt/references/distributed-training.md +451 -0
- package/bin/skills/litgpt/references/supported-models.md +336 -0
- package/bin/skills/litgpt/references/training-recipes.md +619 -0
- package/bin/skills/llama-cpp/SKILL.md +258 -0
- package/bin/skills/llama-cpp/references/optimization.md +89 -0
- package/bin/skills/llama-cpp/references/quantization.md +213 -0
- package/bin/skills/llama-cpp/references/server.md +125 -0
- package/bin/skills/llama-factory/SKILL.md +80 -0
- package/bin/skills/llama-factory/references/_images.md +23 -0
- package/bin/skills/llama-factory/references/advanced.md +1055 -0
- package/bin/skills/llama-factory/references/getting_started.md +349 -0
- package/bin/skills/llama-factory/references/index.md +19 -0
- package/bin/skills/llama-factory/references/other.md +31 -0
- package/bin/skills/llamaguard/SKILL.md +337 -0
- package/bin/skills/llamaindex/SKILL.md +569 -0
- package/bin/skills/llamaindex/references/agents.md +83 -0
- package/bin/skills/llamaindex/references/data_connectors.md +108 -0
- package/bin/skills/llamaindex/references/query_engines.md +406 -0
- package/bin/skills/llava/SKILL.md +304 -0
- package/bin/skills/llava/references/training.md +197 -0
- package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
- package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
- package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
- package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
- package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
- package/bin/skills/long-context/SKILL.md +536 -0
- package/bin/skills/long-context/references/extension_methods.md +468 -0
- package/bin/skills/long-context/references/fine_tuning.md +611 -0
- package/bin/skills/long-context/references/rope.md +402 -0
- package/bin/skills/mamba/SKILL.md +260 -0
- package/bin/skills/mamba/references/architecture-details.md +206 -0
- package/bin/skills/mamba/references/benchmarks.md +255 -0
- package/bin/skills/mamba/references/training-guide.md +388 -0
- package/bin/skills/megatron-core/SKILL.md +366 -0
- package/bin/skills/megatron-core/references/benchmarks.md +249 -0
- package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
- package/bin/skills/megatron-core/references/production-examples.md +473 -0
- package/bin/skills/megatron-core/references/training-recipes.md +547 -0
- package/bin/skills/miles/SKILL.md +315 -0
- package/bin/skills/miles/references/api-reference.md +141 -0
- package/bin/skills/miles/references/troubleshooting.md +352 -0
- package/bin/skills/mlflow/SKILL.md +704 -0
- package/bin/skills/mlflow/references/deployment.md +744 -0
- package/bin/skills/mlflow/references/model-registry.md +770 -0
- package/bin/skills/mlflow/references/tracking.md +680 -0
- package/bin/skills/modal/SKILL.md +341 -0
- package/bin/skills/modal/references/advanced-usage.md +503 -0
- package/bin/skills/modal/references/troubleshooting.md +494 -0
- package/bin/skills/model-merging/SKILL.md +539 -0
- package/bin/skills/model-merging/references/evaluation.md +462 -0
- package/bin/skills/model-merging/references/examples.md +428 -0
- package/bin/skills/model-merging/references/methods.md +352 -0
- package/bin/skills/model-pruning/SKILL.md +495 -0
- package/bin/skills/model-pruning/references/wanda.md +347 -0
- package/bin/skills/moe-training/SKILL.md +526 -0
- package/bin/skills/moe-training/references/architectures.md +432 -0
- package/bin/skills/moe-training/references/inference.md +348 -0
- package/bin/skills/moe-training/references/training.md +425 -0
- package/bin/skills/nanogpt/SKILL.md +290 -0
- package/bin/skills/nanogpt/references/architecture.md +382 -0
- package/bin/skills/nanogpt/references/data.md +476 -0
- package/bin/skills/nanogpt/references/training.md +564 -0
- package/bin/skills/nemo-curator/SKILL.md +383 -0
- package/bin/skills/nemo-curator/references/deduplication.md +87 -0
- package/bin/skills/nemo-curator/references/filtering.md +102 -0
- package/bin/skills/nemo-evaluator/SKILL.md +494 -0
- package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
- package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
- package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
- package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
- package/bin/skills/nemo-guardrails/SKILL.md +297 -0
- package/bin/skills/nnsight/SKILL.md +436 -0
- package/bin/skills/nnsight/references/README.md +78 -0
- package/bin/skills/nnsight/references/api.md +344 -0
- package/bin/skills/nnsight/references/tutorials.md +300 -0
- package/bin/skills/openrlhf/SKILL.md +249 -0
- package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
- package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
- package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
- package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
- package/bin/skills/outlines/SKILL.md +652 -0
- package/bin/skills/outlines/references/backends.md +615 -0
- package/bin/skills/outlines/references/examples.md +773 -0
- package/bin/skills/outlines/references/json_generation.md +652 -0
- package/bin/skills/peft/SKILL.md +431 -0
- package/bin/skills/peft/references/advanced-usage.md +514 -0
- package/bin/skills/peft/references/troubleshooting.md +480 -0
- package/bin/skills/phoenix/SKILL.md +475 -0
- package/bin/skills/phoenix/references/advanced-usage.md +619 -0
- package/bin/skills/phoenix/references/troubleshooting.md +538 -0
- package/bin/skills/pinecone/SKILL.md +358 -0
- package/bin/skills/pinecone/references/deployment.md +181 -0
- package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
- package/bin/skills/pytorch-fsdp/references/index.md +7 -0
- package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
- package/bin/skills/pytorch-lightning/SKILL.md +346 -0
- package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
- package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
- package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
- package/bin/skills/pyvene/SKILL.md +473 -0
- package/bin/skills/pyvene/references/README.md +73 -0
- package/bin/skills/pyvene/references/api.md +383 -0
- package/bin/skills/pyvene/references/tutorials.md +376 -0
- package/bin/skills/qdrant/SKILL.md +493 -0
- package/bin/skills/qdrant/references/advanced-usage.md +648 -0
- package/bin/skills/qdrant/references/troubleshooting.md +631 -0
- package/bin/skills/ray-data/SKILL.md +326 -0
- package/bin/skills/ray-data/references/integration.md +82 -0
- package/bin/skills/ray-data/references/transformations.md +83 -0
- package/bin/skills/ray-train/SKILL.md +406 -0
- package/bin/skills/ray-train/references/multi-node.md +628 -0
- package/bin/skills/rwkv/SKILL.md +260 -0
- package/bin/skills/rwkv/references/architecture-details.md +344 -0
- package/bin/skills/rwkv/references/rwkv7.md +386 -0
- package/bin/skills/rwkv/references/state-management.md +369 -0
- package/bin/skills/saelens/SKILL.md +386 -0
- package/bin/skills/saelens/references/README.md +70 -0
- package/bin/skills/saelens/references/api.md +333 -0
- package/bin/skills/saelens/references/tutorials.md +318 -0
- package/bin/skills/segment-anything/SKILL.md +500 -0
- package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
- package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
- package/bin/skills/sentence-transformers/SKILL.md +255 -0
- package/bin/skills/sentence-transformers/references/models.md +123 -0
- package/bin/skills/sentencepiece/SKILL.md +235 -0
- package/bin/skills/sentencepiece/references/algorithms.md +200 -0
- package/bin/skills/sentencepiece/references/training.md +304 -0
- package/bin/skills/sglang/SKILL.md +442 -0
- package/bin/skills/sglang/references/deployment.md +490 -0
- package/bin/skills/sglang/references/radix-attention.md +413 -0
- package/bin/skills/sglang/references/structured-generation.md +541 -0
- package/bin/skills/simpo/SKILL.md +219 -0
- package/bin/skills/simpo/references/datasets.md +478 -0
- package/bin/skills/simpo/references/hyperparameters.md +452 -0
- package/bin/skills/simpo/references/loss-functions.md +350 -0
- package/bin/skills/skypilot/SKILL.md +509 -0
- package/bin/skills/skypilot/references/advanced-usage.md +491 -0
- package/bin/skills/skypilot/references/troubleshooting.md +570 -0
- package/bin/skills/slime/SKILL.md +464 -0
- package/bin/skills/slime/references/api-reference.md +392 -0
- package/bin/skills/slime/references/troubleshooting.md +386 -0
- package/bin/skills/speculative-decoding/SKILL.md +467 -0
- package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
- package/bin/skills/speculative-decoding/references/medusa.md +350 -0
- package/bin/skills/stable-diffusion/SKILL.md +519 -0
- package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
- package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
- package/bin/skills/tensorboard/SKILL.md +629 -0
- package/bin/skills/tensorboard/references/integrations.md +638 -0
- package/bin/skills/tensorboard/references/profiling.md +545 -0
- package/bin/skills/tensorboard/references/visualization.md +620 -0
- package/bin/skills/tensorrt-llm/SKILL.md +187 -0
- package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
- package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
- package/bin/skills/tensorrt-llm/references/serving.md +470 -0
- package/bin/skills/tinker/SKILL.md +362 -0
- package/bin/skills/tinker/references/api-reference.md +168 -0
- package/bin/skills/tinker/references/getting-started.md +157 -0
- package/bin/skills/tinker/references/loss-functions.md +163 -0
- package/bin/skills/tinker/references/models-and-lora.md +139 -0
- package/bin/skills/tinker/references/recipes.md +280 -0
- package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
- package/bin/skills/tinker/references/rendering.md +243 -0
- package/bin/skills/tinker/references/supervised-learning.md +232 -0
- package/bin/skills/tinker-training-cost/SKILL.md +187 -0
- package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
- package/bin/skills/torchforge/SKILL.md +433 -0
- package/bin/skills/torchforge/references/api-reference.md +327 -0
- package/bin/skills/torchforge/references/troubleshooting.md +409 -0
- package/bin/skills/torchtitan/SKILL.md +358 -0
- package/bin/skills/torchtitan/references/checkpoint.md +181 -0
- package/bin/skills/torchtitan/references/custom-models.md +258 -0
- package/bin/skills/torchtitan/references/float8.md +133 -0
- package/bin/skills/torchtitan/references/fsdp.md +126 -0
- package/bin/skills/transformer-lens/SKILL.md +346 -0
- package/bin/skills/transformer-lens/references/README.md +54 -0
- package/bin/skills/transformer-lens/references/api.md +362 -0
- package/bin/skills/transformer-lens/references/tutorials.md +339 -0
- package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
- package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
- package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
- package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
- package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
- package/bin/skills/unsloth/SKILL.md +80 -0
- package/bin/skills/unsloth/references/index.md +7 -0
- package/bin/skills/unsloth/references/llms-full.md +16799 -0
- package/bin/skills/unsloth/references/llms-txt.md +12044 -0
- package/bin/skills/unsloth/references/llms.md +82 -0
- package/bin/skills/verl/SKILL.md +391 -0
- package/bin/skills/verl/references/api-reference.md +301 -0
- package/bin/skills/verl/references/troubleshooting.md +391 -0
- package/bin/skills/vllm/SKILL.md +364 -0
- package/bin/skills/vllm/references/optimization.md +226 -0
- package/bin/skills/vllm/references/quantization.md +284 -0
- package/bin/skills/vllm/references/server-deployment.md +255 -0
- package/bin/skills/vllm/references/troubleshooting.md +447 -0
- package/bin/skills/weights-and-biases/SKILL.md +590 -0
- package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
- package/bin/skills/weights-and-biases/references/integrations.md +700 -0
- package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
- package/bin/skills/whisper/SKILL.md +317 -0
- package/bin/skills/whisper/references/languages.md +189 -0
- package/bin/synsc +0 -0
- package/package.json +10 -0
|
@@ -0,0 +1,394 @@
|
|
|
1
|
+
# Common Issues and Troubleshooting
|
|
2
|
+
|
|
3
|
+
Solutions to frequently encountered problems with BigCode Evaluation Harness.
|
|
4
|
+
|
|
5
|
+
## Installation Issues
|
|
6
|
+
|
|
7
|
+
### Issue: PyTorch Version Conflicts
|
|
8
|
+
|
|
9
|
+
**Symptom**: Import errors or CUDA incompatibility after installation.
|
|
10
|
+
|
|
11
|
+
**Solution**: Install PyTorch separately BEFORE installing the harness:
|
|
12
|
+
```bash
|
|
13
|
+
# Check your CUDA version
|
|
14
|
+
nvidia-smi
|
|
15
|
+
|
|
16
|
+
# Install matching PyTorch (example for CUDA 11.8)
|
|
17
|
+
pip install torch --index-url https://download.pytorch.org/whl/cu118
|
|
18
|
+
|
|
19
|
+
# Then install harness
|
|
20
|
+
pip install -e .
|
|
21
|
+
```
|
|
22
|
+
|
|
23
|
+
### Issue: DS-1000 Specific Requirements
|
|
24
|
+
|
|
25
|
+
**Symptom**: Errors when running DS-1000 benchmark.
|
|
26
|
+
|
|
27
|
+
**Solution**: DS-1000 requires Python 3.7.10 specifically:
|
|
28
|
+
```bash
|
|
29
|
+
# Create conda environment
|
|
30
|
+
conda create -n ds1000 python=3.7.10
|
|
31
|
+
conda activate ds1000
|
|
32
|
+
|
|
33
|
+
# Install specific dependencies
|
|
34
|
+
pip install -e ".[ds1000]"
|
|
35
|
+
pip install torch==1.12.1+cu116 --extra-index-url https://download.pytorch.org/whl/cu116
|
|
36
|
+
|
|
37
|
+
# Set environment variables
|
|
38
|
+
export TF_CPP_MIN_LOG_LEVEL=3
|
|
39
|
+
export TF_FORCE_GPU_ALLOW_GROWTH=true
|
|
40
|
+
```
|
|
41
|
+
|
|
42
|
+
### Issue: HuggingFace Authentication
|
|
43
|
+
|
|
44
|
+
**Symptom**: `401 Unauthorized` when accessing gated models/datasets.
|
|
45
|
+
|
|
46
|
+
**Solution**:
|
|
47
|
+
```bash
|
|
48
|
+
# Login to HuggingFace
|
|
49
|
+
huggingface-cli login
|
|
50
|
+
|
|
51
|
+
# Use auth token in command
|
|
52
|
+
accelerate launch main.py \
|
|
53
|
+
--model meta-llama/CodeLlama-7b-hf \
|
|
54
|
+
--use_auth_token \
|
|
55
|
+
...
|
|
56
|
+
```
|
|
57
|
+
|
|
58
|
+
## Memory Issues
|
|
59
|
+
|
|
60
|
+
### Issue: CUDA Out of Memory
|
|
61
|
+
|
|
62
|
+
**Symptom**: `torch.cuda.OutOfMemoryError: CUDA out of memory`
|
|
63
|
+
|
|
64
|
+
**Solutions**:
|
|
65
|
+
|
|
66
|
+
1. **Use quantization**:
|
|
67
|
+
```bash
|
|
68
|
+
# 8-bit quantization (saves ~50% memory)
|
|
69
|
+
accelerate launch main.py \
|
|
70
|
+
--model bigcode/starcoder2-15b \
|
|
71
|
+
--load_in_8bit \
|
|
72
|
+
...
|
|
73
|
+
|
|
74
|
+
# 4-bit quantization (saves ~75% memory)
|
|
75
|
+
accelerate launch main.py \
|
|
76
|
+
--model bigcode/starcoder2-15b \
|
|
77
|
+
--load_in_4bit \
|
|
78
|
+
...
|
|
79
|
+
```
|
|
80
|
+
|
|
81
|
+
2. **Reduce batch size**:
|
|
82
|
+
```bash
|
|
83
|
+
--batch_size 1
|
|
84
|
+
```
|
|
85
|
+
|
|
86
|
+
3. **Set memory limits**:
|
|
87
|
+
```bash
|
|
88
|
+
--max_memory_per_gpu "20GiB"
|
|
89
|
+
# OR
|
|
90
|
+
--max_memory_per_gpu auto
|
|
91
|
+
```
|
|
92
|
+
|
|
93
|
+
4. **Use half precision**:
|
|
94
|
+
```bash
|
|
95
|
+
--precision fp16
|
|
96
|
+
# OR
|
|
97
|
+
--precision bf16
|
|
98
|
+
```
|
|
99
|
+
|
|
100
|
+
### Issue: Running Out of RAM During Evaluation
|
|
101
|
+
|
|
102
|
+
**Symptom**: Process killed, system becomes unresponsive.
|
|
103
|
+
|
|
104
|
+
**Solution**: Reduce number of samples being held in memory:
|
|
105
|
+
```bash
|
|
106
|
+
# Save intermediate results
|
|
107
|
+
--save_every_k_tasks 10
|
|
108
|
+
|
|
109
|
+
# Evaluate subset at a time
|
|
110
|
+
--limit 50 --limit_start 0
|
|
111
|
+
# Then
|
|
112
|
+
--limit 50 --limit_start 50
|
|
113
|
+
```
|
|
114
|
+
|
|
115
|
+
## Execution Issues
|
|
116
|
+
|
|
117
|
+
### Issue: Code Execution Not Allowed
|
|
118
|
+
|
|
119
|
+
**Symptom**: Error about code execution being disabled.
|
|
120
|
+
|
|
121
|
+
**Solution**: Add the execution flag:
|
|
122
|
+
```bash
|
|
123
|
+
accelerate launch main.py \
|
|
124
|
+
--model ... \
|
|
125
|
+
--tasks humaneval \
|
|
126
|
+
--allow_code_execution # Required for unit test benchmarks
|
|
127
|
+
```
|
|
128
|
+
|
|
129
|
+
### Issue: Execution Timeout/Hang
|
|
130
|
+
|
|
131
|
+
**Symptom**: Evaluation hangs indefinitely or times out.
|
|
132
|
+
|
|
133
|
+
**Solutions**:
|
|
134
|
+
|
|
135
|
+
1. **Use Docker for isolation**:
|
|
136
|
+
```bash
|
|
137
|
+
# Generate without execution
|
|
138
|
+
accelerate launch main.py \
|
|
139
|
+
--model ... \
|
|
140
|
+
--tasks humaneval \
|
|
141
|
+
--generation_only \
|
|
142
|
+
--save_generations \
|
|
143
|
+
--save_generations_path generations.json
|
|
144
|
+
|
|
145
|
+
# Evaluate in Docker
|
|
146
|
+
docker run -v $(pwd)/generations.json:/app/generations.json:ro \
|
|
147
|
+
-it evaluation-harness python3 main.py \
|
|
148
|
+
--tasks humaneval \
|
|
149
|
+
--load_generations_path /app/generations.json \
|
|
150
|
+
--allow_code_execution
|
|
151
|
+
```
|
|
152
|
+
|
|
153
|
+
2. **Use subsets for debugging**:
|
|
154
|
+
```bash
|
|
155
|
+
--limit 10 # Only evaluate first 10 problems
|
|
156
|
+
```
|
|
157
|
+
|
|
158
|
+
### Issue: MultiPL-E Language Runtime Errors
|
|
159
|
+
|
|
160
|
+
**Symptom**: Errors executing code in non-Python languages.
|
|
161
|
+
|
|
162
|
+
**Solution**: Use the MultiPL-E specific Docker image:
|
|
163
|
+
```bash
|
|
164
|
+
docker pull ghcr.io/bigcode-project/evaluation-harness-multiple
|
|
165
|
+
docker run -it evaluation-harness-multiple ...
|
|
166
|
+
```
|
|
167
|
+
|
|
168
|
+
## Result Discrepancies
|
|
169
|
+
|
|
170
|
+
### Issue: Results Don't Match Paper/Leaderboard
|
|
171
|
+
|
|
172
|
+
**Symptom**: Your pass@k scores differ from reported values.
|
|
173
|
+
|
|
174
|
+
**Common causes and fixes**:
|
|
175
|
+
|
|
176
|
+
1. **Wrong n_samples**:
|
|
177
|
+
```bash
|
|
178
|
+
# For accurate pass@k estimation, use n_samples >= 200
|
|
179
|
+
--n_samples 200
|
|
180
|
+
```
|
|
181
|
+
|
|
182
|
+
2. **Wrong temperature**:
|
|
183
|
+
```bash
|
|
184
|
+
# Papers often use different temperatures
|
|
185
|
+
# For pass@1: temperature 0.2 (near-greedy)
|
|
186
|
+
# For pass@10, pass@100: temperature 0.8 (more sampling)
|
|
187
|
+
--temperature 0.8
|
|
188
|
+
```
|
|
189
|
+
|
|
190
|
+
3. **Task name mismatch**:
|
|
191
|
+
```bash
|
|
192
|
+
# Use exact task names
|
|
193
|
+
--tasks humaneval # Correct
|
|
194
|
+
--tasks human_eval # Wrong
|
|
195
|
+
--tasks HumanEval # Wrong
|
|
196
|
+
```
|
|
197
|
+
|
|
198
|
+
4. **Prompting differences**:
|
|
199
|
+
```bash
|
|
200
|
+
# Some models need instruction formatting
|
|
201
|
+
--instruction_tokens "<s>[INST],</s>,[/INST]"
|
|
202
|
+
|
|
203
|
+
# Or specific prompt types for HumanEvalPack
|
|
204
|
+
--prompt instruct
|
|
205
|
+
```
|
|
206
|
+
|
|
207
|
+
5. **Postprocessing differences**:
|
|
208
|
+
```bash
|
|
209
|
+
# Enable/disable postprocessing
|
|
210
|
+
--postprocess True # Default
|
|
211
|
+
```
|
|
212
|
+
|
|
213
|
+
### Issue: Inconsistent Results Across Runs
|
|
214
|
+
|
|
215
|
+
**Symptom**: Different scores each time you run.
|
|
216
|
+
|
|
217
|
+
**Solution**: For reproducibility:
|
|
218
|
+
```bash
|
|
219
|
+
# Use greedy decoding for deterministic results
|
|
220
|
+
--do_sample False
|
|
221
|
+
--temperature 0.0
|
|
222
|
+
|
|
223
|
+
# OR set seeds (if using sampling)
|
|
224
|
+
# Note: Sampling inherently has variance
|
|
225
|
+
# Use high n_samples to reduce noise
|
|
226
|
+
--n_samples 200
|
|
227
|
+
```
|
|
228
|
+
|
|
229
|
+
## Model Loading Issues
|
|
230
|
+
|
|
231
|
+
### Issue: Model with Custom Code
|
|
232
|
+
|
|
233
|
+
**Symptom**: `ValueError: ... requires you to execute the configuration file`
|
|
234
|
+
|
|
235
|
+
**Solution**:
|
|
236
|
+
```bash
|
|
237
|
+
--trust_remote_code
|
|
238
|
+
```
|
|
239
|
+
|
|
240
|
+
### Issue: Private/Gated Model Access
|
|
241
|
+
|
|
242
|
+
**Symptom**: `401 Unauthorized` or `403 Forbidden`
|
|
243
|
+
|
|
244
|
+
**Solution**:
|
|
245
|
+
```bash
|
|
246
|
+
# First login
|
|
247
|
+
huggingface-cli login
|
|
248
|
+
|
|
249
|
+
# Then use auth token
|
|
250
|
+
--use_auth_token
|
|
251
|
+
```
|
|
252
|
+
|
|
253
|
+
### Issue: PEFT/LoRA Adapter Loading
|
|
254
|
+
|
|
255
|
+
**Symptom**: Can't load fine-tuned adapter.
|
|
256
|
+
|
|
257
|
+
**Solution**:
|
|
258
|
+
```bash
|
|
259
|
+
--model base-model-name \
|
|
260
|
+
--peft_model path/to/adapter
|
|
261
|
+
```
|
|
262
|
+
|
|
263
|
+
### Issue: Seq2Seq Model Not Generating
|
|
264
|
+
|
|
265
|
+
**Symptom**: Empty or truncated outputs with encoder-decoder models.
|
|
266
|
+
|
|
267
|
+
**Solution**:
|
|
268
|
+
```bash
|
|
269
|
+
--modeltype seq2seq
|
|
270
|
+
```
|
|
271
|
+
|
|
272
|
+
## Task-Specific Issues
|
|
273
|
+
|
|
274
|
+
### Issue: Low MBPP Scores with Instruction Models
|
|
275
|
+
|
|
276
|
+
**Symptom**: Instruction-tuned models score poorly on MBPP.
|
|
277
|
+
|
|
278
|
+
**Solution**: MBPP prompts are plain text, not instruction format. Consider:
|
|
279
|
+
1. Using `instruct-humaneval` for instruction models
|
|
280
|
+
2. Creating custom instruction-formatted prompts
|
|
281
|
+
|
|
282
|
+
### Issue: APPS Taking Too Long
|
|
283
|
+
|
|
284
|
+
**Symptom**: APPS evaluation runs for hours.
|
|
285
|
+
|
|
286
|
+
**Solutions**:
|
|
287
|
+
```bash
|
|
288
|
+
# Use subset
|
|
289
|
+
--limit 100
|
|
290
|
+
|
|
291
|
+
# Reduce samples
|
|
292
|
+
--n_samples 10
|
|
293
|
+
|
|
294
|
+
# Use introductory level only
|
|
295
|
+
--tasks apps-introductory
|
|
296
|
+
```
|
|
297
|
+
|
|
298
|
+
### Issue: GSM8K Wrong max_length
|
|
299
|
+
|
|
300
|
+
**Symptom**: Truncated outputs, low scores on math tasks.
|
|
301
|
+
|
|
302
|
+
**Solution**: GSM8K needs longer context for 8-shot prompts:
|
|
303
|
+
```bash
|
|
304
|
+
--max_length_generation 2048 # Not default 512
|
|
305
|
+
```
|
|
306
|
+
|
|
307
|
+
## Docker Issues
|
|
308
|
+
|
|
309
|
+
### Issue: Docker Image Pull Fails
|
|
310
|
+
|
|
311
|
+
**Symptom**: `Error response from daemon: manifest unknown`
|
|
312
|
+
|
|
313
|
+
**Solution**: Build locally:
|
|
314
|
+
```bash
|
|
315
|
+
# Clone repo
|
|
316
|
+
git clone https://github.com/bigcode-project/bigcode-evaluation-harness.git
|
|
317
|
+
cd bigcode-evaluation-harness
|
|
318
|
+
|
|
319
|
+
# Build image
|
|
320
|
+
sudo make DOCKERFILE=Dockerfile all
|
|
321
|
+
|
|
322
|
+
# For MultiPL-E
|
|
323
|
+
sudo make DOCKERFILE=Dockerfile-multiple all
|
|
324
|
+
```
|
|
325
|
+
|
|
326
|
+
### Issue: Docker Can't Access GPU
|
|
327
|
+
|
|
328
|
+
**Symptom**: No GPU available inside container.
|
|
329
|
+
|
|
330
|
+
**Solution**: Use nvidia-docker:
|
|
331
|
+
```bash
|
|
332
|
+
docker run --gpus all -it evaluation-harness ...
|
|
333
|
+
```
|
|
334
|
+
|
|
335
|
+
## Debugging Tips
|
|
336
|
+
|
|
337
|
+
### Enable Verbose Output
|
|
338
|
+
|
|
339
|
+
```bash
|
|
340
|
+
# Check what's being generated
|
|
341
|
+
--save_generations
|
|
342
|
+
--save_references
|
|
343
|
+
|
|
344
|
+
# Inspect a few samples
|
|
345
|
+
--limit 5
|
|
346
|
+
```
|
|
347
|
+
|
|
348
|
+
### Test Reference Solutions
|
|
349
|
+
|
|
350
|
+
```bash
|
|
351
|
+
# Verify test cases pass with ground truth
|
|
352
|
+
--check_references
|
|
353
|
+
```
|
|
354
|
+
|
|
355
|
+
### Inspect Intermediate Results
|
|
356
|
+
|
|
357
|
+
```bash
|
|
358
|
+
# Save progress periodically
|
|
359
|
+
--save_every_k_tasks 10
|
|
360
|
+
--save_generations_path intermediate_generations.json
|
|
361
|
+
```
|
|
362
|
+
|
|
363
|
+
### Common Debug Workflow
|
|
364
|
+
|
|
365
|
+
```bash
|
|
366
|
+
# 1. Test with tiny subset
|
|
367
|
+
accelerate launch main.py \
|
|
368
|
+
--model your-model \
|
|
369
|
+
--tasks humaneval \
|
|
370
|
+
--limit 3 \
|
|
371
|
+
--n_samples 1 \
|
|
372
|
+
--save_generations \
|
|
373
|
+
--allow_code_execution
|
|
374
|
+
|
|
375
|
+
# 2. Inspect generations
|
|
376
|
+
cat generations.json | python -m json.tool | head -100
|
|
377
|
+
|
|
378
|
+
# 3. If looks good, scale up
|
|
379
|
+
accelerate launch main.py \
|
|
380
|
+
--model your-model \
|
|
381
|
+
--tasks humaneval \
|
|
382
|
+
--n_samples 200 \
|
|
383
|
+
--allow_code_execution
|
|
384
|
+
```
|
|
385
|
+
|
|
386
|
+
## Getting Help
|
|
387
|
+
|
|
388
|
+
1. **Check existing issues**: https://github.com/bigcode-project/bigcode-evaluation-harness/issues
|
|
389
|
+
2. **Search closed issues**: Often contains solutions
|
|
390
|
+
3. **Open new issue** with:
|
|
391
|
+
- Full command used
|
|
392
|
+
- Error message
|
|
393
|
+
- Environment details (Python version, PyTorch version, GPU)
|
|
394
|
+
- Model being evaluated
|