npm - @synsci/cli-darwin-arm64 - Versions diffs - 1.1.49 - Mend

@synsci/cli-darwin-arm64 1.1.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (373) hide show

package/bin/skills/accelerate/SKILL.md +332 -0
package/bin/skills/accelerate/references/custom-plugins.md +453 -0
package/bin/skills/accelerate/references/megatron-integration.md +489 -0
package/bin/skills/accelerate/references/performance.md +525 -0
package/bin/skills/audiocraft/SKILL.md +564 -0
package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
package/bin/skills/autogpt/SKILL.md +403 -0
package/bin/skills/autogpt/references/advanced-usage.md +535 -0
package/bin/skills/autogpt/references/troubleshooting.md +420 -0
package/bin/skills/awq/SKILL.md +310 -0
package/bin/skills/awq/references/advanced-usage.md +324 -0
package/bin/skills/awq/references/troubleshooting.md +344 -0
package/bin/skills/axolotl/SKILL.md +158 -0
package/bin/skills/axolotl/references/api.md +5548 -0
package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
package/bin/skills/axolotl/references/index.md +15 -0
package/bin/skills/axolotl/references/other.md +3563 -0
package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
package/bin/skills/bitsandbytes/SKILL.md +411 -0
package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
package/bin/skills/blip-2/SKILL.md +564 -0
package/bin/skills/blip-2/references/advanced-usage.md +680 -0
package/bin/skills/blip-2/references/troubleshooting.md +526 -0
package/bin/skills/chroma/SKILL.md +406 -0
package/bin/skills/chroma/references/integration.md +38 -0
package/bin/skills/clip/SKILL.md +253 -0
package/bin/skills/clip/references/applications.md +207 -0
package/bin/skills/constitutional-ai/SKILL.md +290 -0
package/bin/skills/crewai/SKILL.md +498 -0
package/bin/skills/crewai/references/flows.md +438 -0
package/bin/skills/crewai/references/tools.md +429 -0
package/bin/skills/crewai/references/troubleshooting.md +480 -0
package/bin/skills/deepspeed/SKILL.md +141 -0
package/bin/skills/deepspeed/references/08.md +17 -0
package/bin/skills/deepspeed/references/09.md +173 -0
package/bin/skills/deepspeed/references/2020.md +378 -0
package/bin/skills/deepspeed/references/2023.md +279 -0
package/bin/skills/deepspeed/references/assets.md +179 -0
package/bin/skills/deepspeed/references/index.md +35 -0
package/bin/skills/deepspeed/references/mii.md +118 -0
package/bin/skills/deepspeed/references/other.md +1191 -0
package/bin/skills/deepspeed/references/tutorials.md +6554 -0
package/bin/skills/dspy/SKILL.md +590 -0
package/bin/skills/dspy/references/examples.md +663 -0
package/bin/skills/dspy/references/modules.md +475 -0
package/bin/skills/dspy/references/optimizers.md +566 -0
package/bin/skills/faiss/SKILL.md +221 -0
package/bin/skills/faiss/references/index_types.md +280 -0
package/bin/skills/flash-attention/SKILL.md +367 -0
package/bin/skills/flash-attention/references/benchmarks.md +215 -0
package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
package/bin/skills/gguf/SKILL.md +427 -0
package/bin/skills/gguf/references/advanced-usage.md +504 -0
package/bin/skills/gguf/references/troubleshooting.md +442 -0
package/bin/skills/gptq/SKILL.md +450 -0
package/bin/skills/gptq/references/calibration.md +337 -0
package/bin/skills/gptq/references/integration.md +129 -0
package/bin/skills/gptq/references/troubleshooting.md +95 -0
package/bin/skills/grpo-rl-training/README.md +97 -0
package/bin/skills/grpo-rl-training/SKILL.md +572 -0
package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
package/bin/skills/guidance/SKILL.md +572 -0
package/bin/skills/guidance/references/backends.md +554 -0
package/bin/skills/guidance/references/constraints.md +674 -0
package/bin/skills/guidance/references/examples.md +767 -0
package/bin/skills/hqq/SKILL.md +445 -0
package/bin/skills/hqq/references/advanced-usage.md +528 -0
package/bin/skills/hqq/references/troubleshooting.md +503 -0
package/bin/skills/hugging-face-cli/SKILL.md +191 -0
package/bin/skills/hugging-face-cli/references/commands.md +954 -0
package/bin/skills/hugging-face-cli/references/examples.md +374 -0
package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
package/bin/skills/hugging-face-jobs/index.html +216 -0
package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
package/bin/skills/instructor/SKILL.md +740 -0
package/bin/skills/instructor/references/examples.md +107 -0
package/bin/skills/instructor/references/providers.md +70 -0
package/bin/skills/instructor/references/validation.md +606 -0
package/bin/skills/knowledge-distillation/SKILL.md +458 -0
package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
package/bin/skills/lambda-labs/SKILL.md +545 -0
package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
package/bin/skills/langchain/SKILL.md +480 -0
package/bin/skills/langchain/references/agents.md +499 -0
package/bin/skills/langchain/references/integration.md +562 -0
package/bin/skills/langchain/references/rag.md +600 -0
package/bin/skills/langsmith/SKILL.md +422 -0
package/bin/skills/langsmith/references/advanced-usage.md +548 -0
package/bin/skills/langsmith/references/troubleshooting.md +537 -0
package/bin/skills/litgpt/SKILL.md +469 -0
package/bin/skills/litgpt/references/custom-models.md +568 -0
package/bin/skills/litgpt/references/distributed-training.md +451 -0
package/bin/skills/litgpt/references/supported-models.md +336 -0
package/bin/skills/litgpt/references/training-recipes.md +619 -0
package/bin/skills/llama-cpp/SKILL.md +258 -0
package/bin/skills/llama-cpp/references/optimization.md +89 -0
package/bin/skills/llama-cpp/references/quantization.md +213 -0
package/bin/skills/llama-cpp/references/server.md +125 -0
package/bin/skills/llama-factory/SKILL.md +80 -0
package/bin/skills/llama-factory/references/_images.md +23 -0
package/bin/skills/llama-factory/references/advanced.md +1055 -0
package/bin/skills/llama-factory/references/getting_started.md +349 -0
package/bin/skills/llama-factory/references/index.md +19 -0
package/bin/skills/llama-factory/references/other.md +31 -0
package/bin/skills/llamaguard/SKILL.md +337 -0
package/bin/skills/llamaindex/SKILL.md +569 -0
package/bin/skills/llamaindex/references/agents.md +83 -0
package/bin/skills/llamaindex/references/data_connectors.md +108 -0
package/bin/skills/llamaindex/references/query_engines.md +406 -0
package/bin/skills/llava/SKILL.md +304 -0
package/bin/skills/llava/references/training.md +197 -0
package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
package/bin/skills/long-context/SKILL.md +536 -0
package/bin/skills/long-context/references/extension_methods.md +468 -0
package/bin/skills/long-context/references/fine_tuning.md +611 -0
package/bin/skills/long-context/references/rope.md +402 -0
package/bin/skills/mamba/SKILL.md +260 -0
package/bin/skills/mamba/references/architecture-details.md +206 -0
package/bin/skills/mamba/references/benchmarks.md +255 -0
package/bin/skills/mamba/references/training-guide.md +388 -0
package/bin/skills/megatron-core/SKILL.md +366 -0
package/bin/skills/megatron-core/references/benchmarks.md +249 -0
package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
package/bin/skills/megatron-core/references/production-examples.md +473 -0
package/bin/skills/megatron-core/references/training-recipes.md +547 -0
package/bin/skills/miles/SKILL.md +315 -0
package/bin/skills/miles/references/api-reference.md +141 -0
package/bin/skills/miles/references/troubleshooting.md +352 -0
package/bin/skills/mlflow/SKILL.md +704 -0
package/bin/skills/mlflow/references/deployment.md +744 -0
package/bin/skills/mlflow/references/model-registry.md +770 -0
package/bin/skills/mlflow/references/tracking.md +680 -0
package/bin/skills/modal/SKILL.md +341 -0
package/bin/skills/modal/references/advanced-usage.md +503 -0
package/bin/skills/modal/references/troubleshooting.md +494 -0
package/bin/skills/model-merging/SKILL.md +539 -0
package/bin/skills/model-merging/references/evaluation.md +462 -0
package/bin/skills/model-merging/references/examples.md +428 -0
package/bin/skills/model-merging/references/methods.md +352 -0
package/bin/skills/model-pruning/SKILL.md +495 -0
package/bin/skills/model-pruning/references/wanda.md +347 -0
package/bin/skills/moe-training/SKILL.md +526 -0
package/bin/skills/moe-training/references/architectures.md +432 -0
package/bin/skills/moe-training/references/inference.md +348 -0
package/bin/skills/moe-training/references/training.md +425 -0
package/bin/skills/nanogpt/SKILL.md +290 -0
package/bin/skills/nanogpt/references/architecture.md +382 -0
package/bin/skills/nanogpt/references/data.md +476 -0
package/bin/skills/nanogpt/references/training.md +564 -0
package/bin/skills/nemo-curator/SKILL.md +383 -0
package/bin/skills/nemo-curator/references/deduplication.md +87 -0
package/bin/skills/nemo-curator/references/filtering.md +102 -0
package/bin/skills/nemo-evaluator/SKILL.md +494 -0
package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
package/bin/skills/nemo-guardrails/SKILL.md +297 -0
package/bin/skills/nnsight/SKILL.md +436 -0
package/bin/skills/nnsight/references/README.md +78 -0
package/bin/skills/nnsight/references/api.md +344 -0
package/bin/skills/nnsight/references/tutorials.md +300 -0
package/bin/skills/openrlhf/SKILL.md +249 -0
package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
package/bin/skills/outlines/SKILL.md +652 -0
package/bin/skills/outlines/references/backends.md +615 -0
package/bin/skills/outlines/references/examples.md +773 -0
package/bin/skills/outlines/references/json_generation.md +652 -0
package/bin/skills/peft/SKILL.md +431 -0
package/bin/skills/peft/references/advanced-usage.md +514 -0
package/bin/skills/peft/references/troubleshooting.md +480 -0
package/bin/skills/phoenix/SKILL.md +475 -0
package/bin/skills/phoenix/references/advanced-usage.md +619 -0
package/bin/skills/phoenix/references/troubleshooting.md +538 -0
package/bin/skills/pinecone/SKILL.md +358 -0
package/bin/skills/pinecone/references/deployment.md +181 -0
package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
package/bin/skills/pytorch-fsdp/references/index.md +7 -0
package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
package/bin/skills/pytorch-lightning/SKILL.md +346 -0
package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
package/bin/skills/pyvene/SKILL.md +473 -0
package/bin/skills/pyvene/references/README.md +73 -0
package/bin/skills/pyvene/references/api.md +383 -0
package/bin/skills/pyvene/references/tutorials.md +376 -0
package/bin/skills/qdrant/SKILL.md +493 -0
package/bin/skills/qdrant/references/advanced-usage.md +648 -0
package/bin/skills/qdrant/references/troubleshooting.md +631 -0
package/bin/skills/ray-data/SKILL.md +326 -0
package/bin/skills/ray-data/references/integration.md +82 -0
package/bin/skills/ray-data/references/transformations.md +83 -0
package/bin/skills/ray-train/SKILL.md +406 -0
package/bin/skills/ray-train/references/multi-node.md +628 -0
package/bin/skills/rwkv/SKILL.md +260 -0
package/bin/skills/rwkv/references/architecture-details.md +344 -0
package/bin/skills/rwkv/references/rwkv7.md +386 -0
package/bin/skills/rwkv/references/state-management.md +369 -0
package/bin/skills/saelens/SKILL.md +386 -0
package/bin/skills/saelens/references/README.md +70 -0
package/bin/skills/saelens/references/api.md +333 -0
package/bin/skills/saelens/references/tutorials.md +318 -0
package/bin/skills/segment-anything/SKILL.md +500 -0
package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
package/bin/skills/sentence-transformers/SKILL.md +255 -0
package/bin/skills/sentence-transformers/references/models.md +123 -0
package/bin/skills/sentencepiece/SKILL.md +235 -0
package/bin/skills/sentencepiece/references/algorithms.md +200 -0
package/bin/skills/sentencepiece/references/training.md +304 -0
package/bin/skills/sglang/SKILL.md +442 -0
package/bin/skills/sglang/references/deployment.md +490 -0
package/bin/skills/sglang/references/radix-attention.md +413 -0
package/bin/skills/sglang/references/structured-generation.md +541 -0
package/bin/skills/simpo/SKILL.md +219 -0
package/bin/skills/simpo/references/datasets.md +478 -0
package/bin/skills/simpo/references/hyperparameters.md +452 -0
package/bin/skills/simpo/references/loss-functions.md +350 -0
package/bin/skills/skypilot/SKILL.md +509 -0
package/bin/skills/skypilot/references/advanced-usage.md +491 -0
package/bin/skills/skypilot/references/troubleshooting.md +570 -0
package/bin/skills/slime/SKILL.md +464 -0
package/bin/skills/slime/references/api-reference.md +392 -0
package/bin/skills/slime/references/troubleshooting.md +386 -0
package/bin/skills/speculative-decoding/SKILL.md +467 -0
package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
package/bin/skills/speculative-decoding/references/medusa.md +350 -0
package/bin/skills/stable-diffusion/SKILL.md +519 -0
package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
package/bin/skills/tensorboard/SKILL.md +629 -0
package/bin/skills/tensorboard/references/integrations.md +638 -0
package/bin/skills/tensorboard/references/profiling.md +545 -0
package/bin/skills/tensorboard/references/visualization.md +620 -0
package/bin/skills/tensorrt-llm/SKILL.md +187 -0
package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
package/bin/skills/tensorrt-llm/references/serving.md +470 -0
package/bin/skills/tinker/SKILL.md +362 -0
package/bin/skills/tinker/references/api-reference.md +168 -0
package/bin/skills/tinker/references/getting-started.md +157 -0
package/bin/skills/tinker/references/loss-functions.md +163 -0
package/bin/skills/tinker/references/models-and-lora.md +139 -0
package/bin/skills/tinker/references/recipes.md +280 -0
package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
package/bin/skills/tinker/references/rendering.md +243 -0
package/bin/skills/tinker/references/supervised-learning.md +232 -0
package/bin/skills/tinker-training-cost/SKILL.md +187 -0
package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
package/bin/skills/torchforge/SKILL.md +433 -0
package/bin/skills/torchforge/references/api-reference.md +327 -0
package/bin/skills/torchforge/references/troubleshooting.md +409 -0
package/bin/skills/torchtitan/SKILL.md +358 -0
package/bin/skills/torchtitan/references/checkpoint.md +181 -0
package/bin/skills/torchtitan/references/custom-models.md +258 -0
package/bin/skills/torchtitan/references/float8.md +133 -0
package/bin/skills/torchtitan/references/fsdp.md +126 -0
package/bin/skills/transformer-lens/SKILL.md +346 -0
package/bin/skills/transformer-lens/references/README.md +54 -0
package/bin/skills/transformer-lens/references/api.md +362 -0
package/bin/skills/transformer-lens/references/tutorials.md +339 -0
package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
package/bin/skills/unsloth/SKILL.md +80 -0
package/bin/skills/unsloth/references/index.md +7 -0
package/bin/skills/unsloth/references/llms-full.md +16799 -0
package/bin/skills/unsloth/references/llms-txt.md +12044 -0
package/bin/skills/unsloth/references/llms.md +82 -0
package/bin/skills/verl/SKILL.md +391 -0
package/bin/skills/verl/references/api-reference.md +301 -0
package/bin/skills/verl/references/troubleshooting.md +391 -0
package/bin/skills/vllm/SKILL.md +364 -0
package/bin/skills/vllm/references/optimization.md +226 -0
package/bin/skills/vllm/references/quantization.md +284 -0
package/bin/skills/vllm/references/server-deployment.md +255 -0
package/bin/skills/vllm/references/troubleshooting.md +447 -0
package/bin/skills/weights-and-biases/SKILL.md +590 -0
package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
package/bin/skills/weights-and-biases/references/integrations.md +700 -0
package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
package/bin/skills/whisper/SKILL.md +317 -0
package/bin/skills/whisper/references/languages.md +189 -0
package/bin/synsc +0 -0
package/package.json +10 -0

package/bin/skills/litgpt/references/training-recipes.md ADDED Viewed

@@ -0,0 +1,619 @@
+# Training Recipes
+Complete hyperparameter configurations for LoRA, QLoRA, and full fine-tuning across different model sizes.
+## Overview
+LitGPT provides optimized training configurations in `config_hub/finetune/` for various model architectures and fine-tuning methods.
+**Key Configuration Files**:
+- `config_hub/finetune/*/lora.yaml` - LoRA fine-tuning
+- `config_hub/finetune/*/qlora.yaml` - 4-bit quantized LoRA
+- `config_hub/finetune/*/full.yaml` - Full fine-tuning
+## LoRA Fine-tuning Recipes
+### TinyLlama 1.1B LoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 8
+lr_warmup_steps: 10
+epochs: 3
+max_seq_length: 512
+# LoRA specific
+lora_r: 8
+lora_alpha: 16
+lora_dropout: 0.05
+```
+**Command**:
+```bash
+litgpt finetune_lora TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T \
+  --data JSON \
+  --data.json_path data/alpaca_sample.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 8 \
+  --train.lr_warmup_steps 10 \
+  --train.epochs 3 \
+  --train.max_seq_length 512 \
+  --lora_r 8 \
+  --lora_alpha 16
+```
+**Memory**: ~4GB VRAM
+**Time**: ~30 minutes on RTX 3090
+### Llama 2 7B LoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 2
+lr_warmup_steps: 10
+epochs: 4
+max_seq_length: 512
+# LoRA specific
+lora_r: 8
+lora_alpha: 16
+lora_dropout: 0.05
+```
+**Command**:
+```bash
+litgpt finetune_lora meta-llama/Llama-2-7b-hf \
+  --data JSON \
+  --data.json_path data/alpaca.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 2 \
+  --train.lr_warmup_steps 10 \
+  --train.epochs 4 \
+  --lora_r 8 \
+  --lora_alpha 16
+```
+**Memory**: ~16GB VRAM
+**Gradient Accumulation**: 4 steps (8 / 2)
+**Time**: ~6 hours on A100
+### Llama 3 8B LoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 1
+lr_warmup_steps: 10
+epochs: 2
+max_seq_length: 512
+# LoRA specific
+lora_r: 8
+lora_alpha: 16
+lora_dropout: 0.05
+```
+**Command**:
+```bash
+litgpt finetune_lora meta-llama/Llama-3.2-8B \
+  --data JSON \
+  --data.json_path data/custom_dataset.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 1 \
+  --train.lr_warmup_steps 10 \
+  --train.epochs 2 \
+  --lora_r 8
+```
+**Memory**: ~20GB VRAM
+**Gradient Accumulation**: 8 steps
+**Time**: ~8 hours on A100
+### Mistral 7B LoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 2
+lr_warmup_steps: 10
+epochs: 4
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+```
+**Command**:
+```bash
+litgpt finetune_lora mistralai/Mistral-7B-v0.1 \
+  --data JSON \
+  --data.json_path data/alpaca.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 2 \
+  --train.epochs 4 \
+  --lora_r 8
+```
+**Memory**: ~16GB VRAM
+### Phi-2 LoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 4
+lr_warmup_steps: 10
+epochs: 1
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+```
+**Command**:
+```bash
+litgpt finetune_lora microsoft/phi-2 \
+  --data JSON \
+  --data.json_path data/alpaca_sample.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 4 \
+  --train.epochs 1 \
+  --lora_r 8
+```
+**Memory**: ~8GB VRAM
+**Time**: ~20 minutes on RTX 3090
+### Falcon 7B LoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 1
+lr_warmup_steps: 10
+epochs: 4
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+```
+**Command**:
+```bash
+litgpt finetune_lora tiiuae/falcon-7b \
+  --data JSON \
+  --data.json_path data/alpaca.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 1 \
+  --train.epochs 4 \
+  --lora_r 8
+```
+**Memory**: ~18GB VRAM
+### Gemma 7B LoRA
+**Configuration**:
+```yaml
+global_batch_size: 6
+micro_batch_size: 1
+lr_warmup_steps: 200
+epochs: 2
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+```
+**Command**:
+```bash
+litgpt finetune_lora google/gemma-7b \
+  --data JSON \
+  --data.json_path data/alpaca.json \
+  --train.global_batch_size 6 \
+  --train.micro_batch_size 1 \
+  --train.lr_warmup_steps 200 \
+  --train.epochs 2 \
+  --lora_r 8
+```
+**Memory**: ~18GB VRAM
+**Note**: Longer warmup (200 steps) for stability
+## QLoRA Fine-tuning Recipes
+QLoRA uses 4-bit quantization to reduce memory by ~75%.
+### TinyLlama 1.1B QLoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 8
+lr_warmup_steps: 10
+epochs: 3
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+quantize: "bnb.nf4"
+```
+**Command**:
+```bash
+litgpt finetune_lora TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T \
+  --quantize bnb.nf4 \
+  --data JSON \
+  --data.json_path data/alpaca_sample.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 8 \
+  --train.epochs 3 \
+  --lora_r 8
+```
+**Memory**: ~2GB VRAM (75% reduction)
+### Llama 2 7B QLoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 2
+lr_warmup_steps: 10
+epochs: 4
+max_seq_length: 512
+min_lr: 6.0e-5
+lora_r: 8
+lora_alpha: 16
+quantize: "bnb.nf4"
+```
+**Command**:
+```bash
+litgpt finetune_lora meta-llama/Llama-2-7b-hf \
+  --quantize bnb.nf4 \
+  --data JSON \
+  --data.json_path data/alpaca.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 2 \
+  --train.epochs 4 \
+  --lora_r 8
+```
+**Memory**: ~6GB VRAM (consumer GPU friendly)
+### Llama 3 8B QLoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 2
+lr_warmup_steps: 10
+epochs: 2
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+quantize: "bnb.nf4"
+```
+**Command**:
+```bash
+litgpt finetune_lora meta-llama/Llama-3.2-8B \
+  --quantize bnb.nf4 \
+  --data JSON \
+  --data.json_path data/custom_dataset.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 2 \
+  --train.epochs 2 \
+  --lora_r 8
+```
+**Memory**: ~8GB VRAM
+### Mistral 7B QLoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 2
+lr_warmup_steps: 10
+epochs: 4
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+quantize: "bnb.nf4"
+```
+**Memory**: ~6GB VRAM
+### Phi-2 QLoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 4
+lr_warmup_steps: 10
+epochs: 1
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+quantize: "bnb.nf4"
+```
+**Memory**: ~3GB VRAM
+### Falcon 7B QLoRA
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 1
+lr_warmup_steps: 10
+epochs: 4
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+quantize: "bnb.nf4"
+```
+**Memory**: ~6GB VRAM
+### Gemma 2B QLoRA
+**Configuration**:
+```yaml
+global_batch_size: 6
+micro_batch_size: 2
+lr_warmup_steps: 200
+epochs: 2
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+quantize: "bnb.nf4"
+```
+**Memory**: ~3GB VRAM
+### Gemma 7B QLoRA
+**Configuration**:
+```yaml
+global_batch_size: 6
+micro_batch_size: 1
+lr_warmup_steps: 200
+epochs: 2
+max_seq_length: 512
+lora_r: 8
+lora_alpha: 16
+quantize: "bnb.nf4"
+```
+**Memory**: ~6GB VRAM
+## Full Fine-tuning Recipes
+Full fine-tuning updates all model parameters (requires more memory).
+### TinyLlama 1.1B Full
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 2
+lr_warmup_steps: 100
+epochs: 3
+max_seq_length: 512
+learning_rate: 5e-5
+```
+**Command**:
+```bash
+litgpt finetune_full TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T \
+  --data JSON \
+  --data.json_path data/alpaca.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 2 \
+  --train.lr_warmup_steps 100 \
+  --train.epochs 3 \
+  --train.learning_rate 5e-5
+```
+**Memory**: ~12GB VRAM
+**Time**: ~4 hours on A100
+### Phi-2 Full
+**Configuration**:
+```yaml
+global_batch_size: 8
+micro_batch_size: 1
+lr_warmup_steps: 100
+epochs: 2
+max_seq_length: 512
+learning_rate: 3e-5
+```
+**Command**:
+```bash
+litgpt finetune_full microsoft/phi-2 \
+  --data JSON \
+  --data.json_path data/alpaca.json \
+  --train.global_batch_size 8 \
+  --train.micro_batch_size 1 \
+  --train.epochs 2 \
+  --train.learning_rate 3e-5
+```
+**Memory**: ~24GB VRAM
+## Common Hyperparameter Patterns
+### Learning Rates
+| Model Size | LoRA LR | Full Fine-tune LR |
+|------------|---------|-------------------|
+| <2B | 3e-4 | 5e-5 |
+| 2-10B | 1e-4 | 3e-5 |
+| 10-70B | 5e-5 | 1e-5 |
+### LoRA Rank (r)
+- **r=8**: Default, good balance (recommended)
+- **r=16**: More capacity, 2× trainable params
+- **r=32**: Maximum capacity, slower training
+- **r=4**: Minimal, fastest training
+**Rule of thumb**: Start with r=8, increase if underfitting.
+### Batch Sizes
+| GPU VRAM | Micro Batch | Global Batch |
+|----------|-------------|--------------|
+| 8GB | 1 | 8 |
+| 16GB | 2 | 8-16 |
+| 40GB | 4 | 16-32 |
+| 80GB | 8 | 32-64 |
+### Warmup Steps
+- **Small models (<2B)**: 10-50 steps
+- **Medium models (2-10B)**: 100-200 steps
+- **Large models (>10B)**: 200-500 steps
+### Epochs
+- **Instruction tuning**: 1-3 epochs
+- **Domain adaptation**: 3-5 epochs
+- **Small datasets (<10K)**: 5-10 epochs
+## Advanced Configurations
+### Custom Learning Rate Schedule
+```bash
+litgpt finetune_lora meta-llama/Llama-2-7b-hf \
+  --train.learning_rate 3e-4 \
+  --train.lr_warmup_steps 100 \
+  --train.min_lr 3e-6 \
+  --train.lr_decay_iters 10000
+```
+### Gradient Accumulation
+```bash
+# Simulate global_batch_size=128 with 16GB GPU
+litgpt finetune_lora meta-llama/Llama-2-7b-hf \
+  --train.global_batch_size 128 \
+  --train.micro_batch_size 2
+# Accumulates over 64 steps (128 / 2)
+```
+### Mixed Precision
+```bash
+litgpt finetune_lora meta-llama/Llama-2-7b-hf \
+  --precision bf16-mixed  # BF16 mixed precision
+# or
+  --precision 16-mixed  # FP16 mixed precision
+```
+### Longer Context
+```bash
+litgpt finetune_lora meta-llama/Llama-3.1-8B \
+  --train.max_seq_length 8192 \
+  --train.micro_batch_size 1  # Reduce batch for memory
+```
+## Memory Optimization
+### Out of Memory? Try These
+1. **Enable quantization**:
+   ```bash
+   --quantize bnb.nf4  # 4-bit QLoRA
+   ```
+2. **Reduce batch size**:
+   ```bash
+   --train.micro_batch_size 1
+   ```
+3. **Lower LoRA rank**:
+   ```bash
+   --lora_r 4  # Instead of 8
+   ```
+4. **Use FSDP** (multi-GPU):
+   ```bash
+   litgpt finetune_lora meta-llama/Llama-2-7b-hf \
+     --devices 4  # Use 4 GPUs with FSDP
+   ```
+5. **Gradient checkpointing**:
+   ```bash
+   --train.gradient_accumulation_iters 16
+   ```
+## Data Format
+LitGPT expects JSON data in instruction format:
+```json
+[
+  {
+    "instruction": "What is the capital of France?",
+    "input": "",
+    "output": "The capital of France is Paris."
+  },
+  {
+    "instruction": "Translate to Spanish:",
+    "input": "Hello world",
+    "output": "Hola mundo"
+  }
+]
+```
+**Load custom data**:
+```bash
+litgpt finetune_lora meta-llama/Llama-2-7b-hf \
+  --data JSON \
+  --data.json_path data/my_dataset.json \
+  --data.val_split_fraction 0.1  # 10% validation
+```
+## Merge and Deploy
+After fine-tuning, merge LoRA weights:
+```bash
+litgpt merge_lora checkpoints/meta-llama/Llama-2-7b-hf/final_lora.pth
+```
+Generate with merged model:
+```bash
+litgpt generate checkpoints/meta-llama/Llama-2-7b-hf-merged/ \
+  --prompt "What is machine learning?"
+```
+Or serve via API:
+```bash
+litgpt serve checkpoints/meta-llama/Llama-2-7b-hf-merged/
+```
+## References
+- Configuration hub: `config_hub/finetune/`
+- Fine-tuning tutorial: `tutorials/finetune_*.md`
+- Memory guide: `tutorials/oom.md`