@synsci/cli-darwin-arm64 1.1.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (373) hide show
  1. package/bin/skills/accelerate/SKILL.md +332 -0
  2. package/bin/skills/accelerate/references/custom-plugins.md +453 -0
  3. package/bin/skills/accelerate/references/megatron-integration.md +489 -0
  4. package/bin/skills/accelerate/references/performance.md +525 -0
  5. package/bin/skills/audiocraft/SKILL.md +564 -0
  6. package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
  7. package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
  8. package/bin/skills/autogpt/SKILL.md +403 -0
  9. package/bin/skills/autogpt/references/advanced-usage.md +535 -0
  10. package/bin/skills/autogpt/references/troubleshooting.md +420 -0
  11. package/bin/skills/awq/SKILL.md +310 -0
  12. package/bin/skills/awq/references/advanced-usage.md +324 -0
  13. package/bin/skills/awq/references/troubleshooting.md +344 -0
  14. package/bin/skills/axolotl/SKILL.md +158 -0
  15. package/bin/skills/axolotl/references/api.md +5548 -0
  16. package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
  17. package/bin/skills/axolotl/references/index.md +15 -0
  18. package/bin/skills/axolotl/references/other.md +3563 -0
  19. package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
  20. package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
  21. package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
  22. package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
  23. package/bin/skills/bitsandbytes/SKILL.md +411 -0
  24. package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
  25. package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
  26. package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
  27. package/bin/skills/blip-2/SKILL.md +564 -0
  28. package/bin/skills/blip-2/references/advanced-usage.md +680 -0
  29. package/bin/skills/blip-2/references/troubleshooting.md +526 -0
  30. package/bin/skills/chroma/SKILL.md +406 -0
  31. package/bin/skills/chroma/references/integration.md +38 -0
  32. package/bin/skills/clip/SKILL.md +253 -0
  33. package/bin/skills/clip/references/applications.md +207 -0
  34. package/bin/skills/constitutional-ai/SKILL.md +290 -0
  35. package/bin/skills/crewai/SKILL.md +498 -0
  36. package/bin/skills/crewai/references/flows.md +438 -0
  37. package/bin/skills/crewai/references/tools.md +429 -0
  38. package/bin/skills/crewai/references/troubleshooting.md +480 -0
  39. package/bin/skills/deepspeed/SKILL.md +141 -0
  40. package/bin/skills/deepspeed/references/08.md +17 -0
  41. package/bin/skills/deepspeed/references/09.md +173 -0
  42. package/bin/skills/deepspeed/references/2020.md +378 -0
  43. package/bin/skills/deepspeed/references/2023.md +279 -0
  44. package/bin/skills/deepspeed/references/assets.md +179 -0
  45. package/bin/skills/deepspeed/references/index.md +35 -0
  46. package/bin/skills/deepspeed/references/mii.md +118 -0
  47. package/bin/skills/deepspeed/references/other.md +1191 -0
  48. package/bin/skills/deepspeed/references/tutorials.md +6554 -0
  49. package/bin/skills/dspy/SKILL.md +590 -0
  50. package/bin/skills/dspy/references/examples.md +663 -0
  51. package/bin/skills/dspy/references/modules.md +475 -0
  52. package/bin/skills/dspy/references/optimizers.md +566 -0
  53. package/bin/skills/faiss/SKILL.md +221 -0
  54. package/bin/skills/faiss/references/index_types.md +280 -0
  55. package/bin/skills/flash-attention/SKILL.md +367 -0
  56. package/bin/skills/flash-attention/references/benchmarks.md +215 -0
  57. package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
  58. package/bin/skills/gguf/SKILL.md +427 -0
  59. package/bin/skills/gguf/references/advanced-usage.md +504 -0
  60. package/bin/skills/gguf/references/troubleshooting.md +442 -0
  61. package/bin/skills/gptq/SKILL.md +450 -0
  62. package/bin/skills/gptq/references/calibration.md +337 -0
  63. package/bin/skills/gptq/references/integration.md +129 -0
  64. package/bin/skills/gptq/references/troubleshooting.md +95 -0
  65. package/bin/skills/grpo-rl-training/README.md +97 -0
  66. package/bin/skills/grpo-rl-training/SKILL.md +572 -0
  67. package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
  68. package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
  69. package/bin/skills/guidance/SKILL.md +572 -0
  70. package/bin/skills/guidance/references/backends.md +554 -0
  71. package/bin/skills/guidance/references/constraints.md +674 -0
  72. package/bin/skills/guidance/references/examples.md +767 -0
  73. package/bin/skills/hqq/SKILL.md +445 -0
  74. package/bin/skills/hqq/references/advanced-usage.md +528 -0
  75. package/bin/skills/hqq/references/troubleshooting.md +503 -0
  76. package/bin/skills/hugging-face-cli/SKILL.md +191 -0
  77. package/bin/skills/hugging-face-cli/references/commands.md +954 -0
  78. package/bin/skills/hugging-face-cli/references/examples.md +374 -0
  79. package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
  80. package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
  81. package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
  82. package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
  83. package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
  84. package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
  85. package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
  86. package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
  87. package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
  88. package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
  89. package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
  90. package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
  91. package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
  92. package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
  93. package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
  94. package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
  95. package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
  96. package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
  97. package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
  98. package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
  99. package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
  100. package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
  101. package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
  102. package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
  103. package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
  104. package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
  105. package/bin/skills/hugging-face-jobs/index.html +216 -0
  106. package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
  107. package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
  108. package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
  109. package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
  110. package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
  111. package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
  112. package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
  113. package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
  114. package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
  115. package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
  116. package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
  117. package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
  118. package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
  119. package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
  120. package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
  121. package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
  122. package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
  123. package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
  124. package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
  125. package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
  126. package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
  127. package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
  128. package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
  129. package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
  130. package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
  131. package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
  132. package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
  133. package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
  134. package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
  135. package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
  136. package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
  137. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
  138. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
  139. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
  140. package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
  141. package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
  142. package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
  143. package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
  144. package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
  145. package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
  146. package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
  147. package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
  148. package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
  149. package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
  150. package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
  151. package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
  152. package/bin/skills/instructor/SKILL.md +740 -0
  153. package/bin/skills/instructor/references/examples.md +107 -0
  154. package/bin/skills/instructor/references/providers.md +70 -0
  155. package/bin/skills/instructor/references/validation.md +606 -0
  156. package/bin/skills/knowledge-distillation/SKILL.md +458 -0
  157. package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
  158. package/bin/skills/lambda-labs/SKILL.md +545 -0
  159. package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
  160. package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
  161. package/bin/skills/langchain/SKILL.md +480 -0
  162. package/bin/skills/langchain/references/agents.md +499 -0
  163. package/bin/skills/langchain/references/integration.md +562 -0
  164. package/bin/skills/langchain/references/rag.md +600 -0
  165. package/bin/skills/langsmith/SKILL.md +422 -0
  166. package/bin/skills/langsmith/references/advanced-usage.md +548 -0
  167. package/bin/skills/langsmith/references/troubleshooting.md +537 -0
  168. package/bin/skills/litgpt/SKILL.md +469 -0
  169. package/bin/skills/litgpt/references/custom-models.md +568 -0
  170. package/bin/skills/litgpt/references/distributed-training.md +451 -0
  171. package/bin/skills/litgpt/references/supported-models.md +336 -0
  172. package/bin/skills/litgpt/references/training-recipes.md +619 -0
  173. package/bin/skills/llama-cpp/SKILL.md +258 -0
  174. package/bin/skills/llama-cpp/references/optimization.md +89 -0
  175. package/bin/skills/llama-cpp/references/quantization.md +213 -0
  176. package/bin/skills/llama-cpp/references/server.md +125 -0
  177. package/bin/skills/llama-factory/SKILL.md +80 -0
  178. package/bin/skills/llama-factory/references/_images.md +23 -0
  179. package/bin/skills/llama-factory/references/advanced.md +1055 -0
  180. package/bin/skills/llama-factory/references/getting_started.md +349 -0
  181. package/bin/skills/llama-factory/references/index.md +19 -0
  182. package/bin/skills/llama-factory/references/other.md +31 -0
  183. package/bin/skills/llamaguard/SKILL.md +337 -0
  184. package/bin/skills/llamaindex/SKILL.md +569 -0
  185. package/bin/skills/llamaindex/references/agents.md +83 -0
  186. package/bin/skills/llamaindex/references/data_connectors.md +108 -0
  187. package/bin/skills/llamaindex/references/query_engines.md +406 -0
  188. package/bin/skills/llava/SKILL.md +304 -0
  189. package/bin/skills/llava/references/training.md +197 -0
  190. package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
  191. package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
  192. package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
  193. package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
  194. package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
  195. package/bin/skills/long-context/SKILL.md +536 -0
  196. package/bin/skills/long-context/references/extension_methods.md +468 -0
  197. package/bin/skills/long-context/references/fine_tuning.md +611 -0
  198. package/bin/skills/long-context/references/rope.md +402 -0
  199. package/bin/skills/mamba/SKILL.md +260 -0
  200. package/bin/skills/mamba/references/architecture-details.md +206 -0
  201. package/bin/skills/mamba/references/benchmarks.md +255 -0
  202. package/bin/skills/mamba/references/training-guide.md +388 -0
  203. package/bin/skills/megatron-core/SKILL.md +366 -0
  204. package/bin/skills/megatron-core/references/benchmarks.md +249 -0
  205. package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
  206. package/bin/skills/megatron-core/references/production-examples.md +473 -0
  207. package/bin/skills/megatron-core/references/training-recipes.md +547 -0
  208. package/bin/skills/miles/SKILL.md +315 -0
  209. package/bin/skills/miles/references/api-reference.md +141 -0
  210. package/bin/skills/miles/references/troubleshooting.md +352 -0
  211. package/bin/skills/mlflow/SKILL.md +704 -0
  212. package/bin/skills/mlflow/references/deployment.md +744 -0
  213. package/bin/skills/mlflow/references/model-registry.md +770 -0
  214. package/bin/skills/mlflow/references/tracking.md +680 -0
  215. package/bin/skills/modal/SKILL.md +341 -0
  216. package/bin/skills/modal/references/advanced-usage.md +503 -0
  217. package/bin/skills/modal/references/troubleshooting.md +494 -0
  218. package/bin/skills/model-merging/SKILL.md +539 -0
  219. package/bin/skills/model-merging/references/evaluation.md +462 -0
  220. package/bin/skills/model-merging/references/examples.md +428 -0
  221. package/bin/skills/model-merging/references/methods.md +352 -0
  222. package/bin/skills/model-pruning/SKILL.md +495 -0
  223. package/bin/skills/model-pruning/references/wanda.md +347 -0
  224. package/bin/skills/moe-training/SKILL.md +526 -0
  225. package/bin/skills/moe-training/references/architectures.md +432 -0
  226. package/bin/skills/moe-training/references/inference.md +348 -0
  227. package/bin/skills/moe-training/references/training.md +425 -0
  228. package/bin/skills/nanogpt/SKILL.md +290 -0
  229. package/bin/skills/nanogpt/references/architecture.md +382 -0
  230. package/bin/skills/nanogpt/references/data.md +476 -0
  231. package/bin/skills/nanogpt/references/training.md +564 -0
  232. package/bin/skills/nemo-curator/SKILL.md +383 -0
  233. package/bin/skills/nemo-curator/references/deduplication.md +87 -0
  234. package/bin/skills/nemo-curator/references/filtering.md +102 -0
  235. package/bin/skills/nemo-evaluator/SKILL.md +494 -0
  236. package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
  237. package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
  238. package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
  239. package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
  240. package/bin/skills/nemo-guardrails/SKILL.md +297 -0
  241. package/bin/skills/nnsight/SKILL.md +436 -0
  242. package/bin/skills/nnsight/references/README.md +78 -0
  243. package/bin/skills/nnsight/references/api.md +344 -0
  244. package/bin/skills/nnsight/references/tutorials.md +300 -0
  245. package/bin/skills/openrlhf/SKILL.md +249 -0
  246. package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
  247. package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
  248. package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
  249. package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
  250. package/bin/skills/outlines/SKILL.md +652 -0
  251. package/bin/skills/outlines/references/backends.md +615 -0
  252. package/bin/skills/outlines/references/examples.md +773 -0
  253. package/bin/skills/outlines/references/json_generation.md +652 -0
  254. package/bin/skills/peft/SKILL.md +431 -0
  255. package/bin/skills/peft/references/advanced-usage.md +514 -0
  256. package/bin/skills/peft/references/troubleshooting.md +480 -0
  257. package/bin/skills/phoenix/SKILL.md +475 -0
  258. package/bin/skills/phoenix/references/advanced-usage.md +619 -0
  259. package/bin/skills/phoenix/references/troubleshooting.md +538 -0
  260. package/bin/skills/pinecone/SKILL.md +358 -0
  261. package/bin/skills/pinecone/references/deployment.md +181 -0
  262. package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
  263. package/bin/skills/pytorch-fsdp/references/index.md +7 -0
  264. package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
  265. package/bin/skills/pytorch-lightning/SKILL.md +346 -0
  266. package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
  267. package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
  268. package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
  269. package/bin/skills/pyvene/SKILL.md +473 -0
  270. package/bin/skills/pyvene/references/README.md +73 -0
  271. package/bin/skills/pyvene/references/api.md +383 -0
  272. package/bin/skills/pyvene/references/tutorials.md +376 -0
  273. package/bin/skills/qdrant/SKILL.md +493 -0
  274. package/bin/skills/qdrant/references/advanced-usage.md +648 -0
  275. package/bin/skills/qdrant/references/troubleshooting.md +631 -0
  276. package/bin/skills/ray-data/SKILL.md +326 -0
  277. package/bin/skills/ray-data/references/integration.md +82 -0
  278. package/bin/skills/ray-data/references/transformations.md +83 -0
  279. package/bin/skills/ray-train/SKILL.md +406 -0
  280. package/bin/skills/ray-train/references/multi-node.md +628 -0
  281. package/bin/skills/rwkv/SKILL.md +260 -0
  282. package/bin/skills/rwkv/references/architecture-details.md +344 -0
  283. package/bin/skills/rwkv/references/rwkv7.md +386 -0
  284. package/bin/skills/rwkv/references/state-management.md +369 -0
  285. package/bin/skills/saelens/SKILL.md +386 -0
  286. package/bin/skills/saelens/references/README.md +70 -0
  287. package/bin/skills/saelens/references/api.md +333 -0
  288. package/bin/skills/saelens/references/tutorials.md +318 -0
  289. package/bin/skills/segment-anything/SKILL.md +500 -0
  290. package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
  291. package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
  292. package/bin/skills/sentence-transformers/SKILL.md +255 -0
  293. package/bin/skills/sentence-transformers/references/models.md +123 -0
  294. package/bin/skills/sentencepiece/SKILL.md +235 -0
  295. package/bin/skills/sentencepiece/references/algorithms.md +200 -0
  296. package/bin/skills/sentencepiece/references/training.md +304 -0
  297. package/bin/skills/sglang/SKILL.md +442 -0
  298. package/bin/skills/sglang/references/deployment.md +490 -0
  299. package/bin/skills/sglang/references/radix-attention.md +413 -0
  300. package/bin/skills/sglang/references/structured-generation.md +541 -0
  301. package/bin/skills/simpo/SKILL.md +219 -0
  302. package/bin/skills/simpo/references/datasets.md +478 -0
  303. package/bin/skills/simpo/references/hyperparameters.md +452 -0
  304. package/bin/skills/simpo/references/loss-functions.md +350 -0
  305. package/bin/skills/skypilot/SKILL.md +509 -0
  306. package/bin/skills/skypilot/references/advanced-usage.md +491 -0
  307. package/bin/skills/skypilot/references/troubleshooting.md +570 -0
  308. package/bin/skills/slime/SKILL.md +464 -0
  309. package/bin/skills/slime/references/api-reference.md +392 -0
  310. package/bin/skills/slime/references/troubleshooting.md +386 -0
  311. package/bin/skills/speculative-decoding/SKILL.md +467 -0
  312. package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
  313. package/bin/skills/speculative-decoding/references/medusa.md +350 -0
  314. package/bin/skills/stable-diffusion/SKILL.md +519 -0
  315. package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
  316. package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
  317. package/bin/skills/tensorboard/SKILL.md +629 -0
  318. package/bin/skills/tensorboard/references/integrations.md +638 -0
  319. package/bin/skills/tensorboard/references/profiling.md +545 -0
  320. package/bin/skills/tensorboard/references/visualization.md +620 -0
  321. package/bin/skills/tensorrt-llm/SKILL.md +187 -0
  322. package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
  323. package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
  324. package/bin/skills/tensorrt-llm/references/serving.md +470 -0
  325. package/bin/skills/tinker/SKILL.md +362 -0
  326. package/bin/skills/tinker/references/api-reference.md +168 -0
  327. package/bin/skills/tinker/references/getting-started.md +157 -0
  328. package/bin/skills/tinker/references/loss-functions.md +163 -0
  329. package/bin/skills/tinker/references/models-and-lora.md +139 -0
  330. package/bin/skills/tinker/references/recipes.md +280 -0
  331. package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
  332. package/bin/skills/tinker/references/rendering.md +243 -0
  333. package/bin/skills/tinker/references/supervised-learning.md +232 -0
  334. package/bin/skills/tinker-training-cost/SKILL.md +187 -0
  335. package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
  336. package/bin/skills/torchforge/SKILL.md +433 -0
  337. package/bin/skills/torchforge/references/api-reference.md +327 -0
  338. package/bin/skills/torchforge/references/troubleshooting.md +409 -0
  339. package/bin/skills/torchtitan/SKILL.md +358 -0
  340. package/bin/skills/torchtitan/references/checkpoint.md +181 -0
  341. package/bin/skills/torchtitan/references/custom-models.md +258 -0
  342. package/bin/skills/torchtitan/references/float8.md +133 -0
  343. package/bin/skills/torchtitan/references/fsdp.md +126 -0
  344. package/bin/skills/transformer-lens/SKILL.md +346 -0
  345. package/bin/skills/transformer-lens/references/README.md +54 -0
  346. package/bin/skills/transformer-lens/references/api.md +362 -0
  347. package/bin/skills/transformer-lens/references/tutorials.md +339 -0
  348. package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
  349. package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
  350. package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
  351. package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
  352. package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
  353. package/bin/skills/unsloth/SKILL.md +80 -0
  354. package/bin/skills/unsloth/references/index.md +7 -0
  355. package/bin/skills/unsloth/references/llms-full.md +16799 -0
  356. package/bin/skills/unsloth/references/llms-txt.md +12044 -0
  357. package/bin/skills/unsloth/references/llms.md +82 -0
  358. package/bin/skills/verl/SKILL.md +391 -0
  359. package/bin/skills/verl/references/api-reference.md +301 -0
  360. package/bin/skills/verl/references/troubleshooting.md +391 -0
  361. package/bin/skills/vllm/SKILL.md +364 -0
  362. package/bin/skills/vllm/references/optimization.md +226 -0
  363. package/bin/skills/vllm/references/quantization.md +284 -0
  364. package/bin/skills/vllm/references/server-deployment.md +255 -0
  365. package/bin/skills/vllm/references/troubleshooting.md +447 -0
  366. package/bin/skills/weights-and-biases/SKILL.md +590 -0
  367. package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
  368. package/bin/skills/weights-and-biases/references/integrations.md +700 -0
  369. package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
  370. package/bin/skills/whisper/SKILL.md +317 -0
  371. package/bin/skills/whisper/references/languages.md +189 -0
  372. package/bin/synsc +0 -0
  373. package/package.json +10 -0
@@ -0,0 +1,619 @@
1
+ # Training Recipes
2
+
3
+ Complete hyperparameter configurations for LoRA, QLoRA, and full fine-tuning across different model sizes.
4
+
5
+ ## Overview
6
+
7
+ LitGPT provides optimized training configurations in `config_hub/finetune/` for various model architectures and fine-tuning methods.
8
+
9
+ **Key Configuration Files**:
10
+ - `config_hub/finetune/*/lora.yaml` - LoRA fine-tuning
11
+ - `config_hub/finetune/*/qlora.yaml` - 4-bit quantized LoRA
12
+ - `config_hub/finetune/*/full.yaml` - Full fine-tuning
13
+
14
+ ## LoRA Fine-tuning Recipes
15
+
16
+ ### TinyLlama 1.1B LoRA
17
+
18
+ **Configuration**:
19
+ ```yaml
20
+ global_batch_size: 8
21
+ micro_batch_size: 8
22
+ lr_warmup_steps: 10
23
+ epochs: 3
24
+ max_seq_length: 512
25
+
26
+ # LoRA specific
27
+ lora_r: 8
28
+ lora_alpha: 16
29
+ lora_dropout: 0.05
30
+ ```
31
+
32
+ **Command**:
33
+ ```bash
34
+ litgpt finetune_lora TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T \
35
+ --data JSON \
36
+ --data.json_path data/alpaca_sample.json \
37
+ --train.global_batch_size 8 \
38
+ --train.micro_batch_size 8 \
39
+ --train.lr_warmup_steps 10 \
40
+ --train.epochs 3 \
41
+ --train.max_seq_length 512 \
42
+ --lora_r 8 \
43
+ --lora_alpha 16
44
+ ```
45
+
46
+ **Memory**: ~4GB VRAM
47
+ **Time**: ~30 minutes on RTX 3090
48
+
49
+ ### Llama 2 7B LoRA
50
+
51
+ **Configuration**:
52
+ ```yaml
53
+ global_batch_size: 8
54
+ micro_batch_size: 2
55
+ lr_warmup_steps: 10
56
+ epochs: 4
57
+ max_seq_length: 512
58
+
59
+ # LoRA specific
60
+ lora_r: 8
61
+ lora_alpha: 16
62
+ lora_dropout: 0.05
63
+ ```
64
+
65
+ **Command**:
66
+ ```bash
67
+ litgpt finetune_lora meta-llama/Llama-2-7b-hf \
68
+ --data JSON \
69
+ --data.json_path data/alpaca.json \
70
+ --train.global_batch_size 8 \
71
+ --train.micro_batch_size 2 \
72
+ --train.lr_warmup_steps 10 \
73
+ --train.epochs 4 \
74
+ --lora_r 8 \
75
+ --lora_alpha 16
76
+ ```
77
+
78
+ **Memory**: ~16GB VRAM
79
+ **Gradient Accumulation**: 4 steps (8 / 2)
80
+ **Time**: ~6 hours on A100
81
+
82
+ ### Llama 3 8B LoRA
83
+
84
+ **Configuration**:
85
+ ```yaml
86
+ global_batch_size: 8
87
+ micro_batch_size: 1
88
+ lr_warmup_steps: 10
89
+ epochs: 2
90
+ max_seq_length: 512
91
+
92
+ # LoRA specific
93
+ lora_r: 8
94
+ lora_alpha: 16
95
+ lora_dropout: 0.05
96
+ ```
97
+
98
+ **Command**:
99
+ ```bash
100
+ litgpt finetune_lora meta-llama/Llama-3.2-8B \
101
+ --data JSON \
102
+ --data.json_path data/custom_dataset.json \
103
+ --train.global_batch_size 8 \
104
+ --train.micro_batch_size 1 \
105
+ --train.lr_warmup_steps 10 \
106
+ --train.epochs 2 \
107
+ --lora_r 8
108
+ ```
109
+
110
+ **Memory**: ~20GB VRAM
111
+ **Gradient Accumulation**: 8 steps
112
+ **Time**: ~8 hours on A100
113
+
114
+ ### Mistral 7B LoRA
115
+
116
+ **Configuration**:
117
+ ```yaml
118
+ global_batch_size: 8
119
+ micro_batch_size: 2
120
+ lr_warmup_steps: 10
121
+ epochs: 4
122
+ max_seq_length: 512
123
+
124
+ lora_r: 8
125
+ lora_alpha: 16
126
+ ```
127
+
128
+ **Command**:
129
+ ```bash
130
+ litgpt finetune_lora mistralai/Mistral-7B-v0.1 \
131
+ --data JSON \
132
+ --data.json_path data/alpaca.json \
133
+ --train.global_batch_size 8 \
134
+ --train.micro_batch_size 2 \
135
+ --train.epochs 4 \
136
+ --lora_r 8
137
+ ```
138
+
139
+ **Memory**: ~16GB VRAM
140
+
141
+ ### Phi-2 LoRA
142
+
143
+ **Configuration**:
144
+ ```yaml
145
+ global_batch_size: 8
146
+ micro_batch_size: 4
147
+ lr_warmup_steps: 10
148
+ epochs: 1
149
+ max_seq_length: 512
150
+
151
+ lora_r: 8
152
+ lora_alpha: 16
153
+ ```
154
+
155
+ **Command**:
156
+ ```bash
157
+ litgpt finetune_lora microsoft/phi-2 \
158
+ --data JSON \
159
+ --data.json_path data/alpaca_sample.json \
160
+ --train.global_batch_size 8 \
161
+ --train.micro_batch_size 4 \
162
+ --train.epochs 1 \
163
+ --lora_r 8
164
+ ```
165
+
166
+ **Memory**: ~8GB VRAM
167
+ **Time**: ~20 minutes on RTX 3090
168
+
169
+ ### Falcon 7B LoRA
170
+
171
+ **Configuration**:
172
+ ```yaml
173
+ global_batch_size: 8
174
+ micro_batch_size: 1
175
+ lr_warmup_steps: 10
176
+ epochs: 4
177
+ max_seq_length: 512
178
+
179
+ lora_r: 8
180
+ lora_alpha: 16
181
+ ```
182
+
183
+ **Command**:
184
+ ```bash
185
+ litgpt finetune_lora tiiuae/falcon-7b \
186
+ --data JSON \
187
+ --data.json_path data/alpaca.json \
188
+ --train.global_batch_size 8 \
189
+ --train.micro_batch_size 1 \
190
+ --train.epochs 4 \
191
+ --lora_r 8
192
+ ```
193
+
194
+ **Memory**: ~18GB VRAM
195
+
196
+ ### Gemma 7B LoRA
197
+
198
+ **Configuration**:
199
+ ```yaml
200
+ global_batch_size: 6
201
+ micro_batch_size: 1
202
+ lr_warmup_steps: 200
203
+ epochs: 2
204
+ max_seq_length: 512
205
+
206
+ lora_r: 8
207
+ lora_alpha: 16
208
+ ```
209
+
210
+ **Command**:
211
+ ```bash
212
+ litgpt finetune_lora google/gemma-7b \
213
+ --data JSON \
214
+ --data.json_path data/alpaca.json \
215
+ --train.global_batch_size 6 \
216
+ --train.micro_batch_size 1 \
217
+ --train.lr_warmup_steps 200 \
218
+ --train.epochs 2 \
219
+ --lora_r 8
220
+ ```
221
+
222
+ **Memory**: ~18GB VRAM
223
+ **Note**: Longer warmup (200 steps) for stability
224
+
225
+ ## QLoRA Fine-tuning Recipes
226
+
227
+ QLoRA uses 4-bit quantization to reduce memory by ~75%.
228
+
229
+ ### TinyLlama 1.1B QLoRA
230
+
231
+ **Configuration**:
232
+ ```yaml
233
+ global_batch_size: 8
234
+ micro_batch_size: 8
235
+ lr_warmup_steps: 10
236
+ epochs: 3
237
+ max_seq_length: 512
238
+
239
+ lora_r: 8
240
+ lora_alpha: 16
241
+ quantize: "bnb.nf4"
242
+ ```
243
+
244
+ **Command**:
245
+ ```bash
246
+ litgpt finetune_lora TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T \
247
+ --quantize bnb.nf4 \
248
+ --data JSON \
249
+ --data.json_path data/alpaca_sample.json \
250
+ --train.global_batch_size 8 \
251
+ --train.micro_batch_size 8 \
252
+ --train.epochs 3 \
253
+ --lora_r 8
254
+ ```
255
+
256
+ **Memory**: ~2GB VRAM (75% reduction)
257
+
258
+ ### Llama 2 7B QLoRA
259
+
260
+ **Configuration**:
261
+ ```yaml
262
+ global_batch_size: 8
263
+ micro_batch_size: 2
264
+ lr_warmup_steps: 10
265
+ epochs: 4
266
+ max_seq_length: 512
267
+ min_lr: 6.0e-5
268
+
269
+ lora_r: 8
270
+ lora_alpha: 16
271
+ quantize: "bnb.nf4"
272
+ ```
273
+
274
+ **Command**:
275
+ ```bash
276
+ litgpt finetune_lora meta-llama/Llama-2-7b-hf \
277
+ --quantize bnb.nf4 \
278
+ --data JSON \
279
+ --data.json_path data/alpaca.json \
280
+ --train.global_batch_size 8 \
281
+ --train.micro_batch_size 2 \
282
+ --train.epochs 4 \
283
+ --lora_r 8
284
+ ```
285
+
286
+ **Memory**: ~6GB VRAM (consumer GPU friendly)
287
+
288
+ ### Llama 3 8B QLoRA
289
+
290
+ **Configuration**:
291
+ ```yaml
292
+ global_batch_size: 8
293
+ micro_batch_size: 2
294
+ lr_warmup_steps: 10
295
+ epochs: 2
296
+ max_seq_length: 512
297
+
298
+ lora_r: 8
299
+ lora_alpha: 16
300
+ quantize: "bnb.nf4"
301
+ ```
302
+
303
+ **Command**:
304
+ ```bash
305
+ litgpt finetune_lora meta-llama/Llama-3.2-8B \
306
+ --quantize bnb.nf4 \
307
+ --data JSON \
308
+ --data.json_path data/custom_dataset.json \
309
+ --train.global_batch_size 8 \
310
+ --train.micro_batch_size 2 \
311
+ --train.epochs 2 \
312
+ --lora_r 8
313
+ ```
314
+
315
+ **Memory**: ~8GB VRAM
316
+
317
+ ### Mistral 7B QLoRA
318
+
319
+ **Configuration**:
320
+ ```yaml
321
+ global_batch_size: 8
322
+ micro_batch_size: 2
323
+ lr_warmup_steps: 10
324
+ epochs: 4
325
+ max_seq_length: 512
326
+
327
+ lora_r: 8
328
+ lora_alpha: 16
329
+ quantize: "bnb.nf4"
330
+ ```
331
+
332
+ **Memory**: ~6GB VRAM
333
+
334
+ ### Phi-2 QLoRA
335
+
336
+ **Configuration**:
337
+ ```yaml
338
+ global_batch_size: 8
339
+ micro_batch_size: 4
340
+ lr_warmup_steps: 10
341
+ epochs: 1
342
+ max_seq_length: 512
343
+
344
+ lora_r: 8
345
+ lora_alpha: 16
346
+ quantize: "bnb.nf4"
347
+ ```
348
+
349
+ **Memory**: ~3GB VRAM
350
+
351
+ ### Falcon 7B QLoRA
352
+
353
+ **Configuration**:
354
+ ```yaml
355
+ global_batch_size: 8
356
+ micro_batch_size: 1
357
+ lr_warmup_steps: 10
358
+ epochs: 4
359
+ max_seq_length: 512
360
+
361
+ lora_r: 8
362
+ lora_alpha: 16
363
+ quantize: "bnb.nf4"
364
+ ```
365
+
366
+ **Memory**: ~6GB VRAM
367
+
368
+ ### Gemma 2B QLoRA
369
+
370
+ **Configuration**:
371
+ ```yaml
372
+ global_batch_size: 6
373
+ micro_batch_size: 2
374
+ lr_warmup_steps: 200
375
+ epochs: 2
376
+ max_seq_length: 512
377
+
378
+ lora_r: 8
379
+ lora_alpha: 16
380
+ quantize: "bnb.nf4"
381
+ ```
382
+
383
+ **Memory**: ~3GB VRAM
384
+
385
+ ### Gemma 7B QLoRA
386
+
387
+ **Configuration**:
388
+ ```yaml
389
+ global_batch_size: 6
390
+ micro_batch_size: 1
391
+ lr_warmup_steps: 200
392
+ epochs: 2
393
+ max_seq_length: 512
394
+
395
+ lora_r: 8
396
+ lora_alpha: 16
397
+ quantize: "bnb.nf4"
398
+ ```
399
+
400
+ **Memory**: ~6GB VRAM
401
+
402
+ ## Full Fine-tuning Recipes
403
+
404
+ Full fine-tuning updates all model parameters (requires more memory).
405
+
406
+ ### TinyLlama 1.1B Full
407
+
408
+ **Configuration**:
409
+ ```yaml
410
+ global_batch_size: 8
411
+ micro_batch_size: 2
412
+ lr_warmup_steps: 100
413
+ epochs: 3
414
+ max_seq_length: 512
415
+ learning_rate: 5e-5
416
+ ```
417
+
418
+ **Command**:
419
+ ```bash
420
+ litgpt finetune_full TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T \
421
+ --data JSON \
422
+ --data.json_path data/alpaca.json \
423
+ --train.global_batch_size 8 \
424
+ --train.micro_batch_size 2 \
425
+ --train.lr_warmup_steps 100 \
426
+ --train.epochs 3 \
427
+ --train.learning_rate 5e-5
428
+ ```
429
+
430
+ **Memory**: ~12GB VRAM
431
+ **Time**: ~4 hours on A100
432
+
433
+ ### Phi-2 Full
434
+
435
+ **Configuration**:
436
+ ```yaml
437
+ global_batch_size: 8
438
+ micro_batch_size: 1
439
+ lr_warmup_steps: 100
440
+ epochs: 2
441
+ max_seq_length: 512
442
+ learning_rate: 3e-5
443
+ ```
444
+
445
+ **Command**:
446
+ ```bash
447
+ litgpt finetune_full microsoft/phi-2 \
448
+ --data JSON \
449
+ --data.json_path data/alpaca.json \
450
+ --train.global_batch_size 8 \
451
+ --train.micro_batch_size 1 \
452
+ --train.epochs 2 \
453
+ --train.learning_rate 3e-5
454
+ ```
455
+
456
+ **Memory**: ~24GB VRAM
457
+
458
+ ## Common Hyperparameter Patterns
459
+
460
+ ### Learning Rates
461
+
462
+ | Model Size | LoRA LR | Full Fine-tune LR |
463
+ |------------|---------|-------------------|
464
+ | <2B | 3e-4 | 5e-5 |
465
+ | 2-10B | 1e-4 | 3e-5 |
466
+ | 10-70B | 5e-5 | 1e-5 |
467
+
468
+ ### LoRA Rank (r)
469
+
470
+ - **r=8**: Default, good balance (recommended)
471
+ - **r=16**: More capacity, 2× trainable params
472
+ - **r=32**: Maximum capacity, slower training
473
+ - **r=4**: Minimal, fastest training
474
+
475
+ **Rule of thumb**: Start with r=8, increase if underfitting.
476
+
477
+ ### Batch Sizes
478
+
479
+ | GPU VRAM | Micro Batch | Global Batch |
480
+ |----------|-------------|--------------|
481
+ | 8GB | 1 | 8 |
482
+ | 16GB | 2 | 8-16 |
483
+ | 40GB | 4 | 16-32 |
484
+ | 80GB | 8 | 32-64 |
485
+
486
+ ### Warmup Steps
487
+
488
+ - **Small models (<2B)**: 10-50 steps
489
+ - **Medium models (2-10B)**: 100-200 steps
490
+ - **Large models (>10B)**: 200-500 steps
491
+
492
+ ### Epochs
493
+
494
+ - **Instruction tuning**: 1-3 epochs
495
+ - **Domain adaptation**: 3-5 epochs
496
+ - **Small datasets (<10K)**: 5-10 epochs
497
+
498
+ ## Advanced Configurations
499
+
500
+ ### Custom Learning Rate Schedule
501
+
502
+ ```bash
503
+ litgpt finetune_lora meta-llama/Llama-2-7b-hf \
504
+ --train.learning_rate 3e-4 \
505
+ --train.lr_warmup_steps 100 \
506
+ --train.min_lr 3e-6 \
507
+ --train.lr_decay_iters 10000
508
+ ```
509
+
510
+ ### Gradient Accumulation
511
+
512
+ ```bash
513
+ # Simulate global_batch_size=128 with 16GB GPU
514
+ litgpt finetune_lora meta-llama/Llama-2-7b-hf \
515
+ --train.global_batch_size 128 \
516
+ --train.micro_batch_size 2
517
+ # Accumulates over 64 steps (128 / 2)
518
+ ```
519
+
520
+ ### Mixed Precision
521
+
522
+ ```bash
523
+ litgpt finetune_lora meta-llama/Llama-2-7b-hf \
524
+ --precision bf16-mixed # BF16 mixed precision
525
+ # or
526
+ --precision 16-mixed # FP16 mixed precision
527
+ ```
528
+
529
+ ### Longer Context
530
+
531
+ ```bash
532
+ litgpt finetune_lora meta-llama/Llama-3.1-8B \
533
+ --train.max_seq_length 8192 \
534
+ --train.micro_batch_size 1 # Reduce batch for memory
535
+ ```
536
+
537
+ ## Memory Optimization
538
+
539
+ ### Out of Memory? Try These
540
+
541
+ 1. **Enable quantization**:
542
+ ```bash
543
+ --quantize bnb.nf4 # 4-bit QLoRA
544
+ ```
545
+
546
+ 2. **Reduce batch size**:
547
+ ```bash
548
+ --train.micro_batch_size 1
549
+ ```
550
+
551
+ 3. **Lower LoRA rank**:
552
+ ```bash
553
+ --lora_r 4 # Instead of 8
554
+ ```
555
+
556
+ 4. **Use FSDP** (multi-GPU):
557
+ ```bash
558
+ litgpt finetune_lora meta-llama/Llama-2-7b-hf \
559
+ --devices 4 # Use 4 GPUs with FSDP
560
+ ```
561
+
562
+ 5. **Gradient checkpointing**:
563
+ ```bash
564
+ --train.gradient_accumulation_iters 16
565
+ ```
566
+
567
+ ## Data Format
568
+
569
+ LitGPT expects JSON data in instruction format:
570
+
571
+ ```json
572
+ [
573
+ {
574
+ "instruction": "What is the capital of France?",
575
+ "input": "",
576
+ "output": "The capital of France is Paris."
577
+ },
578
+ {
579
+ "instruction": "Translate to Spanish:",
580
+ "input": "Hello world",
581
+ "output": "Hola mundo"
582
+ }
583
+ ]
584
+ ```
585
+
586
+ **Load custom data**:
587
+ ```bash
588
+ litgpt finetune_lora meta-llama/Llama-2-7b-hf \
589
+ --data JSON \
590
+ --data.json_path data/my_dataset.json \
591
+ --data.val_split_fraction 0.1 # 10% validation
592
+ ```
593
+
594
+ ## Merge and Deploy
595
+
596
+ After fine-tuning, merge LoRA weights:
597
+
598
+ ```bash
599
+ litgpt merge_lora checkpoints/meta-llama/Llama-2-7b-hf/final_lora.pth
600
+ ```
601
+
602
+ Generate with merged model:
603
+
604
+ ```bash
605
+ litgpt generate checkpoints/meta-llama/Llama-2-7b-hf-merged/ \
606
+ --prompt "What is machine learning?"
607
+ ```
608
+
609
+ Or serve via API:
610
+
611
+ ```bash
612
+ litgpt serve checkpoints/meta-llama/Llama-2-7b-hf-merged/
613
+ ```
614
+
615
+ ## References
616
+
617
+ - Configuration hub: `config_hub/finetune/`
618
+ - Fine-tuning tutorial: `tutorials/finetune_*.md`
619
+ - Memory guide: `tutorials/oom.md`