@synsci/cli-darwin-x64 1.1.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (373) hide show
  1. package/bin/skills/accelerate/SKILL.md +332 -0
  2. package/bin/skills/accelerate/references/custom-plugins.md +453 -0
  3. package/bin/skills/accelerate/references/megatron-integration.md +489 -0
  4. package/bin/skills/accelerate/references/performance.md +525 -0
  5. package/bin/skills/audiocraft/SKILL.md +564 -0
  6. package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
  7. package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
  8. package/bin/skills/autogpt/SKILL.md +403 -0
  9. package/bin/skills/autogpt/references/advanced-usage.md +535 -0
  10. package/bin/skills/autogpt/references/troubleshooting.md +420 -0
  11. package/bin/skills/awq/SKILL.md +310 -0
  12. package/bin/skills/awq/references/advanced-usage.md +324 -0
  13. package/bin/skills/awq/references/troubleshooting.md +344 -0
  14. package/bin/skills/axolotl/SKILL.md +158 -0
  15. package/bin/skills/axolotl/references/api.md +5548 -0
  16. package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
  17. package/bin/skills/axolotl/references/index.md +15 -0
  18. package/bin/skills/axolotl/references/other.md +3563 -0
  19. package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
  20. package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
  21. package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
  22. package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
  23. package/bin/skills/bitsandbytes/SKILL.md +411 -0
  24. package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
  25. package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
  26. package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
  27. package/bin/skills/blip-2/SKILL.md +564 -0
  28. package/bin/skills/blip-2/references/advanced-usage.md +680 -0
  29. package/bin/skills/blip-2/references/troubleshooting.md +526 -0
  30. package/bin/skills/chroma/SKILL.md +406 -0
  31. package/bin/skills/chroma/references/integration.md +38 -0
  32. package/bin/skills/clip/SKILL.md +253 -0
  33. package/bin/skills/clip/references/applications.md +207 -0
  34. package/bin/skills/constitutional-ai/SKILL.md +290 -0
  35. package/bin/skills/crewai/SKILL.md +498 -0
  36. package/bin/skills/crewai/references/flows.md +438 -0
  37. package/bin/skills/crewai/references/tools.md +429 -0
  38. package/bin/skills/crewai/references/troubleshooting.md +480 -0
  39. package/bin/skills/deepspeed/SKILL.md +141 -0
  40. package/bin/skills/deepspeed/references/08.md +17 -0
  41. package/bin/skills/deepspeed/references/09.md +173 -0
  42. package/bin/skills/deepspeed/references/2020.md +378 -0
  43. package/bin/skills/deepspeed/references/2023.md +279 -0
  44. package/bin/skills/deepspeed/references/assets.md +179 -0
  45. package/bin/skills/deepspeed/references/index.md +35 -0
  46. package/bin/skills/deepspeed/references/mii.md +118 -0
  47. package/bin/skills/deepspeed/references/other.md +1191 -0
  48. package/bin/skills/deepspeed/references/tutorials.md +6554 -0
  49. package/bin/skills/dspy/SKILL.md +590 -0
  50. package/bin/skills/dspy/references/examples.md +663 -0
  51. package/bin/skills/dspy/references/modules.md +475 -0
  52. package/bin/skills/dspy/references/optimizers.md +566 -0
  53. package/bin/skills/faiss/SKILL.md +221 -0
  54. package/bin/skills/faiss/references/index_types.md +280 -0
  55. package/bin/skills/flash-attention/SKILL.md +367 -0
  56. package/bin/skills/flash-attention/references/benchmarks.md +215 -0
  57. package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
  58. package/bin/skills/gguf/SKILL.md +427 -0
  59. package/bin/skills/gguf/references/advanced-usage.md +504 -0
  60. package/bin/skills/gguf/references/troubleshooting.md +442 -0
  61. package/bin/skills/gptq/SKILL.md +450 -0
  62. package/bin/skills/gptq/references/calibration.md +337 -0
  63. package/bin/skills/gptq/references/integration.md +129 -0
  64. package/bin/skills/gptq/references/troubleshooting.md +95 -0
  65. package/bin/skills/grpo-rl-training/README.md +97 -0
  66. package/bin/skills/grpo-rl-training/SKILL.md +572 -0
  67. package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
  68. package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
  69. package/bin/skills/guidance/SKILL.md +572 -0
  70. package/bin/skills/guidance/references/backends.md +554 -0
  71. package/bin/skills/guidance/references/constraints.md +674 -0
  72. package/bin/skills/guidance/references/examples.md +767 -0
  73. package/bin/skills/hqq/SKILL.md +445 -0
  74. package/bin/skills/hqq/references/advanced-usage.md +528 -0
  75. package/bin/skills/hqq/references/troubleshooting.md +503 -0
  76. package/bin/skills/hugging-face-cli/SKILL.md +191 -0
  77. package/bin/skills/hugging-face-cli/references/commands.md +954 -0
  78. package/bin/skills/hugging-face-cli/references/examples.md +374 -0
  79. package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
  80. package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
  81. package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
  82. package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
  83. package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
  84. package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
  85. package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
  86. package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
  87. package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
  88. package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
  89. package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
  90. package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
  91. package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
  92. package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
  93. package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
  94. package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
  95. package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
  96. package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
  97. package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
  98. package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
  99. package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
  100. package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
  101. package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
  102. package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
  103. package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
  104. package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
  105. package/bin/skills/hugging-face-jobs/index.html +216 -0
  106. package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
  107. package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
  108. package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
  109. package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
  110. package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
  111. package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
  112. package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
  113. package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
  114. package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
  115. package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
  116. package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
  117. package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
  118. package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
  119. package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
  120. package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
  121. package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
  122. package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
  123. package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
  124. package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
  125. package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
  126. package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
  127. package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
  128. package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
  129. package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
  130. package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
  131. package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
  132. package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
  133. package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
  134. package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
  135. package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
  136. package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
  137. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
  138. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
  139. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
  140. package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
  141. package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
  142. package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
  143. package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
  144. package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
  145. package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
  146. package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
  147. package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
  148. package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
  149. package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
  150. package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
  151. package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
  152. package/bin/skills/instructor/SKILL.md +740 -0
  153. package/bin/skills/instructor/references/examples.md +107 -0
  154. package/bin/skills/instructor/references/providers.md +70 -0
  155. package/bin/skills/instructor/references/validation.md +606 -0
  156. package/bin/skills/knowledge-distillation/SKILL.md +458 -0
  157. package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
  158. package/bin/skills/lambda-labs/SKILL.md +545 -0
  159. package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
  160. package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
  161. package/bin/skills/langchain/SKILL.md +480 -0
  162. package/bin/skills/langchain/references/agents.md +499 -0
  163. package/bin/skills/langchain/references/integration.md +562 -0
  164. package/bin/skills/langchain/references/rag.md +600 -0
  165. package/bin/skills/langsmith/SKILL.md +422 -0
  166. package/bin/skills/langsmith/references/advanced-usage.md +548 -0
  167. package/bin/skills/langsmith/references/troubleshooting.md +537 -0
  168. package/bin/skills/litgpt/SKILL.md +469 -0
  169. package/bin/skills/litgpt/references/custom-models.md +568 -0
  170. package/bin/skills/litgpt/references/distributed-training.md +451 -0
  171. package/bin/skills/litgpt/references/supported-models.md +336 -0
  172. package/bin/skills/litgpt/references/training-recipes.md +619 -0
  173. package/bin/skills/llama-cpp/SKILL.md +258 -0
  174. package/bin/skills/llama-cpp/references/optimization.md +89 -0
  175. package/bin/skills/llama-cpp/references/quantization.md +213 -0
  176. package/bin/skills/llama-cpp/references/server.md +125 -0
  177. package/bin/skills/llama-factory/SKILL.md +80 -0
  178. package/bin/skills/llama-factory/references/_images.md +23 -0
  179. package/bin/skills/llama-factory/references/advanced.md +1055 -0
  180. package/bin/skills/llama-factory/references/getting_started.md +349 -0
  181. package/bin/skills/llama-factory/references/index.md +19 -0
  182. package/bin/skills/llama-factory/references/other.md +31 -0
  183. package/bin/skills/llamaguard/SKILL.md +337 -0
  184. package/bin/skills/llamaindex/SKILL.md +569 -0
  185. package/bin/skills/llamaindex/references/agents.md +83 -0
  186. package/bin/skills/llamaindex/references/data_connectors.md +108 -0
  187. package/bin/skills/llamaindex/references/query_engines.md +406 -0
  188. package/bin/skills/llava/SKILL.md +304 -0
  189. package/bin/skills/llava/references/training.md +197 -0
  190. package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
  191. package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
  192. package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
  193. package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
  194. package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
  195. package/bin/skills/long-context/SKILL.md +536 -0
  196. package/bin/skills/long-context/references/extension_methods.md +468 -0
  197. package/bin/skills/long-context/references/fine_tuning.md +611 -0
  198. package/bin/skills/long-context/references/rope.md +402 -0
  199. package/bin/skills/mamba/SKILL.md +260 -0
  200. package/bin/skills/mamba/references/architecture-details.md +206 -0
  201. package/bin/skills/mamba/references/benchmarks.md +255 -0
  202. package/bin/skills/mamba/references/training-guide.md +388 -0
  203. package/bin/skills/megatron-core/SKILL.md +366 -0
  204. package/bin/skills/megatron-core/references/benchmarks.md +249 -0
  205. package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
  206. package/bin/skills/megatron-core/references/production-examples.md +473 -0
  207. package/bin/skills/megatron-core/references/training-recipes.md +547 -0
  208. package/bin/skills/miles/SKILL.md +315 -0
  209. package/bin/skills/miles/references/api-reference.md +141 -0
  210. package/bin/skills/miles/references/troubleshooting.md +352 -0
  211. package/bin/skills/mlflow/SKILL.md +704 -0
  212. package/bin/skills/mlflow/references/deployment.md +744 -0
  213. package/bin/skills/mlflow/references/model-registry.md +770 -0
  214. package/bin/skills/mlflow/references/tracking.md +680 -0
  215. package/bin/skills/modal/SKILL.md +341 -0
  216. package/bin/skills/modal/references/advanced-usage.md +503 -0
  217. package/bin/skills/modal/references/troubleshooting.md +494 -0
  218. package/bin/skills/model-merging/SKILL.md +539 -0
  219. package/bin/skills/model-merging/references/evaluation.md +462 -0
  220. package/bin/skills/model-merging/references/examples.md +428 -0
  221. package/bin/skills/model-merging/references/methods.md +352 -0
  222. package/bin/skills/model-pruning/SKILL.md +495 -0
  223. package/bin/skills/model-pruning/references/wanda.md +347 -0
  224. package/bin/skills/moe-training/SKILL.md +526 -0
  225. package/bin/skills/moe-training/references/architectures.md +432 -0
  226. package/bin/skills/moe-training/references/inference.md +348 -0
  227. package/bin/skills/moe-training/references/training.md +425 -0
  228. package/bin/skills/nanogpt/SKILL.md +290 -0
  229. package/bin/skills/nanogpt/references/architecture.md +382 -0
  230. package/bin/skills/nanogpt/references/data.md +476 -0
  231. package/bin/skills/nanogpt/references/training.md +564 -0
  232. package/bin/skills/nemo-curator/SKILL.md +383 -0
  233. package/bin/skills/nemo-curator/references/deduplication.md +87 -0
  234. package/bin/skills/nemo-curator/references/filtering.md +102 -0
  235. package/bin/skills/nemo-evaluator/SKILL.md +494 -0
  236. package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
  237. package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
  238. package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
  239. package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
  240. package/bin/skills/nemo-guardrails/SKILL.md +297 -0
  241. package/bin/skills/nnsight/SKILL.md +436 -0
  242. package/bin/skills/nnsight/references/README.md +78 -0
  243. package/bin/skills/nnsight/references/api.md +344 -0
  244. package/bin/skills/nnsight/references/tutorials.md +300 -0
  245. package/bin/skills/openrlhf/SKILL.md +249 -0
  246. package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
  247. package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
  248. package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
  249. package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
  250. package/bin/skills/outlines/SKILL.md +652 -0
  251. package/bin/skills/outlines/references/backends.md +615 -0
  252. package/bin/skills/outlines/references/examples.md +773 -0
  253. package/bin/skills/outlines/references/json_generation.md +652 -0
  254. package/bin/skills/peft/SKILL.md +431 -0
  255. package/bin/skills/peft/references/advanced-usage.md +514 -0
  256. package/bin/skills/peft/references/troubleshooting.md +480 -0
  257. package/bin/skills/phoenix/SKILL.md +475 -0
  258. package/bin/skills/phoenix/references/advanced-usage.md +619 -0
  259. package/bin/skills/phoenix/references/troubleshooting.md +538 -0
  260. package/bin/skills/pinecone/SKILL.md +358 -0
  261. package/bin/skills/pinecone/references/deployment.md +181 -0
  262. package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
  263. package/bin/skills/pytorch-fsdp/references/index.md +7 -0
  264. package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
  265. package/bin/skills/pytorch-lightning/SKILL.md +346 -0
  266. package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
  267. package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
  268. package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
  269. package/bin/skills/pyvene/SKILL.md +473 -0
  270. package/bin/skills/pyvene/references/README.md +73 -0
  271. package/bin/skills/pyvene/references/api.md +383 -0
  272. package/bin/skills/pyvene/references/tutorials.md +376 -0
  273. package/bin/skills/qdrant/SKILL.md +493 -0
  274. package/bin/skills/qdrant/references/advanced-usage.md +648 -0
  275. package/bin/skills/qdrant/references/troubleshooting.md +631 -0
  276. package/bin/skills/ray-data/SKILL.md +326 -0
  277. package/bin/skills/ray-data/references/integration.md +82 -0
  278. package/bin/skills/ray-data/references/transformations.md +83 -0
  279. package/bin/skills/ray-train/SKILL.md +406 -0
  280. package/bin/skills/ray-train/references/multi-node.md +628 -0
  281. package/bin/skills/rwkv/SKILL.md +260 -0
  282. package/bin/skills/rwkv/references/architecture-details.md +344 -0
  283. package/bin/skills/rwkv/references/rwkv7.md +386 -0
  284. package/bin/skills/rwkv/references/state-management.md +369 -0
  285. package/bin/skills/saelens/SKILL.md +386 -0
  286. package/bin/skills/saelens/references/README.md +70 -0
  287. package/bin/skills/saelens/references/api.md +333 -0
  288. package/bin/skills/saelens/references/tutorials.md +318 -0
  289. package/bin/skills/segment-anything/SKILL.md +500 -0
  290. package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
  291. package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
  292. package/bin/skills/sentence-transformers/SKILL.md +255 -0
  293. package/bin/skills/sentence-transformers/references/models.md +123 -0
  294. package/bin/skills/sentencepiece/SKILL.md +235 -0
  295. package/bin/skills/sentencepiece/references/algorithms.md +200 -0
  296. package/bin/skills/sentencepiece/references/training.md +304 -0
  297. package/bin/skills/sglang/SKILL.md +442 -0
  298. package/bin/skills/sglang/references/deployment.md +490 -0
  299. package/bin/skills/sglang/references/radix-attention.md +413 -0
  300. package/bin/skills/sglang/references/structured-generation.md +541 -0
  301. package/bin/skills/simpo/SKILL.md +219 -0
  302. package/bin/skills/simpo/references/datasets.md +478 -0
  303. package/bin/skills/simpo/references/hyperparameters.md +452 -0
  304. package/bin/skills/simpo/references/loss-functions.md +350 -0
  305. package/bin/skills/skypilot/SKILL.md +509 -0
  306. package/bin/skills/skypilot/references/advanced-usage.md +491 -0
  307. package/bin/skills/skypilot/references/troubleshooting.md +570 -0
  308. package/bin/skills/slime/SKILL.md +464 -0
  309. package/bin/skills/slime/references/api-reference.md +392 -0
  310. package/bin/skills/slime/references/troubleshooting.md +386 -0
  311. package/bin/skills/speculative-decoding/SKILL.md +467 -0
  312. package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
  313. package/bin/skills/speculative-decoding/references/medusa.md +350 -0
  314. package/bin/skills/stable-diffusion/SKILL.md +519 -0
  315. package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
  316. package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
  317. package/bin/skills/tensorboard/SKILL.md +629 -0
  318. package/bin/skills/tensorboard/references/integrations.md +638 -0
  319. package/bin/skills/tensorboard/references/profiling.md +545 -0
  320. package/bin/skills/tensorboard/references/visualization.md +620 -0
  321. package/bin/skills/tensorrt-llm/SKILL.md +187 -0
  322. package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
  323. package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
  324. package/bin/skills/tensorrt-llm/references/serving.md +470 -0
  325. package/bin/skills/tinker/SKILL.md +362 -0
  326. package/bin/skills/tinker/references/api-reference.md +168 -0
  327. package/bin/skills/tinker/references/getting-started.md +157 -0
  328. package/bin/skills/tinker/references/loss-functions.md +163 -0
  329. package/bin/skills/tinker/references/models-and-lora.md +139 -0
  330. package/bin/skills/tinker/references/recipes.md +280 -0
  331. package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
  332. package/bin/skills/tinker/references/rendering.md +243 -0
  333. package/bin/skills/tinker/references/supervised-learning.md +232 -0
  334. package/bin/skills/tinker-training-cost/SKILL.md +187 -0
  335. package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
  336. package/bin/skills/torchforge/SKILL.md +433 -0
  337. package/bin/skills/torchforge/references/api-reference.md +327 -0
  338. package/bin/skills/torchforge/references/troubleshooting.md +409 -0
  339. package/bin/skills/torchtitan/SKILL.md +358 -0
  340. package/bin/skills/torchtitan/references/checkpoint.md +181 -0
  341. package/bin/skills/torchtitan/references/custom-models.md +258 -0
  342. package/bin/skills/torchtitan/references/float8.md +133 -0
  343. package/bin/skills/torchtitan/references/fsdp.md +126 -0
  344. package/bin/skills/transformer-lens/SKILL.md +346 -0
  345. package/bin/skills/transformer-lens/references/README.md +54 -0
  346. package/bin/skills/transformer-lens/references/api.md +362 -0
  347. package/bin/skills/transformer-lens/references/tutorials.md +339 -0
  348. package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
  349. package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
  350. package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
  351. package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
  352. package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
  353. package/bin/skills/unsloth/SKILL.md +80 -0
  354. package/bin/skills/unsloth/references/index.md +7 -0
  355. package/bin/skills/unsloth/references/llms-full.md +16799 -0
  356. package/bin/skills/unsloth/references/llms-txt.md +12044 -0
  357. package/bin/skills/unsloth/references/llms.md +82 -0
  358. package/bin/skills/verl/SKILL.md +391 -0
  359. package/bin/skills/verl/references/api-reference.md +301 -0
  360. package/bin/skills/verl/references/troubleshooting.md +391 -0
  361. package/bin/skills/vllm/SKILL.md +364 -0
  362. package/bin/skills/vllm/references/optimization.md +226 -0
  363. package/bin/skills/vllm/references/quantization.md +284 -0
  364. package/bin/skills/vllm/references/server-deployment.md +255 -0
  365. package/bin/skills/vllm/references/troubleshooting.md +447 -0
  366. package/bin/skills/weights-and-biases/SKILL.md +590 -0
  367. package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
  368. package/bin/skills/weights-and-biases/references/integrations.md +700 -0
  369. package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
  370. package/bin/skills/whisper/SKILL.md +317 -0
  371. package/bin/skills/whisper/references/languages.md +189 -0
  372. package/bin/synsc +0 -0
  373. package/package.json +10 -0
@@ -0,0 +1,452 @@
1
+ # Hyperparameters
2
+
3
+ Complete guide to SimPO hyperparameter selection and tuning.
4
+
5
+ ## Overview
6
+
7
+ Key hyperparameters in SimPO:
8
+ 1. **Learning Rate** - Most critical
9
+ 2. **Beta (β)** - Reward scaling
10
+ 3. **Gamma-Beta Ratio (γ/β)** - Target margin
11
+ 4. **SFT Weight** - Regularization strength
12
+
13
+ ## Learning Rate
14
+
15
+ ### Recommended Ranges
16
+
17
+ **By model size**:
18
+ | Model Size | Learning Rate | Notes |
19
+ |------------|---------------|-------|
20
+ | 1B-3B | 5e-7 to 1e-6 | Higher end safe |
21
+ | 7B-8B | 3e-7 to 5e-7 | **Standard** |
22
+ | 13B-30B | 1e-7 to 3e-7 | Lower for stability |
23
+ | 70B+ | 5e-8 to 1e-7 | Very conservative |
24
+
25
+ **By task type**:
26
+ | Task | Learning Rate | Reason |
27
+ |------|---------------|--------|
28
+ | General chat | 5e-7 | Standard |
29
+ | Code generation | 3e-7 | **Precise reasoning** |
30
+ | Math reasoning | 3e-7 | **Careful optimization** |
31
+ | Creative writing | 1e-6 | More aggressive OK |
32
+
33
+ ### Why Learning Rate Matters
34
+
35
+ **Too high** (> 1e-6 for 7B):
36
+ - Loss divergence
37
+ - Catastrophic forgetting
38
+ - Unstable training
39
+
40
+ **Too low** (< 1e-7 for 7B):
41
+ - Very slow convergence
42
+ - May not finish in time
43
+ - Undertraining
44
+
45
+ **Optimal** (3e-7 to 5e-7 for 7B):
46
+ - Stable convergence
47
+ - Good final performance
48
+ - Efficient training
49
+
50
+ ### Config Examples
51
+
52
+ **Mistral 7B (general)**:
53
+ ```yaml
54
+ learning_rate: 5e-7
55
+ num_train_epochs: 1
56
+ warmup_ratio: 0.1
57
+ lr_scheduler_type: cosine
58
+ ```
59
+
60
+ **Llama 3 8B (reasoning)**:
61
+ ```yaml
62
+ learning_rate: 3e-7
63
+ num_train_epochs: 1
64
+ warmup_ratio: 0.1
65
+ lr_scheduler_type: cosine
66
+ ```
67
+
68
+ **Gemma 2 9B (creative)**:
69
+ ```yaml
70
+ learning_rate: 1e-6
71
+ num_train_epochs: 1
72
+ warmup_ratio: 0.1
73
+ lr_scheduler_type: linear
74
+ ```
75
+
76
+ ## Beta (β)
77
+
78
+ ### Recommended Values
79
+
80
+ **Range**: 2.0 to 10.0 (much higher than DPO's 0.01-0.1)
81
+
82
+ **By preference strength**:
83
+ | Beta | Preference Strength | Use Case |
84
+ |------|-------------------|----------|
85
+ | 1.0-2.0 | Weak | Subtle preferences |
86
+ | 2.0-5.0 | **Standard** | General alignment |
87
+ | 5.0-10.0 | Strong | Clear preferences |
88
+
89
+ **Default**: 2.0 to 2.5
90
+
91
+ ### Why Beta Matters
92
+
93
+ **Low beta** (< 2.0):
94
+ - Weak reward signal
95
+ - Slow preference learning
96
+ - May underfit
97
+
98
+ **High beta** (> 10.0):
99
+ - Very strong reward signal
100
+ - Risk of overfitting
101
+ - May ignore weak preferences
102
+
103
+ **Optimal** (2.0-5.0):
104
+ - Balanced reward scaling
105
+ - Stable training
106
+ - Good generalization
107
+
108
+ ### Interaction with Gamma
109
+
110
+ **Beta and gamma together**:
111
+ ```
112
+ Target margin in reward space = gamma
113
+ Target margin in logit space = gamma / beta
114
+ ```
115
+
116
+ **Example**:
117
+ ```yaml
118
+ beta: 2.0
119
+ gamma_beta_ratio: 0.5
120
+ # Effective gamma = 2.0 * 0.5 = 1.0
121
+ ```
122
+
123
+ ### Config Examples
124
+
125
+ **Weak preferences**:
126
+ ```yaml
127
+ beta: 2.0
128
+ gamma_beta_ratio: 0.3 # Small margin
129
+ ```
130
+
131
+ **Standard**:
132
+ ```yaml
133
+ beta: 2.5
134
+ gamma_beta_ratio: 0.5 # Default
135
+ ```
136
+
137
+ **Strong preferences**:
138
+ ```yaml
139
+ beta: 5.0
140
+ gamma_beta_ratio: 0.7 # Larger margin
141
+ ```
142
+
143
+ ## Gamma-Beta Ratio (γ/β)
144
+
145
+ ### Recommended Values
146
+
147
+ **Range**: 0.0 to 1.0
148
+
149
+ **By scenario**:
150
+ | Ratio | Margin | Use Case |
151
+ |-------|--------|----------|
152
+ | 0.0-0.3 | Small | Weak preference data |
153
+ | 0.4-0.6 | **Standard** | General use |
154
+ | 0.7-1.0 | Large | Very clear preferences |
155
+
156
+ **Default**: 0.5
157
+
158
+ ### Why Gamma Matters
159
+
160
+ **Low gamma** (< 0.3):
161
+ - Small target margin
162
+ - Less aggressive alignment
163
+ - More conservative
164
+
165
+ **High gamma** (> 0.7):
166
+ - Large target margin
167
+ - Stronger alignment
168
+ - More aggressive
169
+
170
+ **Optimal** (0.4-0.6):
171
+ - Balanced margin
172
+ - Stable training
173
+ - Good alignment
174
+
175
+ ### Mathematical Meaning
176
+
177
+ **In loss function**:
178
+ ```python
179
+ logits = pi_logratios - gamma_beta_ratio
180
+ loss = -log(sigmoid(beta * logits))
181
+ ```
182
+
183
+ **Interpretation**:
184
+ - gamma_beta_ratio shifts the decision boundary
185
+ - Higher ratio = requires larger log prob difference
186
+ - Controls how "clear" preferences must be
187
+
188
+ ### Config Examples
189
+
190
+ **Noisy preferences**:
191
+ ```yaml
192
+ gamma_beta_ratio: 0.3 # Smaller margin, more tolerant
193
+ ```
194
+
195
+ **Standard**:
196
+ ```yaml
197
+ gamma_beta_ratio: 0.5 # Default
198
+ ```
199
+
200
+ **High-quality preferences**:
201
+ ```yaml
202
+ gamma_beta_ratio: 0.8 # Larger margin, stricter
203
+ ```
204
+
205
+ ## SFT Weight
206
+
207
+ ### Recommended Values
208
+
209
+ **Range**: 0.0 to 1.0
210
+
211
+ **By model type**:
212
+ | Model Type | SFT Weight | Reason |
213
+ |------------|-----------|--------|
214
+ | Base model | 0.0 | No prior capabilities |
215
+ | **Instruct model** | 0.05-0.1 | Preserve instruction following |
216
+ | Chat model | 0.1-0.2 | Preserve conversational skills |
217
+
218
+ **Default**: 0.0 (no SFT regularization)
219
+
220
+ ### Why SFT Weight Matters
221
+
222
+ **Zero SFT** (0.0):
223
+ - Pure preference optimization
224
+ - May forget capabilities
225
+ - Standard for base models
226
+
227
+ **Low SFT** (0.05-0.1):
228
+ - Balanced approach
229
+ - **Recommended for instruct models**
230
+ - Slight capability preservation
231
+
232
+ **High SFT** (> 0.2):
233
+ - Strong capability preservation
234
+ - Weaker preference alignment
235
+ - May reduce alignment gains
236
+
237
+ ### Trade-off
238
+
239
+ ```
240
+ Total Loss = SimPO Loss + (sft_weight * SFT Loss)
241
+ ```
242
+
243
+ **Example**:
244
+ ```yaml
245
+ sft_weight: 0.1
246
+ # 90% preference optimization + 10% capability preservation
247
+ ```
248
+
249
+ ### Config Examples
250
+
251
+ **Base model (no SFT)**:
252
+ ```yaml
253
+ model_name_or_path: mistralai/Mistral-7B-v0.1
254
+ sft_weight: 0.0
255
+ ```
256
+
257
+ **Instruct model (light SFT)**:
258
+ ```yaml
259
+ model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
260
+ sft_weight: 0.1
261
+ ```
262
+
263
+ **Chat model (moderate SFT)**:
264
+ ```yaml
265
+ model_name_or_path: HuggingFaceH4/zephyr-7b-beta
266
+ sft_weight: 0.2
267
+ ```
268
+
269
+ ## Model-Size-Specific Recommendations
270
+
271
+ ### 7B Models (Mistral, Llama 3)
272
+
273
+ **Standard config**:
274
+ ```yaml
275
+ learning_rate: 5e-7
276
+ beta: 2.0
277
+ gamma_beta_ratio: 0.5
278
+ sft_weight: 0.0 # 0.1 if instruct model
279
+ num_train_epochs: 1
280
+ per_device_train_batch_size: 2
281
+ gradient_accumulation_steps: 4
282
+ ```
283
+
284
+ ### 8B-13B Models
285
+
286
+ **Standard config**:
287
+ ```yaml
288
+ learning_rate: 3e-7
289
+ beta: 2.5
290
+ gamma_beta_ratio: 0.5
291
+ sft_weight: 0.1 # If instruct
292
+ num_train_epochs: 1
293
+ per_device_train_batch_size: 1
294
+ gradient_accumulation_steps: 8
295
+ ```
296
+
297
+ ### 70B Models
298
+
299
+ **Standard config**:
300
+ ```yaml
301
+ learning_rate: 1e-7
302
+ beta: 2.0
303
+ gamma_beta_ratio: 0.5
304
+ sft_weight: 0.05
305
+ num_train_epochs: 1
306
+ per_device_train_batch_size: 1
307
+ gradient_accumulation_steps: 16
308
+ ```
309
+
310
+ ## Batch Size & Gradient Accumulation
311
+
312
+ ### Effective Batch Size
313
+
314
+ ```
315
+ Effective Batch Size = per_device_batch_size * num_gpus * grad_accum_steps
316
+ ```
317
+
318
+ **Recommended effective batch sizes**:
319
+ - 7B: 128-256
320
+ - 13B: 64-128
321
+ - 70B: 32-64
322
+
323
+ ### Config Examples
324
+
325
+ **Single GPU (A100 40GB)**:
326
+ ```yaml
327
+ per_device_train_batch_size: 1
328
+ gradient_accumulation_steps: 128 # Effective batch = 128
329
+ ```
330
+
331
+ **4 GPUs (A100 40GB)**:
332
+ ```yaml
333
+ per_device_train_batch_size: 2
334
+ gradient_accumulation_steps: 16 # Effective batch = 2*4*16 = 128
335
+ ```
336
+
337
+ **8 GPUs (A100 80GB)**:
338
+ ```yaml
339
+ per_device_train_batch_size: 2
340
+ gradient_accumulation_steps: 8 # Effective batch = 2*8*8 = 128
341
+ ```
342
+
343
+ ## Loss Type
344
+
345
+ ### Sigmoid vs Hinge
346
+
347
+ **Sigmoid** (default, recommended):
348
+ ```yaml
349
+ loss_type: sigmoid
350
+ label_smoothing: 0.0
351
+ ```
352
+
353
+ **Hinge** (experimental):
354
+ ```yaml
355
+ loss_type: hinge
356
+ # No label smoothing for hinge
357
+ ```
358
+
359
+ **When to use hinge**:
360
+ - Margin-based tasks
361
+ - SVM-style optimization
362
+ - Experimental purposes
363
+
364
+ **Generally**: Stick with sigmoid
365
+
366
+ ## Tuning Guide
367
+
368
+ ### Step 1: Start with Defaults
369
+
370
+ ```yaml
371
+ learning_rate: 5e-7 # For 7B
372
+ beta: 2.0
373
+ gamma_beta_ratio: 0.5
374
+ sft_weight: 0.0 # 0.1 if instruct
375
+ loss_type: sigmoid
376
+ ```
377
+
378
+ ### Step 2: Monitor Training
379
+
380
+ **Check every 100 steps**:
381
+ - Loss curve (should decrease smoothly)
382
+ - Reward margin (should increase)
383
+ - Chosen/rejected logps (should separate)
384
+
385
+ ### Step 3: Adjust if Needed
386
+
387
+ **If loss diverges**:
388
+ ```yaml
389
+ learning_rate: 3e-7 # Reduce from 5e-7
390
+ beta: 1.0 # Reduce from 2.0
391
+ ```
392
+
393
+ **If loss plateaus early**:
394
+ ```yaml
395
+ learning_rate: 1e-6 # Increase from 5e-7
396
+ beta: 5.0 # Increase from 2.0
397
+ ```
398
+
399
+ **If model forgets**:
400
+ ```yaml
401
+ sft_weight: 0.2 # Increase from 0.0
402
+ ```
403
+
404
+ ## Complete Example Configs
405
+
406
+ ### Mistral 7B Base (Standard)
407
+
408
+ ```yaml
409
+ model_name_or_path: mistralai/Mistral-7B-v0.1
410
+ dataset_mixer:
411
+ HuggingFaceH4/ultrafeedback_binarized: 1.0
412
+
413
+ learning_rate: 5e-7
414
+ beta: 2.0
415
+ gamma_beta_ratio: 0.5
416
+ loss_type: sigmoid
417
+ sft_weight: 0.0
418
+
419
+ num_train_epochs: 1
420
+ per_device_train_batch_size: 2
421
+ gradient_accumulation_steps: 4
422
+ warmup_ratio: 0.1
423
+ lr_scheduler_type: cosine
424
+
425
+ bf16: true
426
+ gradient_checkpointing: true
427
+ ```
428
+
429
+ ### Llama 3 8B Instruct (Reasoning)
430
+
431
+ ```yaml
432
+ model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
433
+ dataset_mixer:
434
+ argilla/distilabel-math-preference-dpo: 1.0
435
+
436
+ learning_rate: 3e-7
437
+ beta: 5.0
438
+ gamma_beta_ratio: 0.7
439
+ loss_type: sigmoid
440
+ sft_weight: 0.1
441
+
442
+ num_train_epochs: 1
443
+ per_device_train_batch_size: 1
444
+ gradient_accumulation_steps: 16
445
+ warmup_ratio: 0.1
446
+ lr_scheduler_type: cosine
447
+ ```
448
+
449
+ ## References
450
+
451
+ - SimPO paper: https://arxiv.org/abs/2405.14734
452
+ - Alignment Handbook: https://github.com/huggingface/alignment-handbook