@synsci/cli-darwin-x64 1.1.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (373) hide show
  1. package/bin/skills/accelerate/SKILL.md +332 -0
  2. package/bin/skills/accelerate/references/custom-plugins.md +453 -0
  3. package/bin/skills/accelerate/references/megatron-integration.md +489 -0
  4. package/bin/skills/accelerate/references/performance.md +525 -0
  5. package/bin/skills/audiocraft/SKILL.md +564 -0
  6. package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
  7. package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
  8. package/bin/skills/autogpt/SKILL.md +403 -0
  9. package/bin/skills/autogpt/references/advanced-usage.md +535 -0
  10. package/bin/skills/autogpt/references/troubleshooting.md +420 -0
  11. package/bin/skills/awq/SKILL.md +310 -0
  12. package/bin/skills/awq/references/advanced-usage.md +324 -0
  13. package/bin/skills/awq/references/troubleshooting.md +344 -0
  14. package/bin/skills/axolotl/SKILL.md +158 -0
  15. package/bin/skills/axolotl/references/api.md +5548 -0
  16. package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
  17. package/bin/skills/axolotl/references/index.md +15 -0
  18. package/bin/skills/axolotl/references/other.md +3563 -0
  19. package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
  20. package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
  21. package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
  22. package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
  23. package/bin/skills/bitsandbytes/SKILL.md +411 -0
  24. package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
  25. package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
  26. package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
  27. package/bin/skills/blip-2/SKILL.md +564 -0
  28. package/bin/skills/blip-2/references/advanced-usage.md +680 -0
  29. package/bin/skills/blip-2/references/troubleshooting.md +526 -0
  30. package/bin/skills/chroma/SKILL.md +406 -0
  31. package/bin/skills/chroma/references/integration.md +38 -0
  32. package/bin/skills/clip/SKILL.md +253 -0
  33. package/bin/skills/clip/references/applications.md +207 -0
  34. package/bin/skills/constitutional-ai/SKILL.md +290 -0
  35. package/bin/skills/crewai/SKILL.md +498 -0
  36. package/bin/skills/crewai/references/flows.md +438 -0
  37. package/bin/skills/crewai/references/tools.md +429 -0
  38. package/bin/skills/crewai/references/troubleshooting.md +480 -0
  39. package/bin/skills/deepspeed/SKILL.md +141 -0
  40. package/bin/skills/deepspeed/references/08.md +17 -0
  41. package/bin/skills/deepspeed/references/09.md +173 -0
  42. package/bin/skills/deepspeed/references/2020.md +378 -0
  43. package/bin/skills/deepspeed/references/2023.md +279 -0
  44. package/bin/skills/deepspeed/references/assets.md +179 -0
  45. package/bin/skills/deepspeed/references/index.md +35 -0
  46. package/bin/skills/deepspeed/references/mii.md +118 -0
  47. package/bin/skills/deepspeed/references/other.md +1191 -0
  48. package/bin/skills/deepspeed/references/tutorials.md +6554 -0
  49. package/bin/skills/dspy/SKILL.md +590 -0
  50. package/bin/skills/dspy/references/examples.md +663 -0
  51. package/bin/skills/dspy/references/modules.md +475 -0
  52. package/bin/skills/dspy/references/optimizers.md +566 -0
  53. package/bin/skills/faiss/SKILL.md +221 -0
  54. package/bin/skills/faiss/references/index_types.md +280 -0
  55. package/bin/skills/flash-attention/SKILL.md +367 -0
  56. package/bin/skills/flash-attention/references/benchmarks.md +215 -0
  57. package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
  58. package/bin/skills/gguf/SKILL.md +427 -0
  59. package/bin/skills/gguf/references/advanced-usage.md +504 -0
  60. package/bin/skills/gguf/references/troubleshooting.md +442 -0
  61. package/bin/skills/gptq/SKILL.md +450 -0
  62. package/bin/skills/gptq/references/calibration.md +337 -0
  63. package/bin/skills/gptq/references/integration.md +129 -0
  64. package/bin/skills/gptq/references/troubleshooting.md +95 -0
  65. package/bin/skills/grpo-rl-training/README.md +97 -0
  66. package/bin/skills/grpo-rl-training/SKILL.md +572 -0
  67. package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
  68. package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
  69. package/bin/skills/guidance/SKILL.md +572 -0
  70. package/bin/skills/guidance/references/backends.md +554 -0
  71. package/bin/skills/guidance/references/constraints.md +674 -0
  72. package/bin/skills/guidance/references/examples.md +767 -0
  73. package/bin/skills/hqq/SKILL.md +445 -0
  74. package/bin/skills/hqq/references/advanced-usage.md +528 -0
  75. package/bin/skills/hqq/references/troubleshooting.md +503 -0
  76. package/bin/skills/hugging-face-cli/SKILL.md +191 -0
  77. package/bin/skills/hugging-face-cli/references/commands.md +954 -0
  78. package/bin/skills/hugging-face-cli/references/examples.md +374 -0
  79. package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
  80. package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
  81. package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
  82. package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
  83. package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
  84. package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
  85. package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
  86. package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
  87. package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
  88. package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
  89. package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
  90. package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
  91. package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
  92. package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
  93. package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
  94. package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
  95. package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
  96. package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
  97. package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
  98. package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
  99. package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
  100. package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
  101. package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
  102. package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
  103. package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
  104. package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
  105. package/bin/skills/hugging-face-jobs/index.html +216 -0
  106. package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
  107. package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
  108. package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
  109. package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
  110. package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
  111. package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
  112. package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
  113. package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
  114. package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
  115. package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
  116. package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
  117. package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
  118. package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
  119. package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
  120. package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
  121. package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
  122. package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
  123. package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
  124. package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
  125. package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
  126. package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
  127. package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
  128. package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
  129. package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
  130. package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
  131. package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
  132. package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
  133. package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
  134. package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
  135. package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
  136. package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
  137. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
  138. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
  139. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
  140. package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
  141. package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
  142. package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
  143. package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
  144. package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
  145. package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
  146. package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
  147. package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
  148. package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
  149. package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
  150. package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
  151. package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
  152. package/bin/skills/instructor/SKILL.md +740 -0
  153. package/bin/skills/instructor/references/examples.md +107 -0
  154. package/bin/skills/instructor/references/providers.md +70 -0
  155. package/bin/skills/instructor/references/validation.md +606 -0
  156. package/bin/skills/knowledge-distillation/SKILL.md +458 -0
  157. package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
  158. package/bin/skills/lambda-labs/SKILL.md +545 -0
  159. package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
  160. package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
  161. package/bin/skills/langchain/SKILL.md +480 -0
  162. package/bin/skills/langchain/references/agents.md +499 -0
  163. package/bin/skills/langchain/references/integration.md +562 -0
  164. package/bin/skills/langchain/references/rag.md +600 -0
  165. package/bin/skills/langsmith/SKILL.md +422 -0
  166. package/bin/skills/langsmith/references/advanced-usage.md +548 -0
  167. package/bin/skills/langsmith/references/troubleshooting.md +537 -0
  168. package/bin/skills/litgpt/SKILL.md +469 -0
  169. package/bin/skills/litgpt/references/custom-models.md +568 -0
  170. package/bin/skills/litgpt/references/distributed-training.md +451 -0
  171. package/bin/skills/litgpt/references/supported-models.md +336 -0
  172. package/bin/skills/litgpt/references/training-recipes.md +619 -0
  173. package/bin/skills/llama-cpp/SKILL.md +258 -0
  174. package/bin/skills/llama-cpp/references/optimization.md +89 -0
  175. package/bin/skills/llama-cpp/references/quantization.md +213 -0
  176. package/bin/skills/llama-cpp/references/server.md +125 -0
  177. package/bin/skills/llama-factory/SKILL.md +80 -0
  178. package/bin/skills/llama-factory/references/_images.md +23 -0
  179. package/bin/skills/llama-factory/references/advanced.md +1055 -0
  180. package/bin/skills/llama-factory/references/getting_started.md +349 -0
  181. package/bin/skills/llama-factory/references/index.md +19 -0
  182. package/bin/skills/llama-factory/references/other.md +31 -0
  183. package/bin/skills/llamaguard/SKILL.md +337 -0
  184. package/bin/skills/llamaindex/SKILL.md +569 -0
  185. package/bin/skills/llamaindex/references/agents.md +83 -0
  186. package/bin/skills/llamaindex/references/data_connectors.md +108 -0
  187. package/bin/skills/llamaindex/references/query_engines.md +406 -0
  188. package/bin/skills/llava/SKILL.md +304 -0
  189. package/bin/skills/llava/references/training.md +197 -0
  190. package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
  191. package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
  192. package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
  193. package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
  194. package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
  195. package/bin/skills/long-context/SKILL.md +536 -0
  196. package/bin/skills/long-context/references/extension_methods.md +468 -0
  197. package/bin/skills/long-context/references/fine_tuning.md +611 -0
  198. package/bin/skills/long-context/references/rope.md +402 -0
  199. package/bin/skills/mamba/SKILL.md +260 -0
  200. package/bin/skills/mamba/references/architecture-details.md +206 -0
  201. package/bin/skills/mamba/references/benchmarks.md +255 -0
  202. package/bin/skills/mamba/references/training-guide.md +388 -0
  203. package/bin/skills/megatron-core/SKILL.md +366 -0
  204. package/bin/skills/megatron-core/references/benchmarks.md +249 -0
  205. package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
  206. package/bin/skills/megatron-core/references/production-examples.md +473 -0
  207. package/bin/skills/megatron-core/references/training-recipes.md +547 -0
  208. package/bin/skills/miles/SKILL.md +315 -0
  209. package/bin/skills/miles/references/api-reference.md +141 -0
  210. package/bin/skills/miles/references/troubleshooting.md +352 -0
  211. package/bin/skills/mlflow/SKILL.md +704 -0
  212. package/bin/skills/mlflow/references/deployment.md +744 -0
  213. package/bin/skills/mlflow/references/model-registry.md +770 -0
  214. package/bin/skills/mlflow/references/tracking.md +680 -0
  215. package/bin/skills/modal/SKILL.md +341 -0
  216. package/bin/skills/modal/references/advanced-usage.md +503 -0
  217. package/bin/skills/modal/references/troubleshooting.md +494 -0
  218. package/bin/skills/model-merging/SKILL.md +539 -0
  219. package/bin/skills/model-merging/references/evaluation.md +462 -0
  220. package/bin/skills/model-merging/references/examples.md +428 -0
  221. package/bin/skills/model-merging/references/methods.md +352 -0
  222. package/bin/skills/model-pruning/SKILL.md +495 -0
  223. package/bin/skills/model-pruning/references/wanda.md +347 -0
  224. package/bin/skills/moe-training/SKILL.md +526 -0
  225. package/bin/skills/moe-training/references/architectures.md +432 -0
  226. package/bin/skills/moe-training/references/inference.md +348 -0
  227. package/bin/skills/moe-training/references/training.md +425 -0
  228. package/bin/skills/nanogpt/SKILL.md +290 -0
  229. package/bin/skills/nanogpt/references/architecture.md +382 -0
  230. package/bin/skills/nanogpt/references/data.md +476 -0
  231. package/bin/skills/nanogpt/references/training.md +564 -0
  232. package/bin/skills/nemo-curator/SKILL.md +383 -0
  233. package/bin/skills/nemo-curator/references/deduplication.md +87 -0
  234. package/bin/skills/nemo-curator/references/filtering.md +102 -0
  235. package/bin/skills/nemo-evaluator/SKILL.md +494 -0
  236. package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
  237. package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
  238. package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
  239. package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
  240. package/bin/skills/nemo-guardrails/SKILL.md +297 -0
  241. package/bin/skills/nnsight/SKILL.md +436 -0
  242. package/bin/skills/nnsight/references/README.md +78 -0
  243. package/bin/skills/nnsight/references/api.md +344 -0
  244. package/bin/skills/nnsight/references/tutorials.md +300 -0
  245. package/bin/skills/openrlhf/SKILL.md +249 -0
  246. package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
  247. package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
  248. package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
  249. package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
  250. package/bin/skills/outlines/SKILL.md +652 -0
  251. package/bin/skills/outlines/references/backends.md +615 -0
  252. package/bin/skills/outlines/references/examples.md +773 -0
  253. package/bin/skills/outlines/references/json_generation.md +652 -0
  254. package/bin/skills/peft/SKILL.md +431 -0
  255. package/bin/skills/peft/references/advanced-usage.md +514 -0
  256. package/bin/skills/peft/references/troubleshooting.md +480 -0
  257. package/bin/skills/phoenix/SKILL.md +475 -0
  258. package/bin/skills/phoenix/references/advanced-usage.md +619 -0
  259. package/bin/skills/phoenix/references/troubleshooting.md +538 -0
  260. package/bin/skills/pinecone/SKILL.md +358 -0
  261. package/bin/skills/pinecone/references/deployment.md +181 -0
  262. package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
  263. package/bin/skills/pytorch-fsdp/references/index.md +7 -0
  264. package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
  265. package/bin/skills/pytorch-lightning/SKILL.md +346 -0
  266. package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
  267. package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
  268. package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
  269. package/bin/skills/pyvene/SKILL.md +473 -0
  270. package/bin/skills/pyvene/references/README.md +73 -0
  271. package/bin/skills/pyvene/references/api.md +383 -0
  272. package/bin/skills/pyvene/references/tutorials.md +376 -0
  273. package/bin/skills/qdrant/SKILL.md +493 -0
  274. package/bin/skills/qdrant/references/advanced-usage.md +648 -0
  275. package/bin/skills/qdrant/references/troubleshooting.md +631 -0
  276. package/bin/skills/ray-data/SKILL.md +326 -0
  277. package/bin/skills/ray-data/references/integration.md +82 -0
  278. package/bin/skills/ray-data/references/transformations.md +83 -0
  279. package/bin/skills/ray-train/SKILL.md +406 -0
  280. package/bin/skills/ray-train/references/multi-node.md +628 -0
  281. package/bin/skills/rwkv/SKILL.md +260 -0
  282. package/bin/skills/rwkv/references/architecture-details.md +344 -0
  283. package/bin/skills/rwkv/references/rwkv7.md +386 -0
  284. package/bin/skills/rwkv/references/state-management.md +369 -0
  285. package/bin/skills/saelens/SKILL.md +386 -0
  286. package/bin/skills/saelens/references/README.md +70 -0
  287. package/bin/skills/saelens/references/api.md +333 -0
  288. package/bin/skills/saelens/references/tutorials.md +318 -0
  289. package/bin/skills/segment-anything/SKILL.md +500 -0
  290. package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
  291. package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
  292. package/bin/skills/sentence-transformers/SKILL.md +255 -0
  293. package/bin/skills/sentence-transformers/references/models.md +123 -0
  294. package/bin/skills/sentencepiece/SKILL.md +235 -0
  295. package/bin/skills/sentencepiece/references/algorithms.md +200 -0
  296. package/bin/skills/sentencepiece/references/training.md +304 -0
  297. package/bin/skills/sglang/SKILL.md +442 -0
  298. package/bin/skills/sglang/references/deployment.md +490 -0
  299. package/bin/skills/sglang/references/radix-attention.md +413 -0
  300. package/bin/skills/sglang/references/structured-generation.md +541 -0
  301. package/bin/skills/simpo/SKILL.md +219 -0
  302. package/bin/skills/simpo/references/datasets.md +478 -0
  303. package/bin/skills/simpo/references/hyperparameters.md +452 -0
  304. package/bin/skills/simpo/references/loss-functions.md +350 -0
  305. package/bin/skills/skypilot/SKILL.md +509 -0
  306. package/bin/skills/skypilot/references/advanced-usage.md +491 -0
  307. package/bin/skills/skypilot/references/troubleshooting.md +570 -0
  308. package/bin/skills/slime/SKILL.md +464 -0
  309. package/bin/skills/slime/references/api-reference.md +392 -0
  310. package/bin/skills/slime/references/troubleshooting.md +386 -0
  311. package/bin/skills/speculative-decoding/SKILL.md +467 -0
  312. package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
  313. package/bin/skills/speculative-decoding/references/medusa.md +350 -0
  314. package/bin/skills/stable-diffusion/SKILL.md +519 -0
  315. package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
  316. package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
  317. package/bin/skills/tensorboard/SKILL.md +629 -0
  318. package/bin/skills/tensorboard/references/integrations.md +638 -0
  319. package/bin/skills/tensorboard/references/profiling.md +545 -0
  320. package/bin/skills/tensorboard/references/visualization.md +620 -0
  321. package/bin/skills/tensorrt-llm/SKILL.md +187 -0
  322. package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
  323. package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
  324. package/bin/skills/tensorrt-llm/references/serving.md +470 -0
  325. package/bin/skills/tinker/SKILL.md +362 -0
  326. package/bin/skills/tinker/references/api-reference.md +168 -0
  327. package/bin/skills/tinker/references/getting-started.md +157 -0
  328. package/bin/skills/tinker/references/loss-functions.md +163 -0
  329. package/bin/skills/tinker/references/models-and-lora.md +139 -0
  330. package/bin/skills/tinker/references/recipes.md +280 -0
  331. package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
  332. package/bin/skills/tinker/references/rendering.md +243 -0
  333. package/bin/skills/tinker/references/supervised-learning.md +232 -0
  334. package/bin/skills/tinker-training-cost/SKILL.md +187 -0
  335. package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
  336. package/bin/skills/torchforge/SKILL.md +433 -0
  337. package/bin/skills/torchforge/references/api-reference.md +327 -0
  338. package/bin/skills/torchforge/references/troubleshooting.md +409 -0
  339. package/bin/skills/torchtitan/SKILL.md +358 -0
  340. package/bin/skills/torchtitan/references/checkpoint.md +181 -0
  341. package/bin/skills/torchtitan/references/custom-models.md +258 -0
  342. package/bin/skills/torchtitan/references/float8.md +133 -0
  343. package/bin/skills/torchtitan/references/fsdp.md +126 -0
  344. package/bin/skills/transformer-lens/SKILL.md +346 -0
  345. package/bin/skills/transformer-lens/references/README.md +54 -0
  346. package/bin/skills/transformer-lens/references/api.md +362 -0
  347. package/bin/skills/transformer-lens/references/tutorials.md +339 -0
  348. package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
  349. package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
  350. package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
  351. package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
  352. package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
  353. package/bin/skills/unsloth/SKILL.md +80 -0
  354. package/bin/skills/unsloth/references/index.md +7 -0
  355. package/bin/skills/unsloth/references/llms-full.md +16799 -0
  356. package/bin/skills/unsloth/references/llms-txt.md +12044 -0
  357. package/bin/skills/unsloth/references/llms.md +82 -0
  358. package/bin/skills/verl/SKILL.md +391 -0
  359. package/bin/skills/verl/references/api-reference.md +301 -0
  360. package/bin/skills/verl/references/troubleshooting.md +391 -0
  361. package/bin/skills/vllm/SKILL.md +364 -0
  362. package/bin/skills/vllm/references/optimization.md +226 -0
  363. package/bin/skills/vllm/references/quantization.md +284 -0
  364. package/bin/skills/vllm/references/server-deployment.md +255 -0
  365. package/bin/skills/vllm/references/troubleshooting.md +447 -0
  366. package/bin/skills/weights-and-biases/SKILL.md +590 -0
  367. package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
  368. package/bin/skills/weights-and-biases/references/integrations.md +700 -0
  369. package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
  370. package/bin/skills/whisper/SKILL.md +317 -0
  371. package/bin/skills/whisper/references/languages.md +189 -0
  372. package/bin/synsc +0 -0
  373. package/package.json +10 -0
@@ -0,0 +1,590 @@
1
+ ---
2
+ name: weights-and-biases
3
+ description: Track ML experiments with automatic logging, visualize training in real-time, optimize hyperparameters with sweeps, and manage model registry with W&B - collaborative MLOps platform
4
+ version: 1.0.0
5
+ author: Synthetic Sciences
6
+ license: MIT
7
+ tags: [MLOps, Weights And Biases, WandB, Experiment Tracking, Hyperparameter Tuning, Model Registry, Collaboration, Real-Time Visualization, PyTorch, TensorFlow, HuggingFace]
8
+ dependencies: [wandb]
9
+ ---
10
+
11
+ # Weights & Biases: ML Experiment Tracking & MLOps
12
+
13
+ ## When to Use This Skill
14
+
15
+ Use Weights & Biases (W&B) when you need to:
16
+ - **Track ML experiments** with automatic metric logging
17
+ - **Visualize training** in real-time dashboards
18
+ - **Compare runs** across hyperparameters and configurations
19
+ - **Optimize hyperparameters** with automated sweeps
20
+ - **Manage model registry** with versioning and lineage
21
+ - **Collaborate on ML projects** with team workspaces
22
+ - **Track artifacts** (datasets, models, code) with lineage
23
+
24
+ **Users**: 200,000+ ML practitioners | **GitHub Stars**: 10.5k+ | **Integrations**: 100+
25
+
26
+ ## Installation
27
+
28
+ ```bash
29
+ # Install W&B
30
+ pip install wandb
31
+
32
+ # Login (creates API key)
33
+ wandb login
34
+
35
+ # Or set API key programmatically
36
+ export WANDB_API_KEY=your_api_key_here
37
+ ```
38
+
39
+ ## Quick Start
40
+
41
+ ### Basic Experiment Tracking
42
+
43
+ ```python
44
+ import wandb
45
+
46
+ # Initialize a run
47
+ run = wandb.init(
48
+ project="my-project",
49
+ config={
50
+ "learning_rate": 0.001,
51
+ "epochs": 10,
52
+ "batch_size": 32,
53
+ "architecture": "ResNet50"
54
+ }
55
+ )
56
+
57
+ # Training loop
58
+ for epoch in range(run.config.epochs):
59
+ # Your training code
60
+ train_loss = train_epoch()
61
+ val_loss = validate()
62
+
63
+ # Log metrics
64
+ wandb.log({
65
+ "epoch": epoch,
66
+ "train/loss": train_loss,
67
+ "val/loss": val_loss,
68
+ "train/accuracy": train_acc,
69
+ "val/accuracy": val_acc
70
+ })
71
+
72
+ # Finish the run
73
+ wandb.finish()
74
+ ```
75
+
76
+ ### With PyTorch
77
+
78
+ ```python
79
+ import torch
80
+ import wandb
81
+
82
+ # Initialize
83
+ wandb.init(project="pytorch-demo", config={
84
+ "lr": 0.001,
85
+ "epochs": 10
86
+ })
87
+
88
+ # Access config
89
+ config = wandb.config
90
+
91
+ # Training loop
92
+ for epoch in range(config.epochs):
93
+ for batch_idx, (data, target) in enumerate(train_loader):
94
+ # Forward pass
95
+ output = model(data)
96
+ loss = criterion(output, target)
97
+
98
+ # Backward pass
99
+ optimizer.zero_grad()
100
+ loss.backward()
101
+ optimizer.step()
102
+
103
+ # Log every 100 batches
104
+ if batch_idx % 100 == 0:
105
+ wandb.log({
106
+ "loss": loss.item(),
107
+ "epoch": epoch,
108
+ "batch": batch_idx
109
+ })
110
+
111
+ # Save model
112
+ torch.save(model.state_dict(), "model.pth")
113
+ wandb.save("model.pth") # Upload to W&B
114
+
115
+ wandb.finish()
116
+ ```
117
+
118
+ ## Core Concepts
119
+
120
+ ### 1. Projects and Runs
121
+
122
+ **Project**: Collection of related experiments
123
+ **Run**: Single execution of your training script
124
+
125
+ ```python
126
+ # Create/use project
127
+ run = wandb.init(
128
+ project="image-classification",
129
+ name="resnet50-experiment-1", # Optional run name
130
+ tags=["baseline", "resnet"], # Organize with tags
131
+ notes="First baseline run" # Add notes
132
+ )
133
+
134
+ # Each run has unique ID
135
+ print(f"Run ID: {run.id}")
136
+ print(f"Run URL: {run.url}")
137
+ ```
138
+
139
+ ### 2. Configuration Tracking
140
+
141
+ Track hyperparameters automatically:
142
+
143
+ ```python
144
+ config = {
145
+ # Model architecture
146
+ "model": "ResNet50",
147
+ "pretrained": True,
148
+
149
+ # Training params
150
+ "learning_rate": 0.001,
151
+ "batch_size": 32,
152
+ "epochs": 50,
153
+ "optimizer": "Adam",
154
+
155
+ # Data params
156
+ "dataset": "ImageNet",
157
+ "augmentation": "standard"
158
+ }
159
+
160
+ wandb.init(project="my-project", config=config)
161
+
162
+ # Access config during training
163
+ lr = wandb.config.learning_rate
164
+ batch_size = wandb.config.batch_size
165
+ ```
166
+
167
+ ### 3. Metric Logging
168
+
169
+ ```python
170
+ # Log scalars
171
+ wandb.log({"loss": 0.5, "accuracy": 0.92})
172
+
173
+ # Log multiple metrics
174
+ wandb.log({
175
+ "train/loss": train_loss,
176
+ "train/accuracy": train_acc,
177
+ "val/loss": val_loss,
178
+ "val/accuracy": val_acc,
179
+ "learning_rate": current_lr,
180
+ "epoch": epoch
181
+ })
182
+
183
+ # Log with custom x-axis
184
+ wandb.log({"loss": loss}, step=global_step)
185
+
186
+ # Log media (images, audio, video)
187
+ wandb.log({"examples": [wandb.Image(img) for img in images]})
188
+
189
+ # Log histograms
190
+ wandb.log({"gradients": wandb.Histogram(gradients)})
191
+
192
+ # Log tables
193
+ table = wandb.Table(columns=["id", "prediction", "ground_truth"])
194
+ wandb.log({"predictions": table})
195
+ ```
196
+
197
+ ### 4. Model Checkpointing
198
+
199
+ ```python
200
+ import torch
201
+ import wandb
202
+
203
+ # Save model checkpoint
204
+ checkpoint = {
205
+ 'epoch': epoch,
206
+ 'model_state_dict': model.state_dict(),
207
+ 'optimizer_state_dict': optimizer.state_dict(),
208
+ 'loss': loss,
209
+ }
210
+
211
+ torch.save(checkpoint, 'checkpoint.pth')
212
+
213
+ # Upload to W&B
214
+ wandb.save('checkpoint.pth')
215
+
216
+ # Or use Artifacts (recommended)
217
+ artifact = wandb.Artifact('model', type='model')
218
+ artifact.add_file('checkpoint.pth')
219
+ wandb.log_artifact(artifact)
220
+ ```
221
+
222
+ ## Hyperparameter Sweeps
223
+
224
+ Automatically search for optimal hyperparameters.
225
+
226
+ ### Define Sweep Configuration
227
+
228
+ ```python
229
+ sweep_config = {
230
+ 'method': 'bayes', # or 'grid', 'random'
231
+ 'metric': {
232
+ 'name': 'val/accuracy',
233
+ 'goal': 'maximize'
234
+ },
235
+ 'parameters': {
236
+ 'learning_rate': {
237
+ 'distribution': 'log_uniform',
238
+ 'min': 1e-5,
239
+ 'max': 1e-1
240
+ },
241
+ 'batch_size': {
242
+ 'values': [16, 32, 64, 128]
243
+ },
244
+ 'optimizer': {
245
+ 'values': ['adam', 'sgd', 'rmsprop']
246
+ },
247
+ 'dropout': {
248
+ 'distribution': 'uniform',
249
+ 'min': 0.1,
250
+ 'max': 0.5
251
+ }
252
+ }
253
+ }
254
+
255
+ # Initialize sweep
256
+ sweep_id = wandb.sweep(sweep_config, project="my-project")
257
+ ```
258
+
259
+ ### Define Training Function
260
+
261
+ ```python
262
+ def train():
263
+ # Initialize run
264
+ run = wandb.init()
265
+
266
+ # Access sweep parameters
267
+ lr = wandb.config.learning_rate
268
+ batch_size = wandb.config.batch_size
269
+ optimizer_name = wandb.config.optimizer
270
+
271
+ # Build model with sweep config
272
+ model = build_model(wandb.config)
273
+ optimizer = get_optimizer(optimizer_name, lr)
274
+
275
+ # Training loop
276
+ for epoch in range(NUM_EPOCHS):
277
+ train_loss = train_epoch(model, optimizer, batch_size)
278
+ val_acc = validate(model)
279
+
280
+ # Log metrics
281
+ wandb.log({
282
+ "train/loss": train_loss,
283
+ "val/accuracy": val_acc
284
+ })
285
+
286
+ # Run sweep
287
+ wandb.agent(sweep_id, function=train, count=50) # Run 50 trials
288
+ ```
289
+
290
+ ### Sweep Strategies
291
+
292
+ ```python
293
+ # Grid search - exhaustive
294
+ sweep_config = {
295
+ 'method': 'grid',
296
+ 'parameters': {
297
+ 'lr': {'values': [0.001, 0.01, 0.1]},
298
+ 'batch_size': {'values': [16, 32, 64]}
299
+ }
300
+ }
301
+
302
+ # Random search
303
+ sweep_config = {
304
+ 'method': 'random',
305
+ 'parameters': {
306
+ 'lr': {'distribution': 'uniform', 'min': 0.0001, 'max': 0.1},
307
+ 'dropout': {'distribution': 'uniform', 'min': 0.1, 'max': 0.5}
308
+ }
309
+ }
310
+
311
+ # Bayesian optimization (recommended)
312
+ sweep_config = {
313
+ 'method': 'bayes',
314
+ 'metric': {'name': 'val/loss', 'goal': 'minimize'},
315
+ 'parameters': {
316
+ 'lr': {'distribution': 'log_uniform', 'min': 1e-5, 'max': 1e-1}
317
+ }
318
+ }
319
+ ```
320
+
321
+ ## Artifacts
322
+
323
+ Track datasets, models, and other files with lineage.
324
+
325
+ ### Log Artifacts
326
+
327
+ ```python
328
+ # Create artifact
329
+ artifact = wandb.Artifact(
330
+ name='training-dataset',
331
+ type='dataset',
332
+ description='ImageNet training split',
333
+ metadata={'size': '1.2M images', 'split': 'train'}
334
+ )
335
+
336
+ # Add files
337
+ artifact.add_file('data/train.csv')
338
+ artifact.add_dir('data/images/')
339
+
340
+ # Log artifact
341
+ wandb.log_artifact(artifact)
342
+ ```
343
+
344
+ ### Use Artifacts
345
+
346
+ ```python
347
+ # Download and use artifact
348
+ run = wandb.init(project="my-project")
349
+
350
+ # Download artifact
351
+ artifact = run.use_artifact('training-dataset:latest')
352
+ artifact_dir = artifact.download()
353
+
354
+ # Use the data
355
+ data = load_data(f"{artifact_dir}/train.csv")
356
+ ```
357
+
358
+ ### Model Registry
359
+
360
+ ```python
361
+ # Log model as artifact
362
+ model_artifact = wandb.Artifact(
363
+ name='resnet50-model',
364
+ type='model',
365
+ metadata={'architecture': 'ResNet50', 'accuracy': 0.95}
366
+ )
367
+
368
+ model_artifact.add_file('model.pth')
369
+ wandb.log_artifact(model_artifact, aliases=['best', 'production'])
370
+
371
+ # Link to model registry
372
+ run.link_artifact(model_artifact, 'model-registry/production-models')
373
+ ```
374
+
375
+ ## Integration Examples
376
+
377
+ ### HuggingFace Transformers
378
+
379
+ ```python
380
+ from transformers import Trainer, TrainingArguments
381
+ import wandb
382
+
383
+ # Initialize W&B
384
+ wandb.init(project="hf-transformers")
385
+
386
+ # Training arguments with W&B
387
+ training_args = TrainingArguments(
388
+ output_dir="./results",
389
+ report_to="wandb", # Enable W&B logging
390
+ run_name="bert-finetuning",
391
+ logging_steps=100,
392
+ save_steps=500
393
+ )
394
+
395
+ # Trainer automatically logs to W&B
396
+ trainer = Trainer(
397
+ model=model,
398
+ args=training_args,
399
+ train_dataset=train_dataset,
400
+ eval_dataset=eval_dataset
401
+ )
402
+
403
+ trainer.train()
404
+ ```
405
+
406
+ ### PyTorch Lightning
407
+
408
+ ```python
409
+ from pytorch_lightning import Trainer
410
+ from pytorch_lightning.loggers import WandbLogger
411
+ import wandb
412
+
413
+ # Create W&B logger
414
+ wandb_logger = WandbLogger(
415
+ project="lightning-demo",
416
+ log_model=True # Log model checkpoints
417
+ )
418
+
419
+ # Use with Trainer
420
+ trainer = Trainer(
421
+ logger=wandb_logger,
422
+ max_epochs=10
423
+ )
424
+
425
+ trainer.fit(model, datamodule=dm)
426
+ ```
427
+
428
+ ### Keras/TensorFlow
429
+
430
+ ```python
431
+ import wandb
432
+ from wandb.keras import WandbCallback
433
+
434
+ # Initialize
435
+ wandb.init(project="keras-demo")
436
+
437
+ # Add callback
438
+ model.fit(
439
+ x_train, y_train,
440
+ validation_data=(x_val, y_val),
441
+ epochs=10,
442
+ callbacks=[WandbCallback()] # Auto-logs metrics
443
+ )
444
+ ```
445
+
446
+ ## Visualization & Analysis
447
+
448
+ ### Custom Charts
449
+
450
+ ```python
451
+ # Log custom visualizations
452
+ import matplotlib.pyplot as plt
453
+
454
+ fig, ax = plt.subplots()
455
+ ax.plot(x, y)
456
+ wandb.log({"custom_plot": wandb.Image(fig)})
457
+
458
+ # Log confusion matrix
459
+ wandb.log({"conf_mat": wandb.plot.confusion_matrix(
460
+ probs=None,
461
+ y_true=ground_truth,
462
+ preds=predictions,
463
+ class_names=class_names
464
+ )})
465
+ ```
466
+
467
+ ### Reports
468
+
469
+ Create shareable reports in W&B UI:
470
+ - Combine runs, charts, and text
471
+ - Markdown support
472
+ - Embeddable visualizations
473
+ - Team collaboration
474
+
475
+ ## Best Practices
476
+
477
+ ### 1. Organize with Tags and Groups
478
+
479
+ ```python
480
+ wandb.init(
481
+ project="my-project",
482
+ tags=["baseline", "resnet50", "imagenet"],
483
+ group="resnet-experiments", # Group related runs
484
+ job_type="train" # Type of job
485
+ )
486
+ ```
487
+
488
+ ### 2. Log Everything Relevant
489
+
490
+ ```python
491
+ # Log system metrics
492
+ wandb.log({
493
+ "gpu/util": gpu_utilization,
494
+ "gpu/memory": gpu_memory_used,
495
+ "cpu/util": cpu_utilization
496
+ })
497
+
498
+ # Log code version
499
+ wandb.log({"git_commit": git_commit_hash})
500
+
501
+ # Log data splits
502
+ wandb.log({
503
+ "data/train_size": len(train_dataset),
504
+ "data/val_size": len(val_dataset)
505
+ })
506
+ ```
507
+
508
+ ### 3. Use Descriptive Names
509
+
510
+ ```python
511
+ # ✅ Good: Descriptive run names
512
+ wandb.init(
513
+ project="nlp-classification",
514
+ name="bert-base-lr0.001-bs32-epoch10"
515
+ )
516
+
517
+ # ❌ Bad: Generic names
518
+ wandb.init(project="nlp", name="run1")
519
+ ```
520
+
521
+ ### 4. Save Important Artifacts
522
+
523
+ ```python
524
+ # Save final model
525
+ artifact = wandb.Artifact('final-model', type='model')
526
+ artifact.add_file('model.pth')
527
+ wandb.log_artifact(artifact)
528
+
529
+ # Save predictions for analysis
530
+ predictions_table = wandb.Table(
531
+ columns=["id", "input", "prediction", "ground_truth"],
532
+ data=predictions_data
533
+ )
534
+ wandb.log({"predictions": predictions_table})
535
+ ```
536
+
537
+ ### 5. Use Offline Mode for Unstable Connections
538
+
539
+ ```python
540
+ import os
541
+
542
+ # Enable offline mode
543
+ os.environ["WANDB_MODE"] = "offline"
544
+
545
+ wandb.init(project="my-project")
546
+ # ... your code ...
547
+
548
+ # Sync later
549
+ # wandb sync <run_directory>
550
+ ```
551
+
552
+ ## Team Collaboration
553
+
554
+ ### Share Runs
555
+
556
+ ```python
557
+ # Runs are automatically shareable via URL
558
+ run = wandb.init(project="team-project")
559
+ print(f"Share this URL: {run.url}")
560
+ ```
561
+
562
+ ### Team Projects
563
+
564
+ - Create team account at wandb.ai
565
+ - Add team members
566
+ - Set project visibility (private/public)
567
+ - Use team-level artifacts and model registry
568
+
569
+ ## Pricing
570
+
571
+ - **Free**: Unlimited public projects, 100GB storage
572
+ - **Academic**: Free for students/researchers
573
+ - **Teams**: $50/seat/month, private projects, unlimited storage
574
+ - **Enterprise**: Custom pricing, on-prem options
575
+
576
+ ## Resources
577
+
578
+ - **Documentation**: https://docs.wandb.ai
579
+ - **GitHub**: https://github.com/wandb/wandb (10.5k+ stars)
580
+ - **Examples**: https://github.com/wandb/examples
581
+ - **Community**: https://wandb.ai/community
582
+ - **Discord**: https://wandb.me/discord
583
+
584
+ ## See Also
585
+
586
+ - `references/sweeps.md` - Comprehensive hyperparameter optimization guide
587
+ - `references/artifacts.md` - Data and model versioning patterns
588
+ - `references/integrations.md` - Framework-specific examples
589
+
590
+