@synsci/cli-darwin-x64 1.1.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (373) hide show
  1. package/bin/skills/accelerate/SKILL.md +332 -0
  2. package/bin/skills/accelerate/references/custom-plugins.md +453 -0
  3. package/bin/skills/accelerate/references/megatron-integration.md +489 -0
  4. package/bin/skills/accelerate/references/performance.md +525 -0
  5. package/bin/skills/audiocraft/SKILL.md +564 -0
  6. package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
  7. package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
  8. package/bin/skills/autogpt/SKILL.md +403 -0
  9. package/bin/skills/autogpt/references/advanced-usage.md +535 -0
  10. package/bin/skills/autogpt/references/troubleshooting.md +420 -0
  11. package/bin/skills/awq/SKILL.md +310 -0
  12. package/bin/skills/awq/references/advanced-usage.md +324 -0
  13. package/bin/skills/awq/references/troubleshooting.md +344 -0
  14. package/bin/skills/axolotl/SKILL.md +158 -0
  15. package/bin/skills/axolotl/references/api.md +5548 -0
  16. package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
  17. package/bin/skills/axolotl/references/index.md +15 -0
  18. package/bin/skills/axolotl/references/other.md +3563 -0
  19. package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
  20. package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
  21. package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
  22. package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
  23. package/bin/skills/bitsandbytes/SKILL.md +411 -0
  24. package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
  25. package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
  26. package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
  27. package/bin/skills/blip-2/SKILL.md +564 -0
  28. package/bin/skills/blip-2/references/advanced-usage.md +680 -0
  29. package/bin/skills/blip-2/references/troubleshooting.md +526 -0
  30. package/bin/skills/chroma/SKILL.md +406 -0
  31. package/bin/skills/chroma/references/integration.md +38 -0
  32. package/bin/skills/clip/SKILL.md +253 -0
  33. package/bin/skills/clip/references/applications.md +207 -0
  34. package/bin/skills/constitutional-ai/SKILL.md +290 -0
  35. package/bin/skills/crewai/SKILL.md +498 -0
  36. package/bin/skills/crewai/references/flows.md +438 -0
  37. package/bin/skills/crewai/references/tools.md +429 -0
  38. package/bin/skills/crewai/references/troubleshooting.md +480 -0
  39. package/bin/skills/deepspeed/SKILL.md +141 -0
  40. package/bin/skills/deepspeed/references/08.md +17 -0
  41. package/bin/skills/deepspeed/references/09.md +173 -0
  42. package/bin/skills/deepspeed/references/2020.md +378 -0
  43. package/bin/skills/deepspeed/references/2023.md +279 -0
  44. package/bin/skills/deepspeed/references/assets.md +179 -0
  45. package/bin/skills/deepspeed/references/index.md +35 -0
  46. package/bin/skills/deepspeed/references/mii.md +118 -0
  47. package/bin/skills/deepspeed/references/other.md +1191 -0
  48. package/bin/skills/deepspeed/references/tutorials.md +6554 -0
  49. package/bin/skills/dspy/SKILL.md +590 -0
  50. package/bin/skills/dspy/references/examples.md +663 -0
  51. package/bin/skills/dspy/references/modules.md +475 -0
  52. package/bin/skills/dspy/references/optimizers.md +566 -0
  53. package/bin/skills/faiss/SKILL.md +221 -0
  54. package/bin/skills/faiss/references/index_types.md +280 -0
  55. package/bin/skills/flash-attention/SKILL.md +367 -0
  56. package/bin/skills/flash-attention/references/benchmarks.md +215 -0
  57. package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
  58. package/bin/skills/gguf/SKILL.md +427 -0
  59. package/bin/skills/gguf/references/advanced-usage.md +504 -0
  60. package/bin/skills/gguf/references/troubleshooting.md +442 -0
  61. package/bin/skills/gptq/SKILL.md +450 -0
  62. package/bin/skills/gptq/references/calibration.md +337 -0
  63. package/bin/skills/gptq/references/integration.md +129 -0
  64. package/bin/skills/gptq/references/troubleshooting.md +95 -0
  65. package/bin/skills/grpo-rl-training/README.md +97 -0
  66. package/bin/skills/grpo-rl-training/SKILL.md +572 -0
  67. package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
  68. package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
  69. package/bin/skills/guidance/SKILL.md +572 -0
  70. package/bin/skills/guidance/references/backends.md +554 -0
  71. package/bin/skills/guidance/references/constraints.md +674 -0
  72. package/bin/skills/guidance/references/examples.md +767 -0
  73. package/bin/skills/hqq/SKILL.md +445 -0
  74. package/bin/skills/hqq/references/advanced-usage.md +528 -0
  75. package/bin/skills/hqq/references/troubleshooting.md +503 -0
  76. package/bin/skills/hugging-face-cli/SKILL.md +191 -0
  77. package/bin/skills/hugging-face-cli/references/commands.md +954 -0
  78. package/bin/skills/hugging-face-cli/references/examples.md +374 -0
  79. package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
  80. package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
  81. package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
  82. package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
  83. package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
  84. package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
  85. package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
  86. package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
  87. package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
  88. package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
  89. package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
  90. package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
  91. package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
  92. package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
  93. package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
  94. package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
  95. package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
  96. package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
  97. package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
  98. package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
  99. package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
  100. package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
  101. package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
  102. package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
  103. package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
  104. package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
  105. package/bin/skills/hugging-face-jobs/index.html +216 -0
  106. package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
  107. package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
  108. package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
  109. package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
  110. package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
  111. package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
  112. package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
  113. package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
  114. package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
  115. package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
  116. package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
  117. package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
  118. package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
  119. package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
  120. package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
  121. package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
  122. package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
  123. package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
  124. package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
  125. package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
  126. package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
  127. package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
  128. package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
  129. package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
  130. package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
  131. package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
  132. package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
  133. package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
  134. package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
  135. package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
  136. package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
  137. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
  138. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
  139. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
  140. package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
  141. package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
  142. package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
  143. package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
  144. package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
  145. package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
  146. package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
  147. package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
  148. package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
  149. package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
  150. package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
  151. package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
  152. package/bin/skills/instructor/SKILL.md +740 -0
  153. package/bin/skills/instructor/references/examples.md +107 -0
  154. package/bin/skills/instructor/references/providers.md +70 -0
  155. package/bin/skills/instructor/references/validation.md +606 -0
  156. package/bin/skills/knowledge-distillation/SKILL.md +458 -0
  157. package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
  158. package/bin/skills/lambda-labs/SKILL.md +545 -0
  159. package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
  160. package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
  161. package/bin/skills/langchain/SKILL.md +480 -0
  162. package/bin/skills/langchain/references/agents.md +499 -0
  163. package/bin/skills/langchain/references/integration.md +562 -0
  164. package/bin/skills/langchain/references/rag.md +600 -0
  165. package/bin/skills/langsmith/SKILL.md +422 -0
  166. package/bin/skills/langsmith/references/advanced-usage.md +548 -0
  167. package/bin/skills/langsmith/references/troubleshooting.md +537 -0
  168. package/bin/skills/litgpt/SKILL.md +469 -0
  169. package/bin/skills/litgpt/references/custom-models.md +568 -0
  170. package/bin/skills/litgpt/references/distributed-training.md +451 -0
  171. package/bin/skills/litgpt/references/supported-models.md +336 -0
  172. package/bin/skills/litgpt/references/training-recipes.md +619 -0
  173. package/bin/skills/llama-cpp/SKILL.md +258 -0
  174. package/bin/skills/llama-cpp/references/optimization.md +89 -0
  175. package/bin/skills/llama-cpp/references/quantization.md +213 -0
  176. package/bin/skills/llama-cpp/references/server.md +125 -0
  177. package/bin/skills/llama-factory/SKILL.md +80 -0
  178. package/bin/skills/llama-factory/references/_images.md +23 -0
  179. package/bin/skills/llama-factory/references/advanced.md +1055 -0
  180. package/bin/skills/llama-factory/references/getting_started.md +349 -0
  181. package/bin/skills/llama-factory/references/index.md +19 -0
  182. package/bin/skills/llama-factory/references/other.md +31 -0
  183. package/bin/skills/llamaguard/SKILL.md +337 -0
  184. package/bin/skills/llamaindex/SKILL.md +569 -0
  185. package/bin/skills/llamaindex/references/agents.md +83 -0
  186. package/bin/skills/llamaindex/references/data_connectors.md +108 -0
  187. package/bin/skills/llamaindex/references/query_engines.md +406 -0
  188. package/bin/skills/llava/SKILL.md +304 -0
  189. package/bin/skills/llava/references/training.md +197 -0
  190. package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
  191. package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
  192. package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
  193. package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
  194. package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
  195. package/bin/skills/long-context/SKILL.md +536 -0
  196. package/bin/skills/long-context/references/extension_methods.md +468 -0
  197. package/bin/skills/long-context/references/fine_tuning.md +611 -0
  198. package/bin/skills/long-context/references/rope.md +402 -0
  199. package/bin/skills/mamba/SKILL.md +260 -0
  200. package/bin/skills/mamba/references/architecture-details.md +206 -0
  201. package/bin/skills/mamba/references/benchmarks.md +255 -0
  202. package/bin/skills/mamba/references/training-guide.md +388 -0
  203. package/bin/skills/megatron-core/SKILL.md +366 -0
  204. package/bin/skills/megatron-core/references/benchmarks.md +249 -0
  205. package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
  206. package/bin/skills/megatron-core/references/production-examples.md +473 -0
  207. package/bin/skills/megatron-core/references/training-recipes.md +547 -0
  208. package/bin/skills/miles/SKILL.md +315 -0
  209. package/bin/skills/miles/references/api-reference.md +141 -0
  210. package/bin/skills/miles/references/troubleshooting.md +352 -0
  211. package/bin/skills/mlflow/SKILL.md +704 -0
  212. package/bin/skills/mlflow/references/deployment.md +744 -0
  213. package/bin/skills/mlflow/references/model-registry.md +770 -0
  214. package/bin/skills/mlflow/references/tracking.md +680 -0
  215. package/bin/skills/modal/SKILL.md +341 -0
  216. package/bin/skills/modal/references/advanced-usage.md +503 -0
  217. package/bin/skills/modal/references/troubleshooting.md +494 -0
  218. package/bin/skills/model-merging/SKILL.md +539 -0
  219. package/bin/skills/model-merging/references/evaluation.md +462 -0
  220. package/bin/skills/model-merging/references/examples.md +428 -0
  221. package/bin/skills/model-merging/references/methods.md +352 -0
  222. package/bin/skills/model-pruning/SKILL.md +495 -0
  223. package/bin/skills/model-pruning/references/wanda.md +347 -0
  224. package/bin/skills/moe-training/SKILL.md +526 -0
  225. package/bin/skills/moe-training/references/architectures.md +432 -0
  226. package/bin/skills/moe-training/references/inference.md +348 -0
  227. package/bin/skills/moe-training/references/training.md +425 -0
  228. package/bin/skills/nanogpt/SKILL.md +290 -0
  229. package/bin/skills/nanogpt/references/architecture.md +382 -0
  230. package/bin/skills/nanogpt/references/data.md +476 -0
  231. package/bin/skills/nanogpt/references/training.md +564 -0
  232. package/bin/skills/nemo-curator/SKILL.md +383 -0
  233. package/bin/skills/nemo-curator/references/deduplication.md +87 -0
  234. package/bin/skills/nemo-curator/references/filtering.md +102 -0
  235. package/bin/skills/nemo-evaluator/SKILL.md +494 -0
  236. package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
  237. package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
  238. package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
  239. package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
  240. package/bin/skills/nemo-guardrails/SKILL.md +297 -0
  241. package/bin/skills/nnsight/SKILL.md +436 -0
  242. package/bin/skills/nnsight/references/README.md +78 -0
  243. package/bin/skills/nnsight/references/api.md +344 -0
  244. package/bin/skills/nnsight/references/tutorials.md +300 -0
  245. package/bin/skills/openrlhf/SKILL.md +249 -0
  246. package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
  247. package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
  248. package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
  249. package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
  250. package/bin/skills/outlines/SKILL.md +652 -0
  251. package/bin/skills/outlines/references/backends.md +615 -0
  252. package/bin/skills/outlines/references/examples.md +773 -0
  253. package/bin/skills/outlines/references/json_generation.md +652 -0
  254. package/bin/skills/peft/SKILL.md +431 -0
  255. package/bin/skills/peft/references/advanced-usage.md +514 -0
  256. package/bin/skills/peft/references/troubleshooting.md +480 -0
  257. package/bin/skills/phoenix/SKILL.md +475 -0
  258. package/bin/skills/phoenix/references/advanced-usage.md +619 -0
  259. package/bin/skills/phoenix/references/troubleshooting.md +538 -0
  260. package/bin/skills/pinecone/SKILL.md +358 -0
  261. package/bin/skills/pinecone/references/deployment.md +181 -0
  262. package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
  263. package/bin/skills/pytorch-fsdp/references/index.md +7 -0
  264. package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
  265. package/bin/skills/pytorch-lightning/SKILL.md +346 -0
  266. package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
  267. package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
  268. package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
  269. package/bin/skills/pyvene/SKILL.md +473 -0
  270. package/bin/skills/pyvene/references/README.md +73 -0
  271. package/bin/skills/pyvene/references/api.md +383 -0
  272. package/bin/skills/pyvene/references/tutorials.md +376 -0
  273. package/bin/skills/qdrant/SKILL.md +493 -0
  274. package/bin/skills/qdrant/references/advanced-usage.md +648 -0
  275. package/bin/skills/qdrant/references/troubleshooting.md +631 -0
  276. package/bin/skills/ray-data/SKILL.md +326 -0
  277. package/bin/skills/ray-data/references/integration.md +82 -0
  278. package/bin/skills/ray-data/references/transformations.md +83 -0
  279. package/bin/skills/ray-train/SKILL.md +406 -0
  280. package/bin/skills/ray-train/references/multi-node.md +628 -0
  281. package/bin/skills/rwkv/SKILL.md +260 -0
  282. package/bin/skills/rwkv/references/architecture-details.md +344 -0
  283. package/bin/skills/rwkv/references/rwkv7.md +386 -0
  284. package/bin/skills/rwkv/references/state-management.md +369 -0
  285. package/bin/skills/saelens/SKILL.md +386 -0
  286. package/bin/skills/saelens/references/README.md +70 -0
  287. package/bin/skills/saelens/references/api.md +333 -0
  288. package/bin/skills/saelens/references/tutorials.md +318 -0
  289. package/bin/skills/segment-anything/SKILL.md +500 -0
  290. package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
  291. package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
  292. package/bin/skills/sentence-transformers/SKILL.md +255 -0
  293. package/bin/skills/sentence-transformers/references/models.md +123 -0
  294. package/bin/skills/sentencepiece/SKILL.md +235 -0
  295. package/bin/skills/sentencepiece/references/algorithms.md +200 -0
  296. package/bin/skills/sentencepiece/references/training.md +304 -0
  297. package/bin/skills/sglang/SKILL.md +442 -0
  298. package/bin/skills/sglang/references/deployment.md +490 -0
  299. package/bin/skills/sglang/references/radix-attention.md +413 -0
  300. package/bin/skills/sglang/references/structured-generation.md +541 -0
  301. package/bin/skills/simpo/SKILL.md +219 -0
  302. package/bin/skills/simpo/references/datasets.md +478 -0
  303. package/bin/skills/simpo/references/hyperparameters.md +452 -0
  304. package/bin/skills/simpo/references/loss-functions.md +350 -0
  305. package/bin/skills/skypilot/SKILL.md +509 -0
  306. package/bin/skills/skypilot/references/advanced-usage.md +491 -0
  307. package/bin/skills/skypilot/references/troubleshooting.md +570 -0
  308. package/bin/skills/slime/SKILL.md +464 -0
  309. package/bin/skills/slime/references/api-reference.md +392 -0
  310. package/bin/skills/slime/references/troubleshooting.md +386 -0
  311. package/bin/skills/speculative-decoding/SKILL.md +467 -0
  312. package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
  313. package/bin/skills/speculative-decoding/references/medusa.md +350 -0
  314. package/bin/skills/stable-diffusion/SKILL.md +519 -0
  315. package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
  316. package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
  317. package/bin/skills/tensorboard/SKILL.md +629 -0
  318. package/bin/skills/tensorboard/references/integrations.md +638 -0
  319. package/bin/skills/tensorboard/references/profiling.md +545 -0
  320. package/bin/skills/tensorboard/references/visualization.md +620 -0
  321. package/bin/skills/tensorrt-llm/SKILL.md +187 -0
  322. package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
  323. package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
  324. package/bin/skills/tensorrt-llm/references/serving.md +470 -0
  325. package/bin/skills/tinker/SKILL.md +362 -0
  326. package/bin/skills/tinker/references/api-reference.md +168 -0
  327. package/bin/skills/tinker/references/getting-started.md +157 -0
  328. package/bin/skills/tinker/references/loss-functions.md +163 -0
  329. package/bin/skills/tinker/references/models-and-lora.md +139 -0
  330. package/bin/skills/tinker/references/recipes.md +280 -0
  331. package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
  332. package/bin/skills/tinker/references/rendering.md +243 -0
  333. package/bin/skills/tinker/references/supervised-learning.md +232 -0
  334. package/bin/skills/tinker-training-cost/SKILL.md +187 -0
  335. package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
  336. package/bin/skills/torchforge/SKILL.md +433 -0
  337. package/bin/skills/torchforge/references/api-reference.md +327 -0
  338. package/bin/skills/torchforge/references/troubleshooting.md +409 -0
  339. package/bin/skills/torchtitan/SKILL.md +358 -0
  340. package/bin/skills/torchtitan/references/checkpoint.md +181 -0
  341. package/bin/skills/torchtitan/references/custom-models.md +258 -0
  342. package/bin/skills/torchtitan/references/float8.md +133 -0
  343. package/bin/skills/torchtitan/references/fsdp.md +126 -0
  344. package/bin/skills/transformer-lens/SKILL.md +346 -0
  345. package/bin/skills/transformer-lens/references/README.md +54 -0
  346. package/bin/skills/transformer-lens/references/api.md +362 -0
  347. package/bin/skills/transformer-lens/references/tutorials.md +339 -0
  348. package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
  349. package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
  350. package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
  351. package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
  352. package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
  353. package/bin/skills/unsloth/SKILL.md +80 -0
  354. package/bin/skills/unsloth/references/index.md +7 -0
  355. package/bin/skills/unsloth/references/llms-full.md +16799 -0
  356. package/bin/skills/unsloth/references/llms-txt.md +12044 -0
  357. package/bin/skills/unsloth/references/llms.md +82 -0
  358. package/bin/skills/verl/SKILL.md +391 -0
  359. package/bin/skills/verl/references/api-reference.md +301 -0
  360. package/bin/skills/verl/references/troubleshooting.md +391 -0
  361. package/bin/skills/vllm/SKILL.md +364 -0
  362. package/bin/skills/vllm/references/optimization.md +226 -0
  363. package/bin/skills/vllm/references/quantization.md +284 -0
  364. package/bin/skills/vllm/references/server-deployment.md +255 -0
  365. package/bin/skills/vllm/references/troubleshooting.md +447 -0
  366. package/bin/skills/weights-and-biases/SKILL.md +590 -0
  367. package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
  368. package/bin/skills/weights-and-biases/references/integrations.md +700 -0
  369. package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
  370. package/bin/skills/whisper/SKILL.md +317 -0
  371. package/bin/skills/whisper/references/languages.md +189 -0
  372. package/bin/synsc +0 -0
  373. package/package.json +10 -0
@@ -0,0 +1,476 @@
1
+ # NanoGPT Data Preparation
2
+
3
+ ## Data Format
4
+
5
+ NanoGPT uses **binary token files** for efficient loading:
6
+
7
+ ```
8
+ dataset/
9
+ ├── train.bin # Training tokens (uint16 array)
10
+ ├── val.bin # Validation tokens (uint16 array)
11
+ └── meta.pkl # Metadata (vocab_size, mappings)
12
+ ```
13
+
14
+ **Why binary?**
15
+ - 100× faster than reading text files
16
+ - Memory-mapped loading (no RAM overhead)
17
+ - Simple format (just token IDs)
18
+
19
+ ## Character-Level Tokenization
20
+
21
+ ### Shakespeare Example
22
+
23
+ **Input text**:
24
+ ```
25
+ First Citizen:
26
+ Before we proceed any further, hear me speak.
27
+
28
+ All:
29
+ Speak, speak.
30
+ ```
31
+
32
+ **Character vocabulary** (65 total):
33
+ ```python
34
+ chars = ['\n', ' ', '!', ',', '.', ':', ';', '?', 'A', 'B', ..., 'z']
35
+ stoi = {'\n': 0, ' ': 1, '!': 2, ...} # char → ID
36
+ itos = {0: '\n', 1: ' ', 2: '!', ...} # ID → char
37
+ ```
38
+
39
+ **Tokenization**:
40
+ ```python
41
+ text = "First Citizen:"
42
+ tokens = [18, 47, 56, 57, 58, 1, 15, 47, 58, 47, 63, 43, 52, 10]
43
+ # F=18, i=47, r=56, s=57, t=58, ' '=1, C=15, ...
44
+ ```
45
+
46
+ **Full preparation script**:
47
+
48
+ ```python
49
+ # data/shakespeare_char/prepare.py
50
+ import os
51
+ import requests
52
+ import pickle
53
+ import numpy as np
54
+
55
+ # Download Shakespeare dataset
56
+ input_file = 'input.txt'
57
+ if not os.path.exists(input_file):
58
+ url = 'https://raw.githubusercontent.com/karpathy/char-rnn/master/data/tinyshakespeare/input.txt'
59
+ with open(input_file, 'w') as f:
60
+ f.write(requests.get(url).text)
61
+
62
+ # Load text
63
+ with open(input_file, 'r') as f:
64
+ data = f.read()
65
+
66
+ print(f"Dataset size: {len(data):,} characters")
67
+
68
+ # Build vocabulary
69
+ chars = sorted(list(set(data)))
70
+ vocab_size = len(chars)
71
+ print(f"Vocabulary: {vocab_size} unique characters")
72
+ print(f"Characters: {''.join(chars[:20])}...")
73
+
74
+ # Create mappings
75
+ stoi = {ch: i for i, ch in enumerate(chars)}
76
+ itos = {i: ch for i, ch in enumerate(chars)}
77
+
78
+ # Encode full dataset
79
+ def encode(s):
80
+ return [stoi[c] for c in s]
81
+
82
+ def decode(l):
83
+ return ''.join([itos[i] for i in l])
84
+
85
+ # Split train/val (90/10)
86
+ n = len(data)
87
+ train_data = data[:int(n * 0.9)]
88
+ val_data = data[int(n * 0.9):]
89
+
90
+ # Tokenize
91
+ train_ids = encode(train_data)
92
+ val_ids = encode(val_data)
93
+
94
+ print(f"Train: {len(train_ids):,} tokens")
95
+ print(f"Val: {len(val_ids):,} tokens")
96
+
97
+ # Save as binary (uint16)
98
+ train_ids = np.array(train_ids, dtype=np.uint16)
99
+ val_ids = np.array(val_ids, dtype=np.uint16)
100
+
101
+ train_ids.tofile('train.bin')
102
+ val_ids.tofile('val.bin')
103
+
104
+ # Save metadata
105
+ meta = {
106
+ 'vocab_size': vocab_size,
107
+ 'itos': itos,
108
+ 'stoi': stoi,
109
+ }
110
+
111
+ with open('meta.pkl', 'wb') as f:
112
+ pickle.dump(meta, f)
113
+
114
+ print("Saved train.bin, val.bin, meta.pkl")
115
+ ```
116
+
117
+ **Output**:
118
+ ```
119
+ Dataset size: 1,115,394 characters
120
+ Vocabulary: 65 unique characters
121
+ Characters: !$&',-.3:;?ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz
122
+ Train: 1,003,854 tokens
123
+ Val: 111,540 tokens
124
+ Saved train.bin, val.bin, meta.pkl
125
+ ```
126
+
127
+ ### Custom Character Dataset
128
+
129
+ ```python
130
+ # For your own text dataset
131
+ text = open('my_data.txt', 'r').read()
132
+
133
+ # Build vocab
134
+ chars = sorted(list(set(text)))
135
+ vocab_size = len(chars)
136
+
137
+ # Create mappings
138
+ stoi = {ch: i for i, ch in enumerate(chars)}
139
+ itos = {i: ch for i, ch in enumerate(chars)}
140
+
141
+ # Encode
142
+ encode = lambda s: [stoi[c] for c in s]
143
+ decode = lambda l: ''.join([itos[i] for i in l])
144
+
145
+ # Split and save
146
+ data = np.array(encode(text), dtype=np.uint16)
147
+ n = len(data)
148
+ train = data[:int(n*0.9)]
149
+ val = data[int(n*0.9):]
150
+
151
+ train.tofile('data/custom/train.bin')
152
+ val.tofile('data/custom/val.bin')
153
+
154
+ # Save meta
155
+ with open('data/custom/meta.pkl', 'wb') as f:
156
+ pickle.dump({'vocab_size': vocab_size, 'itos': itos, 'stoi': stoi}, f)
157
+ ```
158
+
159
+ ## BPE (Byte Pair Encoding)
160
+
161
+ ### OpenWebText with GPT-2 Tokenizer
162
+
163
+ **BPE advantages**:
164
+ - Handles rare words better (subword units)
165
+ - Standard for GPT-2, GPT-3
166
+ - Vocabulary: 50,257 tokens
167
+
168
+ **Preparation script**:
169
+
170
+ ```python
171
+ # data/openwebtext/prepare.py
172
+ import os
173
+ import numpy as np
174
+ import tiktoken
175
+ from datasets import load_dataset
176
+ from tqdm import tqdm
177
+
178
+ # Number of workers for parallel processing
179
+ num_proc = 8
180
+ num_proc_load_dataset = num_proc
181
+
182
+ # Download OpenWebText dataset
183
+ dataset = load_dataset("openwebtext", num_proc=num_proc_load_dataset)
184
+
185
+ # Use GPT-2 tokenizer
186
+ enc = tiktoken.get_encoding("gpt2")
187
+
188
+ def process(example):
189
+ """Tokenize a single example."""
190
+ ids = enc.encode_ordinary(example['text']) # Tokenize
191
+ ids.append(enc.eot_token) # Add end-of-text token
192
+ out = {'ids': ids, 'len': len(ids)}
193
+ return out
194
+
195
+ # Tokenize entire dataset (parallel)
196
+ tokenized = dataset.map(
197
+ process,
198
+ remove_columns=['text'],
199
+ desc="Tokenizing",
200
+ num_proc=num_proc,
201
+ )
202
+
203
+ # Concatenate all into one big array
204
+ train_ids = np.concatenate([
205
+ np.array(sample['ids'], dtype=np.uint16)
206
+ for sample in tqdm(tokenized['train'], desc="Concatenating")
207
+ ])
208
+
209
+ print(f"Total tokens: {len(train_ids):,}") # ~9 billion tokens
210
+
211
+ # Save train.bin
212
+ train_ids.tofile(os.path.join(os.path.dirname(__file__), 'train.bin'))
213
+
214
+ # Create val.bin (sample from train)
215
+ # Take first 5000 documents for validation
216
+ val_ids = np.concatenate([
217
+ np.array(sample['ids'], dtype=np.uint16)
218
+ for sample in tokenized['train'][:5000]
219
+ ])
220
+ val_ids.tofile(os.path.join(os.path.dirname(__file__), 'val.bin'))
221
+
222
+ # Save metadata
223
+ import pickle
224
+ meta = {
225
+ 'vocab_size': enc.n_vocab,
226
+ 'eot_token': enc.eot_token,
227
+ }
228
+ with open(os.path.join(os.path.dirname(__file__), 'meta.pkl'), 'wb') as f:
229
+ pickle.dump(meta, f)
230
+
231
+ print(f"Train tokens: {len(train_ids):,}")
232
+ print(f"Val tokens: {len(val_ids):,}")
233
+ print(f"Vocab size: {enc.n_vocab:,}")
234
+ ```
235
+
236
+ **Output**:
237
+ ```
238
+ Total tokens: 9,035,582,198
239
+ Train tokens: 9,035,582,198
240
+ Val tokens: 4,123,676
241
+ Vocab size: 50,257
242
+ ```
243
+
244
+ **Time**: 1-2 hours on 8-core CPU
245
+
246
+ **Disk usage**:
247
+ - train.bin: ~18 GB (9B tokens × 2 bytes)
248
+ - val.bin: ~8 MB
249
+ - Original text: ~54 GB
250
+
251
+ ### BPE Tokenization Example
252
+
253
+ ```python
254
+ import tiktoken
255
+
256
+ enc = tiktoken.get_encoding("gpt2")
257
+
258
+ # Tokenize
259
+ text = "Hello world! This is a test."
260
+ tokens = enc.encode_ordinary(text)
261
+ print(tokens)
262
+ # [15496, 995, 0, 770, 318, 257, 1332, 13]
263
+
264
+ # Decode
265
+ decoded = enc.decode(tokens)
266
+ print(decoded)
267
+ # "Hello world! This is a test."
268
+
269
+ # Token → text
270
+ print([enc.decode([t]) for t in tokens])
271
+ # ['Hello', ' world', '!', ' This', ' is', ' a', ' test', '.']
272
+ ```
273
+
274
+ **Subword splitting**:
275
+ ```python
276
+ # Rare word "electroencephalography" is split
277
+ tokens = enc.encode_ordinary("electroencephalography")
278
+ print([enc.decode([t]) for t in tokens])
279
+ # ['elect', 'ro', 'ence', 'ph', 'al', 'ography']
280
+ ```
281
+
282
+ ## Data Loading
283
+
284
+ ### Memory-Mapped Loading (Efficient)
285
+
286
+ ```python
287
+ import numpy as np
288
+ import torch
289
+
290
+ # Load data (memory-mapped, no RAM overhead)
291
+ data_dir = 'data/shakespeare_char'
292
+ train_data = np.memmap(
293
+ os.path.join(data_dir, 'train.bin'),
294
+ dtype=np.uint16,
295
+ mode='r'
296
+ )
297
+
298
+ print(f"Loaded {len(train_data):,} tokens") # No actual read yet!
299
+
300
+ # Get batch (read on-demand)
301
+ def get_batch(split):
302
+ data = train_data if split == 'train' else val_data
303
+
304
+ # Random indices
305
+ ix = torch.randint(len(data) - block_size, (batch_size,))
306
+
307
+ # Extract sequences
308
+ x = torch.stack([torch.from_numpy(data[i:i+block_size].astype(np.int64)) for i in ix])
309
+ y = torch.stack([torch.from_numpy(data[i+1:i+1+block_size].astype(np.int64)) for i in ix])
310
+
311
+ # Move to GPU
312
+ x, y = x.to('cuda'), y.to('cuda')
313
+
314
+ return x, y
315
+
316
+ # Usage
317
+ X, Y = get_batch('train')
318
+ # X shape: (batch_size, block_size)
319
+ # Y shape: (batch_size, block_size)
320
+ ```
321
+
322
+ **Memory efficiency**:
323
+ - 9 GB dataset loaded with ~0 MB RAM
324
+ - Only batch data is loaded into memory
325
+
326
+ ### Data Loader (PyTorch)
327
+
328
+ ```python
329
+ from torch.utils.data import Dataset, DataLoader
330
+
331
+ class TokenDataset(Dataset):
332
+ def __init__(self, data_path, block_size):
333
+ self.data = np.memmap(data_path, dtype=np.uint16, mode='r')
334
+ self.block_size = block_size
335
+
336
+ def __len__(self):
337
+ return len(self.data) - self.block_size
338
+
339
+ def __getitem__(self, idx):
340
+ x = torch.from_numpy(self.data[idx:idx+self.block_size].astype(np.int64))
341
+ y = torch.from_numpy(self.data[idx+1:idx+1+self.block_size].astype(np.int64))
342
+ return x, y
343
+
344
+ # Create data loader
345
+ train_dataset = TokenDataset('data/shakespeare_char/train.bin', block_size=256)
346
+ train_loader = DataLoader(
347
+ train_dataset,
348
+ batch_size=64,
349
+ shuffle=True,
350
+ num_workers=4,
351
+ pin_memory=True
352
+ )
353
+
354
+ # Usage
355
+ for X, Y in train_loader:
356
+ X, Y = X.to('cuda'), Y.to('cuda')
357
+ # Train...
358
+ ```
359
+
360
+ ## Custom Datasets
361
+
362
+ ### Wikipedia
363
+
364
+ ```python
365
+ from datasets import load_dataset
366
+
367
+ # Load Wikipedia
368
+ dataset = load_dataset("wikipedia", "20220301.en", num_proc=8)
369
+
370
+ # Tokenize
371
+ enc = tiktoken.get_encoding("gpt2")
372
+
373
+ def tokenize(example):
374
+ ids = enc.encode_ordinary(example['text'])
375
+ return {'ids': ids, 'len': len(ids)}
376
+
377
+ tokenized = dataset.map(tokenize, num_proc=8, remove_columns=['text', 'title'])
378
+
379
+ # Save
380
+ train_ids = np.concatenate([np.array(x['ids'], dtype=np.uint16) for x in tokenized['train']])
381
+ train_ids.tofile('data/wikipedia/train.bin')
382
+ ```
383
+
384
+ ### Code (GitHub)
385
+
386
+ ```python
387
+ from datasets import load_dataset
388
+
389
+ # Load code dataset (The Stack)
390
+ dataset = load_dataset("bigcode/the-stack", data_dir="data/python", num_proc=8)
391
+
392
+ # Tokenize (same as above)
393
+ enc = tiktoken.get_encoding("gpt2")
394
+ # ... tokenize and save
395
+ ```
396
+
397
+ ### Custom Text Files
398
+
399
+ ```python
400
+ # Load custom text files
401
+ import glob
402
+
403
+ files = glob.glob('my_dataset/*.txt')
404
+ text = ''
405
+
406
+ for file in files:
407
+ with open(file, 'r') as f:
408
+ text += f.read() + '\n'
409
+
410
+ # Character-level
411
+ chars = sorted(list(set(text)))
412
+ stoi = {ch: i for i, ch in enumerate(chars)}
413
+ data = np.array([stoi[c] for c in text], dtype=np.uint16)
414
+
415
+ # Split and save
416
+ n = len(data)
417
+ train = data[:int(n*0.9)]
418
+ val = data[int(n*0.9):]
419
+
420
+ train.tofile('data/custom/train.bin')
421
+ val.tofile('data/custom/val.bin')
422
+
423
+ # Meta
424
+ with open('data/custom/meta.pkl', 'wb') as f:
425
+ pickle.dump({'vocab_size': len(chars), 'itos': {i: ch for i, ch in enumerate(chars)}, 'stoi': stoi}, f)
426
+ ```
427
+
428
+ ## Data Augmentation (Advanced)
429
+
430
+ ### Random Masking (BERT-style)
431
+
432
+ ```python
433
+ def random_mask(tokens, mask_prob=0.15):
434
+ """Randomly mask tokens for denoising objective."""
435
+ mask = torch.rand(tokens.shape) < mask_prob
436
+ tokens[mask] = mask_token_id
437
+ return tokens
438
+
439
+ # Usage in training
440
+ X, Y = get_batch('train')
441
+ X_masked = random_mask(X.clone())
442
+ logits, loss = model(X_masked, Y) # Predict original from masked
443
+ ```
444
+
445
+ ### Document Shuffling
446
+
447
+ ```python
448
+ # Shuffle document order (not token order)
449
+ # Better generalization than sequential documents
450
+
451
+ import random
452
+
453
+ # Load documents
454
+ docs = dataset['train']
455
+ random.shuffle(docs)
456
+
457
+ # Concatenate shuffled
458
+ train_ids = np.concatenate([np.array(doc['ids'], dtype=np.uint16) for doc in docs])
459
+ ```
460
+
461
+ ## Benchmarks
462
+
463
+ | Dataset | Tokens | Vocab | Prep Time | Disk Size |
464
+ |---------|--------|-------|-----------|-----------|
465
+ | Shakespeare (char) | 1M | 65 | 1 sec | 2 MB |
466
+ | TinyStories | 250M | 50K | 5 min | 500 MB |
467
+ | OpenWebText | 9B | 50K | 90 min | 18 GB |
468
+ | The Pile | 300B | 50K | ~2 days | 600 GB |
469
+
470
+ ## Resources
471
+
472
+ - Data preparation scripts: https://github.com/karpathy/nanoGPT/tree/master/data
473
+ - Tiktoken (BPE tokenizer): https://github.com/openai/tiktoken
474
+ - HuggingFace datasets: https://huggingface.co/datasets
475
+ - OpenWebText: https://huggingface.co/datasets/Skylion007/openwebtext
476
+ - The Stack (code): https://huggingface.co/datasets/bigcode/the-stack