@synsci/cli-darwin-x64 1.1.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (373) hide show
  1. package/bin/skills/accelerate/SKILL.md +332 -0
  2. package/bin/skills/accelerate/references/custom-plugins.md +453 -0
  3. package/bin/skills/accelerate/references/megatron-integration.md +489 -0
  4. package/bin/skills/accelerate/references/performance.md +525 -0
  5. package/bin/skills/audiocraft/SKILL.md +564 -0
  6. package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
  7. package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
  8. package/bin/skills/autogpt/SKILL.md +403 -0
  9. package/bin/skills/autogpt/references/advanced-usage.md +535 -0
  10. package/bin/skills/autogpt/references/troubleshooting.md +420 -0
  11. package/bin/skills/awq/SKILL.md +310 -0
  12. package/bin/skills/awq/references/advanced-usage.md +324 -0
  13. package/bin/skills/awq/references/troubleshooting.md +344 -0
  14. package/bin/skills/axolotl/SKILL.md +158 -0
  15. package/bin/skills/axolotl/references/api.md +5548 -0
  16. package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
  17. package/bin/skills/axolotl/references/index.md +15 -0
  18. package/bin/skills/axolotl/references/other.md +3563 -0
  19. package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
  20. package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
  21. package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
  22. package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
  23. package/bin/skills/bitsandbytes/SKILL.md +411 -0
  24. package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
  25. package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
  26. package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
  27. package/bin/skills/blip-2/SKILL.md +564 -0
  28. package/bin/skills/blip-2/references/advanced-usage.md +680 -0
  29. package/bin/skills/blip-2/references/troubleshooting.md +526 -0
  30. package/bin/skills/chroma/SKILL.md +406 -0
  31. package/bin/skills/chroma/references/integration.md +38 -0
  32. package/bin/skills/clip/SKILL.md +253 -0
  33. package/bin/skills/clip/references/applications.md +207 -0
  34. package/bin/skills/constitutional-ai/SKILL.md +290 -0
  35. package/bin/skills/crewai/SKILL.md +498 -0
  36. package/bin/skills/crewai/references/flows.md +438 -0
  37. package/bin/skills/crewai/references/tools.md +429 -0
  38. package/bin/skills/crewai/references/troubleshooting.md +480 -0
  39. package/bin/skills/deepspeed/SKILL.md +141 -0
  40. package/bin/skills/deepspeed/references/08.md +17 -0
  41. package/bin/skills/deepspeed/references/09.md +173 -0
  42. package/bin/skills/deepspeed/references/2020.md +378 -0
  43. package/bin/skills/deepspeed/references/2023.md +279 -0
  44. package/bin/skills/deepspeed/references/assets.md +179 -0
  45. package/bin/skills/deepspeed/references/index.md +35 -0
  46. package/bin/skills/deepspeed/references/mii.md +118 -0
  47. package/bin/skills/deepspeed/references/other.md +1191 -0
  48. package/bin/skills/deepspeed/references/tutorials.md +6554 -0
  49. package/bin/skills/dspy/SKILL.md +590 -0
  50. package/bin/skills/dspy/references/examples.md +663 -0
  51. package/bin/skills/dspy/references/modules.md +475 -0
  52. package/bin/skills/dspy/references/optimizers.md +566 -0
  53. package/bin/skills/faiss/SKILL.md +221 -0
  54. package/bin/skills/faiss/references/index_types.md +280 -0
  55. package/bin/skills/flash-attention/SKILL.md +367 -0
  56. package/bin/skills/flash-attention/references/benchmarks.md +215 -0
  57. package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
  58. package/bin/skills/gguf/SKILL.md +427 -0
  59. package/bin/skills/gguf/references/advanced-usage.md +504 -0
  60. package/bin/skills/gguf/references/troubleshooting.md +442 -0
  61. package/bin/skills/gptq/SKILL.md +450 -0
  62. package/bin/skills/gptq/references/calibration.md +337 -0
  63. package/bin/skills/gptq/references/integration.md +129 -0
  64. package/bin/skills/gptq/references/troubleshooting.md +95 -0
  65. package/bin/skills/grpo-rl-training/README.md +97 -0
  66. package/bin/skills/grpo-rl-training/SKILL.md +572 -0
  67. package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
  68. package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
  69. package/bin/skills/guidance/SKILL.md +572 -0
  70. package/bin/skills/guidance/references/backends.md +554 -0
  71. package/bin/skills/guidance/references/constraints.md +674 -0
  72. package/bin/skills/guidance/references/examples.md +767 -0
  73. package/bin/skills/hqq/SKILL.md +445 -0
  74. package/bin/skills/hqq/references/advanced-usage.md +528 -0
  75. package/bin/skills/hqq/references/troubleshooting.md +503 -0
  76. package/bin/skills/hugging-face-cli/SKILL.md +191 -0
  77. package/bin/skills/hugging-face-cli/references/commands.md +954 -0
  78. package/bin/skills/hugging-face-cli/references/examples.md +374 -0
  79. package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
  80. package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
  81. package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
  82. package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
  83. package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
  84. package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
  85. package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
  86. package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
  87. package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
  88. package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
  89. package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
  90. package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
  91. package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
  92. package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
  93. package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
  94. package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
  95. package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
  96. package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
  97. package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
  98. package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
  99. package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
  100. package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
  101. package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
  102. package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
  103. package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
  104. package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
  105. package/bin/skills/hugging-face-jobs/index.html +216 -0
  106. package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
  107. package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
  108. package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
  109. package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
  110. package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
  111. package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
  112. package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
  113. package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
  114. package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
  115. package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
  116. package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
  117. package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
  118. package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
  119. package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
  120. package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
  121. package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
  122. package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
  123. package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
  124. package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
  125. package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
  126. package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
  127. package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
  128. package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
  129. package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
  130. package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
  131. package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
  132. package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
  133. package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
  134. package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
  135. package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
  136. package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
  137. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
  138. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
  139. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
  140. package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
  141. package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
  142. package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
  143. package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
  144. package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
  145. package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
  146. package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
  147. package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
  148. package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
  149. package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
  150. package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
  151. package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
  152. package/bin/skills/instructor/SKILL.md +740 -0
  153. package/bin/skills/instructor/references/examples.md +107 -0
  154. package/bin/skills/instructor/references/providers.md +70 -0
  155. package/bin/skills/instructor/references/validation.md +606 -0
  156. package/bin/skills/knowledge-distillation/SKILL.md +458 -0
  157. package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
  158. package/bin/skills/lambda-labs/SKILL.md +545 -0
  159. package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
  160. package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
  161. package/bin/skills/langchain/SKILL.md +480 -0
  162. package/bin/skills/langchain/references/agents.md +499 -0
  163. package/bin/skills/langchain/references/integration.md +562 -0
  164. package/bin/skills/langchain/references/rag.md +600 -0
  165. package/bin/skills/langsmith/SKILL.md +422 -0
  166. package/bin/skills/langsmith/references/advanced-usage.md +548 -0
  167. package/bin/skills/langsmith/references/troubleshooting.md +537 -0
  168. package/bin/skills/litgpt/SKILL.md +469 -0
  169. package/bin/skills/litgpt/references/custom-models.md +568 -0
  170. package/bin/skills/litgpt/references/distributed-training.md +451 -0
  171. package/bin/skills/litgpt/references/supported-models.md +336 -0
  172. package/bin/skills/litgpt/references/training-recipes.md +619 -0
  173. package/bin/skills/llama-cpp/SKILL.md +258 -0
  174. package/bin/skills/llama-cpp/references/optimization.md +89 -0
  175. package/bin/skills/llama-cpp/references/quantization.md +213 -0
  176. package/bin/skills/llama-cpp/references/server.md +125 -0
  177. package/bin/skills/llama-factory/SKILL.md +80 -0
  178. package/bin/skills/llama-factory/references/_images.md +23 -0
  179. package/bin/skills/llama-factory/references/advanced.md +1055 -0
  180. package/bin/skills/llama-factory/references/getting_started.md +349 -0
  181. package/bin/skills/llama-factory/references/index.md +19 -0
  182. package/bin/skills/llama-factory/references/other.md +31 -0
  183. package/bin/skills/llamaguard/SKILL.md +337 -0
  184. package/bin/skills/llamaindex/SKILL.md +569 -0
  185. package/bin/skills/llamaindex/references/agents.md +83 -0
  186. package/bin/skills/llamaindex/references/data_connectors.md +108 -0
  187. package/bin/skills/llamaindex/references/query_engines.md +406 -0
  188. package/bin/skills/llava/SKILL.md +304 -0
  189. package/bin/skills/llava/references/training.md +197 -0
  190. package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
  191. package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
  192. package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
  193. package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
  194. package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
  195. package/bin/skills/long-context/SKILL.md +536 -0
  196. package/bin/skills/long-context/references/extension_methods.md +468 -0
  197. package/bin/skills/long-context/references/fine_tuning.md +611 -0
  198. package/bin/skills/long-context/references/rope.md +402 -0
  199. package/bin/skills/mamba/SKILL.md +260 -0
  200. package/bin/skills/mamba/references/architecture-details.md +206 -0
  201. package/bin/skills/mamba/references/benchmarks.md +255 -0
  202. package/bin/skills/mamba/references/training-guide.md +388 -0
  203. package/bin/skills/megatron-core/SKILL.md +366 -0
  204. package/bin/skills/megatron-core/references/benchmarks.md +249 -0
  205. package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
  206. package/bin/skills/megatron-core/references/production-examples.md +473 -0
  207. package/bin/skills/megatron-core/references/training-recipes.md +547 -0
  208. package/bin/skills/miles/SKILL.md +315 -0
  209. package/bin/skills/miles/references/api-reference.md +141 -0
  210. package/bin/skills/miles/references/troubleshooting.md +352 -0
  211. package/bin/skills/mlflow/SKILL.md +704 -0
  212. package/bin/skills/mlflow/references/deployment.md +744 -0
  213. package/bin/skills/mlflow/references/model-registry.md +770 -0
  214. package/bin/skills/mlflow/references/tracking.md +680 -0
  215. package/bin/skills/modal/SKILL.md +341 -0
  216. package/bin/skills/modal/references/advanced-usage.md +503 -0
  217. package/bin/skills/modal/references/troubleshooting.md +494 -0
  218. package/bin/skills/model-merging/SKILL.md +539 -0
  219. package/bin/skills/model-merging/references/evaluation.md +462 -0
  220. package/bin/skills/model-merging/references/examples.md +428 -0
  221. package/bin/skills/model-merging/references/methods.md +352 -0
  222. package/bin/skills/model-pruning/SKILL.md +495 -0
  223. package/bin/skills/model-pruning/references/wanda.md +347 -0
  224. package/bin/skills/moe-training/SKILL.md +526 -0
  225. package/bin/skills/moe-training/references/architectures.md +432 -0
  226. package/bin/skills/moe-training/references/inference.md +348 -0
  227. package/bin/skills/moe-training/references/training.md +425 -0
  228. package/bin/skills/nanogpt/SKILL.md +290 -0
  229. package/bin/skills/nanogpt/references/architecture.md +382 -0
  230. package/bin/skills/nanogpt/references/data.md +476 -0
  231. package/bin/skills/nanogpt/references/training.md +564 -0
  232. package/bin/skills/nemo-curator/SKILL.md +383 -0
  233. package/bin/skills/nemo-curator/references/deduplication.md +87 -0
  234. package/bin/skills/nemo-curator/references/filtering.md +102 -0
  235. package/bin/skills/nemo-evaluator/SKILL.md +494 -0
  236. package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
  237. package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
  238. package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
  239. package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
  240. package/bin/skills/nemo-guardrails/SKILL.md +297 -0
  241. package/bin/skills/nnsight/SKILL.md +436 -0
  242. package/bin/skills/nnsight/references/README.md +78 -0
  243. package/bin/skills/nnsight/references/api.md +344 -0
  244. package/bin/skills/nnsight/references/tutorials.md +300 -0
  245. package/bin/skills/openrlhf/SKILL.md +249 -0
  246. package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
  247. package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
  248. package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
  249. package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
  250. package/bin/skills/outlines/SKILL.md +652 -0
  251. package/bin/skills/outlines/references/backends.md +615 -0
  252. package/bin/skills/outlines/references/examples.md +773 -0
  253. package/bin/skills/outlines/references/json_generation.md +652 -0
  254. package/bin/skills/peft/SKILL.md +431 -0
  255. package/bin/skills/peft/references/advanced-usage.md +514 -0
  256. package/bin/skills/peft/references/troubleshooting.md +480 -0
  257. package/bin/skills/phoenix/SKILL.md +475 -0
  258. package/bin/skills/phoenix/references/advanced-usage.md +619 -0
  259. package/bin/skills/phoenix/references/troubleshooting.md +538 -0
  260. package/bin/skills/pinecone/SKILL.md +358 -0
  261. package/bin/skills/pinecone/references/deployment.md +181 -0
  262. package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
  263. package/bin/skills/pytorch-fsdp/references/index.md +7 -0
  264. package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
  265. package/bin/skills/pytorch-lightning/SKILL.md +346 -0
  266. package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
  267. package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
  268. package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
  269. package/bin/skills/pyvene/SKILL.md +473 -0
  270. package/bin/skills/pyvene/references/README.md +73 -0
  271. package/bin/skills/pyvene/references/api.md +383 -0
  272. package/bin/skills/pyvene/references/tutorials.md +376 -0
  273. package/bin/skills/qdrant/SKILL.md +493 -0
  274. package/bin/skills/qdrant/references/advanced-usage.md +648 -0
  275. package/bin/skills/qdrant/references/troubleshooting.md +631 -0
  276. package/bin/skills/ray-data/SKILL.md +326 -0
  277. package/bin/skills/ray-data/references/integration.md +82 -0
  278. package/bin/skills/ray-data/references/transformations.md +83 -0
  279. package/bin/skills/ray-train/SKILL.md +406 -0
  280. package/bin/skills/ray-train/references/multi-node.md +628 -0
  281. package/bin/skills/rwkv/SKILL.md +260 -0
  282. package/bin/skills/rwkv/references/architecture-details.md +344 -0
  283. package/bin/skills/rwkv/references/rwkv7.md +386 -0
  284. package/bin/skills/rwkv/references/state-management.md +369 -0
  285. package/bin/skills/saelens/SKILL.md +386 -0
  286. package/bin/skills/saelens/references/README.md +70 -0
  287. package/bin/skills/saelens/references/api.md +333 -0
  288. package/bin/skills/saelens/references/tutorials.md +318 -0
  289. package/bin/skills/segment-anything/SKILL.md +500 -0
  290. package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
  291. package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
  292. package/bin/skills/sentence-transformers/SKILL.md +255 -0
  293. package/bin/skills/sentence-transformers/references/models.md +123 -0
  294. package/bin/skills/sentencepiece/SKILL.md +235 -0
  295. package/bin/skills/sentencepiece/references/algorithms.md +200 -0
  296. package/bin/skills/sentencepiece/references/training.md +304 -0
  297. package/bin/skills/sglang/SKILL.md +442 -0
  298. package/bin/skills/sglang/references/deployment.md +490 -0
  299. package/bin/skills/sglang/references/radix-attention.md +413 -0
  300. package/bin/skills/sglang/references/structured-generation.md +541 -0
  301. package/bin/skills/simpo/SKILL.md +219 -0
  302. package/bin/skills/simpo/references/datasets.md +478 -0
  303. package/bin/skills/simpo/references/hyperparameters.md +452 -0
  304. package/bin/skills/simpo/references/loss-functions.md +350 -0
  305. package/bin/skills/skypilot/SKILL.md +509 -0
  306. package/bin/skills/skypilot/references/advanced-usage.md +491 -0
  307. package/bin/skills/skypilot/references/troubleshooting.md +570 -0
  308. package/bin/skills/slime/SKILL.md +464 -0
  309. package/bin/skills/slime/references/api-reference.md +392 -0
  310. package/bin/skills/slime/references/troubleshooting.md +386 -0
  311. package/bin/skills/speculative-decoding/SKILL.md +467 -0
  312. package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
  313. package/bin/skills/speculative-decoding/references/medusa.md +350 -0
  314. package/bin/skills/stable-diffusion/SKILL.md +519 -0
  315. package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
  316. package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
  317. package/bin/skills/tensorboard/SKILL.md +629 -0
  318. package/bin/skills/tensorboard/references/integrations.md +638 -0
  319. package/bin/skills/tensorboard/references/profiling.md +545 -0
  320. package/bin/skills/tensorboard/references/visualization.md +620 -0
  321. package/bin/skills/tensorrt-llm/SKILL.md +187 -0
  322. package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
  323. package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
  324. package/bin/skills/tensorrt-llm/references/serving.md +470 -0
  325. package/bin/skills/tinker/SKILL.md +362 -0
  326. package/bin/skills/tinker/references/api-reference.md +168 -0
  327. package/bin/skills/tinker/references/getting-started.md +157 -0
  328. package/bin/skills/tinker/references/loss-functions.md +163 -0
  329. package/bin/skills/tinker/references/models-and-lora.md +139 -0
  330. package/bin/skills/tinker/references/recipes.md +280 -0
  331. package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
  332. package/bin/skills/tinker/references/rendering.md +243 -0
  333. package/bin/skills/tinker/references/supervised-learning.md +232 -0
  334. package/bin/skills/tinker-training-cost/SKILL.md +187 -0
  335. package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
  336. package/bin/skills/torchforge/SKILL.md +433 -0
  337. package/bin/skills/torchforge/references/api-reference.md +327 -0
  338. package/bin/skills/torchforge/references/troubleshooting.md +409 -0
  339. package/bin/skills/torchtitan/SKILL.md +358 -0
  340. package/bin/skills/torchtitan/references/checkpoint.md +181 -0
  341. package/bin/skills/torchtitan/references/custom-models.md +258 -0
  342. package/bin/skills/torchtitan/references/float8.md +133 -0
  343. package/bin/skills/torchtitan/references/fsdp.md +126 -0
  344. package/bin/skills/transformer-lens/SKILL.md +346 -0
  345. package/bin/skills/transformer-lens/references/README.md +54 -0
  346. package/bin/skills/transformer-lens/references/api.md +362 -0
  347. package/bin/skills/transformer-lens/references/tutorials.md +339 -0
  348. package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
  349. package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
  350. package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
  351. package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
  352. package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
  353. package/bin/skills/unsloth/SKILL.md +80 -0
  354. package/bin/skills/unsloth/references/index.md +7 -0
  355. package/bin/skills/unsloth/references/llms-full.md +16799 -0
  356. package/bin/skills/unsloth/references/llms-txt.md +12044 -0
  357. package/bin/skills/unsloth/references/llms.md +82 -0
  358. package/bin/skills/verl/SKILL.md +391 -0
  359. package/bin/skills/verl/references/api-reference.md +301 -0
  360. package/bin/skills/verl/references/troubleshooting.md +391 -0
  361. package/bin/skills/vllm/SKILL.md +364 -0
  362. package/bin/skills/vllm/references/optimization.md +226 -0
  363. package/bin/skills/vllm/references/quantization.md +284 -0
  364. package/bin/skills/vllm/references/server-deployment.md +255 -0
  365. package/bin/skills/vllm/references/troubleshooting.md +447 -0
  366. package/bin/skills/weights-and-biases/SKILL.md +590 -0
  367. package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
  368. package/bin/skills/weights-and-biases/references/integrations.md +700 -0
  369. package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
  370. package/bin/skills/whisper/SKILL.md +317 -0
  371. package/bin/skills/whisper/references/languages.md +189 -0
  372. package/bin/synsc +0 -0
  373. package/package.json +10 -0
@@ -0,0 +1,303 @@
1
+ # /// script
2
+ # requires-python = ">=3.10"
3
+ # dependencies = [
4
+ # "lighteval[accelerate,vllm]>=0.6.0",
5
+ # "torch>=2.0.0",
6
+ # "transformers>=4.40.0",
7
+ # "accelerate>=0.30.0",
8
+ # "vllm>=0.4.0",
9
+ # ]
10
+ # ///
11
+
12
+ """
13
+ Entry point script for running lighteval evaluations with vLLM backend via `hf jobs uv run`.
14
+
15
+ This script runs evaluations using vLLM for efficient GPU inference on custom HuggingFace models.
16
+ It is separate from inference provider scripts and evaluates models directly on the hardware.
17
+
18
+ Usage (standalone):
19
+ python lighteval_vllm_uv.py --model "meta-llama/Llama-3.2-1B" --tasks "leaderboard|mmlu|5"
20
+
21
+ Usage (via HF Jobs):
22
+ hf jobs uv run lighteval_vllm_uv.py \\
23
+ --flavor a10g-small \\
24
+ --secret HF_TOKEN=$HF_TOKEN \\
25
+ -- --model "meta-llama/Llama-3.2-1B" --tasks "leaderboard|mmlu|5"
26
+ """
27
+
28
+ from __future__ import annotations
29
+
30
+ import argparse
31
+ import os
32
+ import subprocess
33
+ import sys
34
+ from typing import Optional
35
+
36
+
37
+ def setup_environment() -> None:
38
+ """Configure environment variables for HuggingFace authentication."""
39
+ hf_token = os.getenv("HF_TOKEN")
40
+ if hf_token:
41
+ os.environ.setdefault("HUGGING_FACE_HUB_TOKEN", hf_token)
42
+ os.environ.setdefault("HF_HUB_TOKEN", hf_token)
43
+
44
+
45
+ def run_lighteval_vllm(
46
+ model_id: str,
47
+ tasks: str,
48
+ output_dir: Optional[str] = None,
49
+ max_samples: Optional[int] = None,
50
+ batch_size: int = 1,
51
+ tensor_parallel_size: int = 1,
52
+ gpu_memory_utilization: float = 0.8,
53
+ dtype: str = "auto",
54
+ trust_remote_code: bool = False,
55
+ use_chat_template: bool = False,
56
+ system_prompt: Optional[str] = None,
57
+ ) -> None:
58
+ """
59
+ Run lighteval with vLLM backend for efficient GPU inference.
60
+
61
+ Args:
62
+ model_id: HuggingFace model ID (e.g., "meta-llama/Llama-3.2-1B")
63
+ tasks: Task specification (e.g., "leaderboard|mmlu|5" or "lighteval|hellaswag|0")
64
+ output_dir: Directory for evaluation results
65
+ max_samples: Limit number of samples per task
66
+ batch_size: Batch size for evaluation
67
+ tensor_parallel_size: Number of GPUs for tensor parallelism
68
+ gpu_memory_utilization: GPU memory fraction to use (0.0-1.0)
69
+ dtype: Data type for model weights (auto, float16, bfloat16)
70
+ trust_remote_code: Allow executing remote code from model repo
71
+ use_chat_template: Apply chat template for conversational models
72
+ system_prompt: System prompt for chat models
73
+ """
74
+ setup_environment()
75
+
76
+ # Build lighteval vllm command
77
+ cmd = [
78
+ "lighteval",
79
+ "vllm",
80
+ model_id,
81
+ tasks,
82
+ "--batch-size", str(batch_size),
83
+ "--tensor-parallel-size", str(tensor_parallel_size),
84
+ "--gpu-memory-utilization", str(gpu_memory_utilization),
85
+ "--dtype", dtype,
86
+ ]
87
+
88
+ if output_dir:
89
+ cmd.extend(["--output-dir", output_dir])
90
+
91
+ if max_samples:
92
+ cmd.extend(["--max-samples", str(max_samples)])
93
+
94
+ if trust_remote_code:
95
+ cmd.append("--trust-remote-code")
96
+
97
+ if use_chat_template:
98
+ cmd.append("--use-chat-template")
99
+
100
+ if system_prompt:
101
+ cmd.extend(["--system-prompt", system_prompt])
102
+
103
+ print(f"Running: {' '.join(cmd)}")
104
+
105
+ try:
106
+ subprocess.run(cmd, check=True)
107
+ print("Evaluation complete.")
108
+ except subprocess.CalledProcessError as exc:
109
+ print(f"Evaluation failed with exit code {exc.returncode}", file=sys.stderr)
110
+ sys.exit(exc.returncode)
111
+
112
+
113
+ def run_lighteval_accelerate(
114
+ model_id: str,
115
+ tasks: str,
116
+ output_dir: Optional[str] = None,
117
+ max_samples: Optional[int] = None,
118
+ batch_size: int = 1,
119
+ dtype: str = "bfloat16",
120
+ trust_remote_code: bool = False,
121
+ use_chat_template: bool = False,
122
+ system_prompt: Optional[str] = None,
123
+ ) -> None:
124
+ """
125
+ Run lighteval with accelerate backend for multi-GPU distributed inference.
126
+
127
+ Use this backend when vLLM is not available or for models not supported by vLLM.
128
+
129
+ Args:
130
+ model_id: HuggingFace model ID
131
+ tasks: Task specification
132
+ output_dir: Directory for evaluation results
133
+ max_samples: Limit number of samples per task
134
+ batch_size: Batch size for evaluation
135
+ dtype: Data type for model weights
136
+ trust_remote_code: Allow executing remote code
137
+ use_chat_template: Apply chat template
138
+ system_prompt: System prompt for chat models
139
+ """
140
+ setup_environment()
141
+
142
+ # Build lighteval accelerate command
143
+ cmd = [
144
+ "lighteval",
145
+ "accelerate",
146
+ model_id,
147
+ tasks,
148
+ "--batch-size", str(batch_size),
149
+ "--dtype", dtype,
150
+ ]
151
+
152
+ if output_dir:
153
+ cmd.extend(["--output-dir", output_dir])
154
+
155
+ if max_samples:
156
+ cmd.extend(["--max-samples", str(max_samples)])
157
+
158
+ if trust_remote_code:
159
+ cmd.append("--trust-remote-code")
160
+
161
+ if use_chat_template:
162
+ cmd.append("--use-chat-template")
163
+
164
+ if system_prompt:
165
+ cmd.extend(["--system-prompt", system_prompt])
166
+
167
+ print(f"Running: {' '.join(cmd)}")
168
+
169
+ try:
170
+ subprocess.run(cmd, check=True)
171
+ print("Evaluation complete.")
172
+ except subprocess.CalledProcessError as exc:
173
+ print(f"Evaluation failed with exit code {exc.returncode}", file=sys.stderr)
174
+ sys.exit(exc.returncode)
175
+
176
+
177
+ def main() -> None:
178
+ parser = argparse.ArgumentParser(
179
+ description="Run lighteval evaluations with vLLM or accelerate backend on custom HuggingFace models",
180
+ formatter_class=argparse.RawDescriptionHelpFormatter,
181
+ epilog="""
182
+ Examples:
183
+ # Run MMLU evaluation with vLLM
184
+ python lighteval_vllm_uv.py --model meta-llama/Llama-3.2-1B --tasks "leaderboard|mmlu|5"
185
+
186
+ # Run with accelerate backend instead of vLLM
187
+ python lighteval_vllm_uv.py --model meta-llama/Llama-3.2-1B --tasks "leaderboard|mmlu|5" --backend accelerate
188
+
189
+ # Run with chat template for instruction-tuned models
190
+ python lighteval_vllm_uv.py --model meta-llama/Llama-3.2-1B-Instruct --tasks "leaderboard|mmlu|5" --use-chat-template
191
+
192
+ # Run with limited samples for testing
193
+ python lighteval_vllm_uv.py --model meta-llama/Llama-3.2-1B --tasks "leaderboard|mmlu|5" --max-samples 10
194
+
195
+ Task format:
196
+ Tasks use the format: "suite|task|num_fewshot"
197
+ - leaderboard|mmlu|5 (MMLU with 5-shot)
198
+ - lighteval|hellaswag|0 (HellaSwag zero-shot)
199
+ - leaderboard|gsm8k|5 (GSM8K with 5-shot)
200
+ - Multiple tasks: "leaderboard|mmlu|5,leaderboard|gsm8k|5"
201
+ """,
202
+ )
203
+
204
+ parser.add_argument(
205
+ "--model",
206
+ required=True,
207
+ help="HuggingFace model ID (e.g., meta-llama/Llama-3.2-1B)",
208
+ )
209
+ parser.add_argument(
210
+ "--tasks",
211
+ required=True,
212
+ help="Task specification (e.g., 'leaderboard|mmlu|5')",
213
+ )
214
+ parser.add_argument(
215
+ "--backend",
216
+ choices=["vllm", "accelerate"],
217
+ default="vllm",
218
+ help="Inference backend to use (default: vllm)",
219
+ )
220
+ parser.add_argument(
221
+ "--output-dir",
222
+ default=None,
223
+ help="Directory for evaluation results",
224
+ )
225
+ parser.add_argument(
226
+ "--max-samples",
227
+ type=int,
228
+ default=None,
229
+ help="Limit number of samples per task (useful for testing)",
230
+ )
231
+ parser.add_argument(
232
+ "--batch-size",
233
+ type=int,
234
+ default=1,
235
+ help="Batch size for evaluation (default: 1)",
236
+ )
237
+ parser.add_argument(
238
+ "--tensor-parallel-size",
239
+ type=int,
240
+ default=1,
241
+ help="Number of GPUs for tensor parallelism (vLLM only, default: 1)",
242
+ )
243
+ parser.add_argument(
244
+ "--gpu-memory-utilization",
245
+ type=float,
246
+ default=0.8,
247
+ help="GPU memory fraction to use (vLLM only, default: 0.8)",
248
+ )
249
+ parser.add_argument(
250
+ "--dtype",
251
+ default="auto",
252
+ choices=["auto", "float16", "bfloat16", "float32"],
253
+ help="Data type for model weights (default: auto)",
254
+ )
255
+ parser.add_argument(
256
+ "--trust-remote-code",
257
+ action="store_true",
258
+ help="Allow executing remote code from model repository",
259
+ )
260
+ parser.add_argument(
261
+ "--use-chat-template",
262
+ action="store_true",
263
+ help="Apply chat template for instruction-tuned/chat models",
264
+ )
265
+ parser.add_argument(
266
+ "--system-prompt",
267
+ default=None,
268
+ help="System prompt for chat models",
269
+ )
270
+
271
+ args = parser.parse_args()
272
+
273
+ if args.backend == "vllm":
274
+ run_lighteval_vllm(
275
+ model_id=args.model,
276
+ tasks=args.tasks,
277
+ output_dir=args.output_dir,
278
+ max_samples=args.max_samples,
279
+ batch_size=args.batch_size,
280
+ tensor_parallel_size=args.tensor_parallel_size,
281
+ gpu_memory_utilization=args.gpu_memory_utilization,
282
+ dtype=args.dtype,
283
+ trust_remote_code=args.trust_remote_code,
284
+ use_chat_template=args.use_chat_template,
285
+ system_prompt=args.system_prompt,
286
+ )
287
+ else:
288
+ run_lighteval_accelerate(
289
+ model_id=args.model,
290
+ tasks=args.tasks,
291
+ output_dir=args.output_dir,
292
+ max_samples=args.max_samples,
293
+ batch_size=args.batch_size,
294
+ dtype=args.dtype if args.dtype != "auto" else "bfloat16",
295
+ trust_remote_code=args.trust_remote_code,
296
+ use_chat_template=args.use_chat_template,
297
+ system_prompt=args.system_prompt,
298
+ )
299
+
300
+
301
+ if __name__ == "__main__":
302
+ main()
303
+
@@ -0,0 +1,98 @@
1
+ # /// script
2
+ # requires-python = ">=3.10"
3
+ # dependencies = [
4
+ # "huggingface-hub>=0.26.0",
5
+ # "python-dotenv>=1.2.1",
6
+ # ]
7
+ # ///
8
+
9
+ """
10
+ Submit evaluation jobs using the `hf jobs uv run` CLI.
11
+
12
+ This wrapper constructs the appropriate command to execute the local
13
+ `inspect_eval_uv.py` script on Hugging Face Jobs with the requested hardware.
14
+ """
15
+
16
+ import argparse
17
+ import os
18
+ import subprocess
19
+ import sys
20
+ from pathlib import Path
21
+ from typing import Optional
22
+
23
+ from huggingface_hub import get_token
24
+ from dotenv import load_dotenv
25
+
26
+ load_dotenv()
27
+
28
+
29
+ SCRIPT_PATH = Path(__file__).with_name("inspect_eval_uv.py").resolve()
30
+
31
+
32
+ def create_eval_job(
33
+ model_id: str,
34
+ task: str,
35
+ hardware: str = "cpu-basic",
36
+ hf_token: Optional[str] = None,
37
+ limit: Optional[int] = None,
38
+ ) -> None:
39
+ """
40
+ Submit an evaluation job using the Hugging Face Jobs CLI.
41
+ """
42
+ token = hf_token or os.getenv("HF_TOKEN") or get_token()
43
+ if not token:
44
+ raise ValueError("HF_TOKEN is required. Set it in environment or pass as argument.")
45
+
46
+ if not SCRIPT_PATH.exists():
47
+ raise FileNotFoundError(f"Script not found at {SCRIPT_PATH}")
48
+
49
+ print(f"Preparing evaluation job for {model_id} on task {task} (hardware: {hardware})")
50
+
51
+ cmd = [
52
+ "hf",
53
+ "jobs",
54
+ "uv",
55
+ "run",
56
+ str(SCRIPT_PATH),
57
+ "--flavor",
58
+ hardware,
59
+ "--secrets",
60
+ f"HF_TOKEN={token}",
61
+ "--",
62
+ "--model",
63
+ model_id,
64
+ "--task",
65
+ task,
66
+ ]
67
+
68
+ if limit:
69
+ cmd.extend(["--limit", str(limit)])
70
+
71
+ print("Executing:", " ".join(cmd))
72
+
73
+ try:
74
+ subprocess.run(cmd, check=True)
75
+ except subprocess.CalledProcessError as exc:
76
+ print("hf jobs command failed", file=sys.stderr)
77
+ raise
78
+
79
+
80
+ def main() -> None:
81
+ parser = argparse.ArgumentParser(description="Run inspect-ai evaluations on Hugging Face Jobs")
82
+ parser.add_argument("--model", required=True, help="Model ID (e.g. Qwen/Qwen3-0.6B)")
83
+ parser.add_argument("--task", required=True, help="Inspect task (e.g. mmlu, gsm8k)")
84
+ parser.add_argument("--hardware", default="cpu-basic", help="Hardware flavor (e.g. t4-small, a10g-small)")
85
+ parser.add_argument("--limit", type=int, default=None, help="Limit number of samples to evaluate")
86
+
87
+ args = parser.parse_args()
88
+
89
+ create_eval_job(
90
+ model_id=args.model,
91
+ task=args.task,
92
+ hardware=args.hardware,
93
+ limit=args.limit,
94
+ )
95
+
96
+
97
+ if __name__ == "__main__":
98
+ main()