@synsci/cli-darwin-x64 1.1.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (373) hide show
  1. package/bin/skills/accelerate/SKILL.md +332 -0
  2. package/bin/skills/accelerate/references/custom-plugins.md +453 -0
  3. package/bin/skills/accelerate/references/megatron-integration.md +489 -0
  4. package/bin/skills/accelerate/references/performance.md +525 -0
  5. package/bin/skills/audiocraft/SKILL.md +564 -0
  6. package/bin/skills/audiocraft/references/advanced-usage.md +666 -0
  7. package/bin/skills/audiocraft/references/troubleshooting.md +504 -0
  8. package/bin/skills/autogpt/SKILL.md +403 -0
  9. package/bin/skills/autogpt/references/advanced-usage.md +535 -0
  10. package/bin/skills/autogpt/references/troubleshooting.md +420 -0
  11. package/bin/skills/awq/SKILL.md +310 -0
  12. package/bin/skills/awq/references/advanced-usage.md +324 -0
  13. package/bin/skills/awq/references/troubleshooting.md +344 -0
  14. package/bin/skills/axolotl/SKILL.md +158 -0
  15. package/bin/skills/axolotl/references/api.md +5548 -0
  16. package/bin/skills/axolotl/references/dataset-formats.md +1029 -0
  17. package/bin/skills/axolotl/references/index.md +15 -0
  18. package/bin/skills/axolotl/references/other.md +3563 -0
  19. package/bin/skills/bigcode-evaluation-harness/SKILL.md +405 -0
  20. package/bin/skills/bigcode-evaluation-harness/references/benchmarks.md +393 -0
  21. package/bin/skills/bigcode-evaluation-harness/references/custom-tasks.md +424 -0
  22. package/bin/skills/bigcode-evaluation-harness/references/issues.md +394 -0
  23. package/bin/skills/bitsandbytes/SKILL.md +411 -0
  24. package/bin/skills/bitsandbytes/references/memory-optimization.md +521 -0
  25. package/bin/skills/bitsandbytes/references/qlora-training.md +521 -0
  26. package/bin/skills/bitsandbytes/references/quantization-formats.md +447 -0
  27. package/bin/skills/blip-2/SKILL.md +564 -0
  28. package/bin/skills/blip-2/references/advanced-usage.md +680 -0
  29. package/bin/skills/blip-2/references/troubleshooting.md +526 -0
  30. package/bin/skills/chroma/SKILL.md +406 -0
  31. package/bin/skills/chroma/references/integration.md +38 -0
  32. package/bin/skills/clip/SKILL.md +253 -0
  33. package/bin/skills/clip/references/applications.md +207 -0
  34. package/bin/skills/constitutional-ai/SKILL.md +290 -0
  35. package/bin/skills/crewai/SKILL.md +498 -0
  36. package/bin/skills/crewai/references/flows.md +438 -0
  37. package/bin/skills/crewai/references/tools.md +429 -0
  38. package/bin/skills/crewai/references/troubleshooting.md +480 -0
  39. package/bin/skills/deepspeed/SKILL.md +141 -0
  40. package/bin/skills/deepspeed/references/08.md +17 -0
  41. package/bin/skills/deepspeed/references/09.md +173 -0
  42. package/bin/skills/deepspeed/references/2020.md +378 -0
  43. package/bin/skills/deepspeed/references/2023.md +279 -0
  44. package/bin/skills/deepspeed/references/assets.md +179 -0
  45. package/bin/skills/deepspeed/references/index.md +35 -0
  46. package/bin/skills/deepspeed/references/mii.md +118 -0
  47. package/bin/skills/deepspeed/references/other.md +1191 -0
  48. package/bin/skills/deepspeed/references/tutorials.md +6554 -0
  49. package/bin/skills/dspy/SKILL.md +590 -0
  50. package/bin/skills/dspy/references/examples.md +663 -0
  51. package/bin/skills/dspy/references/modules.md +475 -0
  52. package/bin/skills/dspy/references/optimizers.md +566 -0
  53. package/bin/skills/faiss/SKILL.md +221 -0
  54. package/bin/skills/faiss/references/index_types.md +280 -0
  55. package/bin/skills/flash-attention/SKILL.md +367 -0
  56. package/bin/skills/flash-attention/references/benchmarks.md +215 -0
  57. package/bin/skills/flash-attention/references/transformers-integration.md +293 -0
  58. package/bin/skills/gguf/SKILL.md +427 -0
  59. package/bin/skills/gguf/references/advanced-usage.md +504 -0
  60. package/bin/skills/gguf/references/troubleshooting.md +442 -0
  61. package/bin/skills/gptq/SKILL.md +450 -0
  62. package/bin/skills/gptq/references/calibration.md +337 -0
  63. package/bin/skills/gptq/references/integration.md +129 -0
  64. package/bin/skills/gptq/references/troubleshooting.md +95 -0
  65. package/bin/skills/grpo-rl-training/README.md +97 -0
  66. package/bin/skills/grpo-rl-training/SKILL.md +572 -0
  67. package/bin/skills/grpo-rl-training/examples/reward_functions_library.py +393 -0
  68. package/bin/skills/grpo-rl-training/templates/basic_grpo_training.py +228 -0
  69. package/bin/skills/guidance/SKILL.md +572 -0
  70. package/bin/skills/guidance/references/backends.md +554 -0
  71. package/bin/skills/guidance/references/constraints.md +674 -0
  72. package/bin/skills/guidance/references/examples.md +767 -0
  73. package/bin/skills/hqq/SKILL.md +445 -0
  74. package/bin/skills/hqq/references/advanced-usage.md +528 -0
  75. package/bin/skills/hqq/references/troubleshooting.md +503 -0
  76. package/bin/skills/hugging-face-cli/SKILL.md +191 -0
  77. package/bin/skills/hugging-face-cli/references/commands.md +954 -0
  78. package/bin/skills/hugging-face-cli/references/examples.md +374 -0
  79. package/bin/skills/hugging-face-datasets/SKILL.md +547 -0
  80. package/bin/skills/hugging-face-datasets/examples/diverse_training_examples.json +239 -0
  81. package/bin/skills/hugging-face-datasets/examples/system_prompt_template.txt +196 -0
  82. package/bin/skills/hugging-face-datasets/examples/training_examples.json +176 -0
  83. package/bin/skills/hugging-face-datasets/scripts/dataset_manager.py +522 -0
  84. package/bin/skills/hugging-face-datasets/scripts/sql_manager.py +844 -0
  85. package/bin/skills/hugging-face-datasets/templates/chat.json +55 -0
  86. package/bin/skills/hugging-face-datasets/templates/classification.json +62 -0
  87. package/bin/skills/hugging-face-datasets/templates/completion.json +51 -0
  88. package/bin/skills/hugging-face-datasets/templates/custom.json +75 -0
  89. package/bin/skills/hugging-face-datasets/templates/qa.json +54 -0
  90. package/bin/skills/hugging-face-datasets/templates/tabular.json +81 -0
  91. package/bin/skills/hugging-face-evaluation/SKILL.md +656 -0
  92. package/bin/skills/hugging-face-evaluation/examples/USAGE_EXAMPLES.md +382 -0
  93. package/bin/skills/hugging-face-evaluation/examples/artificial_analysis_to_hub.py +141 -0
  94. package/bin/skills/hugging-face-evaluation/examples/example_readme_tables.md +135 -0
  95. package/bin/skills/hugging-face-evaluation/examples/metric_mapping.json +50 -0
  96. package/bin/skills/hugging-face-evaluation/requirements.txt +20 -0
  97. package/bin/skills/hugging-face-evaluation/scripts/evaluation_manager.py +1374 -0
  98. package/bin/skills/hugging-face-evaluation/scripts/inspect_eval_uv.py +104 -0
  99. package/bin/skills/hugging-face-evaluation/scripts/inspect_vllm_uv.py +317 -0
  100. package/bin/skills/hugging-face-evaluation/scripts/lighteval_vllm_uv.py +303 -0
  101. package/bin/skills/hugging-face-evaluation/scripts/run_eval_job.py +98 -0
  102. package/bin/skills/hugging-face-evaluation/scripts/run_vllm_eval_job.py +331 -0
  103. package/bin/skills/hugging-face-evaluation/scripts/test_extraction.py +206 -0
  104. package/bin/skills/hugging-face-jobs/SKILL.md +1041 -0
  105. package/bin/skills/hugging-face-jobs/index.html +216 -0
  106. package/bin/skills/hugging-face-jobs/references/hardware_guide.md +336 -0
  107. package/bin/skills/hugging-face-jobs/references/hub_saving.md +352 -0
  108. package/bin/skills/hugging-face-jobs/references/token_usage.md +546 -0
  109. package/bin/skills/hugging-face-jobs/references/troubleshooting.md +475 -0
  110. package/bin/skills/hugging-face-jobs/scripts/cot-self-instruct.py +718 -0
  111. package/bin/skills/hugging-face-jobs/scripts/finepdfs-stats.py +546 -0
  112. package/bin/skills/hugging-face-jobs/scripts/generate-responses.py +587 -0
  113. package/bin/skills/hugging-face-model-trainer/SKILL.md +711 -0
  114. package/bin/skills/hugging-face-model-trainer/references/gguf_conversion.md +296 -0
  115. package/bin/skills/hugging-face-model-trainer/references/hardware_guide.md +283 -0
  116. package/bin/skills/hugging-face-model-trainer/references/hub_saving.md +364 -0
  117. package/bin/skills/hugging-face-model-trainer/references/reliability_principles.md +371 -0
  118. package/bin/skills/hugging-face-model-trainer/references/trackio_guide.md +189 -0
  119. package/bin/skills/hugging-face-model-trainer/references/training_methods.md +150 -0
  120. package/bin/skills/hugging-face-model-trainer/references/training_patterns.md +203 -0
  121. package/bin/skills/hugging-face-model-trainer/references/troubleshooting.md +282 -0
  122. package/bin/skills/hugging-face-model-trainer/scripts/convert_to_gguf.py +424 -0
  123. package/bin/skills/hugging-face-model-trainer/scripts/dataset_inspector.py +417 -0
  124. package/bin/skills/hugging-face-model-trainer/scripts/estimate_cost.py +150 -0
  125. package/bin/skills/hugging-face-model-trainer/scripts/train_dpo_example.py +106 -0
  126. package/bin/skills/hugging-face-model-trainer/scripts/train_grpo_example.py +89 -0
  127. package/bin/skills/hugging-face-model-trainer/scripts/train_sft_example.py +122 -0
  128. package/bin/skills/hugging-face-paper-publisher/SKILL.md +627 -0
  129. package/bin/skills/hugging-face-paper-publisher/examples/example_usage.md +327 -0
  130. package/bin/skills/hugging-face-paper-publisher/references/quick_reference.md +216 -0
  131. package/bin/skills/hugging-face-paper-publisher/scripts/paper_manager.py +508 -0
  132. package/bin/skills/hugging-face-paper-publisher/templates/arxiv.md +299 -0
  133. package/bin/skills/hugging-face-paper-publisher/templates/ml-report.md +358 -0
  134. package/bin/skills/hugging-face-paper-publisher/templates/modern.md +319 -0
  135. package/bin/skills/hugging-face-paper-publisher/templates/standard.md +201 -0
  136. package/bin/skills/hugging-face-tool-builder/SKILL.md +115 -0
  137. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.py +57 -0
  138. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.sh +40 -0
  139. package/bin/skills/hugging-face-tool-builder/references/baseline_hf_api.tsx +57 -0
  140. package/bin/skills/hugging-face-tool-builder/references/find_models_by_paper.sh +230 -0
  141. package/bin/skills/hugging-face-tool-builder/references/hf_enrich_models.sh +96 -0
  142. package/bin/skills/hugging-face-tool-builder/references/hf_model_card_frontmatter.sh +188 -0
  143. package/bin/skills/hugging-face-tool-builder/references/hf_model_papers_auth.sh +171 -0
  144. package/bin/skills/hugging-face-trackio/SKILL.md +65 -0
  145. package/bin/skills/hugging-face-trackio/references/logging_metrics.md +206 -0
  146. package/bin/skills/hugging-face-trackio/references/retrieving_metrics.md +223 -0
  147. package/bin/skills/huggingface-tokenizers/SKILL.md +516 -0
  148. package/bin/skills/huggingface-tokenizers/references/algorithms.md +653 -0
  149. package/bin/skills/huggingface-tokenizers/references/integration.md +637 -0
  150. package/bin/skills/huggingface-tokenizers/references/pipeline.md +723 -0
  151. package/bin/skills/huggingface-tokenizers/references/training.md +565 -0
  152. package/bin/skills/instructor/SKILL.md +740 -0
  153. package/bin/skills/instructor/references/examples.md +107 -0
  154. package/bin/skills/instructor/references/providers.md +70 -0
  155. package/bin/skills/instructor/references/validation.md +606 -0
  156. package/bin/skills/knowledge-distillation/SKILL.md +458 -0
  157. package/bin/skills/knowledge-distillation/references/minillm.md +334 -0
  158. package/bin/skills/lambda-labs/SKILL.md +545 -0
  159. package/bin/skills/lambda-labs/references/advanced-usage.md +611 -0
  160. package/bin/skills/lambda-labs/references/troubleshooting.md +530 -0
  161. package/bin/skills/langchain/SKILL.md +480 -0
  162. package/bin/skills/langchain/references/agents.md +499 -0
  163. package/bin/skills/langchain/references/integration.md +562 -0
  164. package/bin/skills/langchain/references/rag.md +600 -0
  165. package/bin/skills/langsmith/SKILL.md +422 -0
  166. package/bin/skills/langsmith/references/advanced-usage.md +548 -0
  167. package/bin/skills/langsmith/references/troubleshooting.md +537 -0
  168. package/bin/skills/litgpt/SKILL.md +469 -0
  169. package/bin/skills/litgpt/references/custom-models.md +568 -0
  170. package/bin/skills/litgpt/references/distributed-training.md +451 -0
  171. package/bin/skills/litgpt/references/supported-models.md +336 -0
  172. package/bin/skills/litgpt/references/training-recipes.md +619 -0
  173. package/bin/skills/llama-cpp/SKILL.md +258 -0
  174. package/bin/skills/llama-cpp/references/optimization.md +89 -0
  175. package/bin/skills/llama-cpp/references/quantization.md +213 -0
  176. package/bin/skills/llama-cpp/references/server.md +125 -0
  177. package/bin/skills/llama-factory/SKILL.md +80 -0
  178. package/bin/skills/llama-factory/references/_images.md +23 -0
  179. package/bin/skills/llama-factory/references/advanced.md +1055 -0
  180. package/bin/skills/llama-factory/references/getting_started.md +349 -0
  181. package/bin/skills/llama-factory/references/index.md +19 -0
  182. package/bin/skills/llama-factory/references/other.md +31 -0
  183. package/bin/skills/llamaguard/SKILL.md +337 -0
  184. package/bin/skills/llamaindex/SKILL.md +569 -0
  185. package/bin/skills/llamaindex/references/agents.md +83 -0
  186. package/bin/skills/llamaindex/references/data_connectors.md +108 -0
  187. package/bin/skills/llamaindex/references/query_engines.md +406 -0
  188. package/bin/skills/llava/SKILL.md +304 -0
  189. package/bin/skills/llava/references/training.md +197 -0
  190. package/bin/skills/lm-evaluation-harness/SKILL.md +490 -0
  191. package/bin/skills/lm-evaluation-harness/references/api-evaluation.md +490 -0
  192. package/bin/skills/lm-evaluation-harness/references/benchmark-guide.md +488 -0
  193. package/bin/skills/lm-evaluation-harness/references/custom-tasks.md +602 -0
  194. package/bin/skills/lm-evaluation-harness/references/distributed-eval.md +519 -0
  195. package/bin/skills/long-context/SKILL.md +536 -0
  196. package/bin/skills/long-context/references/extension_methods.md +468 -0
  197. package/bin/skills/long-context/references/fine_tuning.md +611 -0
  198. package/bin/skills/long-context/references/rope.md +402 -0
  199. package/bin/skills/mamba/SKILL.md +260 -0
  200. package/bin/skills/mamba/references/architecture-details.md +206 -0
  201. package/bin/skills/mamba/references/benchmarks.md +255 -0
  202. package/bin/skills/mamba/references/training-guide.md +388 -0
  203. package/bin/skills/megatron-core/SKILL.md +366 -0
  204. package/bin/skills/megatron-core/references/benchmarks.md +249 -0
  205. package/bin/skills/megatron-core/references/parallelism-guide.md +404 -0
  206. package/bin/skills/megatron-core/references/production-examples.md +473 -0
  207. package/bin/skills/megatron-core/references/training-recipes.md +547 -0
  208. package/bin/skills/miles/SKILL.md +315 -0
  209. package/bin/skills/miles/references/api-reference.md +141 -0
  210. package/bin/skills/miles/references/troubleshooting.md +352 -0
  211. package/bin/skills/mlflow/SKILL.md +704 -0
  212. package/bin/skills/mlflow/references/deployment.md +744 -0
  213. package/bin/skills/mlflow/references/model-registry.md +770 -0
  214. package/bin/skills/mlflow/references/tracking.md +680 -0
  215. package/bin/skills/modal/SKILL.md +341 -0
  216. package/bin/skills/modal/references/advanced-usage.md +503 -0
  217. package/bin/skills/modal/references/troubleshooting.md +494 -0
  218. package/bin/skills/model-merging/SKILL.md +539 -0
  219. package/bin/skills/model-merging/references/evaluation.md +462 -0
  220. package/bin/skills/model-merging/references/examples.md +428 -0
  221. package/bin/skills/model-merging/references/methods.md +352 -0
  222. package/bin/skills/model-pruning/SKILL.md +495 -0
  223. package/bin/skills/model-pruning/references/wanda.md +347 -0
  224. package/bin/skills/moe-training/SKILL.md +526 -0
  225. package/bin/skills/moe-training/references/architectures.md +432 -0
  226. package/bin/skills/moe-training/references/inference.md +348 -0
  227. package/bin/skills/moe-training/references/training.md +425 -0
  228. package/bin/skills/nanogpt/SKILL.md +290 -0
  229. package/bin/skills/nanogpt/references/architecture.md +382 -0
  230. package/bin/skills/nanogpt/references/data.md +476 -0
  231. package/bin/skills/nanogpt/references/training.md +564 -0
  232. package/bin/skills/nemo-curator/SKILL.md +383 -0
  233. package/bin/skills/nemo-curator/references/deduplication.md +87 -0
  234. package/bin/skills/nemo-curator/references/filtering.md +102 -0
  235. package/bin/skills/nemo-evaluator/SKILL.md +494 -0
  236. package/bin/skills/nemo-evaluator/references/adapter-system.md +340 -0
  237. package/bin/skills/nemo-evaluator/references/configuration.md +447 -0
  238. package/bin/skills/nemo-evaluator/references/custom-benchmarks.md +315 -0
  239. package/bin/skills/nemo-evaluator/references/execution-backends.md +361 -0
  240. package/bin/skills/nemo-guardrails/SKILL.md +297 -0
  241. package/bin/skills/nnsight/SKILL.md +436 -0
  242. package/bin/skills/nnsight/references/README.md +78 -0
  243. package/bin/skills/nnsight/references/api.md +344 -0
  244. package/bin/skills/nnsight/references/tutorials.md +300 -0
  245. package/bin/skills/openrlhf/SKILL.md +249 -0
  246. package/bin/skills/openrlhf/references/algorithm-comparison.md +404 -0
  247. package/bin/skills/openrlhf/references/custom-rewards.md +530 -0
  248. package/bin/skills/openrlhf/references/hybrid-engine.md +287 -0
  249. package/bin/skills/openrlhf/references/multi-node-training.md +454 -0
  250. package/bin/skills/outlines/SKILL.md +652 -0
  251. package/bin/skills/outlines/references/backends.md +615 -0
  252. package/bin/skills/outlines/references/examples.md +773 -0
  253. package/bin/skills/outlines/references/json_generation.md +652 -0
  254. package/bin/skills/peft/SKILL.md +431 -0
  255. package/bin/skills/peft/references/advanced-usage.md +514 -0
  256. package/bin/skills/peft/references/troubleshooting.md +480 -0
  257. package/bin/skills/phoenix/SKILL.md +475 -0
  258. package/bin/skills/phoenix/references/advanced-usage.md +619 -0
  259. package/bin/skills/phoenix/references/troubleshooting.md +538 -0
  260. package/bin/skills/pinecone/SKILL.md +358 -0
  261. package/bin/skills/pinecone/references/deployment.md +181 -0
  262. package/bin/skills/pytorch-fsdp/SKILL.md +126 -0
  263. package/bin/skills/pytorch-fsdp/references/index.md +7 -0
  264. package/bin/skills/pytorch-fsdp/references/other.md +4249 -0
  265. package/bin/skills/pytorch-lightning/SKILL.md +346 -0
  266. package/bin/skills/pytorch-lightning/references/callbacks.md +436 -0
  267. package/bin/skills/pytorch-lightning/references/distributed.md +490 -0
  268. package/bin/skills/pytorch-lightning/references/hyperparameter-tuning.md +556 -0
  269. package/bin/skills/pyvene/SKILL.md +473 -0
  270. package/bin/skills/pyvene/references/README.md +73 -0
  271. package/bin/skills/pyvene/references/api.md +383 -0
  272. package/bin/skills/pyvene/references/tutorials.md +376 -0
  273. package/bin/skills/qdrant/SKILL.md +493 -0
  274. package/bin/skills/qdrant/references/advanced-usage.md +648 -0
  275. package/bin/skills/qdrant/references/troubleshooting.md +631 -0
  276. package/bin/skills/ray-data/SKILL.md +326 -0
  277. package/bin/skills/ray-data/references/integration.md +82 -0
  278. package/bin/skills/ray-data/references/transformations.md +83 -0
  279. package/bin/skills/ray-train/SKILL.md +406 -0
  280. package/bin/skills/ray-train/references/multi-node.md +628 -0
  281. package/bin/skills/rwkv/SKILL.md +260 -0
  282. package/bin/skills/rwkv/references/architecture-details.md +344 -0
  283. package/bin/skills/rwkv/references/rwkv7.md +386 -0
  284. package/bin/skills/rwkv/references/state-management.md +369 -0
  285. package/bin/skills/saelens/SKILL.md +386 -0
  286. package/bin/skills/saelens/references/README.md +70 -0
  287. package/bin/skills/saelens/references/api.md +333 -0
  288. package/bin/skills/saelens/references/tutorials.md +318 -0
  289. package/bin/skills/segment-anything/SKILL.md +500 -0
  290. package/bin/skills/segment-anything/references/advanced-usage.md +589 -0
  291. package/bin/skills/segment-anything/references/troubleshooting.md +484 -0
  292. package/bin/skills/sentence-transformers/SKILL.md +255 -0
  293. package/bin/skills/sentence-transformers/references/models.md +123 -0
  294. package/bin/skills/sentencepiece/SKILL.md +235 -0
  295. package/bin/skills/sentencepiece/references/algorithms.md +200 -0
  296. package/bin/skills/sentencepiece/references/training.md +304 -0
  297. package/bin/skills/sglang/SKILL.md +442 -0
  298. package/bin/skills/sglang/references/deployment.md +490 -0
  299. package/bin/skills/sglang/references/radix-attention.md +413 -0
  300. package/bin/skills/sglang/references/structured-generation.md +541 -0
  301. package/bin/skills/simpo/SKILL.md +219 -0
  302. package/bin/skills/simpo/references/datasets.md +478 -0
  303. package/bin/skills/simpo/references/hyperparameters.md +452 -0
  304. package/bin/skills/simpo/references/loss-functions.md +350 -0
  305. package/bin/skills/skypilot/SKILL.md +509 -0
  306. package/bin/skills/skypilot/references/advanced-usage.md +491 -0
  307. package/bin/skills/skypilot/references/troubleshooting.md +570 -0
  308. package/bin/skills/slime/SKILL.md +464 -0
  309. package/bin/skills/slime/references/api-reference.md +392 -0
  310. package/bin/skills/slime/references/troubleshooting.md +386 -0
  311. package/bin/skills/speculative-decoding/SKILL.md +467 -0
  312. package/bin/skills/speculative-decoding/references/lookahead.md +309 -0
  313. package/bin/skills/speculative-decoding/references/medusa.md +350 -0
  314. package/bin/skills/stable-diffusion/SKILL.md +519 -0
  315. package/bin/skills/stable-diffusion/references/advanced-usage.md +716 -0
  316. package/bin/skills/stable-diffusion/references/troubleshooting.md +555 -0
  317. package/bin/skills/tensorboard/SKILL.md +629 -0
  318. package/bin/skills/tensorboard/references/integrations.md +638 -0
  319. package/bin/skills/tensorboard/references/profiling.md +545 -0
  320. package/bin/skills/tensorboard/references/visualization.md +620 -0
  321. package/bin/skills/tensorrt-llm/SKILL.md +187 -0
  322. package/bin/skills/tensorrt-llm/references/multi-gpu.md +298 -0
  323. package/bin/skills/tensorrt-llm/references/optimization.md +242 -0
  324. package/bin/skills/tensorrt-llm/references/serving.md +470 -0
  325. package/bin/skills/tinker/SKILL.md +362 -0
  326. package/bin/skills/tinker/references/api-reference.md +168 -0
  327. package/bin/skills/tinker/references/getting-started.md +157 -0
  328. package/bin/skills/tinker/references/loss-functions.md +163 -0
  329. package/bin/skills/tinker/references/models-and-lora.md +139 -0
  330. package/bin/skills/tinker/references/recipes.md +280 -0
  331. package/bin/skills/tinker/references/reinforcement-learning.md +212 -0
  332. package/bin/skills/tinker/references/rendering.md +243 -0
  333. package/bin/skills/tinker/references/supervised-learning.md +232 -0
  334. package/bin/skills/tinker-training-cost/SKILL.md +187 -0
  335. package/bin/skills/tinker-training-cost/scripts/calculate_cost.py +123 -0
  336. package/bin/skills/torchforge/SKILL.md +433 -0
  337. package/bin/skills/torchforge/references/api-reference.md +327 -0
  338. package/bin/skills/torchforge/references/troubleshooting.md +409 -0
  339. package/bin/skills/torchtitan/SKILL.md +358 -0
  340. package/bin/skills/torchtitan/references/checkpoint.md +181 -0
  341. package/bin/skills/torchtitan/references/custom-models.md +258 -0
  342. package/bin/skills/torchtitan/references/float8.md +133 -0
  343. package/bin/skills/torchtitan/references/fsdp.md +126 -0
  344. package/bin/skills/transformer-lens/SKILL.md +346 -0
  345. package/bin/skills/transformer-lens/references/README.md +54 -0
  346. package/bin/skills/transformer-lens/references/api.md +362 -0
  347. package/bin/skills/transformer-lens/references/tutorials.md +339 -0
  348. package/bin/skills/trl-fine-tuning/SKILL.md +455 -0
  349. package/bin/skills/trl-fine-tuning/references/dpo-variants.md +227 -0
  350. package/bin/skills/trl-fine-tuning/references/online-rl.md +82 -0
  351. package/bin/skills/trl-fine-tuning/references/reward-modeling.md +122 -0
  352. package/bin/skills/trl-fine-tuning/references/sft-training.md +168 -0
  353. package/bin/skills/unsloth/SKILL.md +80 -0
  354. package/bin/skills/unsloth/references/index.md +7 -0
  355. package/bin/skills/unsloth/references/llms-full.md +16799 -0
  356. package/bin/skills/unsloth/references/llms-txt.md +12044 -0
  357. package/bin/skills/unsloth/references/llms.md +82 -0
  358. package/bin/skills/verl/SKILL.md +391 -0
  359. package/bin/skills/verl/references/api-reference.md +301 -0
  360. package/bin/skills/verl/references/troubleshooting.md +391 -0
  361. package/bin/skills/vllm/SKILL.md +364 -0
  362. package/bin/skills/vllm/references/optimization.md +226 -0
  363. package/bin/skills/vllm/references/quantization.md +284 -0
  364. package/bin/skills/vllm/references/server-deployment.md +255 -0
  365. package/bin/skills/vllm/references/troubleshooting.md +447 -0
  366. package/bin/skills/weights-and-biases/SKILL.md +590 -0
  367. package/bin/skills/weights-and-biases/references/artifacts.md +584 -0
  368. package/bin/skills/weights-and-biases/references/integrations.md +700 -0
  369. package/bin/skills/weights-and-biases/references/sweeps.md +847 -0
  370. package/bin/skills/whisper/SKILL.md +317 -0
  371. package/bin/skills/whisper/references/languages.md +189 -0
  372. package/bin/synsc +0 -0
  373. package/package.json +10 -0
@@ -0,0 +1,442 @@
1
+ ---
2
+ name: sglang
3
+ description: Fast structured generation and serving for LLMs with RadixAttention prefix caching. Use for JSON/regex outputs, constrained decoding, agentic workflows with tool calls, or when you need 5× faster inference than vLLM with prefix sharing. Powers 300,000+ GPUs at xAI, AMD, NVIDIA, and LinkedIn.
4
+ version: 1.0.0
5
+ author: Synthetic Sciences
6
+ license: MIT
7
+ tags: [Inference Serving, SGLang, Structured Generation, RadixAttention, Prefix Caching, Constrained Decoding, Agents, JSON Output, Fast Inference, Production Scale]
8
+ dependencies: [sglang, torch, transformers]
9
+ ---
10
+
11
+ # SGLang
12
+
13
+ High-performance serving framework for LLMs and VLMs with RadixAttention for automatic prefix caching.
14
+
15
+ ## When to use SGLang
16
+
17
+ **Use SGLang when:**
18
+ - Need structured outputs (JSON, regex, grammar)
19
+ - Building agents with repeated prefixes (system prompts, tools)
20
+ - Agentic workflows with function calling
21
+ - Multi-turn conversations with shared context
22
+ - Need faster JSON decoding (3× vs standard)
23
+
24
+ **Use vLLM instead when:**
25
+ - Simple text generation without structure
26
+ - Don't need prefix caching
27
+ - Want mature, widely-tested production system
28
+
29
+ **Use TensorRT-LLM instead when:**
30
+ - Maximum single-request latency (no batching needed)
31
+ - NVIDIA-only deployment
32
+ - Need FP8/INT4 quantization on H100
33
+
34
+ ## Quick start
35
+
36
+ ### Installation
37
+
38
+ ```bash
39
+ # pip install (recommended)
40
+ pip install "sglang[all]"
41
+
42
+ # With FlashInfer (faster, CUDA 11.8/12.1)
43
+ pip install sglang[all] flashinfer -i https://flashinfer.ai/whl/cu121/torch2.4/
44
+
45
+ # From source
46
+ git clone https://github.com/sgl-project/sglang.git
47
+ cd sglang
48
+ pip install -e "python[all]"
49
+ ```
50
+
51
+ ### Launch server
52
+
53
+ ```bash
54
+ # Basic server (Llama 3-8B)
55
+ python -m sglang.launch_server \
56
+ --model-path meta-llama/Meta-Llama-3-8B-Instruct \
57
+ --port 30000
58
+
59
+ # With RadixAttention (automatic prefix caching)
60
+ python -m sglang.launch_server \
61
+ --model-path meta-llama/Meta-Llama-3-8B-Instruct \
62
+ --port 30000 \
63
+ --enable-radix-cache # Default: enabled
64
+
65
+ # Multi-GPU (tensor parallelism)
66
+ python -m sglang.launch_server \
67
+ --model-path meta-llama/Meta-Llama-3-70B-Instruct \
68
+ --tp 4 \
69
+ --port 30000
70
+ ```
71
+
72
+ ### Basic inference
73
+
74
+ ```python
75
+ import sglang as sgl
76
+
77
+ # Set backend
78
+ sgl.set_default_backend(sgl.OpenAI("http://localhost:30000/v1"))
79
+
80
+ # Simple generation
81
+ @sgl.function
82
+ def simple_gen(s, question):
83
+ s += "Q: " + question + "\n"
84
+ s += "A:" + sgl.gen("answer", max_tokens=100)
85
+
86
+ # Run
87
+ state = simple_gen.run(question="What is the capital of France?")
88
+ print(state["answer"])
89
+ # Output: "The capital of France is Paris."
90
+ ```
91
+
92
+ ### Structured JSON output
93
+
94
+ ```python
95
+ import sglang as sgl
96
+
97
+ @sgl.function
98
+ def extract_person(s, text):
99
+ s += f"Extract person information from: {text}\n"
100
+ s += "Output JSON:\n"
101
+
102
+ # Constrained JSON generation
103
+ s += sgl.gen(
104
+ "json_output",
105
+ max_tokens=200,
106
+ regex=r'\{"name": "[^"]+", "age": \d+, "occupation": "[^"]+"\}'
107
+ )
108
+
109
+ # Run
110
+ state = extract_person.run(
111
+ text="John Smith is a 35-year-old software engineer."
112
+ )
113
+ print(state["json_output"])
114
+ # Output: {"name": "John Smith", "age": 35, "occupation": "software engineer"}
115
+ ```
116
+
117
+ ## RadixAttention (Key Innovation)
118
+
119
+ **What it does**: Automatically caches and reuses common prefixes across requests.
120
+
121
+ **Performance**:
122
+ - **5× faster** for agentic workloads with shared system prompts
123
+ - **10× faster** for few-shot prompting with repeated examples
124
+ - **Zero configuration** - works automatically
125
+
126
+ **How it works**:
127
+ 1. Builds radix tree of all processed tokens
128
+ 2. Automatically detects shared prefixes
129
+ 3. Reuses KV cache for matching prefixes
130
+ 4. Only computes new tokens
131
+
132
+ **Example** (Agent with system prompt):
133
+
134
+ ```
135
+ Request 1: [SYSTEM_PROMPT] + "What's the weather?"
136
+ → Computes full prompt (1000 tokens)
137
+
138
+ Request 2: [SAME_SYSTEM_PROMPT] + "Book a flight"
139
+ → Reuses system prompt KV cache (998 tokens)
140
+ → Only computes 2 new tokens
141
+ → 5× faster!
142
+ ```
143
+
144
+ ## Structured generation patterns
145
+
146
+ ### JSON with schema
147
+
148
+ ```python
149
+ @sgl.function
150
+ def structured_extraction(s, article):
151
+ s += f"Article: {article}\n\n"
152
+ s += "Extract key information as JSON:\n"
153
+
154
+ # JSON schema constraint
155
+ schema = {
156
+ "type": "object",
157
+ "properties": {
158
+ "title": {"type": "string"},
159
+ "author": {"type": "string"},
160
+ "summary": {"type": "string"},
161
+ "sentiment": {"type": "string", "enum": ["positive", "negative", "neutral"]}
162
+ },
163
+ "required": ["title", "author", "summary", "sentiment"]
164
+ }
165
+
166
+ s += sgl.gen("info", max_tokens=300, json_schema=schema)
167
+
168
+ state = structured_extraction.run(article="...")
169
+ print(state["info"])
170
+ # Output: Valid JSON matching schema
171
+ ```
172
+
173
+ ### Regex-constrained generation
174
+
175
+ ```python
176
+ @sgl.function
177
+ def extract_email(s, text):
178
+ s += f"Extract email from: {text}\n"
179
+ s += "Email: "
180
+
181
+ # Email regex pattern
182
+ s += sgl.gen(
183
+ "email",
184
+ max_tokens=50,
185
+ regex=r'[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}'
186
+ )
187
+
188
+ state = extract_email.run(text="Contact john.doe@example.com for details")
189
+ print(state["email"])
190
+ # Output: "john.doe@example.com"
191
+ ```
192
+
193
+ ### Grammar-based generation
194
+
195
+ ```python
196
+ @sgl.function
197
+ def generate_code(s, description):
198
+ s += f"Generate Python code for: {description}\n"
199
+ s += "```python\n"
200
+
201
+ # EBNF grammar for Python
202
+ python_grammar = """
203
+ ?start: function_def
204
+ function_def: "def" NAME "(" [parameters] "):" suite
205
+ parameters: parameter ("," parameter)*
206
+ parameter: NAME
207
+ suite: simple_stmt | NEWLINE INDENT stmt+ DEDENT
208
+ """
209
+
210
+ s += sgl.gen("code", max_tokens=200, grammar=python_grammar)
211
+ s += "\n```"
212
+ ```
213
+
214
+ ## Agent workflows with function calling
215
+
216
+ ```python
217
+ import sglang as sgl
218
+
219
+ # Define tools
220
+ tools = [
221
+ {
222
+ "name": "get_weather",
223
+ "description": "Get weather for a location",
224
+ "parameters": {
225
+ "type": "object",
226
+ "properties": {
227
+ "location": {"type": "string"}
228
+ }
229
+ }
230
+ },
231
+ {
232
+ "name": "book_flight",
233
+ "description": "Book a flight",
234
+ "parameters": {
235
+ "type": "object",
236
+ "properties": {
237
+ "from": {"type": "string"},
238
+ "to": {"type": "string"},
239
+ "date": {"type": "string"}
240
+ }
241
+ }
242
+ }
243
+ ]
244
+
245
+ @sgl.function
246
+ def agent_workflow(s, user_query, tools):
247
+ # System prompt (cached with RadixAttention)
248
+ s += "You are a helpful assistant with access to tools.\n"
249
+ s += f"Available tools: {tools}\n\n"
250
+
251
+ # User query
252
+ s += f"User: {user_query}\n"
253
+ s += "Assistant: "
254
+
255
+ # Generate with function calling
256
+ s += sgl.gen(
257
+ "response",
258
+ max_tokens=200,
259
+ tools=tools, # SGLang handles tool call format
260
+ stop=["User:", "\n\n"]
261
+ )
262
+
263
+ # Multiple queries reuse system prompt
264
+ state1 = agent_workflow.run(
265
+ user_query="What's the weather in NYC?",
266
+ tools=tools
267
+ )
268
+ # First call: Computes full system prompt
269
+
270
+ state2 = agent_workflow.run(
271
+ user_query="Book a flight to LA",
272
+ tools=tools
273
+ )
274
+ # Second call: Reuses system prompt (5× faster)
275
+ ```
276
+
277
+ ## Performance benchmarks
278
+
279
+ ### RadixAttention speedup
280
+
281
+ **Few-shot prompting** (10 examples in prompt):
282
+ - vLLM: 2.5 sec/request
283
+ - SGLang: **0.25 sec/request** (10× faster)
284
+ - Throughput: 4× higher
285
+
286
+ **Agent workflows** (1000-token system prompt):
287
+ - vLLM: 1.8 sec/request
288
+ - SGLang: **0.35 sec/request** (5× faster)
289
+
290
+ **JSON decoding**:
291
+ - Standard: 45 tok/s
292
+ - SGLang: **135 tok/s** (3× faster)
293
+
294
+ ### Throughput (Llama 3-8B, A100)
295
+
296
+ | Workload | vLLM | SGLang | Speedup |
297
+ |----------|------|--------|---------|
298
+ | Simple generation | 2500 tok/s | 2800 tok/s | 1.12× |
299
+ | Few-shot (10 examples) | 500 tok/s | 5000 tok/s | 10× |
300
+ | Agent (tool calls) | 800 tok/s | 4000 tok/s | 5× |
301
+ | JSON output | 600 tok/s | 2400 tok/s | 4× |
302
+
303
+ ## Multi-turn conversations
304
+
305
+ ```python
306
+ @sgl.function
307
+ def multi_turn_chat(s, history, new_message):
308
+ # System prompt (always cached)
309
+ s += "You are a helpful AI assistant.\n\n"
310
+
311
+ # Conversation history (cached as it grows)
312
+ for msg in history:
313
+ s += f"{msg['role']}: {msg['content']}\n"
314
+
315
+ # New user message (only new part)
316
+ s += f"User: {new_message}\n"
317
+ s += "Assistant: "
318
+ s += sgl.gen("response", max_tokens=200)
319
+
320
+ # Turn 1
321
+ history = []
322
+ state = multi_turn_chat.run(history=history, new_message="Hi there!")
323
+ history.append({"role": "User", "content": "Hi there!"})
324
+ history.append({"role": "Assistant", "content": state["response"]})
325
+
326
+ # Turn 2 (reuses Turn 1 KV cache)
327
+ state = multi_turn_chat.run(history=history, new_message="What's 2+2?")
328
+ # Only computes new message (much faster!)
329
+
330
+ # Turn 3 (reuses Turn 1 + Turn 2 KV cache)
331
+ state = multi_turn_chat.run(history=history, new_message="Tell me a joke")
332
+ # Progressively faster as history grows
333
+ ```
334
+
335
+ ## Advanced features
336
+
337
+ ### Speculative decoding
338
+
339
+ ```bash
340
+ # Launch with draft model (2-3× faster)
341
+ python -m sglang.launch_server \
342
+ --model-path meta-llama/Meta-Llama-3-70B-Instruct \
343
+ --speculative-model meta-llama/Meta-Llama-3-8B-Instruct \
344
+ --speculative-num-steps 5
345
+ ```
346
+
347
+ ### Multi-modal (vision models)
348
+
349
+ ```python
350
+ @sgl.function
351
+ def describe_image(s, image_path):
352
+ s += sgl.image(image_path)
353
+ s += "Describe this image in detail: "
354
+ s += sgl.gen("description", max_tokens=200)
355
+
356
+ state = describe_image.run(image_path="photo.jpg")
357
+ print(state["description"])
358
+ ```
359
+
360
+ ### Batching and parallel requests
361
+
362
+ ```python
363
+ # Automatic batching (continuous batching)
364
+ states = sgl.run_batch(
365
+ [
366
+ simple_gen.bind(question="What is AI?"),
367
+ simple_gen.bind(question="What is ML?"),
368
+ simple_gen.bind(question="What is DL?"),
369
+ ]
370
+ )
371
+
372
+ # All 3 processed in single batch (efficient)
373
+ ```
374
+
375
+ ## OpenAI-compatible API
376
+
377
+ ```bash
378
+ # Start server with OpenAI API
379
+ python -m sglang.launch_server \
380
+ --model-path meta-llama/Meta-Llama-3-8B-Instruct \
381
+ --port 30000
382
+
383
+ # Use with OpenAI client
384
+ curl http://localhost:30000/v1/chat/completions \
385
+ -H "Content-Type: application/json" \
386
+ -d '{
387
+ "model": "default",
388
+ "messages": [
389
+ {"role": "system", "content": "You are helpful"},
390
+ {"role": "user", "content": "Hello"}
391
+ ],
392
+ "temperature": 0.7,
393
+ "max_tokens": 100
394
+ }'
395
+
396
+ # Works with OpenAI Python SDK
397
+ from openai import OpenAI
398
+ client = OpenAI(base_url="http://localhost:30000/v1", api_key="EMPTY")
399
+
400
+ response = client.chat.completions.create(
401
+ model="default",
402
+ messages=[{"role": "user", "content": "Hello"}]
403
+ )
404
+ ```
405
+
406
+ ## Supported models
407
+
408
+ **Text models**:
409
+ - Llama 2, Llama 3, Llama 3.1, Llama 3.2
410
+ - Mistral, Mixtral
411
+ - Qwen, Qwen2, QwQ
412
+ - DeepSeek-V2, DeepSeek-V3
413
+ - Gemma, Phi-3
414
+
415
+ **Vision models**:
416
+ - LLaVA, LLaVA-OneVision
417
+ - Phi-3-Vision
418
+ - Qwen2-VL
419
+
420
+ **100+ models** from HuggingFace
421
+
422
+ ## Hardware support
423
+
424
+ **NVIDIA**: A100, H100, L4, T4 (CUDA 11.8+)
425
+ **AMD**: MI300, MI250 (ROCm 6.0+)
426
+ **Intel**: Xeon with GPU (coming soon)
427
+ **Apple**: M1/M2/M3 via MPS (experimental)
428
+
429
+ ## References
430
+
431
+ - **[Structured Generation Guide](references/structured-generation.md)** - JSON schemas, regex, grammars, validation
432
+ - **[RadixAttention Deep Dive](references/radix-attention.md)** - How it works, optimization, benchmarks
433
+ - **[Production Deployment](references/deployment.md)** - Multi-GPU, monitoring, autoscaling
434
+
435
+ ## Resources
436
+
437
+ - **GitHub**: https://github.com/sgl-project/sglang
438
+ - **Docs**: https://sgl-project.github.io/
439
+ - **Paper**: RadixAttention (arXiv:2312.07104)
440
+ - **Discord**: https://discord.gg/sglang
441
+
442
+