PyPI - mlx-forge - Versions diffs - 0.2.0__tar.gz - Mend

mlx-forge 0.2.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (127) hide show

mlx_forge-0.2.0/LICENSE +21 -0
mlx_forge-0.2.0/PKG-INFO +246 -0
mlx_forge-0.2.0/README.md +201 -0
mlx_forge-0.2.0/mlx_forge/__init__.py +456 -0
mlx_forge-0.2.0/mlx_forge/_version.py +1 -0
mlx_forge-0.2.0/mlx_forge/adapters/__init__.py +0 -0
mlx_forge-0.2.0/mlx_forge/adapters/lora.py +287 -0
mlx_forge-0.2.0/mlx_forge/adapters/targeting.py +162 -0
mlx_forge-0.2.0/mlx_forge/cli/__init__.py +0 -0
mlx_forge-0.2.0/mlx_forge/cli/data_cmd.py +220 -0
mlx_forge-0.2.0/mlx_forge/cli/generate_cmd.py +99 -0
mlx_forge-0.2.0/mlx_forge/cli/main.py +254 -0
mlx_forge-0.2.0/mlx_forge/cli/prepare_cmd.py +23 -0
mlx_forge-0.2.0/mlx_forge/cli/studio_cmd.py +21 -0
mlx_forge-0.2.0/mlx_forge/cli/train_cmd.py +11 -0
mlx_forge-0.2.0/mlx_forge/config.py +176 -0
mlx_forge-0.2.0/mlx_forge/data/__init__.py +0 -0
mlx_forge-0.2.0/mlx_forge/data/backend.py +157 -0
mlx_forge-0.2.0/mlx_forge/data/batching.py +238 -0
mlx_forge-0.2.0/mlx_forge/data/catalog.py +370 -0
mlx_forge-0.2.0/mlx_forge/data/converter.py +204 -0
mlx_forge-0.2.0/mlx_forge/data/formats.py +191 -0
mlx_forge-0.2.0/mlx_forge/data/mixing.py +61 -0
mlx_forge-0.2.0/mlx_forge/data/packing.py +93 -0
mlx_forge-0.2.0/mlx_forge/data/preprocessing.py +198 -0
mlx_forge-0.2.0/mlx_forge/data/registry.py +221 -0
mlx_forge-0.2.0/mlx_forge/data/validate.py +227 -0
mlx_forge-0.2.0/mlx_forge/inference/__init__.py +1 -0
mlx_forge-0.2.0/mlx_forge/inference/cache.py +122 -0
mlx_forge-0.2.0/mlx_forge/inference/engine.py +232 -0
mlx_forge-0.2.0/mlx_forge/inference/sampling.py +88 -0
mlx_forge-0.2.0/mlx_forge/logging/__init__.py +0 -0
mlx_forge-0.2.0/mlx_forge/logging/metrics.py +52 -0
mlx_forge-0.2.0/mlx_forge/losses/__init__.py +6 -0
mlx_forge-0.2.0/mlx_forge/losses/dpo.py +98 -0
mlx_forge-0.2.0/mlx_forge/losses/sft.py +77 -0
mlx_forge-0.2.0/mlx_forge/manifest.py +164 -0
mlx_forge-0.2.0/mlx_forge/models/__init__.py +0 -0
mlx_forge-0.2.0/mlx_forge/models/_base/__init__.py +12 -0
mlx_forge-0.2.0/mlx_forge/models/_base/activations.py +25 -0
mlx_forge-0.2.0/mlx_forge/models/_base/args.py +38 -0
mlx_forge-0.2.0/mlx_forge/models/_base/attention.py +101 -0
mlx_forge-0.2.0/mlx_forge/models/_base/rope.py +276 -0
mlx_forge-0.2.0/mlx_forge/models/architectures/__init__.py +4 -0
mlx_forge-0.2.0/mlx_forge/models/architectures/gemma.py +352 -0
mlx_forge-0.2.0/mlx_forge/models/architectures/llama.py +236 -0
mlx_forge-0.2.0/mlx_forge/models/architectures/phi3.py +261 -0
mlx_forge-0.2.0/mlx_forge/models/architectures/phi4.py +221 -0
mlx_forge-0.2.0/mlx_forge/models/architectures/qwen2.py +221 -0
mlx_forge-0.2.0/mlx_forge/models/architectures/qwen3.py +231 -0
mlx_forge-0.2.0/mlx_forge/models/architectures/qwen3_5.py +752 -0
mlx_forge-0.2.0/mlx_forge/models/loader.py +143 -0
mlx_forge-0.2.0/mlx_forge/models/memory.py +376 -0
mlx_forge-0.2.0/mlx_forge/models/quantize.py +39 -0
mlx_forge-0.2.0/mlx_forge/models/registry.py +108 -0
mlx_forge-0.2.0/mlx_forge/models/resolve.py +205 -0
mlx_forge-0.2.0/mlx_forge/recipes/__init__.py +5 -0
mlx_forge-0.2.0/mlx_forge/recipes/auto_config.py +104 -0
mlx_forge-0.2.0/mlx_forge/recipes/built_in/chat_sft.yaml +42 -0
mlx_forge-0.2.0/mlx_forge/recipes/built_in/instruction_sft.yaml +42 -0
mlx_forge-0.2.0/mlx_forge/recipes/built_in/preference_dpo.yaml +46 -0
mlx_forge-0.2.0/mlx_forge/recipes/built_in/writing_style.yaml +42 -0
mlx_forge-0.2.0/mlx_forge/recipes/registry.py +90 -0
mlx_forge-0.2.0/mlx_forge/studio/__init__.py +4 -0
mlx_forge-0.2.0/mlx_forge/studio/api/__init__.py +1 -0
mlx_forge-0.2.0/mlx_forge/studio/api/config_schema.py +152 -0
mlx_forge-0.2.0/mlx_forge/studio/api/data_library.py +76 -0
mlx_forge-0.2.0/mlx_forge/studio/api/datasets.py +44 -0
mlx_forge-0.2.0/mlx_forge/studio/api/inference.py +62 -0
mlx_forge-0.2.0/mlx_forge/studio/api/memory.py +58 -0
mlx_forge-0.2.0/mlx_forge/studio/api/models.py +46 -0
mlx_forge-0.2.0/mlx_forge/studio/api/queue.py +63 -0
mlx_forge-0.2.0/mlx_forge/studio/api/recipes.py +67 -0
mlx_forge-0.2.0/mlx_forge/studio/api/runs.py +73 -0
mlx_forge-0.2.0/mlx_forge/studio/api/training.py +48 -0
mlx_forge-0.2.0/mlx_forge/studio/frontend/assets/index-DfE9wCUu.js +46 -0
mlx_forge-0.2.0/mlx_forge/studio/frontend/assets/index-DoKRRrtV.css +1 -0
mlx_forge-0.2.0/mlx_forge/studio/frontend/index.html +14 -0
mlx_forge-0.2.0/mlx_forge/studio/server.py +210 -0
mlx_forge-0.2.0/mlx_forge/studio/services/__init__.py +1 -0
mlx_forge-0.2.0/mlx_forge/studio/services/data_library_service.py +46 -0
mlx_forge-0.2.0/mlx_forge/studio/services/dataset_service.py +73 -0
mlx_forge-0.2.0/mlx_forge/studio/services/memory_service.py +71 -0
mlx_forge-0.2.0/mlx_forge/studio/services/metrics_watcher.py +56 -0
mlx_forge-0.2.0/mlx_forge/studio/services/model_library_service.py +77 -0
mlx_forge-0.2.0/mlx_forge/studio/services/model_service.py +107 -0
mlx_forge-0.2.0/mlx_forge/studio/services/queue_service.py +178 -0
mlx_forge-0.2.0/mlx_forge/studio/services/recipe_service.py +47 -0
mlx_forge-0.2.0/mlx_forge/studio/services/run_service.py +242 -0
mlx_forge-0.2.0/mlx_forge/studio/services/training_service.py +113 -0
mlx_forge-0.2.0/mlx_forge/trainer/__init__.py +0 -0
mlx_forge-0.2.0/mlx_forge/trainer/callbacks.py +150 -0
mlx_forge-0.2.0/mlx_forge/trainer/checkpoint.py +187 -0
mlx_forge-0.2.0/mlx_forge/trainer/dpo_trainer.py +118 -0
mlx_forge-0.2.0/mlx_forge/trainer/optimizer.py +123 -0
mlx_forge-0.2.0/mlx_forge/trainer/state.py +20 -0
mlx_forge-0.2.0/mlx_forge/trainer/trainer.py +319 -0
mlx_forge-0.2.0/mlx_forge.egg-info/PKG-INFO +246 -0
mlx_forge-0.2.0/mlx_forge.egg-info/SOURCES.txt +125 -0
mlx_forge-0.2.0/mlx_forge.egg-info/dependency_links.txt +1 -0
mlx_forge-0.2.0/mlx_forge.egg-info/entry_points.txt +2 -0
mlx_forge-0.2.0/mlx_forge.egg-info/requires.txt +25 -0
mlx_forge-0.2.0/mlx_forge.egg-info/top_level.txt +1 -0
mlx_forge-0.2.0/pyproject.toml +85 -0
mlx_forge-0.2.0/setup.cfg +4 -0
mlx_forge-0.2.0/tests/test_adapters.py +203 -0
mlx_forge-0.2.0/tests/test_backend.py +278 -0
mlx_forge-0.2.0/tests/test_catalog.py +290 -0
mlx_forge-0.2.0/tests/test_config.py +246 -0
mlx_forge-0.2.0/tests/test_data.py +217 -0
mlx_forge-0.2.0/tests/test_data_validate.py +139 -0
mlx_forge-0.2.0/tests/test_integration.py +288 -0
mlx_forge-0.2.0/tests/test_labels.py +479 -0
mlx_forge-0.2.0/tests/test_m10_performance.py +667 -0
mlx_forge-0.2.0/tests/test_m11_studio.py +604 -0
mlx_forge-0.2.0/tests/test_m12_frontend.py +206 -0
mlx_forge-0.2.0/tests/test_m13_integration.py +708 -0
mlx_forge-0.2.0/tests/test_m9_foundation.py +711 -0
mlx_forge-0.2.0/tests/test_mixing.py +81 -0
mlx_forge-0.2.0/tests/test_model_loading.py +323 -0
mlx_forge-0.2.0/tests/test_qwen3_5.py +1019 -0
mlx_forge-0.2.0/tests/test_resolve.py +223 -0
mlx_forge-0.2.0/tests/test_trainer_infra.py +294 -0
mlx_forge-0.2.0/tests/test_v2_dpo.py +566 -0
mlx_forge-0.2.0/tests/test_v2_memory.py +212 -0
mlx_forge-0.2.0/tests/test_v2_recipes.py +170 -0
mlx_forge-0.2.0/tests/test_v2_studio.py +588 -0

mlx_forge-0.2.0/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 Jiekai Wang
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

mlx_forge-0.2.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,246 @@
+Metadata-Version: 2.4
+Name: mlx-forge
+Version: 0.2.0
+Summary: Fine-tune, experiment with, and run LLMs locally on your Mac
+Author: Jiekai Wang
+License-Expression: MIT
+Project-URL: Repository, https://github.com/moyuan5989/mlx-forge
+Project-URL: Issues, https://github.com/moyuan5989/mlx-forge/issues
+Keywords: mlx,lora,fine-tuning,apple-silicon,llm,qlora,dpo
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Developers
+Classifier: Intended Audience :: Science/Research
+Classifier: Operating System :: MacOS
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Requires-Python: >=3.10
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: mlx>=0.18.0
+Requires-Dist: pydantic>=2.0
+Requires-Dist: pyyaml>=6.0
+Requires-Dist: numpy>=1.24.0
+Requires-Dist: transformers>=4.35.0
+Requires-Dist: safetensors>=0.4.0
+Requires-Dist: huggingface-hub>=0.20.0
+Requires-Dist: datasets>=2.16.0
+Requires-Dist: fastapi>=0.104.0
+Requires-Dist: uvicorn[standard]>=0.24.0
+Requires-Dist: websockets>=12.0
+Provides-Extra: wandb
+Requires-Dist: wandb>=0.16.0; extra == "wandb"
+Provides-Extra: dev
+Requires-Dist: pytest>=7.0; extra == "dev"
+Requires-Dist: pytest-timeout>=2.0; extra == "dev"
+Requires-Dist: pytest-asyncio>=0.23.0; extra == "dev"
+Requires-Dist: pytest-cov>=4.1.0; extra == "dev"
+Requires-Dist: httpx>=0.25.0; extra == "dev"
+Requires-Dist: ruff>=0.4.0; extra == "dev"
+Provides-Extra: all
+Requires-Dist: mlx-forge[wandb]; extra == "all"
+Dynamic: license-file
+# MLX Forge
+**Fine-tune LLMs on your Mac with MLX. No cloud, no CUDA required.**
+[![PyPI](https://img.shields.io/pypi/v/mlx-forge)](https://pypi.org/project/mlx-forge/)
+[![Python](https://img.shields.io/pypi/pyversions/mlx-forge)](https://pypi.org/project/mlx-forge/)
+[![License](https://img.shields.io/badge/license-MIT-blue)](LICENSE)
+[![Tests](https://img.shields.io/github/actions/workflow/status/moyuan5989/mlx-forge/test.yml?label=tests)](https://github.com/moyuan5989/mlx-forge/actions)
+MLX Forge is a complete LLM fine-tuning toolkit that runs entirely on your Mac. Pick a model, upload your data, and start training — all from a browser-based UI. Supports LoRA, QLoRA, DPO, 18+ models, and 20+ curated datasets out of the box.
+```bash
+pip install mlx-forge
+mlx-forge studio
+```
+<p align="center">
+  <img src="assets/studio-new-training.png" alt="MLX Forge Studio — New Training" width="800">
+</p>
+## Why MLX Forge?
+- **One command to start** — `pip install mlx-forge && mlx-forge studio`.
+- **Browser-based Studio UI** — Guided training wizard, real-time loss charts, model library with memory estimates, interactive playground.
+- **Runs on Apple Silicon** — Built on [MLX](https://github.com/ml-explore/mlx). Your data stays on your machine.
+- **Production training features** — QLoRA (67% memory reduction), sequence packing (2-5x speedup), gradient checkpointing, DPO alignment, compiled training loop.
+## Quick Start
+### Studio UI (recommended)
+```bash
+mlx-forge studio
+# Opens at http://127.0.0.1:8741
+```
+Pick a recipe, choose a model, upload your data, and start training — all from the browser.
+### CLI
+```bash
+# Browse and download a dataset
+mlx-forge data catalog
+mlx-forge data download alpaca-cleaned --max-samples 5000
+# Train
+mlx-forge train --config train.yaml
+```
+Models are downloaded from Hugging Face on first run and cached locally. All subsequent runs work offline.
+## Studio UI
+<p align="center">
+  <img src="assets/studio-model-library.png" alt="MLX Forge Studio — Model Library" width="800">
+</p>
+- **New Training** — Guided wizard: pick a recipe (chat, instruction, DPO, writing style), choose a model, configure, and launch
+- **Model Library** — Browse 18+ models with memory estimates for your hardware
+- **Experiments** — Compare runs, view loss curves in real time
+- **Datasets** — Manage your training data
+- **Playground** — Chat with your fine-tuned models interactively
+## Supported Models
+18 curated models in the Studio library, all tested on Apple Silicon:
+| Architecture | Models | Sizes |
+|-------------|--------|-------|
+| Qwen | Qwen 2.5, Qwen 3, Qwen 3.5 | 0.5B - 8B |
+| Gemma | Gemma 2, Gemma 3 | 1B - 9B |
+| Llama | Llama 3.1 | 8B |
+| Phi | Phi-3 Mini, Phi-4 Mini | 3.8B |
+| DeepSeek | DeepSeek-R1-Distill (Qwen-based) | 1.5B - 7B |
+| Mistral | Mistral (uses Llama architecture) | 7B |
+Any HF model using a supported architecture will work — the table above shows the curated models with pre-computed memory estimates in Studio.
+## Features
+**Training**
+- LoRA and QLoRA (4-bit) fine-tuning with 67% memory reduction
+- DPO (Direct Preference Optimization) for alignment
+- Sequence packing for 2-5x speedup on short sequences
+- Gradient checkpointing for 40-60% memory savings
+- Compiled training loop with gradient accumulation
+- Cosine, linear, step, and exponential LR schedules with warmup
+- Resume from any checkpoint
+**Data**
+- 20+ curated datasets across 7 categories (general, code, math, conversation, reasoning, safety, domain)
+- Auto-detection of chat, completions, text, and preference formats
+- Multi-dataset mixing with weighted sampling
+- Data validation with train/val overlap detection
+## CLI Reference
+| Command | Description |
+|---------|-------------|
+| `mlx-forge studio` | Launch the Studio UI |
+| `mlx-forge train --config FILE` | Run LoRA/QLoRA/DPO training |
+| `mlx-forge generate --model MODEL` | Generate text or interactive chat |
+| `mlx-forge prepare --data FILE --model MODEL` | Pre-tokenize a dataset |
+| `mlx-forge data catalog` | Browse 20+ curated datasets |
+| `mlx-forge data download DATASET` | Download a dataset from the catalog |
+| `mlx-forge data import FILE --name NAME` | Import a local JSONL file |
+| `mlx-forge data validate FILE` | Validate JSONL data |
+| `mlx-forge data inspect NAME` | Preview dataset samples |
+| `mlx-forge data stats NAME` | Show dataset statistics |
+## Configuration
+```yaml
+schema_version: 1
+model:
+  path: "Qwen/Qwen3-0.6B"         # HF model ID or local path
+  quantization:                     # Optional: QLoRA (67% memory savings)
+    bits: 4
+    group_size: 64
+adapter:
+  preset: "attention-qv"           # attention-qv | attention-all | mlp | all-linear
+  rank: 16
+  scale: 32.0
+data:
+  train: "./train.jsonl"
+  valid: "./val.jsonl"
+  packing: false                    # Sequence packing (2-5x speedup)
+  max_seq_length: 2048
+training:
+  optimizer: adamw                  # adam | adamw | sgd | adafactor
+  learning_rate: 1.0e-5
+  num_iters: 1000
+  batch_size: 4
+  gradient_checkpointing: false     # 40-60% memory savings
+  # training_type: dpo              # For DPO training
+  # dpo_beta: 0.1
+runtime:
+  seed: 42
+```
+## Data Formats
+MLX Forge auto-detects four JSONL formats:
+**Chat** — Multi-turn conversations (loss on assistant turns only):
+```json
+{"messages": [{"role": "user", "content": "Hello"}, {"role": "assistant", "content": "Hi!"}]}
+```
+**Completions** — Prompt-completion pairs:
+```json
+{"prompt": "Translate to French: Hello", "completion": "Bonjour"}
+```
+**Text** — Raw text for continued pretraining:
+```json
+{"text": "The quick brown fox jumps over the lazy dog."}
+```
+**Preference** — For DPO alignment training:
+```json
+{"chosen": [{"role": "user", "content": "..."}, {"role": "assistant", "content": "good"}], "rejected": [{"role": "user", "content": "..."}, {"role": "assistant", "content": "bad"}]}
+```
+## Library API
+All CLI commands are backed by Python functions:
+```python
+from mlx_forge import prepare, train
+from mlx_forge.config import TrainingConfig
+# Train from a config file
+config = TrainingConfig.from_yaml("train.yaml")
+result = train(config=config)
+print(f"Best val loss: {result.best_val_loss:.4f}")
+```
+```python
+from mlx_forge import generate
+# Generate text with a fine-tuned adapter
+generate(
+    model="Qwen/Qwen3-0.6B",
+    adapter="~/.mlxforge/runs/my-run/checkpoints/best",
+    prompt="Explain quantum computing in simple terms.",
+)
+```
+## Contributing
+See [CONTRIBUTING.md](CONTRIBUTING.md) for development setup, coding standards, and how to submit changes.
+## License
+[MIT](LICENSE)

mlx_forge-0.2.0/README.md ADDED Viewed

@@ -0,0 +1,201 @@
+# MLX Forge
+**Fine-tune LLMs on your Mac with MLX. No cloud, no CUDA required.**
+[![PyPI](https://img.shields.io/pypi/v/mlx-forge)](https://pypi.org/project/mlx-forge/)
+[![Python](https://img.shields.io/pypi/pyversions/mlx-forge)](https://pypi.org/project/mlx-forge/)
+[![License](https://img.shields.io/badge/license-MIT-blue)](LICENSE)
+[![Tests](https://img.shields.io/github/actions/workflow/status/moyuan5989/mlx-forge/test.yml?label=tests)](https://github.com/moyuan5989/mlx-forge/actions)
+MLX Forge is a complete LLM fine-tuning toolkit that runs entirely on your Mac. Pick a model, upload your data, and start training — all from a browser-based UI. Supports LoRA, QLoRA, DPO, 18+ models, and 20+ curated datasets out of the box.
+```bash
+pip install mlx-forge
+mlx-forge studio
+```
+<p align="center">
+  <img src="assets/studio-new-training.png" alt="MLX Forge Studio — New Training" width="800">
+</p>
+## Why MLX Forge?
+- **One command to start** — `pip install mlx-forge && mlx-forge studio`.
+- **Browser-based Studio UI** — Guided training wizard, real-time loss charts, model library with memory estimates, interactive playground.
+- **Runs on Apple Silicon** — Built on [MLX](https://github.com/ml-explore/mlx). Your data stays on your machine.
+- **Production training features** — QLoRA (67% memory reduction), sequence packing (2-5x speedup), gradient checkpointing, DPO alignment, compiled training loop.
+## Quick Start
+### Studio UI (recommended)
+```bash
+mlx-forge studio
+# Opens at http://127.0.0.1:8741
+```
+Pick a recipe, choose a model, upload your data, and start training — all from the browser.
+### CLI
+```bash
+# Browse and download a dataset
+mlx-forge data catalog
+mlx-forge data download alpaca-cleaned --max-samples 5000
+# Train
+mlx-forge train --config train.yaml
+```
+Models are downloaded from Hugging Face on first run and cached locally. All subsequent runs work offline.
+## Studio UI
+<p align="center">
+  <img src="assets/studio-model-library.png" alt="MLX Forge Studio — Model Library" width="800">
+</p>
+- **New Training** — Guided wizard: pick a recipe (chat, instruction, DPO, writing style), choose a model, configure, and launch
+- **Model Library** — Browse 18+ models with memory estimates for your hardware
+- **Experiments** — Compare runs, view loss curves in real time
+- **Datasets** — Manage your training data
+- **Playground** — Chat with your fine-tuned models interactively
+## Supported Models
+18 curated models in the Studio library, all tested on Apple Silicon:
+| Architecture | Models | Sizes |
+|-------------|--------|-------|
+| Qwen | Qwen 2.5, Qwen 3, Qwen 3.5 | 0.5B - 8B |
+| Gemma | Gemma 2, Gemma 3 | 1B - 9B |
+| Llama | Llama 3.1 | 8B |
+| Phi | Phi-3 Mini, Phi-4 Mini | 3.8B |
+| DeepSeek | DeepSeek-R1-Distill (Qwen-based) | 1.5B - 7B |
+| Mistral | Mistral (uses Llama architecture) | 7B |
+Any HF model using a supported architecture will work — the table above shows the curated models with pre-computed memory estimates in Studio.
+## Features
+**Training**
+- LoRA and QLoRA (4-bit) fine-tuning with 67% memory reduction
+- DPO (Direct Preference Optimization) for alignment
+- Sequence packing for 2-5x speedup on short sequences
+- Gradient checkpointing for 40-60% memory savings
+- Compiled training loop with gradient accumulation
+- Cosine, linear, step, and exponential LR schedules with warmup
+- Resume from any checkpoint
+**Data**
+- 20+ curated datasets across 7 categories (general, code, math, conversation, reasoning, safety, domain)
+- Auto-detection of chat, completions, text, and preference formats
+- Multi-dataset mixing with weighted sampling
+- Data validation with train/val overlap detection
+## CLI Reference
+| Command | Description |
+|---------|-------------|
+| `mlx-forge studio` | Launch the Studio UI |
+| `mlx-forge train --config FILE` | Run LoRA/QLoRA/DPO training |
+| `mlx-forge generate --model MODEL` | Generate text or interactive chat |
+| `mlx-forge prepare --data FILE --model MODEL` | Pre-tokenize a dataset |
+| `mlx-forge data catalog` | Browse 20+ curated datasets |
+| `mlx-forge data download DATASET` | Download a dataset from the catalog |
+| `mlx-forge data import FILE --name NAME` | Import a local JSONL file |
+| `mlx-forge data validate FILE` | Validate JSONL data |
+| `mlx-forge data inspect NAME` | Preview dataset samples |
+| `mlx-forge data stats NAME` | Show dataset statistics |
+## Configuration
+```yaml
+schema_version: 1
+model:
+  path: "Qwen/Qwen3-0.6B"         # HF model ID or local path
+  quantization:                     # Optional: QLoRA (67% memory savings)
+    bits: 4
+    group_size: 64
+adapter:
+  preset: "attention-qv"           # attention-qv | attention-all | mlp | all-linear
+  rank: 16
+  scale: 32.0
+data:
+  train: "./train.jsonl"
+  valid: "./val.jsonl"
+  packing: false                    # Sequence packing (2-5x speedup)
+  max_seq_length: 2048
+training:
+  optimizer: adamw                  # adam | adamw | sgd | adafactor
+  learning_rate: 1.0e-5
+  num_iters: 1000
+  batch_size: 4
+  gradient_checkpointing: false     # 40-60% memory savings
+  # training_type: dpo              # For DPO training
+  # dpo_beta: 0.1
+runtime:
+  seed: 42
+```
+## Data Formats
+MLX Forge auto-detects four JSONL formats:
+**Chat** — Multi-turn conversations (loss on assistant turns only):
+```json
+{"messages": [{"role": "user", "content": "Hello"}, {"role": "assistant", "content": "Hi!"}]}
+```
+**Completions** — Prompt-completion pairs:
+```json
+{"prompt": "Translate to French: Hello", "completion": "Bonjour"}
+```
+**Text** — Raw text for continued pretraining:
+```json
+{"text": "The quick brown fox jumps over the lazy dog."}
+```
+**Preference** — For DPO alignment training:
+```json
+{"chosen": [{"role": "user", "content": "..."}, {"role": "assistant", "content": "good"}], "rejected": [{"role": "user", "content": "..."}, {"role": "assistant", "content": "bad"}]}
+```
+## Library API
+All CLI commands are backed by Python functions:
+```python
+from mlx_forge import prepare, train
+from mlx_forge.config import TrainingConfig
+# Train from a config file
+config = TrainingConfig.from_yaml("train.yaml")
+result = train(config=config)
+print(f"Best val loss: {result.best_val_loss:.4f}")
+```
+```python
+from mlx_forge import generate
+# Generate text with a fine-tuned adapter
+generate(
+    model="Qwen/Qwen3-0.6B",
+    adapter="~/.mlxforge/runs/my-run/checkpoints/best",
+    prompt="Explain quantum computing in simple terms.",
+)
+```
+## Contributing
+See [CONTRIBUTING.md](CONTRIBUTING.md) for development setup, coding standards, and how to submit changes.
+## License
+[MIT](LICENSE)