MakazhanAlpamys
diff --git a/‎.claude/settings.json‎
Lines changed: 4 additions & 1 deletion b/‎.claude/settings.json‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 58 additions & 2 deletions b/‎README.md‎
Lines changed: 58 additions & 2 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 3 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎soup_cli/cli.py‎
Lines changed: 3 additions & 1 deletion b/‎soup_cli/cli.py‎
Lines changed: 3 additions & 1 deletion
@@ -13,12 +13,15 @@
       "Bash(git remote*)",
       "Bash(ruff check*)",
       "Bash(ruff format*)",
+      "Bash(python -m ruff*)",
       "Bash(pytest*)",
       "Bash(python -m pytest*)",
       "Bash(pip install*)",
       "Bash(pip list*)",
       "Bash(soup *)",
-      "Bash(python -m soup_cli*)"
+      "Bash(python -m soup_cli*)",
+      "Bash(cd /c/Users/tokmo/peder/Soup && python -m pytest*)",
+      "Bash(cd /c/Users/tokmo/peder/Soup && ruff check*)"
     ]
   }
 }
@@ -34,3 +34,6 @@ wandb/
 # Secrets
 .env
 *.key
+
+# Internal plan (not for repo)
+plan.md
@@ -86,6 +86,50 @@ training:
 output: ./output
 ```
 
+## DPO Training
+
+Train with preference data using Direct Preference Optimization:
+
+```yaml
+base: meta-llama/Llama-3.1-8B-Instruct
+task: dpo
+
+data:
+  train: ./data/preferences.jsonl
+  format: dpo
+
+training:
+  epochs: 3
+  dpo_beta: 0.1
+  lora:
+    r: 64
+    alpha: 16
+  quantization: 4bit
+```
+
+## Chat with your model
+
+```bash
+# Chat with a LoRA adapter (auto-detects base model)
+soup chat --model ./output
+
+# Specify base model explicitly
+soup chat --model ./output --base meta-llama/Llama-3.1-8B-Instruct
+
+# Adjust generation
+soup chat --model ./output --temperature 0.3 --max-tokens 256
+```
+
+## Push to HuggingFace
+
+```bash
+# Upload model to HF Hub
+soup push --model ./output --repo your-username/my-model
+
+# Make it private
+soup push --model ./output --repo your-username/my-model --private
+```
+
 ## Data Formats
 
 Soup supports these formats (auto-detected):
@@ -105,6 +149,11 @@ Soup supports these formats (auto-detected):
 {"messages": [{"role": "user", "content": "Hi"}, {"role": "assistant", "content": "Hello!"}]}
 ```
 
+**DPO (preference pairs):**
+```json
+{"prompt": "Explain gravity", "chosen": "Gravity is a force...", "rejected": "I don't know"}
+```
+
 ## Data Tools
 
 ```bash
@@ -121,12 +170,14 @@ soup data validate ./data/train.jsonl --format alpaca
 |---|---|
 | LoRA / QLoRA fine-tuning | ✅ |
 | SFT (Supervised Fine-Tune) | ✅ |
-| DPO (Direct Preference Optimization) | 🔜 |
+| DPO (Direct Preference Optimization) | ✅ |
 | Auto batch size | ✅ |
 | Auto GPU detection (CUDA/MPS/CPU) | ✅ |
 | Live terminal dashboard | ✅ |
-| Alpaca / ShareGPT / ChatML formats | ✅ |
+| Alpaca / ShareGPT / ChatML / DPO formats | ✅ |
 | HuggingFace datasets support | ✅ |
+| Interactive model chat | ✅ |
+| Push to HuggingFace Hub | ✅ |
 | Experiment tracking | 🔜 |
 | Web dashboard | 🔜 |
 | Cloud mode (BYOG) | 🔜 |
@@ -143,7 +194,12 @@ soup data validate ./data/train.jsonl --format alpaca
 git clone https://github.com/MakazhanAlpamys/Soup.git
 cd Soup
 pip install -e ".[dev]"
+
+# Run unit tests (fast, no GPU needed)
 pytest tests/ -v
+
+# Run smoke tests (downloads tiny model, runs real training)
+pytest tests/ -m smoke -v
 ```
 
 ## License
 
@@ -33,6 +33,7 @@ dependencies = [
     "datasets>=2.14.0",
     "bitsandbytes>=0.41.0",
     "accelerate>=0.25.0",
+    "huggingface-hub>=0.16.0",
 ]
 
 [project.optional-dependencies]
@@ -57,3 +58,5 @@ select = ["E", "F", "I", "N", "W"]
 
 [tool.pytest.ini_options]
 testpaths = ["tests"]
+markers = ["smoke: slow smoke tests that download models and run training (run with: pytest -m smoke)"]
+addopts = "-m 'not smoke'"
@@ -4,7 +4,7 @@
 from rich.console import Console
 
 from soup_cli import __version__
-from soup_cli.commands import data, init, train
+from soup_cli.commands import chat, data, init, push, train
 
 console = Console()
 
@@ -18,6 +18,8 @@
 # Register sub-commands
 app.command()(init.init)
 app.command()(train.train)
+app.command()(chat.chat)
+app.command()(push.push)
 app.add_typer(data.app, name="data", help="Dataset tools: inspect, convert, validate.")
Original file line number	Diff line number	Diff line change
`@@ -13,12 +13,15 @@`
`13`	`13`	`"Bash(git remote*)",`
`14`	`14`	`"Bash(ruff check*)",`
`15`	`15`	`"Bash(ruff format*)",`
	`16`	`+ "Bash(python -m ruff*)",`
`16`	`17`	`"Bash(pytest*)",`
`17`	`18`	`"Bash(python -m pytest*)",`
`18`	`19`	`"Bash(pip install*)",`
`19`	`20`	`"Bash(pip list*)",`
`20`	`21`	`"Bash(soup *)",`
`21`		`- "Bash(python -m soup_cli*)"`
	`22`	`+ "Bash(python -m soup_cli*)",`
	`23`	`+ "Bash(cd /c/Users/tokmo/peder/Soup && python -m pytest*)",`
	`24`	`+ "Bash(cd /c/Users/tokmo/peder/Soup && ruff check*)"`
`22`	`25`	`]`
`23`	`26`	`}`
`24`	`27`	`}`