From d9c1db2b874d12a60f489a3504393418b0b764cb Mon Sep 17 00:00:00 2001
From: Ettore Di Giacinto <mudler@users.noreply.github.com>
Date: Sat, 21 Mar 2026 02:08:02 +0100
Subject: [PATCH] feat: add (experimental) fine-tuning support with TRL (#9088)

* feat: add fine-tuning endpoint

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

* feat(experimental): add fine-tuning endpoint and TRL support

This changeset defines new GRPC signatues for Fine tuning backends, and
add TRL backend as initial fine-tuning engine. This implementation also
supports exporting to GGUF and automatically importing it to LocalAI
after fine-tuning.

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

* commit TRL backend, stop by killing process

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

* move fine-tune to generic features

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

* add evals, reorder menu

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

* Fix tests

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

---------

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
---
 .agents/debugging-backends.md                 |  141 ++
 .github/workflows/backend.yml                 |   39 +
 AGENTS.md                                     |    1 +
 Makefile                                      |    8 +-
 backend/backend.proto                         |  109 ++
 backend/index.yaml                            |   51 +
 backend/python/trl/Makefile                   |   26 +
 backend/python/trl/backend.py                 |  860 ++++++++++
 backend/python/trl/install.sh                 |   37 +
 backend/python/trl/requirements-cpu.txt       |    9 +
 backend/python/trl/requirements-cublas12.txt  |    9 +
 backend/python/trl/requirements-cublas13.txt  |    9 +
 backend/python/trl/requirements.txt           |    3 +
 backend/python/trl/reward_functions.py        |  236 +++
 backend/python/trl/run.sh                     |   10 +
 backend/python/trl/test.py                    |   58 +
 backend/python/trl/test.sh                    |   11 +
 core/cli/run.go                               |    8 +
 core/config/application_config.go             |   14 +
 core/gallery/importers/local.go               |  205 +++
 core/gallery/importers/local_test.go          |  148 ++
 core/http/app.go                              |   11 +
 core/http/auth/features.go                    |   19 +
 core/http/auth/permissions.go                 |    8 +-
 .../endpoints/localai/agent_collections.go    |    5 +-
 core/http/endpoints/localai/finetune.go       |  362 ++++
 core/http/react-ui/src/App.css                |   75 +-
 .../src/components/LoadingSpinner.jsx         |   16 +-
 core/http/react-ui/src/components/Sidebar.jsx |  208 ++-
 core/http/react-ui/src/pages/FineTune.jsx     | 1525 +++++++++++++++++
 core/http/react-ui/src/pages/Studio.jsx       |   48 +
 core/http/react-ui/src/pages/Users.jsx        |   35 +-
 core/http/react-ui/src/router.jsx             |    5 +
 core/http/react-ui/src/utils/api.js           |   19 +
 core/http/routes/auth.go                      |    7 +-
 core/http/routes/finetuning.go                |   42 +
 core/http/routes/localai.go                   |    5 +-
 core/schema/finetune.go                       |  111 ++
 core/services/agent_pool.go                   |    6 +-
 core/services/finetune.go                     |  700 ++++++++
 docs/content/features/fine-tuning.md          |  226 +++
 go.mod                                        |   12 +-
 go.sum                                        |   24 +
 pkg/grpc/backend.go                           |    7 +
 pkg/grpc/base/base.go                         |   20 +
 pkg/grpc/client.go                            |  136 ++
 pkg/grpc/embed.go                             |   62 +
 pkg/grpc/interface.go                         |    7 +
 pkg/grpc/server.go                            |   69 +
 49 files changed, 5652 insertions(+), 110 deletions(-)
 create mode 100644 .agents/debugging-backends.md
 create mode 100644 backend/python/trl/Makefile
 create mode 100644 backend/python/trl/backend.py
 create mode 100644 backend/python/trl/install.sh
 create mode 100644 backend/python/trl/requirements-cpu.txt
 create mode 100644 backend/python/trl/requirements-cublas12.txt
 create mode 100644 backend/python/trl/requirements-cublas13.txt
 create mode 100644 backend/python/trl/requirements.txt
 create mode 100644 backend/python/trl/reward_functions.py
 create mode 100644 backend/python/trl/run.sh
 create mode 100644 backend/python/trl/test.py
 create mode 100644 backend/python/trl/test.sh
 create mode 100644 core/gallery/importers/local.go
 create mode 100644 core/gallery/importers/local_test.go
 create mode 100644 core/http/endpoints/localai/finetune.go
 create mode 100644 core/http/react-ui/src/pages/FineTune.jsx
 create mode 100644 core/http/react-ui/src/pages/Studio.jsx
 create mode 100644 core/http/routes/finetuning.go
 create mode 100644 core/schema/finetune.go
 create mode 100644 core/services/finetune.go
 create mode 100644 docs/content/features/fine-tuning.md

diff --git a/.agents/debugging-backends.md b/.agents/debugging-backends.md
new file mode 100644
index 000000000..e818753c2
--- /dev/null
+++ b/.agents/debugging-backends.md
@@ -0,0 +1,141 @@
+# Debugging and Rebuilding Backends
+
+When a backend fails at runtime (e.g. a gRPC method error, a Python import error, or a dependency conflict), use this guide to diagnose, fix, and rebuild.
+
+## Architecture Overview
+
+- **Source directory**: `backend/python/<name>/` (or `backend/go/<name>/`, `backend/cpp/<name>/`)
+- **Installed directory**: `backends/<name>/` — this is what LocalAI actually runs. It is populated by `make backends/<name>` which builds a Docker image, exports it, and installs it via `local-ai backends install`.
+- **Virtual environment**: `backends/<name>/venv/` — the installed Python venv (for Python backends). The Python binary is at `backends/<name>/venv/bin/python`.
+
+Editing files in `backend/python/<name>/` does **not** affect the running backend until you rebuild with `make backends/<name>`.
+
+## Diagnosing Failures
+
+### 1. Check the logs
+
+Backend gRPC processes log to LocalAI's stdout/stderr. Look for lines tagged with the backend's model ID:
+
+```
+GRPC stderr id="trl-finetune-127.0.0.1:37335" line="..."
+```
+
+Common error patterns:
+- **"Method not implemented"** — the backend is missing a gRPC method that the Go side calls. The model loader (`pkg/model/initializers.go`) always calls `LoadModel` after `Health`; fine-tuning backends must implement it even as a no-op stub.
+- **Python import errors / `AttributeError`** — usually a dependency version mismatch (e.g. `pyarrow` removing `PyExtensionType`).
+- **"failed to load backend"** — the gRPC process crashed or never started. Check stderr lines for the traceback.
+
+### 2. Test the Python environment directly
+
+You can run the installed venv's Python to check imports without starting the full server:
+
+```bash
+backends/<name>/venv/bin/python -c "import datasets; print(datasets.__version__)"
+```
+
+If `pip` is missing from the venv, bootstrap it:
+
+```bash
+backends/<name>/venv/bin/python -m ensurepip
+```
+
+Then use `backends/<name>/venv/bin/python -m pip install ...` to test fixes in the installed venv before committing them to the source requirements.
+
+### 3. Check upstream dependency constraints
+
+When you hit a dependency conflict, check what the main library expects. For example, TRL's upstream `requirements.txt`:
+
+```
+https://github.com/huggingface/trl/blob/main/requirements.txt
+```
+
+Pin minimum versions in the backend's requirements files to match upstream.
+
+## Common Fixes
+
+### Missing gRPC methods
+
+If the Go side calls a method the backend doesn't implement (e.g. `LoadModel`), add a no-op stub in `backend.py`:
+
+```python
+def LoadModel(self, request, context):
+    """No-op — actual loading happens elsewhere."""
+    return backend_pb2.Result(success=True, message="OK")
+```
+
+The gRPC contract requires `LoadModel` to succeed for the model loader to return a usable client, even if the backend doesn't need upfront model loading.
+
+### Dependency version conflicts
+
+Python backends often break when a transitive dependency releases a breaking change (e.g. `pyarrow` removing `PyExtensionType`). Steps:
+
+1. Identify the broken import in the logs
+2. Test in the installed venv: `backends/<name>/venv/bin/python -c "import <module>"`
+3. Check upstream requirements for version constraints
+4. Update **all** requirements files in `backend/python/<name>/`:
+   - `requirements.txt` — base deps (grpcio, protobuf)
+   - `requirements-cpu.txt` — CPU-specific (includes PyTorch CPU index)
+   - `requirements-cublas12.txt` — CUDA 12
+   - `requirements-cublas13.txt` — CUDA 13
+5. Rebuild: `make backends/<name>`
+
+### PyTorch index conflicts (uv resolver)
+
+The Docker build uses `uv` for pip installs. When `--extra-index-url` points to the PyTorch wheel index, `uv` may refuse to fetch packages like `requests` from PyPI if it finds a different version on the PyTorch index first. Fix this by adding `--index-strategy=unsafe-first-match` to `install.sh`:
+
+```bash
+EXTRA_PIP_INSTALL_FLAGS+=" --upgrade --index-strategy=unsafe-first-match"
+installRequirements
+```
+
+Most Python backends already do this — check `backend/python/transformers/install.sh` or similar for reference.
+
+## Rebuilding
+
+### Rebuild a single backend
+
+```bash
+make backends/<name>
+```
+
+This runs the Docker build (`Dockerfile.python`), exports the image to `backend-images/<name>.tar`, and installs it into `backends/<name>/`. It also rebuilds the `local-ai` Go binary (without extra tags).
+
+**Important**: If you were previously running with `GO_TAGS=auth`, the `make backends/<name>` step will overwrite your binary without that tag. Rebuild the Go binary afterward:
+
+```bash
+GO_TAGS=auth make build
+```
+
+### Rebuild and restart
+
+After rebuilding a backend, you must restart LocalAI for it to pick up the new backend files. The backend gRPC process is spawned on demand when the model is first loaded.
+
+```bash
+# Kill existing process
+kill <pid>
+
+# Restart
+./local-ai run --debug [your flags]
+```
+
+### Quick iteration (skip Docker rebuild)
+
+For fast iteration on a Python backend's `backend.py` without a full Docker rebuild, you can edit the installed copy directly:
+
+```bash
+# Edit the installed copy
+vim backends/<name>/backend.py
+
+# Restart LocalAI to respawn the gRPC process
+```
+
+This is useful for testing but **does not persist** — the next `make backends/<name>` will overwrite it. Always commit fixes to the source in `backend/python/<name>/`.
+
+## Verification
+
+After fixing and rebuilding:
+
+1. Start LocalAI and confirm the backend registers: look for `Registering backend name="<name>"` in the logs
+2. Trigger the operation that failed (e.g. start a fine-tuning job)
+3. Watch the GRPC stderr/stdout lines for the backend's model ID
+4. Confirm no errors in the traceback
diff --git a/.github/workflows/backend.yml b/.github/workflows/backend.yml
index 50cc9b180..6842d7da1 100644
--- a/.github/workflows/backend.yml
+++ b/.github/workflows/backend.yml
@@ -118,6 +118,19 @@ jobs:
             dockerfile: "./backend/Dockerfile.python"
             context: "./"
             ubuntu-version: '2404'
+          - build-type: ''
+            cuda-major-version: ""
+            cuda-minor-version: ""
+            platforms: 'linux/amd64'
+            tag-latest: 'auto'
+            tag-suffix: '-cpu-trl'
+            runs-on: 'ubuntu-latest'
+            base-image: "ubuntu:24.04"
+            skip-drivers: 'true'
+            backend: "trl"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./"
+            ubuntu-version: '2404'
           - build-type: ''
             cuda-major-version: ""
             cuda-minor-version: ""
@@ -366,6 +379,19 @@ jobs:
             dockerfile: "./backend/Dockerfile.python"
             context: "./"
             ubuntu-version: '2404'
+          - build-type: 'cublas'
+            cuda-major-version: "12"
+            cuda-minor-version: "8"
+            platforms: 'linux/amd64'
+            tag-latest: 'auto'
+            tag-suffix: '-gpu-nvidia-cuda-12-trl'
+            runs-on: 'ubuntu-latest'
+            base-image: "ubuntu:24.04"
+            skip-drivers: 'false'
+            backend: "trl"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./"
+            ubuntu-version: '2404'
           - build-type: 'cublas'
             cuda-major-version: "12"
             cuda-minor-version: "8"
@@ -757,6 +783,19 @@ jobs:
             dockerfile: "./backend/Dockerfile.python"
             context: "./"
             ubuntu-version: '2404'
+          - build-type: 'cublas'
+            cuda-major-version: "13"
+            cuda-minor-version: "0"
+            platforms: 'linux/amd64'
+            tag-latest: 'auto'
+            tag-suffix: '-gpu-nvidia-cuda-13-trl'
+            runs-on: 'ubuntu-latest'
+            base-image: "ubuntu:24.04"
+            skip-drivers: 'false'
+            backend: "trl"
+            dockerfile: "./backend/Dockerfile.python"
+            context: "./"
+            ubuntu-version: '2404'
           - build-type: 'l4t'
             cuda-major-version: "13"
             cuda-minor-version: "0"
diff --git a/AGENTS.md b/AGENTS.md
index 41a89eab6..27785bf82 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -12,6 +12,7 @@ This file is an index to detailed topic guides in the `.agents/` directory. Read
 | [.agents/llama-cpp-backend.md](.agents/llama-cpp-backend.md) | Working on the llama.cpp backend — architecture, updating, tool call parsing |
 | [.agents/testing-mcp-apps.md](.agents/testing-mcp-apps.md) | Testing MCP Apps (interactive tool UIs) in the React UI |
 | [.agents/api-endpoints-and-auth.md](.agents/api-endpoints-and-auth.md) | Adding API endpoints, auth middleware, feature permissions, user access control |
+| [.agents/debugging-backends.md](.agents/debugging-backends.md) | Debugging runtime backend failures, dependency conflicts, rebuilding backends |
 
 ## Quick Reference
 
diff --git a/Makefile b/Makefile
index c429097b6..e3c02e9c2 100644
--- a/Makefile
+++ b/Makefile
@@ -1,5 +1,5 @@
 # Disable parallel execution for backend builds
-.NOTPARALLEL: backends/diffusers backends/llama-cpp backends/outetts backends/piper backends/stablediffusion-ggml backends/whisper backends/faster-whisper backends/silero-vad backends/local-store backends/huggingface backends/rfdetr backends/kitten-tts backends/kokoro backends/chatterbox backends/llama-cpp-darwin backends/neutts build-darwin-python-backend build-darwin-go-backend backends/mlx backends/diffuser-darwin backends/mlx-vlm backends/mlx-audio backends/mlx-distributed backends/stablediffusion-ggml-darwin backends/vllm backends/vllm-omni backends/moonshine backends/pocket-tts backends/qwen-tts backends/faster-qwen3-tts backends/qwen-asr backends/nemo backends/voxcpm backends/whisperx backends/ace-step backends/acestep-cpp backends/fish-speech backends/voxtral backends/opus
+.NOTPARALLEL: backends/diffusers backends/llama-cpp backends/outetts backends/piper backends/stablediffusion-ggml backends/whisper backends/faster-whisper backends/silero-vad backends/local-store backends/huggingface backends/rfdetr backends/kitten-tts backends/kokoro backends/chatterbox backends/llama-cpp-darwin backends/neutts build-darwin-python-backend build-darwin-go-backend backends/mlx backends/diffuser-darwin backends/mlx-vlm backends/mlx-audio backends/mlx-distributed backends/stablediffusion-ggml-darwin backends/vllm backends/vllm-omni backends/moonshine backends/pocket-tts backends/qwen-tts backends/faster-qwen3-tts backends/qwen-asr backends/nemo backends/voxcpm backends/whisperx backends/ace-step backends/acestep-cpp backends/fish-speech backends/voxtral backends/opus backends/trl
 
 GOCMD=go
 GOTEST=$(GOCMD) test
@@ -421,6 +421,7 @@ prepare-test-extra: protogen-python
 	$(MAKE) -C backend/python/voxcpm
 	$(MAKE) -C backend/python/whisperx
 	$(MAKE) -C backend/python/ace-step
+	$(MAKE) -C backend/python/trl
 
 test-extra: prepare-test-extra
 	$(MAKE) -C backend/python/transformers test
@@ -440,6 +441,7 @@ test-extra: prepare-test-extra
 	$(MAKE) -C backend/python/voxcpm test
 	$(MAKE) -C backend/python/whisperx test
 	$(MAKE) -C backend/python/ace-step test
+	$(MAKE) -C backend/python/trl test
 
 DOCKER_IMAGE?=local-ai
 IMAGE_TYPE?=core
@@ -572,6 +574,7 @@ BACKEND_VOXCPM = voxcpm|python|.|false|true
 BACKEND_WHISPERX = whisperx|python|.|false|true
 BACKEND_ACE_STEP = ace-step|python|.|false|true
 BACKEND_MLX_DISTRIBUTED = mlx-distributed|python|./|false|true
+BACKEND_TRL = trl|python|.|false|true
 
 # Helper function to build docker image for a backend
 # Usage: $(call docker-build-backend,BACKEND_NAME,DOCKERFILE_TYPE,BUILD_CONTEXT,PROGRESS_FLAG,NEEDS_BACKEND_ARG)
@@ -629,12 +632,13 @@ $(eval $(call generate-docker-build-target,$(BACKEND_WHISPERX)))
 $(eval $(call generate-docker-build-target,$(BACKEND_ACE_STEP)))
 $(eval $(call generate-docker-build-target,$(BACKEND_ACESTEP_CPP)))
 $(eval $(call generate-docker-build-target,$(BACKEND_MLX_DISTRIBUTED)))
+$(eval $(call generate-docker-build-target,$(BACKEND_TRL)))
 
 # Pattern rule for docker-save targets
 docker-save-%: backend-images
 	docker save local-ai-backend:$* -o backend-images/$*.tar
 
-docker-build-backends: docker-build-llama-cpp docker-build-rerankers docker-build-vllm docker-build-vllm-omni docker-build-transformers docker-build-outetts docker-build-diffusers docker-build-kokoro docker-build-faster-whisper docker-build-coqui docker-build-chatterbox docker-build-vibevoice docker-build-moonshine docker-build-pocket-tts docker-build-qwen-tts docker-build-fish-speech docker-build-faster-qwen3-tts docker-build-qwen-asr docker-build-nemo docker-build-voxcpm docker-build-whisperx docker-build-ace-step docker-build-acestep-cpp docker-build-voxtral docker-build-mlx-distributed
+docker-build-backends: docker-build-llama-cpp docker-build-rerankers docker-build-vllm docker-build-vllm-omni docker-build-transformers docker-build-outetts docker-build-diffusers docker-build-kokoro docker-build-faster-whisper docker-build-coqui docker-build-chatterbox docker-build-vibevoice docker-build-moonshine docker-build-pocket-tts docker-build-qwen-tts docker-build-fish-speech docker-build-faster-qwen3-tts docker-build-qwen-asr docker-build-nemo docker-build-voxcpm docker-build-whisperx docker-build-ace-step docker-build-acestep-cpp docker-build-voxtral docker-build-mlx-distributed docker-build-trl
 
 ########################################################
 ### Mock Backend for E2E Tests
diff --git a/backend/backend.proto b/backend/backend.proto
index d8a0cd9fc..91497c523 100644
--- a/backend/backend.proto
+++ b/backend/backend.proto
@@ -39,6 +39,13 @@ service Backend {
   rpc AudioDecode(AudioDecodeRequest) returns (AudioDecodeResult) {}
 
   rpc ModelMetadata(ModelOptions) returns (ModelMetadataResponse) {}
+
+  // Fine-tuning RPCs
+  rpc StartFineTune(FineTuneRequest) returns (FineTuneJobResult) {}
+  rpc FineTuneProgress(FineTuneProgressRequest) returns (stream FineTuneProgressUpdate) {}
+  rpc StopFineTune(FineTuneStopRequest) returns (Result) {}
+  rpc ListCheckpoints(ListCheckpointsRequest) returns (ListCheckpointsResponse) {}
+  rpc ExportModel(ExportModelRequest) returns (Result) {}
 }
 
 // Define the empty request
@@ -528,3 +535,105 @@ message ModelMetadataResponse {
   string rendered_template = 2;  // The rendered chat template with enable_thinking=true (empty if not applicable)
   ToolFormatMarkers tool_format = 3;  // Auto-detected tool format markers from differential template analysis
 }
+
+// Fine-tuning messages
+
+message FineTuneRequest {
+  // Model identification
+  string model = 1;                       // HF model name or local path
+  string training_type = 2;              // "lora", "loha", "lokr", "full" — what parameters to train
+  string training_method = 3;            // "sft", "dpo", "grpo", "rloo", "reward", "kto", "orpo", "network_training"
+
+  // Adapter config (universal across LoRA/LoHa/LoKr for LLM + diffusion)
+  int32 adapter_rank = 10;               // LoRA rank (r), default 16
+  int32 adapter_alpha = 11;              // scaling factor, default 16
+  float adapter_dropout = 12;            // default 0.0
+  repeated string target_modules = 13;   // layer names to adapt
+
+  // Universal training hyperparameters
+  float learning_rate = 20;              // default 2e-4
+  int32 num_epochs = 21;                 // default 3
+  int32 batch_size = 22;                 // default 2
+  int32 gradient_accumulation_steps = 23; // default 4
+  int32 warmup_steps = 24;              // default 5
+  int32 max_steps = 25;                 // 0 = use epochs
+  int32 save_steps = 26;               // 0 = only save final
+  float weight_decay = 27;             // default 0.01
+  bool gradient_checkpointing = 28;
+  string optimizer = 29;               // adamw_8bit, adamw, sgd, adafactor, prodigy
+  int32 seed = 30;                     // default 3407
+  string mixed_precision = 31;        // fp16, bf16, fp8, no
+
+  // Dataset
+  string dataset_source = 40;          // HF dataset ID, local file/dir path
+  string dataset_split = 41;           // train, test, etc.
+
+  // Output
+  string output_dir = 50;
+  string job_id = 51;                  // client-assigned or auto-generated
+
+  // Resume training from a checkpoint
+  string resume_from_checkpoint = 55;  // path to checkpoint dir to resume from
+
+  // Backend-specific AND method-specific extensibility
+  map<string, string> extra_options = 60;
+}
+
+message FineTuneJobResult {
+  string job_id = 1;
+  bool success = 2;
+  string message = 3;
+}
+
+message FineTuneProgressRequest {
+  string job_id = 1;
+}
+
+message FineTuneProgressUpdate {
+  string job_id = 1;
+  int32 current_step = 2;
+  int32 total_steps = 3;
+  float current_epoch = 4;
+  float total_epochs = 5;
+  float loss = 6;
+  float learning_rate = 7;
+  float grad_norm = 8;
+  float eval_loss = 9;
+  float eta_seconds = 10;
+  float progress_percent = 11;
+  string status = 12;                  // queued, caching, loading_model, loading_dataset, training, saving, completed, failed, stopped
+  string message = 13;
+  string checkpoint_path = 14;        // set when a checkpoint is saved
+  string sample_path = 15;           // set when a sample is generated (video/image backends)
+  map<string, float> extra_metrics = 16; // method-specific metrics
+}
+
+message FineTuneStopRequest {
+  string job_id = 1;
+  bool save_checkpoint = 2;
+}
+
+message ListCheckpointsRequest {
+  string output_dir = 1;
+}
+
+message ListCheckpointsResponse {
+  repeated CheckpointInfo checkpoints = 1;
+}
+
+message CheckpointInfo {
+  string path = 1;
+  int32 step = 2;
+  float epoch = 3;
+  float loss = 4;
+  string created_at = 5;
+}
+
+message ExportModelRequest {
+  string checkpoint_path = 1;
+  string output_path = 2;
+  string export_format = 3;           // lora, loha, lokr, merged_16bit, merged_4bit, gguf, diffusers
+  string quantization_method = 4;     // for GGUF: q4_k_m, q5_k_m, q8_0, f16, etc.
+  string model = 5;                   // base model name (for merge operations)
+  map<string, string> extra_options = 6;
+}
diff --git a/backend/index.yaml b/backend/index.yaml
index 8dde88256..8a8232747 100644
--- a/backend/index.yaml
+++ b/backend/index.yaml
@@ -3030,3 +3030,54 @@
   uri: "quay.io/go-skynet/local-ai-backends:master-metal-darwin-arm64-voxtral"
   mirrors:
     - localai/localai-backends:master-metal-darwin-arm64-voxtral
+- &trl
+  name: "trl"
+  alias: "trl"
+  license: apache-2.0
+  description: |
+    HuggingFace TRL fine-tuning backend. Supports SFT, DPO, GRPO, RLOO, Reward, KTO, ORPO training methods.
+    Works on CPU and GPU.
+  urls:
+    - https://github.com/huggingface/trl
+  tags:
+    - fine-tuning
+    - LLM
+    - CPU
+    - GPU
+    - CUDA
+  capabilities:
+    default: "cpu-trl"
+    nvidia: "cuda12-trl"
+    nvidia-cuda-12: "cuda12-trl"
+    nvidia-cuda-13: "cuda13-trl"
+## TRL backend images
+- !!merge <<: *trl
+  name: "cpu-trl"
+  uri: "quay.io/go-skynet/local-ai-backends:latest-cpu-trl"
+  mirrors:
+    - localai/localai-backends:latest-cpu-trl
+- !!merge <<: *trl
+  name: "cpu-trl-development"
+  uri: "quay.io/go-skynet/local-ai-backends:master-cpu-trl"
+  mirrors:
+    - localai/localai-backends:master-cpu-trl
+- !!merge <<: *trl
+  name: "cuda12-trl"
+  uri: "quay.io/go-skynet/local-ai-backends:latest-cublas-cuda12-trl"
+  mirrors:
+    - localai/localai-backends:latest-cublas-cuda12-trl
+- !!merge <<: *trl
+  name: "cuda12-trl-development"
+  uri: "quay.io/go-skynet/local-ai-backends:master-cublas-cuda12-trl"
+  mirrors:
+    - localai/localai-backends:master-cublas-cuda12-trl
+- !!merge <<: *trl
+  name: "cuda13-trl"
+  uri: "quay.io/go-skynet/local-ai-backends:latest-cublas-cuda13-trl"
+  mirrors:
+    - localai/localai-backends:latest-cublas-cuda13-trl
+- !!merge <<: *trl
+  name: "cuda13-trl-development"
+  uri: "quay.io/go-skynet/local-ai-backends:master-cublas-cuda13-trl"
+  mirrors:
+    - localai/localai-backends:master-cublas-cuda13-trl
diff --git a/backend/python/trl/Makefile b/backend/python/trl/Makefile
new file mode 100644
index 000000000..ababb961c
--- /dev/null
+++ b/backend/python/trl/Makefile
@@ -0,0 +1,26 @@
+# Version of llama.cpp to fetch convert_hf_to_gguf.py from (for GGUF export)
+LLAMA_CPP_CONVERT_VERSION ?= master
+
+.PHONY: trl
+trl:
+	LLAMA_CPP_CONVERT_VERSION=$(LLAMA_CPP_CONVERT_VERSION) bash install.sh
+
+.PHONY: run
+run: trl
+	@echo "Running trl..."
+	bash run.sh
+	@echo "trl run."
+
+.PHONY: test
+test: trl
+	@echo "Testing trl..."
+	bash test.sh
+	@echo "trl tested."
+
+.PHONY: protogen-clean
+protogen-clean:
+	$(RM) backend_pb2_grpc.py backend_pb2.py
+
+.PHONY: clean
+clean: protogen-clean
+	rm -rf venv __pycache__
diff --git a/backend/python/trl/backend.py b/backend/python/trl/backend.py
new file mode 100644
index 000000000..c414e6fb6
--- /dev/null
+++ b/backend/python/trl/backend.py
@@ -0,0 +1,860 @@
+#!/usr/bin/env python3
+"""
+TRL fine-tuning backend for LocalAI.
+
+Supports all TRL training methods (SFT, DPO, GRPO, RLOO, Reward, KTO, ORPO)
+using standard HuggingFace transformers + PEFT. Works on both CPU and GPU.
+"""
+import argparse
+import json
+import os
+import queue
+import signal
+import sys
+import threading
+import time
+import uuid
+from concurrent import futures
+
+import grpc
+import backend_pb2
+import backend_pb2_grpc
+
+_ONE_DAY_IN_SECONDS = 60 * 60 * 24
+MAX_WORKERS = int(os.environ.get('PYTHON_GRPC_MAX_WORKERS', '4'))
+
+
+class ProgressCallback:
+    """HuggingFace TrainerCallback that pushes progress updates to a queue."""
+
+    def __init__(self, job_id, progress_queue, total_epochs):
+        self.job_id = job_id
+        self.progress_queue = progress_queue
+        self.total_epochs = total_epochs
+
+    def get_callback(self):
+        from transformers import TrainerCallback
+
+        parent = self
+
+        class _Callback(TrainerCallback):
+            def __init__(self):
+                self._train_start_time = None
+
+            def on_train_begin(self, args, state, control, **kwargs):
+                self._train_start_time = time.time()
+
+            def on_log(self, args, state, control, logs=None, **kwargs):
+                if logs is None:
+                    return
+                total_steps = state.max_steps if state.max_steps > 0 else 0
+                progress = (state.global_step / total_steps * 100) if total_steps > 0 else 0
+                eta = 0.0
+                if state.global_step > 0 and total_steps > 0 and self._train_start_time:
+                    elapsed = time.time() - self._train_start_time
+                    remaining_steps = total_steps - state.global_step
+                    if state.global_step > 0:
+                        eta = remaining_steps * (elapsed / state.global_step)
+
+                extra_metrics = {}
+                for k, v in logs.items():
+                    if isinstance(v, (int, float)) and k not in ('loss', 'learning_rate', 'epoch', 'grad_norm', 'eval_loss'):
+                        extra_metrics[k] = float(v)
+
+                update = backend_pb2.FineTuneProgressUpdate(
+                    job_id=parent.job_id,
+                    current_step=state.global_step,
+                    total_steps=total_steps,
+                    current_epoch=float(logs.get('epoch', 0)),
+                    total_epochs=float(parent.total_epochs),
+                    loss=float(logs.get('loss', 0)),
+                    learning_rate=float(logs.get('learning_rate', 0)),
+                    grad_norm=float(logs.get('grad_norm', 0)),
+                    eval_loss=float(logs.get('eval_loss', 0)),
+                    eta_seconds=float(eta),
+                    progress_percent=float(progress),
+                    status="training",
+                    extra_metrics=extra_metrics,
+                )
+                parent.progress_queue.put(update)
+
+            def on_prediction_step(self, args, state, control, **kwargs):
+                """Send periodic updates during evaluation so the UI doesn't freeze."""
+                if not hasattr(self, '_eval_update_counter'):
+                    self._eval_update_counter = 0
+                self._eval_update_counter += 1
+                # Throttle: send an update every 10 prediction steps
+                if self._eval_update_counter % 10 != 0:
+                    return
+                total_steps = state.max_steps if state.max_steps > 0 else 0
+                progress = (state.global_step / total_steps * 100) if total_steps > 0 else 0
+                update = backend_pb2.FineTuneProgressUpdate(
+                    job_id=parent.job_id,
+                    current_step=state.global_step,
+                    total_steps=total_steps,
+                    current_epoch=float(state.epoch or 0),
+                    total_epochs=float(parent.total_epochs),
+                    progress_percent=float(progress),
+                    status="training",
+                    message=f"Evaluating... (batch {self._eval_update_counter})",
+                )
+                parent.progress_queue.put(update)
+
+            def on_evaluate(self, args, state, control, metrics=None, **kwargs):
+                """Report eval results once evaluation is done."""
+                # Reset prediction counter for next eval round
+                self._eval_update_counter = 0
+
+                total_steps = state.max_steps if state.max_steps > 0 else 0
+                progress = (state.global_step / total_steps * 100) if total_steps > 0 else 0
+
+                eval_loss = 0.0
+                extra_metrics = {}
+                if metrics:
+                    eval_loss = float(metrics.get('eval_loss', 0))
+                    for k, v in metrics.items():
+                        if isinstance(v, (int, float)) and k not in ('eval_loss', 'epoch'):
+                            extra_metrics[k] = float(v)
+
+                update = backend_pb2.FineTuneProgressUpdate(
+                    job_id=parent.job_id,
+                    current_step=state.global_step,
+                    total_steps=total_steps,
+                    current_epoch=float(state.epoch or 0),
+                    total_epochs=float(parent.total_epochs),
+                    eval_loss=eval_loss,
+                    progress_percent=float(progress),
+                    status="training",
+                    message=f"Evaluation complete at step {state.global_step}",
+                    extra_metrics=extra_metrics,
+                )
+                parent.progress_queue.put(update)
+
+            def on_save(self, args, state, control, **kwargs):
+                checkpoint_path = os.path.join(args.output_dir, f"checkpoint-{state.global_step}")
+                update = backend_pb2.FineTuneProgressUpdate(
+                    job_id=parent.job_id,
+                    current_step=state.global_step,
+                    status="saving",
+                    message=f"Checkpoint saved at step {state.global_step}",
+                    checkpoint_path=checkpoint_path,
+                )
+                parent.progress_queue.put(update)
+
+            def on_train_end(self, args, state, control, **kwargs):
+                update = backend_pb2.FineTuneProgressUpdate(
+                    job_id=parent.job_id,
+                    current_step=state.global_step,
+                    total_steps=state.max_steps,
+                    progress_percent=100.0,
+                    status="completed",
+                    message="Training completed",
+                )
+                parent.progress_queue.put(update)
+
+        return _Callback()
+
+
+class ActiveJob:
+    """Represents an active fine-tuning job."""
+
+    def __init__(self, job_id):
+        self.job_id = job_id
+        self.progress_queue = queue.Queue()
+        self.trainer = None
+        self.thread = None
+        self.model = None
+        self.tokenizer = None
+        self.error = None
+        self.completed = False
+        self.stopped = False
+
+
+def _is_gated_repo_error(exc):
+    """Check if an exception is caused by a gated HuggingFace repo requiring authentication."""
+    try:
+        from huggingface_hub.utils import GatedRepoError
+        if isinstance(exc, GatedRepoError):
+            return True
+    except ImportError:
+        pass
+    msg = str(exc).lower()
+    if "gated repo" in msg or "access to model" in msg:
+        return True
+    if hasattr(exc, 'response') and hasattr(exc.response, 'status_code'):
+        if exc.response.status_code in (401, 403):
+            return True
+    return False
+
+
+class BackendServicer(backend_pb2_grpc.BackendServicer):
+    def __init__(self):
+        self.active_job = None
+
+    def Health(self, request, context):
+        return backend_pb2.Reply(message=bytes("OK", 'utf-8'))
+
+    def LoadModel(self, request, context):
+        """Accept LoadModel — actual model loading happens in StartFineTune."""
+        return backend_pb2.Result(success=True, message="OK")
+
+    def StartFineTune(self, request, context):
+        if self.active_job is not None and not self.active_job.completed:
+            return backend_pb2.FineTuneJobResult(
+                job_id="",
+                success=False,
+                message="A fine-tuning job is already running",
+            )
+
+        job_id = request.job_id if request.job_id else str(uuid.uuid4())
+        job = ActiveJob(job_id)
+        self.active_job = job
+
+        # Start training in background thread
+        thread = threading.Thread(target=self._run_training, args=(request, job), daemon=True)
+        job.thread = thread
+        thread.start()
+
+        return backend_pb2.FineTuneJobResult(
+            job_id=job_id,
+            success=True,
+            message="Fine-tuning job started",
+        )
+
+    def _run_training(self, request, job):
+        try:
+            self._do_training(request, job)
+        except Exception as e:
+            if _is_gated_repo_error(e):
+                msg = (f"Model '{request.model}' is a gated HuggingFace repo and requires authentication. "
+                       "Pass 'hf_token' in extra_options or set the HF_TOKEN environment variable.")
+            else:
+                msg = f"Training failed: {e}"
+            job.error = msg
+            job.completed = True
+            update = backend_pb2.FineTuneProgressUpdate(
+                job_id=job.job_id,
+                status="failed",
+                message=msg,
+            )
+            job.progress_queue.put(update)
+            # Send sentinel
+            job.progress_queue.put(None)
+
+    def _do_training(self, request, job):
+        import torch
+        from transformers import AutoModelForCausalLM, AutoTokenizer
+        from datasets import load_dataset, Dataset
+
+        extra = dict(request.extra_options)
+        training_method = request.training_method or "sft"
+        training_type = request.training_type or "lora"
+
+        # Send loading status
+        job.progress_queue.put(backend_pb2.FineTuneProgressUpdate(
+            job_id=job.job_id, status="loading_model", message=f"Loading model {request.model}",
+        ))
+
+        # Determine device and dtype
+        device_map = "auto" if torch.cuda.is_available() else "cpu"
+        dtype = torch.float32 if not torch.cuda.is_available() else torch.bfloat16
+
+        # HuggingFace token for gated repos (from extra_options or HF_TOKEN env)
+        hf_token = extra.get("hf_token") or os.environ.get("HF_TOKEN")
+
+        # Load model
+        model_kwargs = {"device_map": device_map, "torch_dtype": dtype}
+        if hf_token:
+            model_kwargs["token"] = hf_token
+        if extra.get("trust_remote_code", "false").lower() == "true":
+            model_kwargs["trust_remote_code"] = True
+        if extra.get("load_in_4bit", "false").lower() == "true" and torch.cuda.is_available():
+            from transformers import BitsAndBytesConfig
+            model_kwargs["quantization_config"] = BitsAndBytesConfig(load_in_4bit=True)
+
+        model = AutoModelForCausalLM.from_pretrained(request.model, **model_kwargs)
+        tokenizer = AutoTokenizer.from_pretrained(request.model, token=hf_token)
+        if tokenizer.pad_token is None:
+            tokenizer.pad_token = tokenizer.eos_token
+
+        job.model = model
+        job.tokenizer = tokenizer
+
+        # Apply LoRA if requested
+        if training_type == "lora":
+            from peft import LoraConfig, get_peft_model
+            lora_r = request.adapter_rank if request.adapter_rank > 0 else 16
+            lora_alpha = request.adapter_alpha if request.adapter_alpha > 0 else 16
+            lora_dropout = request.adapter_dropout if request.adapter_dropout > 0 else 0.0
+
+            target_modules = list(request.target_modules) if request.target_modules else None
+            peft_config = LoraConfig(
+                r=lora_r,
+                lora_alpha=lora_alpha,
+                lora_dropout=lora_dropout,
+                target_modules=target_modules or "all-linear",
+                bias="none",
+                task_type="CAUSAL_LM",
+            )
+            model = get_peft_model(model, peft_config)
+
+        # Load dataset
+        job.progress_queue.put(backend_pb2.FineTuneProgressUpdate(
+            job_id=job.job_id, status="loading_dataset", message="Loading dataset",
+        ))
+
+        dataset_split = request.dataset_split or "train"
+        if os.path.exists(request.dataset_source):
+            if request.dataset_source.endswith('.json') or request.dataset_source.endswith('.jsonl'):
+                dataset = load_dataset("json", data_files=request.dataset_source, split=dataset_split)
+            elif request.dataset_source.endswith('.csv'):
+                dataset = load_dataset("csv", data_files=request.dataset_source, split=dataset_split)
+            else:
+                dataset = load_dataset(request.dataset_source, split=dataset_split)
+        else:
+            dataset = load_dataset(request.dataset_source, split=dataset_split)
+
+        # Eval dataset setup
+        eval_dataset = None
+        eval_strategy = extra.get("eval_strategy", "steps")
+        eval_steps = int(extra.get("eval_steps", str(request.save_steps if request.save_steps > 0 else 500)))
+
+        if eval_strategy != "no":
+            eval_split = extra.get("eval_split")
+            eval_dataset_source = extra.get("eval_dataset_source")
+            if eval_split:
+                # Load a specific split as eval dataset
+                if os.path.exists(request.dataset_source):
+                    if request.dataset_source.endswith('.json') or request.dataset_source.endswith('.jsonl'):
+                        eval_dataset = load_dataset("json", data_files=request.dataset_source, split=eval_split)
+                    elif request.dataset_source.endswith('.csv'):
+                        eval_dataset = load_dataset("csv", data_files=request.dataset_source, split=eval_split)
+                    else:
+                        eval_dataset = load_dataset(request.dataset_source, split=eval_split)
+                else:
+                    eval_dataset = load_dataset(request.dataset_source, split=eval_split)
+            elif eval_dataset_source:
+                # Load eval dataset from a separate source
+                eval_dataset = load_dataset(eval_dataset_source, split="train")
+            else:
+                # Auto-split from training set
+                eval_split_ratio = float(extra.get("eval_split_ratio", "0.1"))
+                split = dataset.train_test_split(test_size=eval_split_ratio)
+                dataset = split["train"]
+                eval_dataset = split["test"]
+
+        if eval_strategy == "no":
+            eval_dataset = None
+
+        # Training config
+        output_dir = request.output_dir or f"./output-{job.job_id}"
+        num_epochs = request.num_epochs if request.num_epochs > 0 else 3
+        batch_size = request.batch_size if request.batch_size > 0 else 2
+        lr = request.learning_rate if request.learning_rate > 0 else 2e-4
+        grad_accum = request.gradient_accumulation_steps if request.gradient_accumulation_steps > 0 else 4
+        warmup_steps = request.warmup_steps if request.warmup_steps > 0 else 5
+        weight_decay = request.weight_decay if request.weight_decay > 0 else 0.01
+        max_steps = request.max_steps if request.max_steps > 0 else -1
+        save_steps = request.save_steps if request.save_steps > 0 else 500
+        seed = request.seed if request.seed > 0 else 3407
+        optimizer = request.optimizer or "adamw_torch"
+
+        # Checkpoint save controls
+        save_total_limit = int(extra.get("save_total_limit", "0")) or None  # 0 = unlimited
+        save_strategy = extra.get("save_strategy", "steps")  # steps, epoch, no
+
+        # CPU vs GPU training args (can be overridden via extra_options)
+        use_cpu = not torch.cuda.is_available()
+        common_train_kwargs = {}
+        if use_cpu:
+            common_train_kwargs["use_cpu"] = True
+            common_train_kwargs["fp16"] = False
+            common_train_kwargs["bf16"] = False
+            common_train_kwargs["gradient_checkpointing"] = False
+        else:
+            common_train_kwargs["bf16"] = True
+            common_train_kwargs["gradient_checkpointing"] = request.gradient_checkpointing
+
+        # Allow extra_options to override training kwargs
+        for flag in ("use_cpu", "bf16", "fp16", "gradient_checkpointing"):
+            if flag in extra:
+                common_train_kwargs[flag] = extra[flag].lower() == "true"
+
+        # Create progress callback
+        progress_cb = ProgressCallback(job.job_id, job.progress_queue, num_epochs)
+
+        # Build save kwargs (shared across all methods)
+        _save_kwargs = {}
+        if save_strategy == "steps" and save_steps > 0:
+            _save_kwargs["save_steps"] = save_steps
+            _save_kwargs["save_strategy"] = "steps"
+        elif save_strategy == "epoch":
+            _save_kwargs["save_strategy"] = "epoch"
+        elif save_strategy == "no":
+            _save_kwargs["save_strategy"] = "no"
+        else:
+            _save_kwargs["save_steps"] = save_steps
+            _save_kwargs["save_strategy"] = "steps"
+        if save_total_limit:
+            _save_kwargs["save_total_limit"] = save_total_limit
+
+        # Eval kwargs
+        _eval_kwargs = {}
+        if eval_dataset is not None:
+            _eval_kwargs["eval_strategy"] = eval_strategy
+            _eval_kwargs["eval_steps"] = eval_steps
+
+        # Common training arguments shared by all methods
+        _common_args = dict(
+            output_dir=output_dir,
+            num_train_epochs=num_epochs,
+            per_device_train_batch_size=batch_size,
+            learning_rate=lr,
+            gradient_accumulation_steps=grad_accum,
+            warmup_steps=warmup_steps,
+            weight_decay=weight_decay,
+            max_steps=max_steps,
+            seed=seed,
+            optim=optimizer,
+            logging_steps=1,
+            report_to="none",
+            **_save_kwargs,
+            **common_train_kwargs,
+            **_eval_kwargs,
+        )
+
+        # Select trainer based on training method
+        if training_method == "sft":
+            from trl import SFTTrainer, SFTConfig
+
+            max_length = int(extra.get("max_seq_length", "512"))
+            packing = extra.get("packing", "false").lower() == "true"
+
+            training_args = SFTConfig(
+                max_length=max_length,
+                packing=packing,
+                **_common_args,
+            )
+
+            trainer = SFTTrainer(
+                model=model,
+                args=training_args,
+                train_dataset=dataset,
+                eval_dataset=eval_dataset,
+                processing_class=tokenizer,
+                callbacks=[progress_cb.get_callback()],
+            )
+
+        elif training_method == "dpo":
+            from trl import DPOTrainer, DPOConfig
+
+            beta = float(extra.get("beta", "0.1"))
+            loss_type = extra.get("loss_type", "sigmoid")
+            max_length = int(extra.get("max_length", "512"))
+
+            training_args = DPOConfig(
+                beta=beta,
+                loss_type=loss_type,
+                max_length=max_length,
+                **_common_args,
+            )
+
+            trainer = DPOTrainer(
+                model=model,
+                args=training_args,
+                train_dataset=dataset,
+                eval_dataset=eval_dataset,
+                processing_class=tokenizer,
+                callbacks=[progress_cb.get_callback()],
+            )
+
+        elif training_method == "grpo":
+            from trl import GRPOTrainer, GRPOConfig
+
+            num_generations = int(extra.get("num_generations", "4"))
+            max_completion_length = int(extra.get("max_completion_length", "256"))
+
+            training_args = GRPOConfig(
+                num_generations=num_generations,
+                max_completion_length=max_completion_length,
+                **_common_args,
+            )
+
+            # GRPO requires reward functions passed via extra_options as a JSON list
+            from reward_functions import build_reward_functions
+
+            reward_funcs = []
+            if extra.get("reward_funcs"):
+                reward_funcs = build_reward_functions(extra["reward_funcs"])
+
+            if not reward_funcs:
+                raise ValueError(
+                    "GRPO requires at least one reward function. "
+                    "Specify reward_functions in the request or "
+                    "reward_funcs in extra_options."
+                )
+
+            trainer = GRPOTrainer(
+                model=model,
+                args=training_args,
+                train_dataset=dataset,
+                processing_class=tokenizer,
+                reward_funcs=reward_funcs,
+                callbacks=[progress_cb.get_callback()],
+            )
+
+        elif training_method == "orpo":
+            from trl import ORPOTrainer, ORPOConfig
+
+            beta = float(extra.get("beta", "0.1"))
+            max_length = int(extra.get("max_length", "512"))
+
+            training_args = ORPOConfig(
+                beta=beta,
+                max_length=max_length,
+                **_common_args,
+            )
+
+            trainer = ORPOTrainer(
+                model=model,
+                args=training_args,
+                train_dataset=dataset,
+                eval_dataset=eval_dataset,
+                processing_class=tokenizer,
+                callbacks=[progress_cb.get_callback()],
+            )
+
+        elif training_method == "kto":
+            from trl import KTOTrainer, KTOConfig
+
+            beta = float(extra.get("beta", "0.1"))
+            max_length = int(extra.get("max_length", "512"))
+
+            training_args = KTOConfig(
+                beta=beta,
+                max_length=max_length,
+                **_common_args,
+            )
+
+            trainer = KTOTrainer(
+                model=model,
+                args=training_args,
+                train_dataset=dataset,
+                eval_dataset=eval_dataset,
+                processing_class=tokenizer,
+                callbacks=[progress_cb.get_callback()],
+            )
+
+        elif training_method == "rloo":
+            from trl import RLOOTrainer, RLOOConfig
+
+            num_generations = int(extra.get("num_generations", "4"))
+            max_completion_length = int(extra.get("max_completion_length", "256"))
+
+            training_args = RLOOConfig(
+                num_generations=num_generations,
+                max_new_tokens=max_completion_length,
+                **_common_args,
+            )
+
+            trainer = RLOOTrainer(
+                model=model,
+                args=training_args,
+                train_dataset=dataset,
+                processing_class=tokenizer,
+                callbacks=[progress_cb.get_callback()],
+            )
+
+        elif training_method == "reward":
+            from trl import RewardTrainer, RewardConfig
+
+            max_length = int(extra.get("max_length", "512"))
+
+            training_args = RewardConfig(
+                max_length=max_length,
+                **_common_args,
+            )
+
+            trainer = RewardTrainer(
+                model=model,
+                args=training_args,
+                train_dataset=dataset,
+                eval_dataset=eval_dataset,
+                processing_class=tokenizer,
+                callbacks=[progress_cb.get_callback()],
+            )
+
+        else:
+            raise ValueError(f"Unsupported training method: {training_method}. "
+                             "Supported: sft, dpo, grpo, orpo, kto, rloo, reward")
+
+        job.trainer = trainer
+
+        # Start training
+        job.progress_queue.put(backend_pb2.FineTuneProgressUpdate(
+            job_id=job.job_id, status="training", message="Training started",
+        ))
+
+        resume_ckpt = request.resume_from_checkpoint if request.resume_from_checkpoint else None
+        trainer.train(resume_from_checkpoint=resume_ckpt)
+
+        # Save final model
+        trainer.save_model(output_dir)
+        if tokenizer:
+            tokenizer.save_pretrained(output_dir)
+
+        job.completed = True
+        # Sentinel to signal stream end
+        job.progress_queue.put(None)
+
+    def FineTuneProgress(self, request, context):
+        if self.active_job is None or self.active_job.job_id != request.job_id:
+            context.set_code(grpc.StatusCode.NOT_FOUND)
+            context.set_details(f"Job {request.job_id} not found")
+            return
+
+        job = self.active_job
+        while True:
+            try:
+                update = job.progress_queue.get(timeout=1.0)
+                if update is None:
+                    break
+                yield update
+                if update.status in ("completed", "failed", "stopped"):
+                    break
+            except queue.Empty:
+                if job.completed or job.stopped:
+                    break
+                if not context.is_active():
+                    break
+                continue
+
+    def StopFineTune(self, request, context):
+        # Stopping is handled by killing the process from Go via ShutdownModel.
+        return backend_pb2.Result(success=True, message="OK")
+
+    def ListCheckpoints(self, request, context):
+        output_dir = request.output_dir
+        if not os.path.isdir(output_dir):
+            return backend_pb2.ListCheckpointsResponse(checkpoints=[])
+
+        checkpoints = []
+        for entry in sorted(os.listdir(output_dir)):
+            if entry.startswith("checkpoint-"):
+                ckpt_path = os.path.join(output_dir, entry)
+                if not os.path.isdir(ckpt_path):
+                    continue
+                step = 0
+                try:
+                    step = int(entry.split("-")[1])
+                except (IndexError, ValueError):
+                    pass
+
+                # Try to read trainer_state.json for metadata
+                loss = 0.0
+                epoch = 0.0
+                state_file = os.path.join(ckpt_path, "trainer_state.json")
+                if os.path.exists(state_file):
+                    try:
+                        with open(state_file) as f:
+                            state = json.load(f)
+                        if state.get("log_history"):
+                            last_log = state["log_history"][-1]
+                            loss = last_log.get("loss", 0.0)
+                            epoch = last_log.get("epoch", 0.0)
+                    except Exception:
+                        pass
+
+                created_at = time.strftime(
+                    "%Y-%m-%dT%H:%M:%SZ",
+                    time.gmtime(os.path.getmtime(ckpt_path)),
+                )
+
+                checkpoints.append(backend_pb2.CheckpointInfo(
+                    path=ckpt_path,
+                    step=step,
+                    epoch=float(epoch),
+                    loss=float(loss),
+                    created_at=created_at,
+                ))
+
+        return backend_pb2.ListCheckpointsResponse(checkpoints=checkpoints)
+
+    def ExportModel(self, request, context):
+        export_format = request.export_format or "lora"
+        output_path = request.output_path
+        checkpoint_path = request.checkpoint_path
+
+        # Extract HF token for gated model access
+        extra = dict(request.extra_options) if request.extra_options else {}
+        hf_token = extra.get("hf_token") or os.environ.get("HF_TOKEN")
+
+        if not checkpoint_path or not os.path.isdir(checkpoint_path):
+            return backend_pb2.Result(success=False, message=f"Checkpoint not found: {checkpoint_path}")
+
+        os.makedirs(output_path, exist_ok=True)
+
+        try:
+            if export_format == "lora":
+                # Just copy the adapter files
+                import shutil
+                for f in os.listdir(checkpoint_path):
+                    src = os.path.join(checkpoint_path, f)
+                    dst = os.path.join(output_path, f)
+                    if os.path.isfile(src):
+                        shutil.copy2(src, dst)
+
+            elif export_format in ("merged_16bit", "merged_4bit"):
+                import torch
+                from transformers import AutoModelForCausalLM, AutoTokenizer
+                from peft import PeftModel
+
+                base_model_name = request.model
+                if not base_model_name:
+                    return backend_pb2.Result(success=False, message="Base model name required for merge export")
+
+                dtype = torch.float16 if export_format == "merged_16bit" else torch.float32
+                base_model = AutoModelForCausalLM.from_pretrained(base_model_name, torch_dtype=dtype, token=hf_token)
+                model = PeftModel.from_pretrained(base_model, checkpoint_path)
+                merged = model.merge_and_unload()
+                merged.save_pretrained(output_path)
+
+                tokenizer = AutoTokenizer.from_pretrained(base_model_name, token=hf_token)
+                tokenizer.save_pretrained(output_path)
+
+            elif export_format == "gguf":
+                import torch
+                import subprocess
+                import shutil
+                from transformers import AutoModelForCausalLM, AutoTokenizer
+                from peft import PeftModel
+
+                base_model_name = request.model
+                if not base_model_name:
+                    return backend_pb2.Result(success=False, message="Base model name required for GGUF export")
+
+                # Step 1: Merge LoRA into base model
+                merge_dir = os.path.join(output_path, "_hf_merged")
+                os.makedirs(merge_dir, exist_ok=True)
+
+                base_model = AutoModelForCausalLM.from_pretrained(base_model_name, torch_dtype=torch.float16, token=hf_token)
+                model = PeftModel.from_pretrained(base_model, checkpoint_path)
+                merged = model.merge_and_unload()
+                merged.save_pretrained(merge_dir)
+
+                tokenizer = AutoTokenizer.from_pretrained(base_model_name, token=hf_token)
+                tokenizer.save_pretrained(merge_dir)
+
+                # Ensure tokenizer.model (SentencePiece) is present in merge_dir.
+                # Gemma models need this file for GGUF conversion to use the
+                # SentencePiece path; without it, the script falls back to BPE
+                # handling which fails on unrecognized pre-tokenizer hashes.
+                sp_model_path = os.path.join(merge_dir, "tokenizer.model")
+                if not os.path.exists(sp_model_path):
+                    sp_copied = False
+                    # Method 1: Load the slow tokenizer which keeps the SP model file
+                    try:
+                        slow_tok = AutoTokenizer.from_pretrained(base_model_name, use_fast=False, token=hf_token)
+                        if hasattr(slow_tok, 'vocab_file') and slow_tok.vocab_file and os.path.exists(slow_tok.vocab_file):
+                            import shutil as _shutil
+                            _shutil.copy2(slow_tok.vocab_file, sp_model_path)
+                            sp_copied = True
+                            print(f"Copied tokenizer.model from slow tokenizer cache")
+                    except Exception as e:
+                        print(f"Slow tokenizer method failed: {e}")
+                    # Method 2: Download from HF hub
+                    if not sp_copied:
+                        try:
+                            from huggingface_hub import hf_hub_download
+                            cached_sp = hf_hub_download(repo_id=base_model_name, filename="tokenizer.model", token=hf_token)
+                            import shutil as _shutil
+                            _shutil.copy2(cached_sp, sp_model_path)
+                            sp_copied = True
+                            print(f"Copied tokenizer.model from HF hub")
+                        except Exception as e:
+                            print(f"HF hub download method failed: {e}")
+                    if not sp_copied:
+                        print(f"WARNING: Could not obtain tokenizer.model for {base_model_name}. "
+                              "GGUF conversion may fail for SentencePiece models.")
+
+                # Free GPU memory before conversion
+                del merged, model, base_model
+                if torch.cuda.is_available():
+                    torch.cuda.empty_cache()
+
+                # Step 2: Convert to GGUF using convert_hf_to_gguf.py
+                quant = request.quantization_method or "auto"
+                outtype_map = {"f16": "f16", "f32": "f32", "bf16": "bf16", "q8_0": "q8_0", "auto": "auto"}
+                outtype = outtype_map.get(quant, "f16")
+
+                gguf_filename = f"{os.path.basename(output_path)}-{outtype}.gguf"
+                gguf_path = os.path.join(output_path, gguf_filename)
+
+                script_dir = os.path.dirname(os.path.abspath(__file__))
+                convert_script = os.path.join(script_dir, "convert_hf_to_gguf.py")
+                if not os.path.exists(convert_script):
+                    return backend_pb2.Result(success=False,
+                        message="convert_hf_to_gguf.py not found. Install the GGUF conversion tools.")
+
+                # Log merge_dir contents for debugging conversion issues
+                merge_files = os.listdir(merge_dir) if os.path.isdir(merge_dir) else []
+                print(f"Merge dir contents: {merge_files}", flush=True)
+
+                env = os.environ.copy()
+                env["NO_LOCAL_GGUF"] = "1"
+                cmd = [sys.executable, convert_script, merge_dir, "--outtype", outtype, "--outfile", gguf_path]
+                conv_result = subprocess.run(cmd, capture_output=True, text=True, timeout=3600, env=env)
+                if conv_result.returncode != 0:
+                    diag = f"stdout: {conv_result.stdout[-300:]}\nstderr: {conv_result.stderr[-500:]}"
+                    return backend_pb2.Result(success=False,
+                        message=f"GGUF conversion failed: {diag}")
+
+                # Clean up intermediate merged model
+                shutil.rmtree(merge_dir, ignore_errors=True)
+            else:
+                return backend_pb2.Result(success=False, message=f"Unsupported export format: {export_format}")
+
+        except Exception as e:
+            if _is_gated_repo_error(e):
+                return backend_pb2.Result(success=False,
+                    message=f"Model '{request.model}' is a gated HuggingFace repo and requires authentication. "
+                            "Pass 'hf_token' in extra_options or set the HF_TOKEN environment variable.")
+            return backend_pb2.Result(success=False, message=f"Export failed: {e}")
+
+        return backend_pb2.Result(success=True, message=f"Model exported to {output_path}")
+
+
+def serve(address):
+    server = grpc.server(
+        futures.ThreadPoolExecutor(max_workers=MAX_WORKERS),
+        options=[
+            ('grpc.max_message_length', 50 * 1024 * 1024),
+            ('grpc.max_send_message_length', 50 * 1024 * 1024),
+            ('grpc.max_receive_message_length', 50 * 1024 * 1024),
+        ],
+    )
+    backend_pb2_grpc.add_BackendServicer_to_server(BackendServicer(), server)
+    server.add_insecure_port(address)
+    server.start()
+    print(f"TRL fine-tuning backend listening on {address}", file=sys.stderr, flush=True)
+
+    # Handle graceful shutdown
+    def stop(signum, frame):
+        server.stop(0)
+        sys.exit(0)
+
+    signal.signal(signal.SIGTERM, stop)
+    signal.signal(signal.SIGINT, stop)
+
+    try:
+        while True:
+            time.sleep(_ONE_DAY_IN_SECONDS)
+    except KeyboardInterrupt:
+        server.stop(0)
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="TRL fine-tuning gRPC backend")
+    parser.add_argument("--addr", default="localhost:50051", help="gRPC server address")
+    args = parser.parse_args()
+    serve(args.addr)
diff --git a/backend/python/trl/install.sh b/backend/python/trl/install.sh
new file mode 100644
index 000000000..6963e60ed
--- /dev/null
+++ b/backend/python/trl/install.sh
@@ -0,0 +1,37 @@
+#!/bin/bash
+set -e
+
+backend_dir=$(dirname $0)
+if [ -d $backend_dir/common ]; then
+    source $backend_dir/common/libbackend.sh
+else
+    source $backend_dir/../common/libbackend.sh
+fi
+
+EXTRA_PIP_INSTALL_FLAGS+=" --upgrade --index-strategy=unsafe-first-match"
+installRequirements
+
+# Fetch convert_hf_to_gguf.py and gguf package from the same llama.cpp version
+LLAMA_CPP_CONVERT_VERSION="${LLAMA_CPP_CONVERT_VERSION:-master}"
+CONVERT_SCRIPT="${EDIR}/convert_hf_to_gguf.py"
+if [ ! -f "${CONVERT_SCRIPT}" ]; then
+    echo "Downloading convert_hf_to_gguf.py from llama.cpp (${LLAMA_CPP_CONVERT_VERSION})..."
+    curl -L --fail --retry 3 \
+        "https://raw.githubusercontent.com/ggml-org/llama.cpp/${LLAMA_CPP_CONVERT_VERSION}/convert_hf_to_gguf.py" \
+        -o "${CONVERT_SCRIPT}" || echo "Warning: Failed to download convert_hf_to_gguf.py. GGUF export will not be available."
+fi
+
+# Install gguf package from the same llama.cpp commit to keep them in sync
+GGUF_PIP_SPEC="gguf @ git+https://github.com/ggml-org/llama.cpp@${LLAMA_CPP_CONVERT_VERSION}#subdirectory=gguf-py"
+echo "Installing gguf package from llama.cpp (${LLAMA_CPP_CONVERT_VERSION})..."
+if [ "x${USE_PIP:-}" == "xtrue" ]; then
+    pip install "${GGUF_PIP_SPEC}" || {
+        echo "Warning: Failed to install gguf from llama.cpp commit, falling back to PyPI..."
+        pip install "gguf>=0.16.0"
+    }
+else
+    uv pip install "${GGUF_PIP_SPEC}" || {
+        echo "Warning: Failed to install gguf from llama.cpp commit, falling back to PyPI..."
+        uv pip install "gguf>=0.16.0"
+    }
+fi
diff --git a/backend/python/trl/requirements-cpu.txt b/backend/python/trl/requirements-cpu.txt
new file mode 100644
index 000000000..c67858542
--- /dev/null
+++ b/backend/python/trl/requirements-cpu.txt
@@ -0,0 +1,9 @@
+--extra-index-url https://download.pytorch.org/whl/cpu
+torch==2.10.0
+trl
+peft
+datasets>=3.0.0
+transformers>=4.56.2
+accelerate>=1.4.0
+huggingface-hub>=1.3.0
+sentencepiece
diff --git a/backend/python/trl/requirements-cublas12.txt b/backend/python/trl/requirements-cublas12.txt
new file mode 100644
index 000000000..05f29591c
--- /dev/null
+++ b/backend/python/trl/requirements-cublas12.txt
@@ -0,0 +1,9 @@
+torch==2.10.0
+trl
+peft
+datasets>=3.0.0
+transformers>=4.56.2
+accelerate>=1.4.0
+huggingface-hub>=1.3.0
+sentencepiece
+bitsandbytes
diff --git a/backend/python/trl/requirements-cublas13.txt b/backend/python/trl/requirements-cublas13.txt
new file mode 100644
index 000000000..05f29591c
--- /dev/null
+++ b/backend/python/trl/requirements-cublas13.txt
@@ -0,0 +1,9 @@
+torch==2.10.0
+trl
+peft
+datasets>=3.0.0
+transformers>=4.56.2
+accelerate>=1.4.0
+huggingface-hub>=1.3.0
+sentencepiece
+bitsandbytes
diff --git a/backend/python/trl/requirements.txt b/backend/python/trl/requirements.txt
new file mode 100644
index 000000000..0834a8fcd
--- /dev/null
+++ b/backend/python/trl/requirements.txt
@@ -0,0 +1,3 @@
+grpcio==1.78.1
+protobuf
+certifi
diff --git a/backend/python/trl/reward_functions.py b/backend/python/trl/reward_functions.py
new file mode 100644
index 000000000..12074f80c
--- /dev/null
+++ b/backend/python/trl/reward_functions.py
@@ -0,0 +1,236 @@
+"""
+Built-in reward functions and inline function compiler for GRPO training.
+
+All reward functions follow TRL's signature: (completions, **kwargs) -> list[float]
+"""
+
+import json
+import re
+import math
+import string
+import functools
+
+
+# ---------------------------------------------------------------------------
+# Built-in reward functions
+# ---------------------------------------------------------------------------
+
+def format_reward(completions, **kwargs):
+    """Checks for <think>...</think> followed by an answer. Returns 1.0 or 0.0."""
+    pattern = re.compile(r"<think>.*?</think>\s*\S", re.DOTALL)
+    return [1.0 if pattern.search(c) else 0.0 for c in completions]
+
+
+def reasoning_accuracy_reward(completions, **kwargs):
+    """Extracts <answer>...</answer> content and compares to the expected answer."""
+    answers = kwargs.get("answer", [])
+    if not answers:
+        return [0.0] * len(completions)
+
+    pattern = re.compile(r"<answer>(.*?)</answer>", re.DOTALL)
+    scores = []
+    for i, c in enumerate(completions):
+        expected = answers[i] if i < len(answers) else ""
+        match = pattern.search(c)
+        if match:
+            extracted = match.group(1).strip()
+            scores.append(1.0 if extracted.lower() == str(expected).strip().lower() else 0.0)
+        else:
+            scores.append(0.0)
+    return scores
+
+
+def length_reward(completions, target_length=200, **kwargs):
+    """Score based on proximity to target_length. Returns [0, 1]."""
+    scores = []
+    for c in completions:
+        length = len(c)
+        if target_length <= 0:
+            scores.append(0.0)
+        else:
+            diff = abs(length - target_length) / target_length
+            scores.append(max(0.0, 1.0 - diff))
+    return scores
+
+
+def xml_tag_reward(completions, **kwargs):
+    """Scores properly opened/closed XML tags (<think>, <answer>)."""
+    tags = ["think", "answer"]
+    scores = []
+    for c in completions:
+        tag_score = 0.0
+        for tag in tags:
+            if f"<{tag}>" in c and f"</{tag}>" in c:
+                tag_score += 0.5
+        scores.append(min(tag_score, 1.0))
+    return scores
+
+
+def no_repetition_reward(completions, n=4, **kwargs):
+    """Penalizes n-gram repetition. Returns [0, 1]."""
+    scores = []
+    for c in completions:
+        words = c.split()
+        if len(words) < n:
+            scores.append(1.0)
+            continue
+        ngrams = [tuple(words[i:i+n]) for i in range(len(words) - n + 1)]
+        unique = len(set(ngrams))
+        total = len(ngrams)
+        scores.append(unique / total if total > 0 else 1.0)
+    return scores
+
+
+def code_execution_reward(completions, **kwargs):
+    """Checks Python code block syntax validity via compile(). Returns 1.0 or 0.0."""
+    pattern = re.compile(r"```python\s*\n(.*?)```", re.DOTALL)
+    scores = []
+    for c in completions:
+        match = pattern.search(c)
+        if not match:
+            scores.append(0.0)
+            continue
+        code = match.group(1)
+        try:
+            compile(code, "<inline>", "exec")
+            scores.append(1.0)
+        except SyntaxError:
+            scores.append(0.0)
+    return scores
+
+
+# ---------------------------------------------------------------------------
+# Registry
+# ---------------------------------------------------------------------------
+
+BUILTIN_REGISTRY = {
+    "format_reward": format_reward,
+    "reasoning_accuracy_reward": reasoning_accuracy_reward,
+    "length_reward": length_reward,
+    "xml_tag_reward": xml_tag_reward,
+    "no_repetition_reward": no_repetition_reward,
+    "code_execution_reward": code_execution_reward,
+}
+
+
+# ---------------------------------------------------------------------------
+# Inline function compiler
+# ---------------------------------------------------------------------------
+
+_SAFE_BUILTINS = {
+    "len": len, "int": int, "float": float, "str": str, "bool": bool,
+    "list": list, "dict": dict, "tuple": tuple, "set": set,
+    "range": range, "enumerate": enumerate, "zip": zip,
+    "map": map, "filter": filter, "sorted": sorted,
+    "min": min, "max": max, "sum": sum, "abs": abs, "round": round,
+    "any": any, "all": all, "isinstance": isinstance, "type": type,
+    "print": print, "True": True, "False": False, "None": None,
+    "ValueError": ValueError, "TypeError": TypeError,
+    "KeyError": KeyError, "IndexError": IndexError,
+}
+
+
+def compile_inline_reward(name, code):
+    """Compile user-provided code into a reward function.
+
+    The code should be the body of a function that receives
+    `completions` (list[str]) and `**kwargs`, and returns list[float].
+
+    Available modules: re, math, json, string.
+    """
+    func_source = (
+        f"def _user_reward_{name}(completions, **kwargs):\n"
+        + "\n".join(f"    {line}" for line in code.splitlines())
+    )
+
+    restricted_globals = {
+        "__builtins__": _SAFE_BUILTINS,
+        "re": re,
+        "math": math,
+        "json": json,
+        "string": string,
+    }
+
+    try:
+        compiled = compile(func_source, f"<inline-reward-{name}>", "exec")
+    except SyntaxError as e:
+        raise ValueError(f"Syntax error in inline reward function '{name}': {e}")
+
+    exec(compiled, restricted_globals)
+    func = restricted_globals[f"_user_reward_{name}"]
+
+    # Validate with a quick smoke test
+    try:
+        result = func(["test"], answer=["test"])
+        if not isinstance(result, list):
+            raise ValueError(
+                f"Inline reward function '{name}' must return a list, got {type(result).__name__}"
+            )
+    except Exception as e:
+        if "must return a list" in str(e):
+            raise
+        # Other errors during smoke test are acceptable (e.g. missing kwargs)
+        pass
+
+    return func
+
+
+# ---------------------------------------------------------------------------
+# Dispatcher
+# ---------------------------------------------------------------------------
+
+def build_reward_functions(specs_json):
+    """Parse a JSON list of reward function specs and return a list of callables.
+
+    Each spec is a dict with:
+      - type: "builtin" or "inline"
+      - name: function name
+      - code: (inline only) Python function body
+      - params: (optional) dict of string params applied via functools.partial
+    """
+    if isinstance(specs_json, str):
+        specs = json.loads(specs_json)
+    else:
+        specs = specs_json
+
+    if not isinstance(specs, list):
+        raise ValueError("reward_funcs must be a JSON array of reward function specs")
+
+    reward_funcs = []
+    for spec in specs:
+        spec_type = spec.get("type", "builtin")
+        name = spec.get("name", "")
+        params = spec.get("params", {})
+
+        if spec_type == "builtin":
+            if name not in BUILTIN_REGISTRY:
+                available = ", ".join(sorted(BUILTIN_REGISTRY.keys()))
+                raise ValueError(
+                    f"Unknown builtin reward function '{name}'. Available: {available}"
+                )
+            func = BUILTIN_REGISTRY[name]
+            if params:
+                # Convert string params to appropriate types
+                typed_params = {}
+                for k, v in params.items():
+                    try:
+                        typed_params[k] = int(v)
+                    except (ValueError, TypeError):
+                        try:
+                            typed_params[k] = float(v)
+                        except (ValueError, TypeError):
+                            typed_params[k] = v
+                func = functools.partial(func, **typed_params)
+            reward_funcs.append(func)
+
+        elif spec_type == "inline":
+            code = spec.get("code", "")
+            if not code.strip():
+                raise ValueError(f"Inline reward function '{name}' has no code")
+            func = compile_inline_reward(name, code)
+            reward_funcs.append(func)
+
+        else:
+            raise ValueError(f"Unknown reward function type '{spec_type}'. Use 'builtin' or 'inline'")
+
+    return reward_funcs
diff --git a/backend/python/trl/run.sh b/backend/python/trl/run.sh
new file mode 100644
index 000000000..bd17c6e1d
--- /dev/null
+++ b/backend/python/trl/run.sh
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+backend_dir=$(dirname $0)
+if [ -d $backend_dir/common ]; then
+    source $backend_dir/common/libbackend.sh
+else
+    source $backend_dir/../common/libbackend.sh
+fi
+
+startBackend $@
diff --git a/backend/python/trl/test.py b/backend/python/trl/test.py
new file mode 100644
index 000000000..d77d4e9f0
--- /dev/null
+++ b/backend/python/trl/test.py
@@ -0,0 +1,58 @@
+"""
+Test script for the TRL fine-tuning gRPC backend.
+"""
+import unittest
+import subprocess
+import time
+
+import grpc
+import backend_pb2
+import backend_pb2_grpc
+
+
+class TestBackendServicer(unittest.TestCase):
+    """Tests for the TRL fine-tuning gRPC service."""
+
+    def setUp(self):
+        self.service = subprocess.Popen(
+            ["python3", "backend.py", "--addr", "localhost:50051"]
+        )
+        time.sleep(10)
+
+    def tearDown(self):
+        self.service.kill()
+        self.service.wait()
+
+    def test_server_startup(self):
+        """Test that the server starts and responds to health checks."""
+        try:
+            self.setUp()
+            with grpc.insecure_channel("localhost:50051") as channel:
+                stub = backend_pb2_grpc.BackendStub(channel)
+                response = stub.Health(backend_pb2.HealthMessage())
+                self.assertEqual(response.message, b'OK')
+        except Exception as err:
+            print(err)
+            self.fail("Server failed to start")
+        finally:
+            self.tearDown()
+
+    def test_list_checkpoints_empty(self):
+        """Test listing checkpoints on a non-existent directory."""
+        try:
+            self.setUp()
+            with grpc.insecure_channel("localhost:50051") as channel:
+                stub = backend_pb2_grpc.BackendStub(channel)
+                response = stub.ListCheckpoints(
+                    backend_pb2.ListCheckpointsRequest(output_dir="/nonexistent")
+                )
+                self.assertEqual(len(response.checkpoints), 0)
+        except Exception as err:
+            print(err)
+            self.fail("ListCheckpoints service failed")
+        finally:
+            self.tearDown()
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/backend/python/trl/test.sh b/backend/python/trl/test.sh
new file mode 100644
index 000000000..eb59f2aaf
--- /dev/null
+++ b/backend/python/trl/test.sh
@@ -0,0 +1,11 @@
+#!/bin/bash
+set -e
+
+backend_dir=$(dirname $0)
+if [ -d $backend_dir/common ]; then
+    source $backend_dir/common/libbackend.sh
+else
+    source $backend_dir/../common/libbackend.sh
+fi
+
+runUnittests
diff --git a/core/cli/run.go b/core/cli/run.go
index c614e123d..000dd3366 100644
--- a/core/cli/run.go
+++ b/core/cli/run.go
@@ -121,6 +121,9 @@ type RunCMD struct {
 	AgentPoolCollectionDBPath string `env:"LOCALAI_AGENT_POOL_COLLECTION_DB_PATH" help:"Database path for agent collections" group:"agents"`
 	AgentHubURL               string `env:"LOCALAI_AGENT_HUB_URL" default:"https://agenthub.localai.io" help:"URL for the agent hub where users can browse and download agent configurations" group:"agents"`
 
+	// Fine-tuning
+	EnableFineTuning bool `env:"LOCALAI_ENABLE_FINETUNING" default:"false" help:"Enable fine-tuning support" group:"finetuning"`
+
 	// Authentication
 	AuthEnabled          bool   `env:"LOCALAI_AUTH" default:"false" help:"Enable user authentication and authorization" group:"auth"`
 	AuthDatabaseURL      string `env:"LOCALAI_AUTH_DATABASE_URL,DATABASE_URL" help:"Database URL for auth (postgres:// or file path for SQLite). Defaults to {DataPath}/database.db" group:"auth"`
@@ -326,6 +329,11 @@ func (r *RunCMD) Run(ctx *cliContext.Context) error {
 		opts = append(opts, config.WithAgentHubURL(r.AgentHubURL))
 	}
 
+	// Fine-tuning
+	if r.EnableFineTuning {
+		opts = append(opts, config.EnableFineTuning)
+	}
+
 	// Authentication
 	authEnabled := r.AuthEnabled || r.GitHubClientID != "" || r.OIDCClientID != ""
 	if authEnabled {
diff --git a/core/config/application_config.go b/core/config/application_config.go
index 9c1be82d9..bb187be43 100644
--- a/core/config/application_config.go
+++ b/core/config/application_config.go
@@ -97,6 +97,9 @@ type ApplicationConfig struct {
 	// Agent Pool (LocalAGI integration)
 	AgentPool AgentPoolConfig
 
+	// Fine-tuning
+	FineTuning FineTuningConfig
+
 	// Authentication & Authorization
 	Auth AuthConfig
 }
@@ -142,6 +145,11 @@ type AgentPoolConfig struct {
 	AgentHubURL      string // default: "https://agenthub.localai.io"
 }
 
+// FineTuningConfig holds configuration for fine-tuning support.
+type FineTuningConfig struct {
+	Enabled bool
+}
+
 type AppOption func(*ApplicationConfig)
 
 func NewApplicationConfig(o ...AppOption) *ApplicationConfig {
@@ -733,6 +741,12 @@ func WithAgentHubURL(url string) AppOption {
 	}
 }
 
+// Fine-tuning options
+
+var EnableFineTuning = func(o *ApplicationConfig) {
+	o.FineTuning.Enabled = true
+}
+
 // Auth options
 
 func WithAuthEnabled(enabled bool) AppOption {
diff --git a/core/gallery/importers/local.go b/core/gallery/importers/local.go
new file mode 100644
index 000000000..2a456cc60
--- /dev/null
+++ b/core/gallery/importers/local.go
@@ -0,0 +1,205 @@
+package importers
+
+import (
+	"encoding/json"
+	"fmt"
+	"os"
+	"path/filepath"
+	"strings"
+
+	"github.com/mudler/LocalAI/core/config"
+	"github.com/mudler/xlog"
+)
+
+// ImportLocalPath scans a local directory for exported model files and produces
+// a config.ModelConfig with the correct backend, model path, and options.
+// Paths in the returned config are relative to modelsPath when possible so that
+// the YAML config remains portable.
+//
+// Detection order:
+//  1. GGUF files (*.gguf) — uses llama-cpp backend
+//  2. LoRA adapter (adapter_config.json) — uses transformers backend with lora_adapter
+//  3. Merged model (*.safetensors or pytorch_model*.bin + config.json) — uses transformers backend
+func ImportLocalPath(dirPath, name string) (*config.ModelConfig, error) {
+	// Make paths relative to the models directory (parent of dirPath)
+	// so config YAML stays portable.
+	modelsDir := filepath.Dir(dirPath)
+	relPath := func(absPath string) string {
+		if rel, err := filepath.Rel(modelsDir, absPath); err == nil {
+			return rel
+		}
+		return absPath
+	}
+
+	// 1. GGUF: check dirPath and dirPath_gguf/ (Unsloth convention)
+	ggufFile := findGGUF(dirPath)
+	if ggufFile == "" {
+		ggufSubdir := dirPath + "_gguf"
+		ggufFile = findGGUF(ggufSubdir)
+	}
+	if ggufFile != "" {
+		xlog.Info("ImportLocalPath: detected GGUF model", "path", ggufFile)
+		cfg := &config.ModelConfig{
+			Name:                name,
+			Backend:             "llama-cpp",
+			KnownUsecaseStrings: []string{"chat"},
+			Options:             []string{"use_jinja:true"},
+		}
+		cfg.Model = relPath(ggufFile)
+		cfg.TemplateConfig.UseTokenizerTemplate = true
+		cfg.Description = buildDescription(dirPath, "GGUF")
+		return cfg, nil
+	}
+
+	// 2. LoRA adapter: look for adapter_config.json
+
+	adapterConfigPath := filepath.Join(dirPath, "adapter_config.json")
+	if fileExists(adapterConfigPath) {
+		xlog.Info("ImportLocalPath: detected LoRA adapter", "path", dirPath)
+		baseModel := readBaseModel(dirPath)
+		cfg := &config.ModelConfig{
+			Name:                name,
+			Backend:             "transformers",
+			KnownUsecaseStrings: []string{"chat"},
+		}
+		cfg.Model = baseModel
+		cfg.TemplateConfig.UseTokenizerTemplate = true
+		cfg.LLMConfig.LoraAdapter = relPath(dirPath)
+		cfg.Description = buildDescription(dirPath, "LoRA adapter")
+		return cfg, nil
+	}
+
+	// Also check for adapter_model.safetensors or adapter_model.bin without adapter_config.json
+	if fileExists(filepath.Join(dirPath, "adapter_model.safetensors")) || fileExists(filepath.Join(dirPath, "adapter_model.bin")) {
+		xlog.Info("ImportLocalPath: detected LoRA adapter (by model files)", "path", dirPath)
+		baseModel := readBaseModel(dirPath)
+		cfg := &config.ModelConfig{
+			Name:                name,
+			Backend:             "transformers",
+			KnownUsecaseStrings: []string{"chat"},
+		}
+		cfg.Model = baseModel
+		cfg.TemplateConfig.UseTokenizerTemplate = true
+		cfg.LLMConfig.LoraAdapter = relPath(dirPath)
+		cfg.Description = buildDescription(dirPath, "LoRA adapter")
+		return cfg, nil
+	}
+
+	// 3. Merged model: *.safetensors or pytorch_model*.bin + config.json
+	if fileExists(filepath.Join(dirPath, "config.json")) && (hasFileWithSuffix(dirPath, ".safetensors") || hasFileWithPrefix(dirPath, "pytorch_model")) {
+		xlog.Info("ImportLocalPath: detected merged model", "path", dirPath)
+		cfg := &config.ModelConfig{
+			Name:                name,
+			Backend:             "transformers",
+			KnownUsecaseStrings: []string{"chat"},
+		}
+		cfg.Model = relPath(dirPath)
+		cfg.TemplateConfig.UseTokenizerTemplate = true
+		cfg.Description = buildDescription(dirPath, "merged model")
+		return cfg, nil
+	}
+
+	return nil, fmt.Errorf("could not detect model format in directory %s", dirPath)
+}
+
+// findGGUF returns the path to the first .gguf file found in dir, or "".
+func findGGUF(dir string) string {
+	entries, err := os.ReadDir(dir)
+	if err != nil {
+		return ""
+	}
+	for _, e := range entries {
+		if !e.IsDir() && strings.HasSuffix(strings.ToLower(e.Name()), ".gguf") {
+			return filepath.Join(dir, e.Name())
+		}
+	}
+	return ""
+}
+
+// readBaseModel reads the base model name from adapter_config.json or export_metadata.json.
+func readBaseModel(dirPath string) string {
+	// Try adapter_config.json → base_model_name_or_path (TRL writes this)
+	if data, err := os.ReadFile(filepath.Join(dirPath, "adapter_config.json")); err == nil {
+		var ac map[string]any
+		if json.Unmarshal(data, &ac) == nil {
+			if bm, ok := ac["base_model_name_or_path"].(string); ok && bm != "" {
+				return bm
+			}
+		}
+	}
+
+	// Try export_metadata.json → base_model (Unsloth writes this)
+	if data, err := os.ReadFile(filepath.Join(dirPath, "export_metadata.json")); err == nil {
+		var meta map[string]any
+		if json.Unmarshal(data, &meta) == nil {
+			if bm, ok := meta["base_model"].(string); ok && bm != "" {
+				return bm
+			}
+		}
+	}
+
+	return ""
+}
+
+// buildDescription creates a human-readable description using available metadata.
+func buildDescription(dirPath, formatLabel string) string {
+	base := ""
+
+	// Try adapter_config.json
+	if data, err := os.ReadFile(filepath.Join(dirPath, "adapter_config.json")); err == nil {
+		var ac map[string]any
+		if json.Unmarshal(data, &ac) == nil {
+			if bm, ok := ac["base_model_name_or_path"].(string); ok && bm != "" {
+				base = bm
+			}
+		}
+	}
+
+	// Try export_metadata.json
+	if base == "" {
+		if data, err := os.ReadFile(filepath.Join(dirPath, "export_metadata.json")); err == nil {
+			var meta map[string]any
+			if json.Unmarshal(data, &meta) == nil {
+				if bm, ok := meta["base_model"].(string); ok && bm != "" {
+					base = bm
+				}
+			}
+		}
+	}
+
+	if base != "" {
+		return fmt.Sprintf("Fine-tuned from %s (%s)", base, formatLabel)
+	}
+	return fmt.Sprintf("Fine-tuned model (%s)", formatLabel)
+}
+
+func fileExists(path string) bool {
+	info, err := os.Stat(path)
+	return err == nil && !info.IsDir()
+}
+
+func hasFileWithSuffix(dir, suffix string) bool {
+	entries, err := os.ReadDir(dir)
+	if err != nil {
+		return false
+	}
+	for _, e := range entries {
+		if !e.IsDir() && strings.HasSuffix(strings.ToLower(e.Name()), suffix) {
+			return true
+		}
+	}
+	return false
+}
+
+func hasFileWithPrefix(dir, prefix string) bool {
+	entries, err := os.ReadDir(dir)
+	if err != nil {
+		return false
+	}
+	for _, e := range entries {
+		if !e.IsDir() && strings.HasPrefix(e.Name(), prefix) {
+			return true
+		}
+	}
+	return false
+}
diff --git a/core/gallery/importers/local_test.go b/core/gallery/importers/local_test.go
new file mode 100644
index 000000000..0de679462
--- /dev/null
+++ b/core/gallery/importers/local_test.go
@@ -0,0 +1,148 @@
+package importers_test
+
+import (
+	"encoding/json"
+	"os"
+	"path/filepath"
+
+	. "github.com/onsi/ginkgo/v2"
+	. "github.com/onsi/gomega"
+
+	"github.com/mudler/LocalAI/core/gallery/importers"
+)
+
+var _ = Describe("ImportLocalPath", func() {
+	var tmpDir string
+
+	BeforeEach(func() {
+		var err error
+		tmpDir, err = os.MkdirTemp("", "importers-local-test")
+		Expect(err).ToNot(HaveOccurred())
+	})
+
+	AfterEach(func() {
+		os.RemoveAll(tmpDir)
+	})
+
+	Context("GGUF detection", func() {
+		It("detects a GGUF file in the directory", func() {
+			modelDir := filepath.Join(tmpDir, "my-model")
+			Expect(os.MkdirAll(modelDir, 0755)).To(Succeed())
+			Expect(os.WriteFile(filepath.Join(modelDir, "model-q4_k_m.gguf"), []byte("fake"), 0644)).To(Succeed())
+
+			cfg, err := importers.ImportLocalPath(modelDir, "my-model")
+			Expect(err).ToNot(HaveOccurred())
+			Expect(cfg.Backend).To(Equal("llama-cpp"))
+			Expect(cfg.Model).To(ContainSubstring(".gguf"))
+			Expect(cfg.TemplateConfig.UseTokenizerTemplate).To(BeTrue())
+			Expect(cfg.KnownUsecaseStrings).To(ContainElement("chat"))
+			Expect(cfg.Options).To(ContainElement("use_jinja:true"))
+		})
+
+		It("detects GGUF in _gguf subdirectory", func() {
+			modelDir := filepath.Join(tmpDir, "my-model")
+			ggufDir := modelDir + "_gguf"
+			Expect(os.MkdirAll(modelDir, 0755)).To(Succeed())
+			Expect(os.MkdirAll(ggufDir, 0755)).To(Succeed())
+			Expect(os.WriteFile(filepath.Join(ggufDir, "model.gguf"), []byte("fake"), 0644)).To(Succeed())
+
+			cfg, err := importers.ImportLocalPath(modelDir, "my-model")
+			Expect(err).ToNot(HaveOccurred())
+			Expect(cfg.Backend).To(Equal("llama-cpp"))
+		})
+	})
+
+	Context("LoRA adapter detection", func() {
+		It("detects LoRA adapter via adapter_config.json", func() {
+			modelDir := filepath.Join(tmpDir, "lora-model")
+			Expect(os.MkdirAll(modelDir, 0755)).To(Succeed())
+
+			adapterConfig := map[string]any{
+				"base_model_name_or_path": "meta-llama/Llama-2-7b-hf",
+				"peft_type":              "LORA",
+			}
+			data, _ := json.Marshal(adapterConfig)
+			Expect(os.WriteFile(filepath.Join(modelDir, "adapter_config.json"), data, 0644)).To(Succeed())
+
+			cfg, err := importers.ImportLocalPath(modelDir, "lora-model")
+			Expect(err).ToNot(HaveOccurred())
+			Expect(cfg.Backend).To(Equal("transformers"))
+			Expect(cfg.Model).To(Equal("meta-llama/Llama-2-7b-hf"))
+			Expect(cfg.LLMConfig.LoraAdapter).To(Equal("lora-model"))
+			Expect(cfg.TemplateConfig.UseTokenizerTemplate).To(BeTrue())
+		})
+
+		It("reads base model from export_metadata.json as fallback", func() {
+			modelDir := filepath.Join(tmpDir, "lora-unsloth")
+			Expect(os.MkdirAll(modelDir, 0755)).To(Succeed())
+
+			adapterConfig := map[string]any{"peft_type": "LORA"}
+			data, _ := json.Marshal(adapterConfig)
+			Expect(os.WriteFile(filepath.Join(modelDir, "adapter_config.json"), data, 0644)).To(Succeed())
+
+			metadata := map[string]any{"base_model": "unsloth/tinyllama-bnb-4bit"}
+			data, _ = json.Marshal(metadata)
+			Expect(os.WriteFile(filepath.Join(modelDir, "export_metadata.json"), data, 0644)).To(Succeed())
+
+			cfg, err := importers.ImportLocalPath(modelDir, "lora-unsloth")
+			Expect(err).ToNot(HaveOccurred())
+			Expect(cfg.Model).To(Equal("unsloth/tinyllama-bnb-4bit"))
+		})
+	})
+
+	Context("Merged model detection", func() {
+		It("detects merged model with safetensors + config.json", func() {
+			modelDir := filepath.Join(tmpDir, "merged")
+			Expect(os.MkdirAll(modelDir, 0755)).To(Succeed())
+			Expect(os.WriteFile(filepath.Join(modelDir, "config.json"), []byte("{}"), 0644)).To(Succeed())
+			Expect(os.WriteFile(filepath.Join(modelDir, "model.safetensors"), []byte("fake"), 0644)).To(Succeed())
+
+			cfg, err := importers.ImportLocalPath(modelDir, "merged")
+			Expect(err).ToNot(HaveOccurred())
+			Expect(cfg.Backend).To(Equal("transformers"))
+			Expect(cfg.Model).To(Equal("merged"))
+			Expect(cfg.TemplateConfig.UseTokenizerTemplate).To(BeTrue())
+		})
+
+		It("detects merged model with pytorch_model files", func() {
+			modelDir := filepath.Join(tmpDir, "merged-pt")
+			Expect(os.MkdirAll(modelDir, 0755)).To(Succeed())
+			Expect(os.WriteFile(filepath.Join(modelDir, "config.json"), []byte("{}"), 0644)).To(Succeed())
+			Expect(os.WriteFile(filepath.Join(modelDir, "pytorch_model-00001-of-00002.bin"), []byte("fake"), 0644)).To(Succeed())
+
+			cfg, err := importers.ImportLocalPath(modelDir, "merged-pt")
+			Expect(err).ToNot(HaveOccurred())
+			Expect(cfg.Backend).To(Equal("transformers"))
+			Expect(cfg.Model).To(Equal("merged-pt"))
+		})
+	})
+
+	Context("fallback", func() {
+		It("returns error for empty directory", func() {
+			modelDir := filepath.Join(tmpDir, "empty")
+			Expect(os.MkdirAll(modelDir, 0755)).To(Succeed())
+
+			_, err := importers.ImportLocalPath(modelDir, "empty")
+			Expect(err).To(HaveOccurred())
+			Expect(err.Error()).To(ContainSubstring("could not detect model format"))
+		})
+	})
+
+	Context("description", func() {
+		It("includes base model name in description", func() {
+			modelDir := filepath.Join(tmpDir, "desc-test")
+			Expect(os.MkdirAll(modelDir, 0755)).To(Succeed())
+
+			adapterConfig := map[string]any{
+				"base_model_name_or_path": "TinyLlama/TinyLlama-1.1B",
+			}
+			data, _ := json.Marshal(adapterConfig)
+			Expect(os.WriteFile(filepath.Join(modelDir, "adapter_config.json"), data, 0644)).To(Succeed())
+
+			cfg, err := importers.ImportLocalPath(modelDir, "desc-test")
+			Expect(err).ToNot(HaveOccurred())
+			Expect(cfg.Description).To(ContainSubstring("TinyLlama/TinyLlama-1.1B"))
+			Expect(cfg.Description).To(ContainSubstring("Fine-tuned from"))
+		})
+	})
+})
diff --git a/core/http/app.go b/core/http/app.go
index e2da479b5..696d394d2 100644
--- a/core/http/app.go
+++ b/core/http/app.go
@@ -302,6 +302,17 @@ func API(application *application.Application) (*echo.Echo, error) {
 	mcpMw := auth.RequireFeature(application.AuthDB(), auth.FeatureMCP)
 	routes.RegisterLocalAIRoutes(e, requestExtractor, application.ModelConfigLoader(), application.ModelLoader(), application.ApplicationConfig(), application.GalleryService(), opcache, application.TemplatesEvaluator(), application, adminMiddleware, mcpJobsMw, mcpMw)
 	routes.RegisterAgentPoolRoutes(e, application, agentsMw, skillsMw, collectionsMw)
+	// Fine-tuning routes
+	if application.ApplicationConfig().FineTuning.Enabled {
+		fineTuningMw := auth.RequireFeature(application.AuthDB(), auth.FeatureFineTuning)
+		ftService := services.NewFineTuneService(
+			application.ApplicationConfig(),
+			application.ModelLoader(),
+			application.ModelConfigLoader(),
+		)
+		routes.RegisterFineTuningRoutes(e, ftService, application.ApplicationConfig(), fineTuningMw)
+	}
+
 	routes.RegisterOpenAIRoutes(e, requestExtractor, application)
 	routes.RegisterAnthropicRoutes(e, requestExtractor, application)
 	routes.RegisterOpenResponsesRoutes(e, requestExtractor, application)
diff --git a/core/http/auth/features.go b/core/http/auth/features.go
index 85b4e60ec..1d7ff4f61 100644
--- a/core/http/auth/features.go
+++ b/core/http/auth/features.go
@@ -85,6 +85,18 @@ var RouteFeatureRegistry = []RouteFeature{
 	{"POST", "/stores/delete", FeatureStores},
 	{"POST", "/stores/get", FeatureStores},
 	{"POST", "/stores/find", FeatureStores},
+
+	// Fine-tuning
+	{"POST", "/api/fine-tuning/jobs", FeatureFineTuning},
+	{"GET", "/api/fine-tuning/jobs", FeatureFineTuning},
+	{"GET", "/api/fine-tuning/jobs/:id", FeatureFineTuning},
+	{"POST", "/api/fine-tuning/jobs/:id/stop", FeatureFineTuning},
+	{"DELETE", "/api/fine-tuning/jobs/:id", FeatureFineTuning},
+	{"GET", "/api/fine-tuning/jobs/:id/progress", FeatureFineTuning},
+	{"GET", "/api/fine-tuning/jobs/:id/checkpoints", FeatureFineTuning},
+	{"POST", "/api/fine-tuning/jobs/:id/export", FeatureFineTuning},
+	{"GET", "/api/fine-tuning/jobs/:id/download", FeatureFineTuning},
+	{"POST", "/api/fine-tuning/datasets", FeatureFineTuning},
 }
 
 // FeatureMeta describes a feature for the admin API/UI.
@@ -104,6 +116,13 @@ func AgentFeatureMetas() []FeatureMeta {
 	}
 }
 
+// GeneralFeatureMetas returns metadata for general features.
+func GeneralFeatureMetas() []FeatureMeta {
+	return []FeatureMeta{
+		{FeatureFineTuning, "Fine-Tuning", false},
+	}
+}
+
 // APIFeatureMetas returns metadata for API endpoint features.
 func APIFeatureMetas() []FeatureMeta {
 	return []FeatureMeta{
diff --git a/core/http/auth/permissions.go b/core/http/auth/permissions.go
index b2408ad4e..1fd9bbc8b 100644
--- a/core/http/auth/permissions.go
+++ b/core/http/auth/permissions.go
@@ -32,6 +32,9 @@ const (
 	FeatureCollections = "collections"
 	FeatureMCPJobs     = "mcp_jobs"
 
+	// General features (default OFF for new users)
+	FeatureFineTuning = "fine_tuning"
+
 	// API features (default ON for new users)
 	FeatureChat              = "chat"
 	FeatureImages            = "images"
@@ -52,6 +55,9 @@ const (
 // AgentFeatures lists agent-related features (default OFF).
 var AgentFeatures = []string{FeatureAgents, FeatureSkills, FeatureCollections, FeatureMCPJobs}
 
+// GeneralFeatures lists general features (default OFF).
+var GeneralFeatures = []string{FeatureFineTuning}
+
 // APIFeatures lists API endpoint features (default ON).
 var APIFeatures = []string{
 	FeatureChat, FeatureImages, FeatureAudioSpeech, FeatureAudioTranscription,
@@ -60,7 +66,7 @@ var APIFeatures = []string{
 }
 
 // AllFeatures lists all known features (used by UI and validation).
-var AllFeatures = append(append([]string{}, AgentFeatures...), APIFeatures...)
+var AllFeatures = append(append(append([]string{}, AgentFeatures...), GeneralFeatures...), APIFeatures...)
 
 // defaultOnFeatures is the set of features that default to ON when absent from a user's permission map.
 var defaultOnFeatures = func() map[string]bool {
diff --git a/core/http/endpoints/localai/agent_collections.go b/core/http/endpoints/localai/agent_collections.go
index 022035ef4..dd4bd2370 100644
--- a/core/http/endpoints/localai/agent_collections.go
+++ b/core/http/endpoints/localai/agent_collections.go
@@ -80,13 +80,14 @@ func UploadToCollectionEndpoint(app *application.Application) echo.HandlerFunc {
 			return c.JSON(http.StatusBadRequest, map[string]string{"error": err.Error()})
 		}
 		defer src.Close()
-		if err := svc.UploadToCollectionForUser(userID, name, file.Filename, src); err != nil {
+		key, err := svc.UploadToCollectionForUser(userID, name, file.Filename, src)
+		if err != nil {
 			if strings.Contains(err.Error(), "not found") {
 				return c.JSON(http.StatusNotFound, map[string]string{"error": err.Error()})
 			}
 			return c.JSON(http.StatusInternalServerError, map[string]string{"error": err.Error()})
 		}
-		return c.JSON(http.StatusOK, map[string]string{"status": "ok", "filename": file.Filename})
+		return c.JSON(http.StatusOK, map[string]string{"status": "ok", "filename": file.Filename, "key": key})
 	}
 }
 
diff --git a/core/http/endpoints/localai/finetune.go b/core/http/endpoints/localai/finetune.go
new file mode 100644
index 000000000..fe735acb2
--- /dev/null
+++ b/core/http/endpoints/localai/finetune.go
@@ -0,0 +1,362 @@
+package localai
+
+import (
+	"archive/tar"
+	"compress/gzip"
+	"encoding/json"
+	"fmt"
+	"io"
+	"net/http"
+	"os"
+	"path/filepath"
+	"strings"
+
+	"github.com/labstack/echo/v4"
+	"github.com/mudler/LocalAI/core/config"
+	"github.com/mudler/LocalAI/core/gallery"
+	"github.com/mudler/LocalAI/core/schema"
+	"github.com/mudler/LocalAI/core/services"
+)
+
+// StartFineTuneJobEndpoint starts a new fine-tuning job.
+func StartFineTuneJobEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		userID := getUserID(c)
+
+		var req schema.FineTuneJobRequest
+		if err := c.Bind(&req); err != nil {
+			return c.JSON(http.StatusBadRequest, map[string]string{
+				"error": "Invalid request: " + err.Error(),
+			})
+		}
+
+		if req.Model == "" {
+			return c.JSON(http.StatusBadRequest, map[string]string{
+				"error": "model is required",
+			})
+		}
+		if req.DatasetSource == "" {
+			return c.JSON(http.StatusBadRequest, map[string]string{
+				"error": "dataset_source is required",
+			})
+		}
+
+		resp, err := ftService.StartJob(c.Request().Context(), userID, req)
+		if err != nil {
+			return c.JSON(http.StatusInternalServerError, map[string]string{
+				"error": err.Error(),
+			})
+		}
+
+		return c.JSON(http.StatusCreated, resp)
+	}
+}
+
+// ListFineTuneJobsEndpoint lists fine-tuning jobs for the current user.
+func ListFineTuneJobsEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		userID := getUserID(c)
+		jobs := ftService.ListJobs(userID)
+		if jobs == nil {
+			jobs = []*schema.FineTuneJob{}
+		}
+		return c.JSON(http.StatusOK, jobs)
+	}
+}
+
+// GetFineTuneJobEndpoint gets a specific fine-tuning job.
+func GetFineTuneJobEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		userID := getUserID(c)
+		jobID := c.Param("id")
+
+		job, err := ftService.GetJob(userID, jobID)
+		if err != nil {
+			return c.JSON(http.StatusNotFound, map[string]string{
+				"error": err.Error(),
+			})
+		}
+
+		return c.JSON(http.StatusOK, job)
+	}
+}
+
+// StopFineTuneJobEndpoint stops a running fine-tuning job.
+func StopFineTuneJobEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		userID := getUserID(c)
+		jobID := c.Param("id")
+
+		// Check for save_checkpoint query param
+		saveCheckpoint := c.QueryParam("save_checkpoint") == "true"
+
+		err := ftService.StopJob(c.Request().Context(), userID, jobID, saveCheckpoint)
+		if err != nil {
+			return c.JSON(http.StatusNotFound, map[string]string{
+				"error": err.Error(),
+			})
+		}
+
+		return c.JSON(http.StatusOK, map[string]string{
+			"status":  "stopped",
+			"message": "Fine-tuning job stopped",
+		})
+	}
+}
+
+// DeleteFineTuneJobEndpoint deletes a fine-tuning job and its data.
+func DeleteFineTuneJobEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		userID := getUserID(c)
+		jobID := c.Param("id")
+
+		err := ftService.DeleteJob(userID, jobID)
+		if err != nil {
+			status := http.StatusInternalServerError
+			if strings.Contains(err.Error(), "not found") {
+				status = http.StatusNotFound
+			} else if strings.Contains(err.Error(), "cannot delete") {
+				status = http.StatusConflict
+			}
+			return c.JSON(status, map[string]string{
+				"error": err.Error(),
+			})
+		}
+
+		return c.JSON(http.StatusOK, map[string]string{
+			"status":  "deleted",
+			"message": "Fine-tuning job deleted",
+		})
+	}
+}
+
+// FineTuneProgressEndpoint streams progress updates via SSE.
+func FineTuneProgressEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		userID := getUserID(c)
+		jobID := c.Param("id")
+
+		// Set SSE headers
+		c.Response().Header().Set("Content-Type", "text/event-stream")
+		c.Response().Header().Set("Cache-Control", "no-cache")
+		c.Response().Header().Set("Connection", "keep-alive")
+		c.Response().WriteHeader(http.StatusOK)
+
+		err := ftService.StreamProgress(c.Request().Context(), userID, jobID, func(event *schema.FineTuneProgressEvent) {
+			data, err := json.Marshal(event)
+			if err != nil {
+				return
+			}
+			fmt.Fprintf(c.Response(), "data: %s\n\n", data)
+			c.Response().Flush()
+		})
+		if err != nil {
+			// If headers already sent, we can't send a JSON error
+			fmt.Fprintf(c.Response(), "data: {\"status\":\"error\",\"message\":%q}\n\n", err.Error())
+			c.Response().Flush()
+		}
+
+		return nil
+	}
+}
+
+// ListCheckpointsEndpoint lists checkpoints for a job.
+func ListCheckpointsEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		userID := getUserID(c)
+		jobID := c.Param("id")
+
+		checkpoints, err := ftService.ListCheckpoints(c.Request().Context(), userID, jobID)
+		if err != nil {
+			return c.JSON(http.StatusNotFound, map[string]string{
+				"error": err.Error(),
+			})
+		}
+
+		return c.JSON(http.StatusOK, map[string]any{
+			"checkpoints": checkpoints,
+		})
+	}
+}
+
+// ExportModelEndpoint exports a model from a checkpoint.
+func ExportModelEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		userID := getUserID(c)
+		jobID := c.Param("id")
+
+		var req schema.ExportRequest
+		if err := c.Bind(&req); err != nil {
+			return c.JSON(http.StatusBadRequest, map[string]string{
+				"error": "Invalid request: " + err.Error(),
+			})
+		}
+
+		modelName, err := ftService.ExportModel(c.Request().Context(), userID, jobID, req)
+		if err != nil {
+			return c.JSON(http.StatusInternalServerError, map[string]string{
+				"error": err.Error(),
+			})
+		}
+
+		return c.JSON(http.StatusAccepted, map[string]string{
+			"status":     "exporting",
+			"message":    "Export started for model '" + modelName + "'",
+			"model_name": modelName,
+		})
+	}
+}
+
+// DownloadExportedModelEndpoint streams the exported model directory as a tar.gz archive.
+func DownloadExportedModelEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		userID := getUserID(c)
+		jobID := c.Param("id")
+
+		modelDir, modelName, err := ftService.GetExportedModelPath(userID, jobID)
+		if err != nil {
+			return c.JSON(http.StatusNotFound, map[string]string{
+				"error": err.Error(),
+			})
+		}
+
+		c.Response().Header().Set("Content-Type", "application/gzip")
+		c.Response().Header().Set("Content-Disposition", fmt.Sprintf(`attachment; filename="%s.tar.gz"`, modelName))
+		c.Response().WriteHeader(http.StatusOK)
+
+		gw := gzip.NewWriter(c.Response())
+		defer gw.Close()
+
+		tw := tar.NewWriter(gw)
+		defer tw.Close()
+
+		err = filepath.Walk(modelDir, func(path string, info os.FileInfo, walkErr error) error {
+			if walkErr != nil {
+				return walkErr
+			}
+
+			relPath, err := filepath.Rel(modelDir, path)
+			if err != nil {
+				return err
+			}
+
+			header, err := tar.FileInfoHeader(info, "")
+			if err != nil {
+				return err
+			}
+			header.Name = filepath.Join(modelName, relPath)
+
+			if err := tw.WriteHeader(header); err != nil {
+				return err
+			}
+
+			if info.IsDir() {
+				return nil
+			}
+
+			f, err := os.Open(path)
+			if err != nil {
+				return err
+			}
+			defer f.Close()
+
+			_, err = io.Copy(tw, f)
+			return err
+		})
+
+		if err != nil {
+			// Headers already sent, can't return JSON error
+			return err
+		}
+
+		return nil
+	}
+}
+
+// ListFineTuneBackendsEndpoint returns installed backends tagged with "fine-tuning".
+func ListFineTuneBackendsEndpoint(appConfig *config.ApplicationConfig) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		backends, err := gallery.AvailableBackends(appConfig.BackendGalleries, appConfig.SystemState)
+		if err != nil {
+			return c.JSON(http.StatusInternalServerError, map[string]string{
+				"error": "failed to list backends: " + err.Error(),
+			})
+		}
+
+		type backendInfo struct {
+			Name        string   `json:"name"`
+			Description string   `json:"description,omitempty"`
+			Tags        []string `json:"tags,omitempty"`
+		}
+
+		var result []backendInfo
+		for _, b := range backends {
+			if !b.Installed {
+				continue
+			}
+			hasTag := false
+			for _, t := range b.Tags {
+				if strings.EqualFold(t, "fine-tuning") {
+					hasTag = true
+					break
+				}
+			}
+			if !hasTag {
+				continue
+			}
+			name := b.Name
+			if b.Alias != "" {
+				name = b.Alias
+			}
+			result = append(result, backendInfo{
+				Name:        name,
+				Description: b.Description,
+				Tags:        b.Tags,
+			})
+		}
+
+		if result == nil {
+			result = []backendInfo{}
+		}
+
+		return c.JSON(http.StatusOK, result)
+	}
+}
+
+// UploadDatasetEndpoint handles dataset file upload.
+func UploadDatasetEndpoint(ftService *services.FineTuneService) echo.HandlerFunc {
+	return func(c echo.Context) error {
+		file, err := c.FormFile("file")
+		if err != nil {
+			return c.JSON(http.StatusBadRequest, map[string]string{
+				"error": "file is required",
+			})
+		}
+
+		src, err := file.Open()
+		if err != nil {
+			return c.JSON(http.StatusInternalServerError, map[string]string{
+				"error": "failed to open file",
+			})
+		}
+		defer src.Close()
+
+		data, err := io.ReadAll(src)
+		if err != nil {
+			return c.JSON(http.StatusInternalServerError, map[string]string{
+				"error": "failed to read file",
+			})
+		}
+
+		path, err := ftService.UploadDataset(file.Filename, data)
+		if err != nil {
+			return c.JSON(http.StatusInternalServerError, map[string]string{
+				"error": err.Error(),
+			})
+		}
+
+		return c.JSON(http.StatusOK, map[string]string{
+			"path": path,
+		})
+	}
+}
diff --git a/core/http/react-ui/src/App.css b/core/http/react-ui/src/App.css
index cc2fdb8c9..8ed05628c 100644
--- a/core/http/react-ui/src/App.css
+++ b/core/http/react-ui/src/App.css
@@ -208,6 +208,32 @@
   overflow: hidden;
 }
 
+.sidebar-section-toggle {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  width: 100%;
+  background: none;
+  border: none;
+  cursor: pointer;
+  font-family: inherit;
+  transition: color var(--duration-fast);
+}
+
+.sidebar-section-toggle:hover {
+  color: var(--color-text-secondary);
+}
+
+.sidebar-section-chevron {
+  font-size: 0.5rem;
+  transition: transform var(--duration-fast);
+  flex-shrink: 0;
+}
+
+.sidebar-section-toggle.open .sidebar-section-chevron {
+  transform: rotate(90deg);
+}
+
 .nav-item {
   display: flex;
   align-items: center;
@@ -392,6 +418,10 @@
   display: none;
 }
 
+.sidebar.collapsed .sidebar-section-chevron {
+  display: none;
+}
+
 .sidebar.collapsed .nav-item {
   justify-content: center;
   padding: 8px 0;
@@ -612,14 +642,6 @@
 .spinner-md .spinner-ring { width: 24px; height: 24px; }
 .spinner-lg .spinner-ring { width: 40px; height: 40px; }
 
-.spinner-logo {
-  animation: pulse 1.2s ease-in-out infinite;
-  object-fit: contain;
-}
-.spinner-sm .spinner-logo { width: 16px; height: 16px; }
-.spinner-md .spinner-logo { width: 24px; height: 24px; }
-.spinner-lg .spinner-logo { width: 40px; height: 40px; }
-
 /* Model selector */
 .model-selector {
   background: var(--color-bg-tertiary);
@@ -2646,6 +2668,43 @@
   font-size: 0.625rem;
 }
 
+/* Studio tabs */
+.studio-tabs {
+  display: flex;
+  gap: 0;
+  border-bottom: 1px solid var(--color-border-subtle);
+  padding: 0 var(--spacing-xl);
+  background: var(--color-bg-primary);
+  position: sticky;
+  top: 0;
+  z-index: 10;
+}
+
+.studio-tab {
+  display: flex;
+  align-items: center;
+  gap: 6px;
+  background: none;
+  border: none;
+  padding: var(--spacing-sm) var(--spacing-md);
+  font-size: 0.8125rem;
+  font-family: inherit;
+  color: var(--color-text-secondary);
+  cursor: pointer;
+  border-bottom: 2px solid transparent;
+  transition: color var(--duration-fast), border-color var(--duration-fast);
+}
+
+.studio-tab:hover {
+  color: var(--color-text-primary);
+}
+
+.studio-tab-active {
+  color: var(--color-primary);
+  border-bottom-color: var(--color-primary);
+  font-weight: 500;
+}
+
 /* Two-column layout for media generation pages */
 .media-layout {
   display: grid;
diff --git a/core/http/react-ui/src/components/LoadingSpinner.jsx b/core/http/react-ui/src/components/LoadingSpinner.jsx
index 23f858abe..b1c1b46a2 100644
--- a/core/http/react-ui/src/components/LoadingSpinner.jsx
+++ b/core/http/react-ui/src/components/LoadingSpinner.jsx
@@ -1,22 +1,8 @@
-import { useState } from 'react'
-import { apiUrl } from '../utils/basePath'
-
 export default function LoadingSpinner({ size = 'md', className = '' }) {
   const sizeClass = size === 'sm' ? 'spinner-sm' : size === 'lg' ? 'spinner-lg' : 'spinner-md'
-  const [imgFailed, setImgFailed] = useState(false)
-
   return (
     <div className={`spinner ${sizeClass} ${className}`}>
-      {imgFailed ? (
-        <div className="spinner-ring" />
-      ) : (
-        <img
-          src={apiUrl('/static/logo.png')}
-          alt=""
-          className="spinner-logo"
-          onError={() => setImgFailed(true)}
-        />
-      )}
+      <div className="spinner-ring" />
     </div>
   )
 }
diff --git a/core/http/react-ui/src/components/Sidebar.jsx b/core/http/react-ui/src/components/Sidebar.jsx
index eec32f88f..4b0ebc229 100644
--- a/core/http/react-ui/src/components/Sidebar.jsx
+++ b/core/http/react-ui/src/components/Sidebar.jsx
@@ -1,37 +1,57 @@
 import { useState, useEffect } from 'react'
-import { NavLink, useNavigate } from 'react-router-dom'
+import { NavLink, useNavigate, useLocation } from 'react-router-dom'
 import ThemeToggle from './ThemeToggle'
 import { useAuth } from '../context/AuthContext'
 import { apiUrl } from '../utils/basePath'
 
 const COLLAPSED_KEY = 'localai_sidebar_collapsed'
+const SECTIONS_KEY = 'localai_sidebar_sections'
 
-const mainItems = [
+const topItems = [
   { path: '/app', icon: 'fas fa-home', label: 'Home' },
   { path: '/app/models', icon: 'fas fa-download', label: 'Install Models', adminOnly: true },
   { path: '/app/chat', icon: 'fas fa-comments', label: 'Chat' },
-  { path: '/app/image', icon: 'fas fa-image', label: 'Images' },
-  { path: '/app/video', icon: 'fas fa-video', label: 'Video' },
-  { path: '/app/tts', icon: 'fas fa-music', label: 'TTS' },
-  { path: '/app/sound', icon: 'fas fa-volume-high', label: 'Sound' },
+  { path: '/app/studio', icon: 'fas fa-palette', label: 'Studio' },
   { path: '/app/talk', icon: 'fas fa-phone', label: 'Talk' },
-  { path: '/app/usage', icon: 'fas fa-chart-bar', label: 'Usage', authOnly: true },
 ]
 
-const agentItems = [
-  { path: '/app/agents', icon: 'fas fa-robot', label: 'Agents' },
-  { path: '/app/skills', icon: 'fas fa-wand-magic-sparkles', label: 'Skills' },
-  { path: '/app/collections', icon: 'fas fa-database', label: 'Memory' },
-  { path: '/app/agent-jobs', icon: 'fas fa-tasks', label: 'MCP CI Jobs', feature: 'mcp' },
-]
-
-const systemItems = [
-  { path: '/app/users', icon: 'fas fa-users', label: 'Users', adminOnly: true, authOnly: true },
-  { path: '/app/backends', icon: 'fas fa-server', label: 'Backends', adminOnly: true },
-  { path: '/app/traces', icon: 'fas fa-chart-line', label: 'Traces', adminOnly: true },
-  { path: '/app/p2p', icon: 'fas fa-circle-nodes', label: 'Swarm', adminOnly: true },
-  { path: '/app/manage', icon: 'fas fa-desktop', label: 'System', adminOnly: true },
-  { path: '/app/settings', icon: 'fas fa-cog', label: 'Settings', adminOnly: true },
+const sections = [
+  {
+    id: 'tools',
+    title: 'Tools',
+    items: [
+      { path: '/app/fine-tune', icon: 'fas fa-graduation-cap', label: 'Fine-Tune', feature: 'fine_tuning' },
+    ],
+  },
+  {
+    id: 'agents',
+    title: 'Agents',
+    featureMap: {
+      '/app/agents': 'agents',
+      '/app/skills': 'skills',
+      '/app/collections': 'collections',
+      '/app/agent-jobs': 'mcp_jobs',
+    },
+    items: [
+      { path: '/app/agents', icon: 'fas fa-robot', label: 'Agents' },
+      { path: '/app/skills', icon: 'fas fa-wand-magic-sparkles', label: 'Skills' },
+      { path: '/app/collections', icon: 'fas fa-database', label: 'Memory' },
+      { path: '/app/agent-jobs', icon: 'fas fa-tasks', label: 'MCP CI Jobs', feature: 'mcp' },
+    ],
+  },
+  {
+    id: 'system',
+    title: 'System',
+    items: [
+      { path: '/app/usage', icon: 'fas fa-chart-bar', label: 'Usage', authOnly: true },
+      { path: '/app/users', icon: 'fas fa-users', label: 'Users', adminOnly: true, authOnly: true },
+      { path: '/app/backends', icon: 'fas fa-server', label: 'Backends', adminOnly: true },
+      { path: '/app/traces', icon: 'fas fa-chart-line', label: 'Traces', adminOnly: true },
+      { path: '/app/p2p', icon: 'fas fa-circle-nodes', label: 'Swarm', adminOnly: true },
+      { path: '/app/manage', icon: 'fas fa-desktop', label: 'System', adminOnly: true },
+      { path: '/app/settings', icon: 'fas fa-cog', label: 'Settings', adminOnly: true },
+    ],
+  },
 ]
 
 function NavItem({ item, onClose, collapsed }) {
@@ -51,18 +71,47 @@ function NavItem({ item, onClose, collapsed }) {
   )
 }
 
+function loadSectionState() {
+  try {
+    const stored = localStorage.getItem(SECTIONS_KEY)
+    return stored ? JSON.parse(stored) : {}
+  } catch (_) {
+    return {}
+  }
+}
+
+function saveSectionState(state) {
+  try { localStorage.setItem(SECTIONS_KEY, JSON.stringify(state)) } catch (_) { /* ignore */ }
+}
+
 export default function Sidebar({ isOpen, onClose }) {
   const [features, setFeatures] = useState({})
   const [collapsed, setCollapsed] = useState(() => {
     try { return localStorage.getItem(COLLAPSED_KEY) === 'true' } catch (_) { return false }
   })
+  const [openSections, setOpenSections] = useState(loadSectionState)
   const { isAdmin, authEnabled, user, logout, hasFeature } = useAuth()
   const navigate = useNavigate()
+  const location = useLocation()
 
   useEffect(() => {
     fetch(apiUrl('/api/features')).then(r => r.json()).then(setFeatures).catch(() => {})
   }, [])
 
+  // Auto-expand section containing the active route
+  useEffect(() => {
+    for (const section of sections) {
+      const match = section.items.some(item => location.pathname.startsWith(item.path))
+      if (match && !openSections[section.id]) {
+        setOpenSections(prev => {
+          const next = { ...prev, [section.id]: true }
+          saveSectionState(next)
+          return next
+        })
+      }
+    }
+  }, [location.pathname])
+
   const toggleCollapse = () => {
     setCollapsed(prev => {
       const next = !prev
@@ -72,17 +121,34 @@ export default function Sidebar({ isOpen, onClose }) {
     })
   }
 
-  const visibleMainItems = mainItems.filter(item => {
-    if (item.adminOnly && !isAdmin) return false
-    if (item.authOnly && !authEnabled) return false
-    return true
-  })
+  const toggleSection = (id) => {
+    setOpenSections(prev => {
+      const next = { ...prev, [id]: !prev[id] }
+      saveSectionState(next)
+      return next
+    })
+  }
 
-  const visibleSystemItems = systemItems.filter(item => {
+  const filterItem = (item) => {
     if (item.adminOnly && !isAdmin) return false
     if (item.authOnly && !authEnabled) return false
+    if (item.feature && features[item.feature] === false) return false
+    if (item.feature && !hasFeature(item.feature)) return false
     return true
-  })
+  }
+
+  const visibleTopItems = topItems.filter(filterItem)
+
+  const getVisibleSectionItems = (section) => {
+    return section.items.filter(item => {
+      if (!filterItem(item)) return false
+      if (section.featureMap) {
+        const featureName = section.featureMap[item.path]
+        return featureName ? hasFeature(featureName) : isAdmin
+      }
+      return true
+    })
+  }
 
   return (
     <>
@@ -104,57 +170,57 @@ export default function Sidebar({ isOpen, onClose }) {
 
         {/* Navigation */}
         <nav className="sidebar-nav">
-          {/* Main section */}
+          {/* Top-level items */}
           <div className="sidebar-section">
-            {visibleMainItems.map(item => (
+            {visibleTopItems.map(item => (
               <NavItem key={item.path} item={item} onClose={onClose} collapsed={collapsed} />
             ))}
           </div>
 
-          {/* Agents section (per-feature permissions) */}
-          {features.agents !== false && (() => {
-            const featureMap = {
-              '/app/agents': 'agents',
-              '/app/skills': 'skills',
-              '/app/collections': 'collections',
-              '/app/agent-jobs': 'mcp_jobs',
-            }
-            const visibleAgentItems = agentItems.filter(item => {
-              if (item.feature && features[item.feature] === false) return false
-              const featureName = featureMap[item.path]
-              return featureName ? hasFeature(featureName) : isAdmin
-            })
-            if (visibleAgentItems.length === 0) return null
+          {/* Collapsible sections */}
+          {sections.map(section => {
+            // For agents section, check global feature flag
+            if (section.id === 'agents' && features.agents === false) return null
+
+            const visibleItems = getVisibleSectionItems(section)
+            if (visibleItems.length === 0) return null
+
+            const isSectionOpen = openSections[section.id]
+            const showItems = isSectionOpen || collapsed
+
             return (
-              <div className="sidebar-section">
-                <div className="sidebar-section-title">Agents</div>
-                {visibleAgentItems.map(item => (
-                  <NavItem key={item.path} item={item} onClose={onClose} collapsed={collapsed} />
-                ))}
+              <div key={section.id} className="sidebar-section">
+                <button
+                  className={`sidebar-section-title sidebar-section-toggle ${isSectionOpen ? 'open' : ''}`}
+                  onClick={() => toggleSection(section.id)}
+                  title={collapsed ? section.title : undefined}
+                >
+                  <span>{section.title}</span>
+                  <i className="fas fa-chevron-right sidebar-section-chevron" />
+                </button>
+                {showItems && (
+                  <div className="sidebar-section-items">
+                    {section.id === 'system' && (
+                      <a
+                        href={apiUrl('/swagger/index.html')}
+                        target="_blank"
+                        rel="noopener noreferrer"
+                        className="nav-item"
+                        title={collapsed ? 'API' : undefined}
+                      >
+                        <i className="fas fa-code nav-icon" />
+                        <span className="nav-label">API</span>
+                        <i className="fas fa-external-link-alt nav-external" />
+                      </a>
+                    )}
+                    {visibleItems.map(item => (
+                      <NavItem key={item.path} item={item} onClose={onClose} collapsed={collapsed} />
+                    ))}
+                  </div>
+                )}
               </div>
             )
-          })()}
-
-          {/* System section */}
-          <div className="sidebar-section">
-            {visibleSystemItems.length > 0 && (
-              <div className="sidebar-section-title">System</div>
-            )}
-            <a
-              href={apiUrl('/swagger/index.html')}
-              target="_blank"
-              rel="noopener noreferrer"
-              className="nav-item"
-              title={collapsed ? 'API' : undefined}
-            >
-              <i className="fas fa-code nav-icon" />
-              <span className="nav-label">API</span>
-              <i className="fas fa-external-link-alt nav-external" />
-            </a>
-            {visibleSystemItems.map(item => (
-              <NavItem key={item.path} item={item} onClose={onClose} collapsed={collapsed} />
-            ))}
-          </div>
+          })}
         </nav>
 
         {/* Footer */}
diff --git a/core/http/react-ui/src/pages/FineTune.jsx b/core/http/react-ui/src/pages/FineTune.jsx
new file mode 100644
index 000000000..606848754
--- /dev/null
+++ b/core/http/react-ui/src/pages/FineTune.jsx
@@ -0,0 +1,1525 @@
+import { useState, useEffect, useRef, useCallback } from 'react'
+import { fineTuneApi } from '../utils/api'
+import LoadingSpinner from '../components/LoadingSpinner'
+
+const TRAINING_METHODS = ['sft', 'dpo', 'grpo', 'rloo', 'reward', 'kto', 'orpo']
+const TRAINING_TYPES = ['lora', 'loha', 'lokr', 'full']
+const FALLBACK_BACKENDS = ['trl']
+const OPTIMIZERS = ['adamw_torch', 'adamw_8bit', 'sgd', 'adafactor', 'prodigy']
+const MIXED_PRECISION_OPTS = ['', 'fp16', 'bf16', 'no']
+
+const BUILTIN_REWARDS = [
+  { name: 'format_reward', description: 'Checks <think>...</think> then answer format', params: [] },
+  { name: 'reasoning_accuracy_reward', description: 'Compares <answer> content to dataset answer column', params: [] },
+  { name: 'length_reward', description: 'Score based on proximity to target length', params: [{ key: 'target_length', default: '200', label: 'Target Length' }] },
+  { name: 'xml_tag_reward', description: 'Scores properly opened/closed XML tags', params: [] },
+  { name: 'no_repetition_reward', description: 'Penalizes n-gram repetition', params: [] },
+  { name: 'code_execution_reward', description: 'Checks Python code block syntax validity', params: [] },
+]
+
+const statusBadgeClass = {
+  queued: '',
+  loading_model: 'badge-warning',
+  loading_dataset: 'badge-warning',
+  training: 'badge-info',
+  saving: 'badge-info',
+  completed: 'badge-success',
+  failed: 'badge-error',
+  stopped: '',
+}
+
+function FormSection({ icon, title, children }) {
+  return (
+    <div style={{ marginBottom: 'var(--spacing-lg)' }}>
+      <h4 style={{
+        fontSize: '0.8125rem', fontWeight: 600, textTransform: 'uppercase',
+        letterSpacing: '0.05em', color: 'var(--color-text-secondary)',
+        display: 'flex', alignItems: 'center', gap: 'var(--spacing-sm)',
+        marginBottom: 'var(--spacing-md)', paddingBottom: 'var(--spacing-sm)',
+        borderBottom: '1px solid var(--color-border-subtle)',
+      }}>
+        <i className={icon} style={{ color: 'var(--color-primary)' }} />
+        {title}
+      </h4>
+      {children}
+    </div>
+  )
+}
+
+function KeyValueEditor({ entries, onChange }) {
+  const addEntry = () => onChange([...entries, { key: '', value: '' }])
+  const removeEntry = (i) => onChange(entries.filter((_, idx) => idx !== i))
+  const updateEntry = (i, field, val) => {
+    const updated = entries.map((e, idx) => idx === i ? { ...e, [field]: val } : e)
+    onChange(updated)
+  }
+
+  return (
+    <div>
+      {entries.map((entry, i) => (
+        <div key={i} style={{ display: 'flex', gap: 'var(--spacing-sm)', marginBottom: 'var(--spacing-sm)', alignItems: 'center' }}>
+          <input
+            className="input"
+            value={entry.key}
+            onChange={e => updateEntry(i, 'key', e.target.value)}
+            placeholder="Key"
+            style={{ flex: 1 }}
+          />
+          <input
+            className="input"
+            value={entry.value}
+            onChange={e => updateEntry(i, 'value', e.target.value)}
+            placeholder="Value"
+            style={{ flex: 2 }}
+          />
+          <button type="button" className="btn btn-danger" style={{ padding: 'var(--spacing-xs) var(--spacing-sm)' }} onClick={() => removeEntry(i)}>
+            <i className="fas fa-times" />
+          </button>
+        </div>
+      ))}
+      <button type="button" className="btn" onClick={addEntry} style={{ fontSize: '0.8125rem' }}>
+        <i className="fas fa-plus" style={{ marginRight: 'var(--spacing-xs)' }} />
+        Add option
+      </button>
+    </div>
+  )
+}
+
+function CopyButton({ text }) {
+  const [copied, setCopied] = useState(false)
+  const handleCopy = (e) => {
+    e.stopPropagation()
+    navigator.clipboard.writeText(text).then(() => {
+      setCopied(true)
+      setTimeout(() => setCopied(false), 1500)
+    })
+  }
+  return (
+    <button className="btn" style={{ padding: '1px 4px', fontSize: '0.7rem' }} onClick={handleCopy} title="Copy to clipboard">
+      <i className={`fas fa-${copied ? 'check' : 'copy'}`} />
+    </button>
+  )
+}
+
+function JobCard({ job, isSelected, onSelect, onUseConfig, onDelete }) {
+  return (
+    <div
+      className="card"
+      style={{
+        cursor: 'pointer', marginBottom: 'var(--spacing-sm)',
+        border: isSelected ? '2px solid var(--color-primary)' : undefined,
+      }}
+      onClick={() => onSelect(job)}
+    >
+      <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center' }}>
+        <div>
+          <strong>{job.model}</strong>
+          <span style={{ marginLeft: 'var(--spacing-sm)', fontSize: '0.875rem', color: 'var(--color-text-muted)' }}>
+            {job.backend} / {job.training_method || 'sft'}
+          </span>
+        </div>
+        <div style={{ display: 'flex', alignItems: 'center', gap: 'var(--spacing-sm)' }}>
+          <button
+            className="btn"
+            style={{ fontSize: '0.75rem', padding: '2px 6px' }}
+            onClick={(e) => { e.stopPropagation(); onUseConfig(job) }}
+            title="Use this job's configuration for a new job"
+          >
+            <i className="fas fa-copy" /> Reuse
+          </button>
+          {['completed', 'stopped', 'failed'].includes(job.status) && (
+            <button
+              className="btn btn-danger"
+              style={{ fontSize: '0.75rem', padding: '2px 6px' }}
+              onClick={(e) => { e.stopPropagation(); onDelete(job.id) }}
+              title="Delete this job and its data"
+            >
+              <i className="fas fa-trash" />
+            </button>
+          )}
+          <span className={`badge ${statusBadgeClass[job.status] || ''}`}>
+            {job.status}
+          </span>
+        </div>
+      </div>
+      <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)', marginTop: 'var(--spacing-xs)' }}>
+        ID: {job.id?.slice(0, 8)}... | Created: {job.created_at}
+      </div>
+      {job.output_dir && (
+        <div style={{ fontSize: '0.75rem', color: 'var(--color-text-muted)', marginTop: '2px', display: 'flex', alignItems: 'center', gap: 'var(--spacing-xs)' }}>
+          <i className="fas fa-folder" />
+          <span style={{ overflow: 'hidden', textOverflow: 'ellipsis', whiteSpace: 'nowrap', maxWidth: '300px' }} title={job.output_dir}>
+            {job.output_dir}
+          </span>
+          <CopyButton text={job.output_dir} />
+        </div>
+      )}
+      {job.message && (
+        <div style={{ fontSize: '0.75rem', color: job.status === 'failed' ? 'var(--color-error)' : 'var(--color-text-muted)', marginTop: '2px' }}>
+          <i className="fas fa-info-circle" style={{ marginRight: '2px' }} />
+          {job.message}
+        </div>
+      )}
+    </div>
+  )
+}
+
+function formatEta(seconds) {
+  if (!seconds || seconds <= 0) return '--'
+  const h = Math.floor(seconds / 3600)
+  const m = Math.floor((seconds % 3600) / 60)
+  const s = Math.floor(seconds % 60)
+  if (h > 0) return `${h}h ${m}m`
+  if (m > 0) return `${m}m ${s}s`
+  return `${s}s`
+}
+
+function formatAxisValue(val, decimals) {
+  if (val >= 1) return val.toFixed(Math.min(decimals, 1))
+  if (val >= 0.01) return val.toFixed(Math.min(decimals, 3))
+  return val.toExponential(1)
+}
+
+function SingleMetricChart({ data, valueKey, label, color, formatValue, events }) {
+  const [tooltip, setTooltip] = useState(null)
+  const svgRef = useRef(null)
+
+  if (!data || data.length < 1) return null
+
+  const pad = { top: 16, right: 12, bottom: 32, left: 52 }
+  const W = 400, H = 220
+  const cw = W - pad.left - pad.right
+  const ch = H - pad.top - pad.bottom
+
+  const steps = data.map(e => e.current_step)
+  const values = data.map(e => e[valueKey])
+
+  const minStep = Math.min(...steps), maxStep = Math.max(...steps)
+  const stepRange = maxStep - minStep || 1
+  const minVal = Math.min(...values), maxVal = Math.max(...values)
+  const valRange = maxVal - minVal || 1
+  const valPad = valRange * 0.05
+  const yMin = Math.max(0, minVal - valPad), yMax = maxVal + valPad
+  const yRange = yMax - yMin || 1
+
+  const x = (step) => pad.left + ((step - minStep) / stepRange) * cw
+  const y = (val) => pad.top + (1 - (val - yMin) / yRange) * ch
+
+  const points = data.map(e => `${x(e.current_step)},${y(e[valueKey])}`).join(' ')
+
+  const xTickCount = Math.min(5, data.length)
+  const xTicks = Array.from({ length: xTickCount }, (_, i) => Math.round(minStep + (stepRange * i) / (xTickCount - 1)))
+  const yTickCount = 4
+  const yTicks = Array.from({ length: yTickCount }, (_, i) => yMin + (yRange * i) / (yTickCount - 1))
+
+  // Epoch boundaries from the full events list if provided
+  const epochBoundaries = []
+  const evts = events || data
+  for (let i = 1; i < evts.length; i++) {
+    const prevEpoch = Math.floor(evts[i - 1].current_epoch || 0)
+    const curEpoch = Math.floor(evts[i].current_epoch || 0)
+    if (curEpoch > prevEpoch && curEpoch > 0) {
+      epochBoundaries.push({ step: evts[i].current_step, epoch: curEpoch })
+    }
+  }
+
+  const fmtVal = formatValue || ((v) => formatAxisValue(v, 3))
+
+  const handleMouseMove = (e) => {
+    if (!svgRef.current) return
+    const rect = svgRef.current.getBoundingClientRect()
+    const mx = ((e.clientX - rect.left) / rect.width) * W
+    const step = minStep + ((mx - pad.left) / cw) * stepRange
+    let nearest = data[0], bestDist = Infinity
+    for (const d of data) {
+      const dist = Math.abs(d.current_step - step)
+      if (dist < bestDist) { bestDist = dist; nearest = d }
+    }
+    setTooltip({ x: x(nearest.current_step), y: y(nearest[valueKey]), data: nearest })
+  }
+
+  return (
+    <div>
+      <div style={{ fontSize: '0.8125rem', fontWeight: 600, marginBottom: 4, display: 'flex', alignItems: 'center', gap: 6 }}>
+        <span style={{ display: 'inline-block', width: 12, height: 3, background: color, borderRadius: 2 }} />
+        {label}
+      </div>
+      <svg
+        ref={svgRef}
+        viewBox={`0 0 ${W} ${H}`}
+        style={{ width: '100%', height: 'auto', maxHeight: 220, background: 'var(--color-bg-secondary)', borderRadius: 'var(--radius-sm)' }}
+        onMouseMove={handleMouseMove}
+        onMouseLeave={() => setTooltip(null)}
+      >
+        {yTicks.map((val, i) => (
+          <line key={i} x1={pad.left} x2={W - pad.right} y1={y(val)} y2={y(val)}
+            stroke="currentColor" strokeOpacity={0.08} strokeDasharray="3 3" />
+        ))}
+        {epochBoundaries.map((eb, i) => (
+          <g key={i}>
+            <line x1={x(eb.step)} x2={x(eb.step)} y1={pad.top} y2={H - pad.bottom}
+              stroke="currentColor" strokeOpacity={0.15} strokeDasharray="4 3" />
+          </g>
+        ))}
+        <polyline points={points} fill="none" stroke={color} strokeWidth={1.5} strokeLinejoin="round" />
+        <line x1={pad.left} x2={W - pad.right} y1={H - pad.bottom} y2={H - pad.bottom}
+          stroke="currentColor" strokeOpacity={0.2} />
+        {xTicks.map((step, i) => (
+          <text key={i} x={x(step)} y={H - pad.bottom + 14} textAnchor="middle"
+            fill="currentColor" fillOpacity={0.5} fontSize={9}>{step}</text>
+        ))}
+        <line x1={pad.left} x2={pad.left} y1={pad.top} y2={H - pad.bottom}
+          stroke="currentColor" strokeOpacity={0.2} />
+        {yTicks.map((val, i) => (
+          <text key={i} x={pad.left - 6} y={y(val) + 3} textAnchor="end"
+            fill="currentColor" fillOpacity={0.5} fontSize={9}>{fmtVal(val)}</text>
+        ))}
+        <text x={pad.left + cw / 2} y={H - 2} textAnchor="middle"
+          fill="currentColor" fillOpacity={0.4} fontSize={8}>Step</text>
+        {tooltip && (
+          <g>
+            <line x1={tooltip.x} x2={tooltip.x} y1={pad.top} y2={H - pad.bottom}
+              stroke={color} strokeOpacity={0.4} strokeDasharray="2 2" />
+            <circle cx={tooltip.x} cy={tooltip.y} r={3} fill={color} />
+            <rect x={Math.min(tooltip.x + 8, W - 120)} y={tooltip.y - 24} width={110} height={30} rx={3}
+              fill="var(--color-bg)" stroke="var(--color-border)" strokeWidth={1} />
+            <text x={Math.min(tooltip.x + 14, W - 114)} y={tooltip.y - 10} fill="currentColor" fontSize={9}>
+              Step {tooltip.data.current_step}
+            </text>
+            <text x={Math.min(tooltip.x + 14, W - 114)} y={tooltip.y + 2} fill={color} fontSize={9} fontWeight="bold">
+              {fmtVal(tooltip.data[valueKey])}
+            </text>
+          </g>
+        )}
+      </svg>
+    </div>
+  )
+}
+
+function ChartsGrid({ events }) {
+  const lossData = events.filter(e => e.loss > 0)
+  const evalData = events.filter(e => e.eval_loss > 0)
+  const lrData = events.filter(e => e.learning_rate != null && e.learning_rate > 0)
+  const gradNormData = events.filter(e => e.grad_norm != null && e.grad_norm > 0)
+
+  const fmtExp = (v) => v.toExponential(1)
+
+  if (lossData.length < 2 && lrData.length < 2 && gradNormData.length < 2) return null
+
+  return (
+    <div style={{ display: 'grid', gridTemplateColumns: '1fr 1fr', gap: 'var(--spacing-md)', marginBottom: 'var(--spacing-md)' }}>
+      <SingleMetricChart data={lossData} valueKey="loss" label="Training Loss" color="#3b82f6" events={events} />
+      {evalData.length >= 1 ? (
+        <SingleMetricChart data={evalData} valueKey="eval_loss" label="Eval Loss" color="#ef4444" events={events} />
+      ) : (
+        <div style={{ display: 'flex', alignItems: 'center', justifyContent: 'center', background: 'var(--color-bg-secondary)', borderRadius: 'var(--radius-sm)', minHeight: 120 }}>
+          <span style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)' }}>
+            <i className="fas fa-chart-area" style={{ marginRight: 6 }} />
+            Eval Loss — waiting for eval data
+          </span>
+        </div>
+      )}
+      <SingleMetricChart data={lrData} valueKey="learning_rate" label="Learning Rate" color="#8b5cf6" formatValue={fmtExp} events={events} />
+      <SingleMetricChart data={gradNormData} valueKey="grad_norm" label="Gradient Norm" color="#f97316" events={events} />
+    </div>
+  )
+}
+
+function TrainingMonitor({ job, onStop }) {
+  const [events, setEvents] = useState([])
+  const [latest, setLatest] = useState(null)
+  const [connecting, setConnecting] = useState(true)
+  const eventSourceRef = useRef(null)
+
+  useEffect(() => {
+    if (!job || !['queued', 'loading_model', 'loading_dataset', 'training', 'saving'].includes(job.status)) {
+      setConnecting(false)
+      return
+    }
+
+    setConnecting(true)
+    setLatest(null)
+    setEvents([])
+
+    const url = fineTuneApi.progressUrl(job.id)
+    const es = new EventSource(url)
+    eventSourceRef.current = es
+
+    es.onmessage = (e) => {
+      try {
+        setConnecting(false)
+        const data = JSON.parse(e.data)
+        setLatest(data)
+        if (data.loss > 0) {
+          setEvents(prev => [...prev, data])
+        }
+        if (['completed', 'failed', 'stopped'].includes(data.status)) {
+          es.close()
+        }
+      } catch (_) {}
+    }
+
+    es.onerror = () => {
+      setConnecting(false)
+      es.close()
+    }
+
+    return () => {
+      es.close()
+    }
+  }, [job?.id])
+
+  if (!job) return null
+
+  return (
+    <div className="card" style={{ marginTop: 'var(--spacing-md)' }}>
+      <h3 style={{ margin: '0 0 var(--spacing-md) 0' }}>
+        <i className="fas fa-chart-line" style={{ marginRight: 'var(--spacing-sm)' }} />
+        Training Monitor
+      </h3>
+
+      {connecting && !latest && (
+        <div style={{ textAlign: 'center', padding: 'var(--spacing-lg)', color: 'var(--color-text-muted)' }}>
+          <LoadingSpinner size="sm" /> Connecting to training stream...
+        </div>
+      )}
+
+      {latest && (
+        <div style={{ display: 'grid', gridTemplateColumns: 'repeat(auto-fill, minmax(130px, 1fr))', gap: 'var(--spacing-sm)', marginBottom: 'var(--spacing-md)' }}>
+          <div className="card" style={{ padding: 'var(--spacing-sm)', textAlign: 'center' }}>
+            <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)' }}>Status</div>
+            <div style={{ fontWeight: 'bold' }}>{latest.status}</div>
+          </div>
+          <div className="card" style={{ padding: 'var(--spacing-sm)', textAlign: 'center' }}>
+            <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)' }}>Progress</div>
+            <div style={{ fontWeight: 'bold' }}>{latest.progress_percent?.toFixed(1)}%</div>
+          </div>
+          <div className="card" style={{ padding: 'var(--spacing-sm)', textAlign: 'center' }}>
+            <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)' }}>Step</div>
+            <div style={{ fontWeight: 'bold' }}>{latest.current_step} / {latest.total_steps}</div>
+          </div>
+          <div className="card" style={{ padding: 'var(--spacing-sm)', textAlign: 'center' }}>
+            <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)' }}>Loss</div>
+            <div style={{ fontWeight: 'bold' }}>{latest.loss?.toFixed(4)}</div>
+          </div>
+          <div className="card" style={{ padding: 'var(--spacing-sm)', textAlign: 'center' }}>
+            <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)' }}>Epoch</div>
+            <div style={{ fontWeight: 'bold' }}>{latest.current_epoch?.toFixed(2)} / {latest.total_epochs?.toFixed(0)}</div>
+          </div>
+          <div className="card" style={{ padding: 'var(--spacing-sm)', textAlign: 'center' }}>
+            <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)' }}>Learning Rate</div>
+            <div style={{ fontWeight: 'bold' }}>{latest.learning_rate?.toExponential(2)}</div>
+          </div>
+          <div className="card" style={{ padding: 'var(--spacing-sm)', textAlign: 'center' }}>
+            <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)' }}>ETA</div>
+            <div style={{ fontWeight: 'bold' }}>{formatEta(latest.eta_seconds)}</div>
+          </div>
+          {latest.extra_metrics?.tokens_per_second > 0 && (
+            <div className="card" style={{ padding: 'var(--spacing-sm)', textAlign: 'center' }}>
+              <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)' }}>Tokens/sec</div>
+              <div style={{ fontWeight: 'bold' }}>{latest.extra_metrics.tokens_per_second.toFixed(0)}</div>
+            </div>
+          )}
+        </div>
+      )}
+
+      {/* Progress bar */}
+      {latest && (
+        <div style={{ background: 'var(--color-bg-secondary)', borderRadius: 'var(--radius-sm)', height: '8px', marginBottom: 'var(--spacing-md)' }}>
+          <div style={{
+            background: 'var(--color-primary)', borderRadius: 'var(--radius-sm)', height: '100%',
+            width: `${Math.min(latest.progress_percent || 0, 100)}%`, transition: 'width 0.3s'
+          }} />
+        </div>
+      )}
+
+      {/* Training charts (2x2 grid) */}
+      <ChartsGrid events={events} />
+
+      {latest?.message && (
+        <div style={{ fontSize: '0.875rem', color: 'var(--color-text-muted)' }}>
+          <i className="fas fa-info-circle" style={{ marginRight: 'var(--spacing-xs)' }} />
+          {latest.message}
+        </div>
+      )}
+
+      {['queued', 'loading_model', 'loading_dataset', 'training', 'saving'].includes(latest?.status || job.status) && (
+        <button
+          className="btn btn-danger"
+          style={{ marginTop: 'var(--spacing-sm)' }}
+          onClick={() => onStop(job.id)}
+        >
+          <i className="fas fa-stop" style={{ marginRight: 'var(--spacing-xs)' }} />
+          Stop Training
+        </button>
+      )}
+    </div>
+  )
+}
+
+function CheckpointsPanel({ job, onResume, onExportCheckpoint }) {
+  const [checkpoints, setCheckpoints] = useState([])
+  const [loading, setLoading] = useState(false)
+
+  useEffect(() => {
+    if (!job) return
+    setLoading(true)
+    fineTuneApi.listCheckpoints(job.id).then(r => {
+      setCheckpoints(r.checkpoints || [])
+    }).catch(() => {}).finally(() => setLoading(false))
+  }, [job?.id])
+
+  if (!job) return null
+  if (loading) return <div style={{ padding: 'var(--spacing-md)', fontSize: '0.875rem' }}><LoadingSpinner size="sm" /> Loading checkpoints...</div>
+  if (checkpoints.length === 0) return null
+
+  return (
+    <div className="card" style={{ marginTop: 'var(--spacing-md)' }}>
+      <h3 style={{ margin: '0 0 var(--spacing-md) 0' }}>
+        <i className="fas fa-save" style={{ marginRight: 'var(--spacing-sm)' }} />
+        Checkpoints
+      </h3>
+      <div style={{ overflowX: 'auto' }}>
+        <table style={{ width: '100%', fontSize: '0.8125rem', borderCollapse: 'collapse' }}>
+          <thead>
+            <tr style={{ borderBottom: '1px solid var(--color-border-subtle)', textAlign: 'left' }}>
+              <th style={{ padding: '4px 8px' }}>Step</th>
+              <th style={{ padding: '4px 8px' }}>Epoch</th>
+              <th style={{ padding: '4px 8px' }}>Loss</th>
+              <th style={{ padding: '4px 8px' }}>Created</th>
+              <th style={{ padding: '4px 8px' }}>Path</th>
+              <th style={{ padding: '4px 8px' }}>Actions</th>
+            </tr>
+          </thead>
+          <tbody>
+            {checkpoints.map(cp => (
+              <tr key={cp.path} style={{ borderBottom: '1px solid var(--color-border-subtle)' }}>
+                <td style={{ padding: '4px 8px' }}>{cp.step}</td>
+                <td style={{ padding: '4px 8px' }}>{cp.epoch?.toFixed(2)}</td>
+                <td style={{ padding: '4px 8px' }}>{cp.loss?.toFixed(4)}</td>
+                <td style={{ padding: '4px 8px' }}>{cp.created_at}</td>
+                <td style={{ padding: '4px 8px', maxWidth: '200px', overflow: 'hidden', textOverflow: 'ellipsis', whiteSpace: 'nowrap' }} title={cp.path}>
+                  {cp.path} <CopyButton text={cp.path} />
+                </td>
+                <td style={{ padding: '4px 8px', whiteSpace: 'nowrap' }}>
+                  <button className="btn" style={{ fontSize: '0.7rem', padding: '2px 6px', marginRight: '4px' }}
+                    onClick={() => onResume(cp)} title="Resume training from this checkpoint">
+                    <i className="fas fa-play" /> Resume
+                  </button>
+                  <button className="btn" style={{ fontSize: '0.7rem', padding: '2px 6px' }}
+                    onClick={() => onExportCheckpoint(cp)} title="Export this checkpoint">
+                    <i className="fas fa-file-export" /> Export
+                  </button>
+                </td>
+              </tr>
+            ))}
+          </tbody>
+        </table>
+      </div>
+    </div>
+  )
+}
+
+const QUANT_PRESETS = ['q4_k_m', 'q5_k_m', 'q8_0', 'f16', 'q4_0', 'q5_0']
+
+function ExportPanel({ job, prefilledCheckpoint }) {
+  const [checkpoints, setCheckpoints] = useState([])
+  const [exportFormat, setExportFormat] = useState('lora')
+  const [quantMethod, setQuantMethod] = useState('q4_k_m')
+  const [modelName, setModelName] = useState('')
+  const [selectedCheckpoint, setSelectedCheckpoint] = useState('')
+  const [exporting, setExporting] = useState(false)
+  const [message, setMessage] = useState('')
+  const [exportedModelName, setExportedModelName] = useState('')
+  const pollRef = useRef(null)
+
+  useEffect(() => {
+    if (!job) return
+    fineTuneApi.listCheckpoints(job.id).then(r => {
+      setCheckpoints(r.checkpoints || [])
+    }).catch(() => {})
+  }, [job?.id])
+
+  // Apply prefilled checkpoint when set
+  useEffect(() => {
+    if (prefilledCheckpoint) {
+      setSelectedCheckpoint(prefilledCheckpoint.path || '')
+    }
+  }, [prefilledCheckpoint])
+
+  // Sync export state from job (e.g. on initial load or job list refresh)
+  useEffect(() => {
+    if (!job) return
+    if (job.export_status === 'exporting') {
+      setExporting(true)
+      setMessage(job.export_message || 'Export in progress...')
+    } else if (job.export_status === 'completed' && job.export_model_name) {
+      setExporting(false)
+      setExportedModelName(job.export_model_name)
+      setMessage(`Model exported and registered as "${job.export_model_name}"`)
+    } else if (job.export_status === 'failed') {
+      setExporting(false)
+      setMessage(`Export failed: ${job.export_message || 'unknown error'}`)
+    }
+  }, [job?.export_status, job?.export_model_name, job?.export_message])
+
+  // Poll for export completion
+  useEffect(() => {
+    if (!exporting || !job) return
+
+    pollRef.current = setInterval(async () => {
+      try {
+        const updated = await fineTuneApi.getJob(job.id)
+        if (updated.export_status === 'completed') {
+          setExporting(false)
+          const name = updated.export_model_name || modelName || 'exported model'
+          setExportedModelName(name)
+          setMessage(`Model exported and registered as "${name}"`)
+          clearInterval(pollRef.current)
+        } else if (updated.export_status === 'failed') {
+          setExporting(false)
+          setMessage(`Export failed: ${updated.export_message || 'unknown error'}`)
+          clearInterval(pollRef.current)
+        } else if (updated.export_status === 'exporting' && updated.export_message) {
+          setMessage(updated.export_message)
+        }
+      } catch (_) {}
+    }, 3000)
+
+    return () => clearInterval(pollRef.current)
+  }, [exporting, job?.id])
+
+  const handleExport = async () => {
+    setExporting(true)
+    setMessage('Export in progress...')
+    setExportedModelName('')
+    try {
+      await fineTuneApi.exportModel(job.id, {
+        name: modelName || undefined,
+        checkpoint_path: selectedCheckpoint || job.output_dir,
+        export_format: exportFormat,
+        quantization_method: exportFormat === 'gguf' ? quantMethod : '',
+        model: job.model,
+      })
+      // Polling will pick up completion/failure
+    } catch (e) {
+      setMessage(`Export failed: ${e.message}`)
+      setExporting(false)
+    }
+  }
+
+  // Show export panel for completed, stopped, and failed jobs (checkpoints may exist)
+  if (!job || !['completed', 'stopped', 'failed'].includes(job.status)) return null
+
+  return (
+    <div className="card" style={{ marginTop: 'var(--spacing-md)' }}>
+      <h3 style={{ margin: '0 0 var(--spacing-md) 0' }}>
+        <i className="fas fa-file-export" style={{ marginRight: 'var(--spacing-sm)' }} />
+        Export Model
+      </h3>
+
+      {checkpoints.length > 0 && (
+        <div style={{ marginBottom: 'var(--spacing-md)' }}>
+          <label className="form-label">Checkpoint</label>
+          <select value={selectedCheckpoint} onChange={e => setSelectedCheckpoint(e.target.value)} className="input">
+            <option value="">Final model (output directory)</option>
+            {checkpoints.map(cp => (
+              <option key={cp.path} value={cp.path}>
+                Step {cp.step} (loss: {cp.loss?.toFixed(4)})
+              </option>
+            ))}
+          </select>
+        </div>
+      )}
+
+      <div style={{ display: 'grid', gridTemplateColumns: '1fr 1fr', gap: 'var(--spacing-md)', marginBottom: 'var(--spacing-md)' }}>
+        <div>
+          <label className="form-label">Export Format</label>
+          <select value={exportFormat} onChange={e => setExportFormat(e.target.value)} className="input">
+            <option value="lora">LoRA Adapter</option>
+            <option value="merged_16bit">Merged (16-bit)</option>
+            <option value="merged_4bit">Merged (4-bit)</option>
+            <option value="gguf">GGUF</option>
+          </select>
+        </div>
+        {exportFormat === 'gguf' && (
+          <div>
+            <label className="form-label">Quantization</label>
+            <input
+              list="quant-presets"
+              value={quantMethod}
+              onChange={e => setQuantMethod(e.target.value)}
+              placeholder="e.g. q4_k_m, bf16, f32"
+              className="input"
+            />
+            <datalist id="quant-presets">
+              {QUANT_PRESETS.map(q => (
+                <option key={q} value={q} />
+              ))}
+            </datalist>
+          </div>
+        )}
+      </div>
+
+      <div style={{ marginBottom: 'var(--spacing-md)' }}>
+        <label className="form-label">Model Name (leave blank to auto-generate)</label>
+        <input
+          type="text"
+          value={modelName}
+          onChange={e => setModelName(e.target.value)}
+          placeholder="e.g. my-finetuned-model"
+          className="input"
+        />
+      </div>
+
+      <button className="btn btn-primary" onClick={handleExport} disabled={exporting}>
+        {exporting ? <><LoadingSpinner size="sm" /> Exporting...</> :
+          <><i className="fas fa-download" style={{ marginRight: 'var(--spacing-xs)' }} /> Export</>}
+      </button>
+
+      {message && (
+        <div style={{ marginTop: 'var(--spacing-sm)', fontSize: '0.875rem', color: message.includes('failed') ? 'var(--color-error)' : 'var(--color-success)' }}>
+          {exporting && <LoadingSpinner size="sm" />} {message}
+          {exportedModelName && !message.includes('failed') && (
+            <span style={{ marginLeft: 'var(--spacing-sm)' }}>
+              <a href={`/app/chat/${encodeURIComponent(exportedModelName)}`} style={{ color: 'var(--color-primary)', textDecoration: 'underline' }}>
+                Chat with {exportedModelName}
+              </a>
+              <a href={fineTuneApi.downloadUrl(job.id)} download className="btn" style={{ marginLeft: 'var(--spacing-sm)', fontSize: '0.8125rem', padding: '2px 8px' }}>
+                <i className="fas fa-download" /> Download Archive
+              </a>
+            </span>
+          )}
+        </div>
+      )}
+    </div>
+  )
+}
+
+export default function FineTune() {
+  const [jobs, setJobs] = useState([])
+  const [selectedJob, setSelectedJob] = useState(null)
+  const [showForm, setShowForm] = useState(false)
+  const [loading, setLoading] = useState(false)
+  const [error, setError] = useState('')
+  const [backends, setBackends] = useState([])
+  const [exportCheckpoint, setExportCheckpoint] = useState(null)
+
+  // Form state
+  const [model, setModel] = useState('')
+  const [backend, setBackend] = useState('')
+  const [trainingMethod, setTrainingMethod] = useState('sft')
+  const [trainingType, setTrainingType] = useState('lora')
+  const [datasetSource, setDatasetSource] = useState('')
+  const [datasetFile, setDatasetFile] = useState(null)
+  const [datasetSplit, setDatasetSplit] = useState('')
+  const [numEpochs, setNumEpochs] = useState(3)
+  const [batchSize, setBatchSize] = useState(2)
+  const [learningRate, setLearningRate] = useState(0.0002)
+  const [learningRateText, setLearningRateText] = useState('0.0002')
+  const [adapterRank, setAdapterRank] = useState(16)
+  const [adapterAlpha, setAdapterAlpha] = useState(16)
+  const [adapterDropout, setAdapterDropout] = useState(0)
+  const [targetModules, setTargetModules] = useState('')
+  const [gradAccum, setGradAccum] = useState(4)
+  const [warmupSteps, setWarmupSteps] = useState(5)
+  const [maxSteps, setMaxSteps] = useState(0)
+  const [saveSteps, setSaveSteps] = useState(500)
+  const [weightDecay, setWeightDecay] = useState(0)
+  const [maxSeqLength, setMaxSeqLength] = useState(2048)
+  const [optimizer, setOptimizer] = useState('adamw_torch')
+  const [gradCheckpointing, setGradCheckpointing] = useState(false)
+  const [seed, setSeed] = useState(0)
+  const [mixedPrecision, setMixedPrecision] = useState('')
+  const [extraOptions, setExtraOptions] = useState([])
+  const [hfToken, setHfToken] = useState('')
+  const [showAdvanced, setShowAdvanced] = useState(false)
+  const [resumeFromCheckpoint, setResumeFromCheckpoint] = useState('')
+  const [saveTotalLimit, setSaveTotalLimit] = useState(0)
+  const [evalEnabled, setEvalEnabled] = useState(false)
+  const [evalStrategy, setEvalStrategy] = useState('steps')
+  const [evalSteps, setEvalSteps] = useState(0)
+  const [evalSplit, setEvalSplit] = useState('')
+  const [evalDatasetSource, setEvalDatasetSource] = useState('')
+  const [evalSplitRatio, setEvalSplitRatio] = useState(0.1)
+  const [rewardFunctions, setRewardFunctions] = useState([]) // [{type, name, code?, params?}]
+  const [showAddCustomReward, setShowAddCustomReward] = useState(false)
+  const [customRewardName, setCustomRewardName] = useState('')
+  const [customRewardCode, setCustomRewardCode] = useState('')
+
+  const loadJobs = useCallback(async () => {
+    try {
+      const data = await fineTuneApi.listJobs()
+      setJobs(data || [])
+    } catch (_) {}
+  }, [])
+
+  useEffect(() => {
+    loadJobs()
+    const interval = setInterval(loadJobs, 10000)
+    return () => clearInterval(interval)
+  }, [loadJobs])
+
+  useEffect(() => {
+    fineTuneApi.listBackends()
+      .then(data => {
+        const names = data && data.length > 0 ? data.map(b => b.name) : FALLBACK_BACKENDS
+        setBackends(names)
+        setBackend(prev => prev || names[0] || '')
+      })
+      .catch(() => {
+        setBackends(FALLBACK_BACKENDS)
+        setBackend(prev => prev || FALLBACK_BACKENDS[0])
+      })
+  }, [])
+
+  const handleSubmit = async (e) => {
+    e.preventDefault()
+    setLoading(true)
+    setError('')
+
+    try {
+      let dsSource = datasetSource
+      if (datasetFile) {
+        const result = await fineTuneApi.uploadDataset(datasetFile)
+        dsSource = result.path
+      }
+
+      const extra = {}
+      if (maxSeqLength) extra.max_seq_length = String(maxSeqLength)
+      if (hfToken.trim()) extra.hf_token = hfToken.trim()
+      if (saveTotalLimit > 0) extra.save_total_limit = String(saveTotalLimit)
+      if (evalEnabled) {
+        extra.eval_strategy = evalStrategy || 'steps'
+        if (evalSteps > 0) extra.eval_steps = String(evalSteps)
+        if (evalSplit.trim()) extra.eval_split = evalSplit.trim()
+        if (evalDatasetSource.trim()) extra.eval_dataset_source = evalDatasetSource.trim()
+        if (evalSplitRatio > 0 && evalSplitRatio !== 0.1) extra.eval_split_ratio = String(evalSplitRatio)
+      } else {
+        extra.eval_strategy = 'no'
+      }
+      for (const { key, value } of extraOptions) {
+        if (key.trim()) extra[key.trim()] = value
+      }
+
+      const isAdapter = ['lora', 'loha', 'lokr'].includes(trainingType)
+
+      const req = {
+        model,
+        backend,
+        training_method: trainingMethod,
+        training_type: trainingType,
+        dataset_source: dsSource,
+        dataset_split: datasetSplit || undefined,
+        num_epochs: numEpochs,
+        batch_size: batchSize,
+        learning_rate: learningRate,
+        adapter_rank: isAdapter ? adapterRank : 0,
+        adapter_alpha: isAdapter ? adapterAlpha : 0,
+        adapter_dropout: isAdapter && adapterDropout > 0 ? adapterDropout : undefined,
+        target_modules: isAdapter && targetModules.trim() ? targetModules.split(',').map(s => s.trim()) : undefined,
+        gradient_accumulation_steps: gradAccum,
+        warmup_steps: warmupSteps,
+        max_steps: maxSteps > 0 ? maxSteps : undefined,
+        save_steps: saveSteps > 0 ? saveSteps : undefined,
+        weight_decay: weightDecay > 0 ? weightDecay : undefined,
+        gradient_checkpointing: gradCheckpointing,
+        optimizer,
+        seed: seed > 0 ? seed : undefined,
+        mixed_precision: mixedPrecision || undefined,
+        resume_from_checkpoint: resumeFromCheckpoint || undefined,
+        extra_options: Object.keys(extra).length > 0 ? extra : undefined,
+        reward_functions: trainingMethod === 'grpo' && rewardFunctions.length > 0 ? rewardFunctions : undefined,
+      }
+
+      const resp = await fineTuneApi.startJob(req)
+      setShowForm(false)
+      setResumeFromCheckpoint('')
+      await loadJobs()
+
+      const newJob = { ...req, id: resp.id, status: 'queued', created_at: new Date().toISOString() }
+      setSelectedJob(newJob)
+    } catch (err) {
+      setError(err.message)
+    }
+    setLoading(false)
+  }
+
+  const handleStop = async (jobId) => {
+    try {
+      await fineTuneApi.stopJob(jobId, true)
+      await loadJobs()
+    } catch (err) {
+      setError(err.message)
+    }
+  }
+
+  const handleDelete = async (jobId) => {
+    if (!window.confirm('Delete this job and all its data (checkpoints, exported model)? This cannot be undone.')) return
+    try {
+      await fineTuneApi.deleteJob(jobId)
+      if (selectedJob?.id === jobId) setSelectedJob(null)
+      await loadJobs()
+    } catch (err) {
+      setError(err.message)
+    }
+  }
+
+  const isAdapter = ['lora', 'loha', 'lokr'].includes(trainingType)
+
+  const getFormConfig = () => {
+    const extra = {}
+    for (const { key, value } of extraOptions) {
+      if (key.trim()) extra[key.trim()] = value
+    }
+    return {
+      model,
+      backend,
+      training_method: trainingMethod,
+      training_type: trainingType,
+      adapter_rank: adapterRank,
+      adapter_alpha: adapterAlpha,
+      adapter_dropout: adapterDropout,
+      target_modules: targetModules.trim() ? targetModules.split(',').map(s => s.trim()) : [],
+      dataset_source: datasetSource,
+      dataset_split: datasetSplit,
+      num_epochs: numEpochs,
+      batch_size: batchSize,
+      learning_rate: learningRate,
+      gradient_accumulation_steps: gradAccum,
+      warmup_steps: warmupSteps,
+      max_steps: maxSteps,
+      save_steps: saveSteps,
+      weight_decay: weightDecay,
+      gradient_checkpointing: gradCheckpointing,
+      optimizer,
+      seed,
+      mixed_precision: mixedPrecision,
+      max_seq_length: maxSeqLength,
+      eval_strategy: evalEnabled ? (evalStrategy || 'steps') : 'no',
+      eval_steps: evalSteps,
+      eval_split: evalSplit,
+      eval_dataset_source: evalDatasetSource,
+      eval_split_ratio: evalSplitRatio,
+      extra_options: Object.keys(extra).length > 0 ? extra : {},
+      reward_functions: rewardFunctions.length > 0 ? rewardFunctions : undefined,
+    }
+  }
+
+  const applyFormConfig = (config) => {
+    if (config.model != null) setModel(config.model)
+    if (config.backend != null) setBackend(config.backend)
+    if (config.training_method != null) setTrainingMethod(config.training_method)
+    if (config.training_type != null) setTrainingType(config.training_type)
+    if (config.adapter_rank != null) setAdapterRank(Number(config.adapter_rank))
+    if (config.adapter_alpha != null) setAdapterAlpha(Number(config.adapter_alpha))
+    if (config.adapter_dropout != null) setAdapterDropout(Number(config.adapter_dropout))
+    if (config.target_modules != null) {
+      const modules = Array.isArray(config.target_modules)
+        ? config.target_modules.join(', ')
+        : String(config.target_modules)
+      setTargetModules(modules)
+    }
+    if (config.dataset_source != null) setDatasetSource(config.dataset_source)
+    if (config.dataset_split != null) setDatasetSplit(config.dataset_split)
+    if (config.num_epochs != null) setNumEpochs(Number(config.num_epochs))
+    if (config.batch_size != null) setBatchSize(Number(config.batch_size))
+    if (config.learning_rate != null) { setLearningRate(Number(config.learning_rate)); setLearningRateText(String(config.learning_rate)) }
+    if (config.gradient_accumulation_steps != null) setGradAccum(Number(config.gradient_accumulation_steps))
+    if (config.warmup_steps != null) setWarmupSteps(Number(config.warmup_steps))
+    if (config.max_steps != null) setMaxSteps(Number(config.max_steps))
+    if (config.save_steps != null) setSaveSteps(Number(config.save_steps))
+    if (config.weight_decay != null) setWeightDecay(Number(config.weight_decay))
+    if (config.gradient_checkpointing != null) setGradCheckpointing(Boolean(config.gradient_checkpointing))
+    if (config.optimizer != null) setOptimizer(config.optimizer)
+    if (config.seed != null) setSeed(Number(config.seed))
+    if (config.mixed_precision != null) setMixedPrecision(config.mixed_precision)
+
+    // Handle max_seq_length: top-level field or inside extra_options
+    if (config.max_seq_length != null) {
+      setMaxSeqLength(Number(config.max_seq_length))
+    } else if (config.extra_options?.max_seq_length != null) {
+      setMaxSeqLength(Number(config.extra_options.max_seq_length))
+    }
+
+    // Eval options — detect enabled state from strategy
+    const restoreEval = (strategy, steps, split, src, ratio) => {
+      if (strategy != null && strategy !== 'no') {
+        setEvalEnabled(true)
+        setEvalStrategy(strategy)
+      } else if (strategy === 'no') {
+        setEvalEnabled(false)
+      }
+      if (steps != null) setEvalSteps(Number(steps))
+      if (split != null) setEvalSplit(split)
+      if (src != null) setEvalDatasetSource(src)
+      if (ratio != null) setEvalSplitRatio(Number(ratio))
+    }
+    restoreEval(config.eval_strategy, config.eval_steps, config.eval_split, config.eval_dataset_source, config.eval_split_ratio)
+    // Also restore from extra_options if present (overrides top-level)
+    const eo = config.extra_options
+    if (eo) restoreEval(eo.eval_strategy, eo.eval_steps, eo.eval_split, eo.eval_dataset_source, eo.eval_split_ratio)
+
+    // Handle save_total_limit from extra_options
+    if (config.extra_options?.save_total_limit != null) {
+      setSaveTotalLimit(Number(config.extra_options.save_total_limit))
+    }
+
+    // Convert extra_options object to [{key, value}] entries, filtering out handled keys
+    if (config.extra_options && typeof config.extra_options === 'object') {
+      const entries = Object.entries(config.extra_options)
+        .filter(([k]) => !['max_seq_length', 'save_total_limit', 'hf_token', 'eval_strategy', 'eval_steps', 'eval_split', 'eval_dataset_source', 'eval_split_ratio'].includes(k))
+        .map(([key, value]) => ({ key, value: String(value) }))
+      setExtraOptions(entries)
+    }
+
+    // Restore reward functions
+    if (Array.isArray(config.reward_functions)) {
+      setRewardFunctions(config.reward_functions)
+    } else {
+      setRewardFunctions([])
+    }
+  }
+
+  const handleExportConfig = () => {
+    const config = getFormConfig()
+    const json = JSON.stringify(config, null, 2)
+    const blob = new Blob([json], { type: 'application/json' })
+    const url = URL.createObjectURL(blob)
+    const a = document.createElement('a')
+    a.href = url
+    a.download = 'finetune-config.json'
+    document.body.appendChild(a)
+    a.click()
+    document.body.removeChild(a)
+    URL.revokeObjectURL(url)
+  }
+
+  const handleImportConfig = () => {
+    const input = document.createElement('input')
+    input.type = 'file'
+    input.accept = '.json'
+    input.onchange = (e) => {
+      const file = e.target.files[0]
+      if (!file) return
+      const reader = new FileReader()
+      reader.onload = (ev) => {
+        try {
+          const config = JSON.parse(ev.target.result)
+          applyFormConfig(config)
+          setShowForm(true)
+          setError('')
+        } catch {
+          setError('Failed to parse config file. Please ensure it is valid JSON.')
+        }
+      }
+      reader.readAsText(file)
+    }
+    input.click()
+  }
+
+  const handleUseConfig = (job) => {
+    // Prefer the stored config if available, otherwise use the job fields
+    applyFormConfig(job.config || job)
+    setResumeFromCheckpoint('')
+    setShowForm(true)
+  }
+
+  const handleResumeFromCheckpoint = (checkpoint) => {
+    if (!selectedJob) return
+    // Apply the original job's config
+    applyFormConfig(selectedJob.config || selectedJob)
+    setResumeFromCheckpoint(checkpoint.path)
+    setShowAdvanced(true)
+    setShowForm(true)
+  }
+
+  const handleExportCheckpoint = (checkpoint) => {
+    setExportCheckpoint(checkpoint)
+  }
+
+  return (
+    <div className="page">
+      <div className="page-header" style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'flex-start' }}>
+        <div>
+          <h1 className="page-title">Fine-Tuning</h1>
+          <p className="page-subtitle">Create and manage fine-tuning jobs</p>
+        </div>
+        <div style={{ display: 'flex', gap: 'var(--spacing-sm)' }}>
+          <button className="btn" onClick={handleImportConfig}>
+            <i className="fas fa-upload" style={{ marginRight: 'var(--spacing-xs)' }} /> Import Config
+          </button>
+          <button className="btn btn-primary" onClick={() => setShowForm(!showForm)}>
+            <i className={`fas fa-${showForm ? 'times' : 'plus'}`} style={{ marginRight: 'var(--spacing-xs)' }} />
+            {showForm ? 'Cancel' : 'New Job'}
+          </button>
+        </div>
+      </div>
+
+      {error && (
+        <div className="card" style={{ background: 'var(--color-error-light)', borderColor: 'var(--color-error-border)', color: 'var(--color-error)', marginBottom: 'var(--spacing-md)', padding: 'var(--spacing-md)' }}>
+          <i className="fas fa-exclamation-triangle" style={{ marginRight: 'var(--spacing-xs)' }} /> {error}
+        </div>
+      )}
+
+      {showForm && (
+        <form onSubmit={handleSubmit} className="card" style={{ marginBottom: 'var(--spacing-md)' }}>
+
+          {resumeFromCheckpoint && (
+            <div style={{ marginBottom: 'var(--spacing-md)', padding: 'var(--spacing-sm) var(--spacing-md)', background: 'var(--color-bg-secondary)', borderRadius: 'var(--radius-sm)', display: 'flex', alignItems: 'center', gap: 'var(--spacing-sm)' }}>
+              <i className="fas fa-redo" style={{ color: 'var(--color-primary)' }} />
+              <span style={{ fontSize: '0.875rem' }}>
+                Resuming from checkpoint: <code style={{ fontSize: '0.8rem' }}>{resumeFromCheckpoint}</code>
+              </span>
+              <button type="button" className="btn" style={{ padding: '2px 6px', fontSize: '0.75rem', marginLeft: 'auto' }} onClick={() => setResumeFromCheckpoint('')}>
+                <i className="fas fa-times" /> Clear
+              </button>
+            </div>
+          )}
+
+          <FormSection icon="fas fa-server" title="Model & Backend">
+            <div style={{ display: 'grid', gridTemplateColumns: '1fr 1fr 2fr', gap: 'var(--spacing-md)' }}>
+              <div>
+                <label className="form-label">Backend</label>
+                <select value={backend} onChange={e => setBackend(e.target.value)} className="input">
+                  {backends.length === 0 ? (
+                    <option value="" disabled>No backends available</option>
+                  ) : (
+                    backends.map(b => <option key={b} value={b}>{b}</option>)
+                  )}
+                </select>
+              </div>
+              <div>
+                <label className="form-label">Training Method</label>
+                <select value={trainingMethod} onChange={e => setTrainingMethod(e.target.value)} className="input">
+                  {TRAINING_METHODS.map(m => <option key={m} value={m}>{m.toUpperCase()}</option>)}
+                </select>
+              </div>
+              <div>
+                <label className="form-label">Model (HuggingFace ID or local path)</label>
+                <input type="text" value={model} onChange={e => setModel(e.target.value)} placeholder="e.g. TinyLlama/TinyLlama-1.1B-Chat-v1.0" className="input" required />
+              </div>
+            </div>
+            <div style={{ marginTop: 'var(--spacing-md)' }}>
+              <label className="form-label">HuggingFace Token (for gated models)</label>
+              <input type="password" value={hfToken} onChange={e => setHfToken(e.target.value)} placeholder="hf_..." className="input" />
+            </div>
+          </FormSection>
+
+          <FormSection icon="fas fa-layer-group" title="Training Type & Adapter">
+            <div style={{ display: 'grid', gridTemplateColumns: 'repeat(auto-fill, minmax(160px, 1fr))', gap: 'var(--spacing-md)' }}>
+              <div>
+                <label className="form-label">Training Type</label>
+                <select value={trainingType} onChange={e => setTrainingType(e.target.value)} className="input">
+                  {TRAINING_TYPES.map(t => <option key={t} value={t}>{t}</option>)}
+                </select>
+              </div>
+              {isAdapter && (
+                <>
+                  <div>
+                    <label className="form-label">Rank</label>
+                    <input type="number" value={adapterRank} onChange={e => setAdapterRank(Number(e.target.value))} className="input" min={1} />
+                  </div>
+                  <div>
+                    <label className="form-label">Alpha</label>
+                    <input type="number" value={adapterAlpha} onChange={e => setAdapterAlpha(Number(e.target.value))} className="input" min={1} />
+                  </div>
+                  <div>
+                    <label className="form-label">Dropout</label>
+                    <input type="number" value={adapterDropout} onChange={e => setAdapterDropout(Number(e.target.value))} className="input" min={0} max={1} step={0.05} />
+                  </div>
+                </>
+              )}
+            </div>
+            {isAdapter && (
+              <div style={{ marginTop: 'var(--spacing-md)' }}>
+                <label className="form-label">Target Modules (comma-separated, blank for default)</label>
+                <input type="text" value={targetModules} onChange={e => setTargetModules(e.target.value)} placeholder="e.g. q_proj, v_proj, k_proj, o_proj" className="input" />
+              </div>
+            )}
+          </FormSection>
+
+          <FormSection icon="fas fa-database" title="Dataset">
+            <div style={{ display: 'grid', gridTemplateColumns: '2fr 1fr 1fr', gap: 'var(--spacing-md)' }}>
+              <div>
+                <label className="form-label">Source (HuggingFace ID or leave blank to upload)</label>
+                <input type="text" value={datasetSource} onChange={e => setDatasetSource(e.target.value)} placeholder="e.g. tatsu-lab/alpaca" className="input" />
+              </div>
+              <div>
+                <label className="form-label">Split</label>
+                <input type="text" value={datasetSplit} onChange={e => setDatasetSplit(e.target.value)} placeholder="e.g. train" className="input" />
+              </div>
+              <div>
+                <label className="form-label">Upload File</label>
+                <input type="file" onChange={e => setDatasetFile(e.target.files[0])} accept=".json,.jsonl,.csv" className="input" style={{ padding: '6px' }} />
+              </div>
+            </div>
+          </FormSection>
+
+          {trainingMethod === 'grpo' && (
+            <FormSection icon="fas fa-trophy" title="Reward Functions (GRPO)">
+              <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)', marginBottom: 'var(--spacing-md)' }}>
+                GRPO requires at least one reward function. Select built-in functions or add custom ones.
+              </div>
+
+              {/* Built-in reward functions */}
+              <div style={{ display: 'grid', gridTemplateColumns: 'repeat(auto-fill, minmax(280px, 1fr))', gap: 'var(--spacing-sm)', marginBottom: 'var(--spacing-md)' }}>
+                {BUILTIN_REWARDS.map(builtin => {
+                  const isSelected = rewardFunctions.some(rf => rf.type === 'builtin' && rf.name === builtin.name)
+                  const selectedRf = rewardFunctions.find(rf => rf.type === 'builtin' && rf.name === builtin.name)
+                  return (
+                    <div key={builtin.name} style={{
+                      padding: 'var(--spacing-sm) var(--spacing-md)',
+                      border: `1px solid ${isSelected ? 'var(--color-primary)' : 'var(--color-border-subtle)'}`,
+                      borderRadius: 'var(--radius-sm)',
+                      background: isSelected ? 'var(--color-bg-secondary)' : 'transparent',
+                    }}>
+                      <label style={{ display: 'flex', alignItems: 'center', gap: 'var(--spacing-sm)', cursor: 'pointer' }}>
+                        <input
+                          type="checkbox"
+                          checked={isSelected}
+                          onChange={e => {
+                            if (e.target.checked) {
+                              setRewardFunctions(prev => [...prev, { type: 'builtin', name: builtin.name }])
+                            } else {
+                              setRewardFunctions(prev => prev.filter(rf => !(rf.type === 'builtin' && rf.name === builtin.name)))
+                            }
+                          }}
+                        />
+                        <div>
+                          <div style={{ fontWeight: 600, fontSize: '0.8125rem' }}>{builtin.name}</div>
+                          <div style={{ fontSize: '0.75rem', color: 'var(--color-text-muted)' }}>{builtin.description}</div>
+                        </div>
+                      </label>
+                      {isSelected && builtin.params.length > 0 && (
+                        <div style={{ marginTop: 'var(--spacing-sm)', paddingLeft: 'var(--spacing-lg)' }}>
+                          {builtin.params.map(param => (
+                            <div key={param.key} style={{ display: 'flex', alignItems: 'center', gap: 'var(--spacing-sm)', marginBottom: 'var(--spacing-xs)' }}>
+                              <label style={{ fontSize: '0.75rem', minWidth: '80px' }}>{param.label}:</label>
+                              <input
+                                type="text"
+                                className="input"
+                                style={{ width: '100px', fontSize: '0.8125rem', padding: '2px 6px' }}
+                                value={selectedRf?.params?.[param.key] || param.default}
+                                onChange={e => {
+                                  setRewardFunctions(prev => prev.map(rf =>
+                                    rf.type === 'builtin' && rf.name === builtin.name
+                                      ? { ...rf, params: { ...(rf.params || {}), [param.key]: e.target.value } }
+                                      : rf
+                                  ))
+                                }}
+                              />
+                            </div>
+                          ))}
+                        </div>
+                      )}
+                    </div>
+                  )
+                })}
+              </div>
+
+              {/* Custom inline reward functions */}
+              {rewardFunctions.filter(rf => rf.type === 'inline').map((rf, idx) => (
+                <div key={`inline-${idx}`} style={{
+                  padding: 'var(--spacing-sm) var(--spacing-md)',
+                  border: '1px solid var(--color-primary)',
+                  borderRadius: 'var(--radius-sm)',
+                  background: 'var(--color-bg-secondary)',
+                  marginBottom: 'var(--spacing-sm)',
+                }}>
+                  <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center', marginBottom: 'var(--spacing-xs)' }}>
+                    <span style={{ fontWeight: 600, fontSize: '0.8125rem' }}>
+                      <i className="fas fa-code" style={{ marginRight: 'var(--spacing-xs)' }} />
+                      {rf.name}
+                    </span>
+                    <button type="button" className="btn btn-danger" style={{ padding: '2px 6px', fontSize: '0.75rem' }}
+                      onClick={() => setRewardFunctions(prev => prev.filter((_, i) => i !== rewardFunctions.indexOf(rf)))}>
+                      <i className="fas fa-times" />
+                    </button>
+                  </div>
+                  <pre style={{ fontSize: '0.75rem', margin: 0, whiteSpace: 'pre-wrap', color: 'var(--color-text-muted)' }}>
+                    {rf.code}
+                  </pre>
+                </div>
+              ))}
+
+              {/* Add custom reward button / form */}
+              {showAddCustomReward ? (
+                <div style={{
+                  padding: 'var(--spacing-md)',
+                  border: '1px dashed var(--color-border)',
+                  borderRadius: 'var(--radius-sm)',
+                  marginTop: 'var(--spacing-sm)',
+                }}>
+                  <div style={{ marginBottom: 'var(--spacing-sm)' }}>
+                    <label className="form-label">Function Name</label>
+                    <input type="text" className="input" value={customRewardName} onChange={e => setCustomRewardName(e.target.value)}
+                      placeholder="e.g. my_custom_reward" style={{ maxWidth: '300px' }} />
+                  </div>
+                  <div style={{ marginBottom: 'var(--spacing-sm)' }}>
+                    <label className="form-label">
+                      Function Body
+                      <span style={{ fontWeight: 'normal', fontSize: '0.75rem', color: 'var(--color-text-muted)', marginLeft: 'var(--spacing-sm)' }}>
+                        (receives: completions, **kwargs; must return list[float]; available: re, math, json, string)
+                      </span>
+                    </label>
+                    <textarea
+                      className="input"
+                      value={customRewardCode}
+                      onChange={e => setCustomRewardCode(e.target.value)}
+                      placeholder={"return [1.0 if '<think>' in c else 0.0 for c in completions]"}
+                      rows={4}
+                      style={{ fontFamily: 'monospace', fontSize: '0.8125rem' }}
+                    />
+                  </div>
+                  <div style={{ display: 'flex', gap: 'var(--spacing-sm)' }}>
+                    <button type="button" className="btn btn-primary" style={{ fontSize: '0.8125rem' }}
+                      disabled={!customRewardName.trim() || !customRewardCode.trim()}
+                      onClick={() => {
+                        setRewardFunctions(prev => [...prev, {
+                          type: 'inline',
+                          name: customRewardName.trim(),
+                          code: customRewardCode,
+                        }])
+                        setCustomRewardName('')
+                        setCustomRewardCode('')
+                        setShowAddCustomReward(false)
+                      }}>
+                      <i className="fas fa-plus" style={{ marginRight: 'var(--spacing-xs)' }} /> Add
+                    </button>
+                    <button type="button" className="btn" style={{ fontSize: '0.8125rem' }}
+                      onClick={() => { setShowAddCustomReward(false); setCustomRewardName(''); setCustomRewardCode('') }}>
+                      Cancel
+                    </button>
+                  </div>
+                </div>
+              ) : (
+                <button type="button" className="btn" onClick={() => setShowAddCustomReward(true)} style={{ fontSize: '0.8125rem' }}>
+                  <i className="fas fa-plus" style={{ marginRight: 'var(--spacing-xs)' }} />
+                  Add Custom Reward Function
+                </button>
+              )}
+            </FormSection>
+          )}
+
+          <FormSection icon="fas fa-sliders-h" title="Hyperparameters">
+            <div style={{ display: 'grid', gridTemplateColumns: 'repeat(auto-fill, minmax(140px, 1fr))', gap: 'var(--spacing-md)' }}>
+              <div>
+                <label className="form-label">Epochs</label>
+                <input type="number" value={numEpochs} onChange={e => setNumEpochs(Number(e.target.value))} className="input" min={1} />
+              </div>
+              <div>
+                <label className="form-label">Batch Size</label>
+                <input type="number" value={batchSize} onChange={e => setBatchSize(Number(e.target.value))} className="input" min={1} />
+              </div>
+              <div>
+                <label className="form-label">Learning Rate</label>
+                <input type="text" value={learningRateText} onChange={e => {
+                  setLearningRateText(e.target.value)
+                  const parsed = Number(e.target.value)
+                  if (!isNaN(parsed) && parsed > 0) setLearningRate(parsed)
+                }} className="input" placeholder="e.g. 5e-5 or 0.00005" />
+              </div>
+              <div>
+                <label className="form-label">Grad Accum Steps</label>
+                <input type="number" value={gradAccum} onChange={e => setGradAccum(Number(e.target.value))} className="input" min={1} />
+              </div>
+              <div>
+                <label className="form-label">Warmup Steps</label>
+                <input type="number" value={warmupSteps} onChange={e => setWarmupSteps(Number(e.target.value))} className="input" min={0} />
+              </div>
+              <div>
+                <label className="form-label">Max Seq Length</label>
+                <input type="number" value={maxSeqLength} onChange={e => setMaxSeqLength(Number(e.target.value))} className="input" min={64} />
+              </div>
+              <div>
+                <label className="form-label">Optimizer</label>
+                <select value={optimizer} onChange={e => setOptimizer(e.target.value)} className="input">
+                  {OPTIMIZERS.map(o => <option key={o} value={o}>{o}</option>)}
+                </select>
+              </div>
+              <div style={{ display: 'flex', alignItems: 'end' }}>
+                <label style={{ display: 'flex', alignItems: 'center', gap: 'var(--spacing-sm)', cursor: 'pointer' }}>
+                  <input type="checkbox" checked={gradCheckpointing} onChange={e => setGradCheckpointing(e.target.checked)} />
+                  <span style={{ fontSize: '0.875rem' }}>Grad Checkpointing</span>
+                </label>
+              </div>
+            </div>
+          </FormSection>
+
+          {/* Collapsible advanced section */}
+          <div style={{ marginBottom: 'var(--spacing-lg)' }}>
+            <button
+              type="button"
+              onClick={() => setShowAdvanced(!showAdvanced)}
+              style={{
+                background: 'none', border: 'none', cursor: 'pointer', padding: 0,
+                fontSize: '0.8125rem', fontWeight: 600, textTransform: 'uppercase',
+                letterSpacing: '0.05em', color: 'var(--color-text-secondary)',
+                display: 'flex', alignItems: 'center', gap: 'var(--spacing-sm)',
+                marginBottom: showAdvanced ? 'var(--spacing-md)' : 0,
+                paddingBottom: 'var(--spacing-sm)',
+                borderBottom: '1px solid var(--color-border-subtle)',
+                width: '100%', fontFamily: 'inherit',
+              }}
+            >
+              <i className={`fas fa-chevron-${showAdvanced ? 'down' : 'right'}`} style={{ color: 'var(--color-primary)', fontSize: '0.75rem', width: '0.75rem' }} />
+              <i className="fas fa-cog" style={{ color: 'var(--color-primary)' }} />
+              Advanced Options
+            </button>
+
+            {showAdvanced && (
+              <div>
+                <div style={{ display: 'grid', gridTemplateColumns: 'repeat(auto-fill, minmax(160px, 1fr))', gap: 'var(--spacing-md)', marginBottom: 'var(--spacing-md)' }}>
+                  <div>
+                    <label className="form-label">Max Steps (0 = auto)</label>
+                    <input type="number" value={maxSteps} onChange={e => setMaxSteps(Number(e.target.value))} className="input" min={0} />
+                  </div>
+                  <div>
+                    <label className="form-label">Save Steps</label>
+                    <input type="number" value={saveSteps} onChange={e => setSaveSteps(Number(e.target.value))} className="input" min={0} />
+                  </div>
+                  <div>
+                    <label className="form-label">Save Total Limit (0 = unlimited)</label>
+                    <input type="number" value={saveTotalLimit} onChange={e => setSaveTotalLimit(Number(e.target.value))} className="input" min={0} />
+                  </div>
+                  <div>
+                    <label className="form-label">Weight Decay</label>
+                    <input type="number" value={weightDecay} onChange={e => setWeightDecay(Number(e.target.value))} className="input" min={0} step={0.01} />
+                  </div>
+                  <div>
+                    <label className="form-label">Seed (0 = random)</label>
+                    <input type="number" value={seed} onChange={e => setSeed(Number(e.target.value))} className="input" min={0} />
+                  </div>
+                  <div>
+                    <label className="form-label">Mixed Precision</label>
+                    <select value={mixedPrecision} onChange={e => setMixedPrecision(e.target.value)} className="input">
+                      {MIXED_PRECISION_OPTS.map(o => <option key={o} value={o}>{o || 'Auto'}</option>)}
+                    </select>
+                  </div>
+                </div>
+
+                <div style={{ marginBottom: 'var(--spacing-md)' }}>
+                  <label style={{ display: 'flex', alignItems: 'center', gap: 'var(--spacing-sm)', cursor: 'pointer', marginBottom: 'var(--spacing-sm)' }}>
+                    <div
+                      onClick={() => setEvalEnabled(!evalEnabled)}
+                      style={{
+                        width: 36, height: 20, borderRadius: 10, position: 'relative',
+                        background: evalEnabled ? 'var(--color-primary)' : 'var(--color-border)',
+                        transition: 'background 0.2s', cursor: 'pointer', flexShrink: 0,
+                      }}
+                    >
+                      <div style={{
+                        width: 16, height: 16, borderRadius: '50%', background: '#fff',
+                        position: 'absolute', top: 2, left: evalEnabled ? 18 : 2,
+                        transition: 'left 0.2s', boxShadow: '0 1px 2px rgba(0,0,0,0.2)',
+                      }} />
+                    </div>
+                    <span style={{ fontSize: '0.875rem', fontWeight: 600 }}>Enable Evaluation</span>
+                  </label>
+                  {evalEnabled && (
+                    <div style={{ display: 'grid', gridTemplateColumns: 'repeat(auto-fill, minmax(160px, 1fr))', gap: 'var(--spacing-md)', paddingLeft: 'var(--spacing-sm)' }}>
+                      <div>
+                        <label className="form-label">Eval Strategy</label>
+                        <select value={evalStrategy} onChange={e => setEvalStrategy(e.target.value)} className="input">
+                          <option value="steps">Steps</option>
+                          <option value="epoch">Epoch</option>
+                        </select>
+                      </div>
+                      <div>
+                        <label className="form-label">Eval Steps (0 = same as save)</label>
+                        <input type="number" value={evalSteps} onChange={e => setEvalSteps(Number(e.target.value))} className="input" min={0} />
+                      </div>
+                      <div>
+                        <label className="form-label">Eval Split</label>
+                        <input type="text" value={evalSplit} onChange={e => setEvalSplit(e.target.value)} placeholder="e.g. validation" className="input" />
+                      </div>
+                      <div>
+                        <label className="form-label">Eval Dataset Source</label>
+                        <input type="text" value={evalDatasetSource} onChange={e => setEvalDatasetSource(e.target.value)} placeholder="Separate HF dataset" className="input" />
+                      </div>
+                      <div>
+                        <label className="form-label">Auto-split Ratio</label>
+                        <input type="number" value={evalSplitRatio} onChange={e => setEvalSplitRatio(Number(e.target.value))} className="input" min={0.01} max={0.5} step={0.01} />
+                      </div>
+                    </div>
+                  )}
+                </div>
+
+                {resumeFromCheckpoint && (
+                  <div style={{ marginBottom: 'var(--spacing-md)' }}>
+                    <label className="form-label">Resume from Checkpoint</label>
+                    <div style={{ display: 'flex', gap: 'var(--spacing-sm)', alignItems: 'center' }}>
+                      <input type="text" value={resumeFromCheckpoint} onChange={e => setResumeFromCheckpoint(e.target.value)} className="input" style={{ flex: 1 }} />
+                      <button type="button" className="btn" style={{ padding: 'var(--spacing-xs) var(--spacing-sm)' }} onClick={() => setResumeFromCheckpoint('')}>
+                        <i className="fas fa-times" />
+                      </button>
+                    </div>
+                  </div>
+                )}
+
+                <div>
+                  <label className="form-label">Extra Options (backend-specific key-value pairs)</label>
+                  <KeyValueEditor entries={extraOptions} onChange={setExtraOptions} />
+                </div>
+              </div>
+            )}
+          </div>
+
+          <div style={{ display: 'flex', gap: 'var(--spacing-sm)' }}>
+            <button type="submit" className="btn btn-primary" disabled={loading || (!datasetSource && !datasetFile)}>
+              {loading ? <><LoadingSpinner size="sm" /> Starting...</> :
+                resumeFromCheckpoint ?
+                  <><i className="fas fa-redo" style={{ marginRight: 'var(--spacing-xs)' }} /> Resume Training</> :
+                  <><i className="fas fa-play" style={{ marginRight: 'var(--spacing-xs)' }} /> Start Fine-Tuning</>}
+            </button>
+            <button type="button" className="btn" onClick={handleExportConfig}>
+              <i className="fas fa-download" style={{ marginRight: 'var(--spacing-xs)' }} /> Export Config
+            </button>
+          </div>
+        </form>
+      )}
+
+      {/* Either show job detail OR job list — not side-by-side */}
+      {selectedJob ? (
+        <div>
+          <button className="btn" onClick={() => setSelectedJob(null)} style={{ marginBottom: 'var(--spacing-md)' }}>
+            <i className="fas fa-arrow-left" style={{ marginRight: 'var(--spacing-xs)' }} />
+            Back to Jobs
+          </button>
+          <div className="card" style={{ marginBottom: 'var(--spacing-md)', padding: 'var(--spacing-md)' }}>
+            <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center' }}>
+              <div>
+                <h3 style={{ margin: 0 }}>{selectedJob.model}</h3>
+                <div style={{ fontSize: '0.8125rem', color: 'var(--color-text-muted)', marginTop: 'var(--spacing-xs)' }}>
+                  {selectedJob.backend} / {selectedJob.training_method || 'sft'} | ID: {selectedJob.id?.slice(0, 8)}... | {selectedJob.created_at}
+                </div>
+              </div>
+              <span className={`badge ${statusBadgeClass[selectedJob.status] || ''}`}>
+                {selectedJob.status}
+              </span>
+            </div>
+          </div>
+          <TrainingMonitor job={selectedJob} onStop={handleStop} />
+          <CheckpointsPanel job={selectedJob} onResume={handleResumeFromCheckpoint} onExportCheckpoint={handleExportCheckpoint} />
+          <ExportPanel job={selectedJob} prefilledCheckpoint={exportCheckpoint} />
+        </div>
+      ) : (
+        <div>
+          <h3 style={{ margin: '0 0 var(--spacing-sm) 0' }}>Jobs</h3>
+          {jobs.length === 0 ? (
+            <div className="empty-state">
+              <div className="empty-state-icon"><i className="fas fa-graduation-cap" /></div>
+              <h2 className="empty-state-title">No fine-tuning jobs yet</h2>
+              <p className="empty-state-text">Click "New Job" to get started</p>
+            </div>
+          ) : (
+            jobs.map(job => (
+              <JobCard key={job.id} job={job} isSelected={false} onSelect={setSelectedJob} onUseConfig={handleUseConfig} onDelete={handleDelete} />
+            ))
+          )}
+        </div>
+      )}
+    </div>
+  )
+}
diff --git a/core/http/react-ui/src/pages/Studio.jsx b/core/http/react-ui/src/pages/Studio.jsx
new file mode 100644
index 000000000..5227103ad
--- /dev/null
+++ b/core/http/react-ui/src/pages/Studio.jsx
@@ -0,0 +1,48 @@
+import { useSearchParams } from 'react-router-dom'
+import ImageGen from './ImageGen'
+import VideoGen from './VideoGen'
+import TTS from './TTS'
+import Sound from './Sound'
+
+const TABS = [
+  { key: 'images', label: 'Images', icon: 'fas fa-image' },
+  { key: 'video', label: 'Video', icon: 'fas fa-video' },
+  { key: 'tts', label: 'TTS', icon: 'fas fa-headphones' },
+  { key: 'sound', label: 'Sound', icon: 'fas fa-music' },
+]
+
+const TAB_COMPONENTS = {
+  images: ImageGen,
+  video: VideoGen,
+  tts: TTS,
+  sound: Sound,
+}
+
+export default function Studio() {
+  const [searchParams, setSearchParams] = useSearchParams()
+  const activeTab = searchParams.get('tab') || 'images'
+
+  const setTab = (key) => {
+    setSearchParams({ tab: key }, { replace: true })
+  }
+
+  const ActiveComponent = TAB_COMPONENTS[activeTab] || ImageGen
+
+  return (
+    <div>
+      <div className="studio-tabs">
+        {TABS.map(tab => (
+          <button
+            key={tab.key}
+            className={`studio-tab${activeTab === tab.key ? ' studio-tab-active' : ''}`}
+            onClick={() => setTab(tab.key)}
+          >
+            <i className={tab.icon} />
+            <span>{tab.label}</span>
+          </button>
+        ))}
+      </div>
+      <ActiveComponent />
+    </div>
+  )
+}
diff --git a/core/http/react-ui/src/pages/Users.jsx b/core/http/react-ui/src/pages/Users.jsx
index 3338bf9dc..205f89eaf 100644
--- a/core/http/react-ui/src/pages/Users.jsx
+++ b/core/http/react-ui/src/pages/Users.jsx
@@ -45,9 +45,11 @@ function PermissionSummary({ user, onClick }) {
   const perms = user.permissions || {}
   const apiFeatures = ['chat', 'images', 'audio_speech', 'audio_transcription', 'vad', 'detection', 'video', 'embeddings', 'sound']
   const agentFeatures = ['agents', 'skills', 'collections', 'mcp_jobs']
+  const generalFeatures = ['fine_tuning']
 
   const apiOn = apiFeatures.filter(f => perms[f] !== false && (perms[f] === true || perms[f] === undefined)).length
   const agentOn = agentFeatures.filter(f => perms[f]).length
+  const generalOn = generalFeatures.filter(f => perms[f]).length
 
   const modelRestricted = user.allowed_models?.enabled
 
@@ -58,7 +60,7 @@ function PermissionSummary({ user, onClick }) {
       title="Edit permissions"
     >
       <i className="fas fa-shield-halved" />
-      {apiOn}/{apiFeatures.length} API, {agentOn}/{agentFeatures.length} Agent
+      {apiOn}/{apiFeatures.length} API, {agentOn}/{agentFeatures.length} Agent, {generalOn}/{generalFeatures.length} Features
       {modelRestricted && ' | Models restricted'}
     </button>
   )
@@ -71,6 +73,7 @@ function PermissionsModal({ user, featureMeta, availableModels, onClose, onSave,
 
   const apiFeatures = featureMeta?.api_features || []
   const agentFeatures = featureMeta?.agent_features || []
+  const generalFeatures = featureMeta?.general_features || []
 
   useEffect(() => {
     const handleKeyDown = (e) => {
@@ -189,6 +192,33 @@ function PermissionsModal({ user, featureMeta, availableModels, onClose, onSave,
           </div>
         </div>
 
+        {/* General Features */}
+        {generalFeatures.length > 0 && (
+        <div className="perm-section">
+          <div className="perm-section-header">
+            <strong className="perm-section-title">
+              <i className="fas fa-sliders" />
+              Features
+            </strong>
+            <div className="action-group">
+              <button className="btn btn-sm btn-secondary perm-btn-all-none" onClick={() => setAllFeatures(generalFeatures, true)}>All</button>
+              <button className="btn btn-sm btn-secondary perm-btn-all-none" onClick={() => setAllFeatures(generalFeatures, false)}>None</button>
+            </div>
+          </div>
+          <div className="perm-grid">
+            {generalFeatures.map(f => (
+              <button
+                key={f.key}
+                className={`btn btn-sm ${permissions[f.key] ? 'btn-primary' : 'btn-secondary'} perm-btn-feature`}
+                onClick={() => toggleFeature(f.key)}
+              >
+                {f.label}
+              </button>
+            ))}
+          </div>
+        </div>
+        )}
+
         {/* Model Access */}
         <div className="perm-section">
           <div className="perm-section-header">
@@ -510,6 +540,9 @@ export default function Users() {
           { key: 'collections', label: 'Collections', default: false },
           { key: 'mcp_jobs', label: 'MCP CI Jobs', default: false },
         ],
+        general_features: [
+          { key: 'fine_tuning', label: 'Fine-Tuning', default: false },
+        ],
       })
     }
   }, [])
diff --git a/core/http/react-ui/src/router.jsx b/core/http/react-ui/src/router.jsx
index 01c29a756..023e36ff1 100644
--- a/core/http/react-ui/src/router.jsx
+++ b/core/http/react-ui/src/router.jsx
@@ -31,6 +31,8 @@ import ImportModel from './pages/ImportModel'
 import BackendLogs from './pages/BackendLogs'
 import Explorer from './pages/Explorer'
 import Login from './pages/Login'
+import FineTune from './pages/FineTune'
+import Studio from './pages/Studio'
 import NotFound from './pages/NotFound'
 import Usage from './pages/Usage'
 import Users from './pages/Users'
@@ -44,6 +46,7 @@ function BrowseRedirect() {
   return <Navigate to={`/app/${splat || ''}`} replace />
 }
 
+
 function Admin({ children }) {
   return <RequireAdmin>{children}</RequireAdmin>
 }
@@ -65,6 +68,7 @@ const appChildren = [
   { path: 'tts/:model', element: <TTS /> },
   { path: 'sound', element: <Sound /> },
   { path: 'sound/:model', element: <Sound /> },
+  { path: 'studio', element: <Studio /> },
   { path: 'talk', element: <Talk /> },
   { path: 'usage', element: <Usage /> },
   { path: 'account', element: <Account /> },
@@ -90,6 +94,7 @@ const appChildren = [
   { path: 'agent-jobs/tasks/:id', element: <Feature feature="mcp_jobs"><AgentTaskDetails /></Feature> },
   { path: 'agent-jobs/tasks/:id/edit', element: <Feature feature="mcp_jobs"><AgentTaskDetails /></Feature> },
   { path: 'agent-jobs/jobs/:id', element: <Feature feature="mcp_jobs"><AgentJobDetails /></Feature> },
+  { path: 'fine-tune', element: <Feature feature="fine_tuning"><FineTune /></Feature> },
   { path: 'model-editor/:name', element: <Admin><ModelEditor /></Admin> },
   { path: 'pipeline-editor', element: <Admin><PipelineEditor /></Admin> },
   { path: 'pipeline-editor/:name', element: <Admin><PipelineEditor /></Admin> },
diff --git a/core/http/react-ui/src/utils/api.js b/core/http/react-ui/src/utils/api.js
index a2beb9832..0861183df 100644
--- a/core/http/react-ui/src/utils/api.js
+++ b/core/http/react-ui/src/utils/api.js
@@ -380,6 +380,25 @@ export const apiKeysApi = {
   revoke: (id) => fetchJSON(`/api/auth/api-keys/${encodeURIComponent(id)}`, { method: 'DELETE' }),
 }
 
+// Fine-tuning API
+export const fineTuneApi = {
+  listBackends: () => fetchJSON('/api/fine-tuning/backends'),
+  startJob: (data) => postJSON('/api/fine-tuning/jobs', data),
+  listJobs: () => fetchJSON('/api/fine-tuning/jobs'),
+  getJob: (id) => fetchJSON(`/api/fine-tuning/jobs/${enc(id)}`),
+  stopJob: (id, saveCheckpoint) => fetchJSON(`/api/fine-tuning/jobs/${enc(id)}/stop?save_checkpoint=${saveCheckpoint ? 'true' : 'false'}`, { method: 'POST' }),
+  deleteJob: (id) => fetchJSON(`/api/fine-tuning/jobs/${enc(id)}`, { method: 'DELETE' }),
+  listCheckpoints: (id) => fetchJSON(`/api/fine-tuning/jobs/${enc(id)}/checkpoints`),
+  exportModel: (id, data) => postJSON(`/api/fine-tuning/jobs/${enc(id)}/export`, data),
+  uploadDataset: (file) => {
+    const formData = new FormData()
+    formData.append('file', file)
+    return fetch(apiUrl('/api/fine-tuning/datasets'), { method: 'POST', body: formData }).then(handleResponse)
+  },
+  progressUrl: (id) => apiUrl(`/api/fine-tuning/jobs/${enc(id)}/progress`),
+  downloadUrl: (id) => apiUrl(`/api/fine-tuning/jobs/${enc(id)}/download`),
+}
+
 // File to base64 helper
 export function fileToBase64(file) {
   return new Promise((resolve, reject) => {
diff --git a/core/http/routes/auth.go b/core/http/routes/auth.go
index 7ce0f0ce1..16a2e95fc 100644
--- a/core/http/routes/auth.go
+++ b/core/http/routes/auth.go
@@ -777,9 +777,10 @@ func RegisterAuthRoutes(e *echo.Echo, app *application.Application) {
 		}
 
 		return c.JSON(http.StatusOK, map[string]interface{}{
-			"agent_features": auth.AgentFeatureMetas(),
-			"api_features":   auth.APIFeatureMetas(),
-			"models":         modelNames,
+			"agent_features":   auth.AgentFeatureMetas(),
+			"general_features": auth.GeneralFeatureMetas(),
+			"api_features":     auth.APIFeatureMetas(),
+			"models":           modelNames,
 		})
 	}, adminMw)
 
diff --git a/core/http/routes/finetuning.go b/core/http/routes/finetuning.go
new file mode 100644
index 000000000..c501d1a38
--- /dev/null
+++ b/core/http/routes/finetuning.go
@@ -0,0 +1,42 @@
+package routes
+
+import (
+	"net/http"
+
+	"github.com/labstack/echo/v4"
+	"github.com/mudler/LocalAI/core/config"
+	"github.com/mudler/LocalAI/core/http/endpoints/localai"
+	"github.com/mudler/LocalAI/core/services"
+)
+
+// RegisterFineTuningRoutes registers fine-tuning API routes.
+func RegisterFineTuningRoutes(e *echo.Echo, ftService *services.FineTuneService, appConfig *config.ApplicationConfig, fineTuningMw echo.MiddlewareFunc) {
+	if ftService == nil {
+		return
+	}
+
+	// Service readiness middleware
+	readyMw := func(next echo.HandlerFunc) echo.HandlerFunc {
+		return func(c echo.Context) error {
+			if ftService == nil {
+				return c.JSON(http.StatusServiceUnavailable, map[string]string{
+					"error": "fine-tuning service is not available",
+				})
+			}
+			return next(c)
+		}
+	}
+
+	ft := e.Group("/api/fine-tuning", readyMw, fineTuningMw)
+	ft.GET("/backends", localai.ListFineTuneBackendsEndpoint(appConfig))
+	ft.POST("/jobs", localai.StartFineTuneJobEndpoint(ftService))
+	ft.GET("/jobs", localai.ListFineTuneJobsEndpoint(ftService))
+	ft.GET("/jobs/:id", localai.GetFineTuneJobEndpoint(ftService))
+	ft.POST("/jobs/:id/stop", localai.StopFineTuneJobEndpoint(ftService))
+	ft.DELETE("/jobs/:id", localai.DeleteFineTuneJobEndpoint(ftService))
+	ft.GET("/jobs/:id/progress", localai.FineTuneProgressEndpoint(ftService))
+	ft.GET("/jobs/:id/checkpoints", localai.ListCheckpointsEndpoint(ftService))
+	ft.POST("/jobs/:id/export", localai.ExportModelEndpoint(ftService))
+	ft.GET("/jobs/:id/download", localai.DownloadExportedModelEndpoint(ftService))
+	ft.POST("/datasets", localai.UploadDatasetEndpoint(ftService))
+}
diff --git a/core/http/routes/localai.go b/core/http/routes/localai.go
index 85134a6a3..2a2925b00 100644
--- a/core/http/routes/localai.go
+++ b/core/http/routes/localai.go
@@ -134,8 +134,9 @@ func RegisterLocalAIRoutes(router *echo.Echo,
 
 	router.GET("/api/features", func(c echo.Context) error {
 		return c.JSON(200, map[string]bool{
-			"agents": appConfig.AgentPool.Enabled,
-			"mcp":    !appConfig.DisableMCP,
+			"agents":      appConfig.AgentPool.Enabled,
+			"mcp":         !appConfig.DisableMCP,
+			"fine_tuning": appConfig.FineTuning.Enabled,
 		})
 	})
 
diff --git a/core/schema/finetune.go b/core/schema/finetune.go
new file mode 100644
index 000000000..08f37cbd4
--- /dev/null
+++ b/core/schema/finetune.go
@@ -0,0 +1,111 @@
+package schema
+
+// RewardFunctionSpec defines a reward function for GRPO training.
+type RewardFunctionSpec struct {
+	Type   string            `json:"type"`             // "builtin" or "inline"
+	Name   string            `json:"name"`
+	Code   string            `json:"code,omitempty"`   // inline only
+	Params map[string]string `json:"params,omitempty"`
+}
+
+// FineTuneJobRequest is the REST API request to start a fine-tuning job.
+type FineTuneJobRequest struct {
+	Model          string            `json:"model"`
+	Backend        string            `json:"backend"`                    // "trl"
+	TrainingType   string            `json:"training_type,omitempty"`    // lora, loha, lokr, full
+	TrainingMethod string            `json:"training_method,omitempty"`  // sft, dpo, grpo, rloo, reward, kto, orpo
+
+	// Adapter config
+	AdapterRank    int32    `json:"adapter_rank,omitempty"`
+	AdapterAlpha   int32    `json:"adapter_alpha,omitempty"`
+	AdapterDropout float32  `json:"adapter_dropout,omitempty"`
+	TargetModules  []string `json:"target_modules,omitempty"`
+
+	// Training hyperparameters
+	LearningRate              float32 `json:"learning_rate,omitempty"`
+	NumEpochs                 int32   `json:"num_epochs,omitempty"`
+	BatchSize                 int32   `json:"batch_size,omitempty"`
+	GradientAccumulationSteps int32   `json:"gradient_accumulation_steps,omitempty"`
+	WarmupSteps               int32   `json:"warmup_steps,omitempty"`
+	MaxSteps                  int32   `json:"max_steps,omitempty"`
+	SaveSteps                 int32   `json:"save_steps,omitempty"`
+	WeightDecay               float32 `json:"weight_decay,omitempty"`
+	GradientCheckpointing     bool    `json:"gradient_checkpointing,omitempty"`
+	Optimizer                 string  `json:"optimizer,omitempty"`
+	Seed                      int32   `json:"seed,omitempty"`
+	MixedPrecision            string  `json:"mixed_precision,omitempty"`
+
+	// Dataset
+	DatasetSource string `json:"dataset_source"`
+	DatasetSplit  string `json:"dataset_split,omitempty"`
+
+	// Resume from a checkpoint
+	ResumeFromCheckpoint string `json:"resume_from_checkpoint,omitempty"`
+
+	// GRPO reward functions
+	RewardFunctions []RewardFunctionSpec `json:"reward_functions,omitempty"`
+
+	// Backend-specific and method-specific options
+	ExtraOptions map[string]string `json:"extra_options,omitempty"`
+}
+
+// FineTuneJob represents a fine-tuning job with its current state.
+type FineTuneJob struct {
+	ID             string            `json:"id"`
+	UserID         string            `json:"user_id,omitempty"`
+	Model          string            `json:"model"`
+	Backend        string            `json:"backend"`
+	ModelID        string            `json:"model_id,omitempty"` // backend model loader ID
+	TrainingType   string            `json:"training_type"`
+	TrainingMethod string            `json:"training_method"`
+	Status         string            `json:"status"` // queued, loading_model, loading_dataset, training, saving, completed, failed, stopped
+	Message        string            `json:"message,omitempty"`
+	OutputDir      string            `json:"output_dir"`
+	ExtraOptions   map[string]string `json:"extra_options,omitempty"`
+	CreatedAt      string            `json:"created_at"`
+
+	// Export state (tracked separately from training status)
+	ExportStatus    string `json:"export_status,omitempty"`     // "", "exporting", "completed", "failed"
+	ExportMessage   string `json:"export_message,omitempty"`
+	ExportModelName string `json:"export_model_name,omitempty"` // registered model name after export
+
+	// Full config for resume/reuse
+	Config *FineTuneJobRequest `json:"config,omitempty"`
+}
+
+// FineTuneJobResponse is the REST API response when creating a job.
+type FineTuneJobResponse struct {
+	ID      string `json:"id"`
+	Status  string `json:"status"`
+	Message string `json:"message"`
+}
+
+// FineTuneProgressEvent is an SSE event for training progress.
+type FineTuneProgressEvent struct {
+	JobID           string             `json:"job_id"`
+	CurrentStep     int32              `json:"current_step"`
+	TotalSteps      int32              `json:"total_steps"`
+	CurrentEpoch    float32            `json:"current_epoch"`
+	TotalEpochs     float32            `json:"total_epochs"`
+	Loss            float32            `json:"loss"`
+	LearningRate    float32            `json:"learning_rate"`
+	GradNorm        float32            `json:"grad_norm"`
+	EvalLoss        float32            `json:"eval_loss"`
+	EtaSeconds      float32            `json:"eta_seconds"`
+	ProgressPercent float32            `json:"progress_percent"`
+	Status          string             `json:"status"`
+	Message         string             `json:"message,omitempty"`
+	CheckpointPath  string             `json:"checkpoint_path,omitempty"`
+	SamplePath      string             `json:"sample_path,omitempty"`
+	ExtraMetrics    map[string]float32 `json:"extra_metrics,omitempty"`
+}
+
+// ExportRequest is the REST API request to export a model.
+type ExportRequest struct {
+	Name               string            `json:"name,omitempty"`              // model name for LocalAI (auto-generated if empty)
+	CheckpointPath     string            `json:"checkpoint_path"`
+	ExportFormat       string            `json:"export_format"`               // lora, merged_16bit, merged_4bit, gguf
+	QuantizationMethod string            `json:"quantization_method"`         // for GGUF: q4_k_m, q5_k_m, q8_0, f16
+	Model              string            `json:"model,omitempty"`             // base model name for merge
+	ExtraOptions       map[string]string `json:"extra_options,omitempty"`
+}
diff --git a/core/services/agent_pool.go b/core/services/agent_pool.go
index 0f3f3be1d..8bd1b484b 100644
--- a/core/services/agent_pool.go
+++ b/core/services/agent_pool.go
@@ -1042,7 +1042,7 @@ func (s *AgentPoolService) CreateCollection(name string) error {
 	return s.collectionsBackend.CreateCollection(name)
 }
 
-func (s *AgentPoolService) UploadToCollection(collection, filename string, fileBody io.Reader) error {
+func (s *AgentPoolService) UploadToCollection(collection, filename string, fileBody io.Reader) (string, error) {
 	return s.collectionsBackend.Upload(collection, filename, fileBody)
 }
 
@@ -1554,10 +1554,10 @@ func (s *AgentPoolService) CreateCollectionForUser(userID, name string) error {
 }
 
 // UploadToCollectionForUser uploads to a collection for a specific user.
-func (s *AgentPoolService) UploadToCollectionForUser(userID, collection, filename string, fileBody io.Reader) error {
+func (s *AgentPoolService) UploadToCollectionForUser(userID, collection, filename string, fileBody io.Reader) (string, error) {
 	backend, err := s.CollectionsBackendForUser(userID)
 	if err != nil {
-		return err
+		return "", err
 	}
 	return backend.Upload(collection, filename, fileBody)
 }
diff --git a/core/services/finetune.go b/core/services/finetune.go
new file mode 100644
index 000000000..09777d187
--- /dev/null
+++ b/core/services/finetune.go
@@ -0,0 +1,700 @@
+package services
+
+import (
+	"context"
+	"encoding/json"
+	"fmt"
+	"os"
+	"path/filepath"
+	"regexp"
+	"sort"
+	"strings"
+	"sync"
+	"time"
+
+	"github.com/google/uuid"
+	"github.com/mudler/LocalAI/core/config"
+	"github.com/mudler/LocalAI/core/gallery/importers"
+	"github.com/mudler/LocalAI/core/schema"
+	pb "github.com/mudler/LocalAI/pkg/grpc/proto"
+	"github.com/mudler/LocalAI/pkg/model"
+	"github.com/mudler/LocalAI/pkg/utils"
+	"github.com/mudler/xlog"
+	"gopkg.in/yaml.v3"
+)
+
+// FineTuneService manages fine-tuning jobs and their lifecycle.
+type FineTuneService struct {
+	appConfig    *config.ApplicationConfig
+	modelLoader  *model.ModelLoader
+	configLoader *config.ModelConfigLoader
+
+	mu   sync.Mutex
+	jobs map[string]*schema.FineTuneJob
+}
+
+// NewFineTuneService creates a new FineTuneService.
+func NewFineTuneService(
+	appConfig *config.ApplicationConfig,
+	modelLoader *model.ModelLoader,
+	configLoader *config.ModelConfigLoader,
+) *FineTuneService {
+	s := &FineTuneService{
+		appConfig:    appConfig,
+		modelLoader:  modelLoader,
+		configLoader: configLoader,
+		jobs:         make(map[string]*schema.FineTuneJob),
+	}
+	s.loadAllJobs()
+	return s
+}
+
+// fineTuneBaseDir returns the base directory for fine-tune job data.
+func (s *FineTuneService) fineTuneBaseDir() string {
+	return filepath.Join(s.appConfig.DataPath, "fine-tune")
+}
+
+// jobDir returns the directory for a specific job.
+func (s *FineTuneService) jobDir(jobID string) string {
+	return filepath.Join(s.fineTuneBaseDir(), jobID)
+}
+
+// saveJobState persists a job's state to disk as state.json.
+func (s *FineTuneService) saveJobState(job *schema.FineTuneJob) {
+	dir := s.jobDir(job.ID)
+	if err := os.MkdirAll(dir, 0750); err != nil {
+		xlog.Error("Failed to create job directory", "job_id", job.ID, "error", err)
+		return
+	}
+
+	data, err := json.MarshalIndent(job, "", "  ")
+	if err != nil {
+		xlog.Error("Failed to marshal job state", "job_id", job.ID, "error", err)
+		return
+	}
+
+	statePath := filepath.Join(dir, "state.json")
+	if err := os.WriteFile(statePath, data, 0640); err != nil {
+		xlog.Error("Failed to write job state", "job_id", job.ID, "error", err)
+	}
+}
+
+// loadAllJobs scans the fine-tune directory for persisted jobs and loads them.
+func (s *FineTuneService) loadAllJobs() {
+	baseDir := s.fineTuneBaseDir()
+	entries, err := os.ReadDir(baseDir)
+	if err != nil {
+		// Directory doesn't exist yet — that's fine
+		return
+	}
+
+	for _, entry := range entries {
+		if !entry.IsDir() {
+			continue
+		}
+		statePath := filepath.Join(baseDir, entry.Name(), "state.json")
+		data, err := os.ReadFile(statePath)
+		if err != nil {
+			continue
+		}
+
+		var job schema.FineTuneJob
+		if err := json.Unmarshal(data, &job); err != nil {
+			xlog.Warn("Failed to parse job state", "path", statePath, "error", err)
+			continue
+		}
+
+		// Jobs that were running when we shut down are now stale
+		if job.Status == "queued" || job.Status == "loading_model" || job.Status == "loading_dataset" || job.Status == "training" || job.Status == "saving" {
+			job.Status = "stopped"
+			job.Message = "Server restarted while job was running"
+		}
+
+		// Exports that were in progress are now stale
+		if job.ExportStatus == "exporting" {
+			job.ExportStatus = "failed"
+			job.ExportMessage = "Server restarted while export was running"
+		}
+
+		s.jobs[job.ID] = &job
+	}
+
+	if len(s.jobs) > 0 {
+		xlog.Info("Loaded persisted fine-tune jobs", "count", len(s.jobs))
+	}
+}
+
+// StartJob starts a new fine-tuning job.
+func (s *FineTuneService) StartJob(ctx context.Context, userID string, req schema.FineTuneJobRequest) (*schema.FineTuneJobResponse, error) {
+	s.mu.Lock()
+	defer s.mu.Unlock()
+
+	jobID := uuid.New().String()
+
+	backendName := req.Backend
+	if backendName == "" {
+		backendName = "trl"
+	}
+
+	// Always use DataPath for output — not user-configurable
+	outputDir := filepath.Join(s.fineTuneBaseDir(), jobID)
+
+	// Build gRPC request
+	grpcReq := &pb.FineTuneRequest{
+		Model:                     req.Model,
+		TrainingType:              req.TrainingType,
+		TrainingMethod:            req.TrainingMethod,
+		AdapterRank:               req.AdapterRank,
+		AdapterAlpha:              req.AdapterAlpha,
+		AdapterDropout:            req.AdapterDropout,
+		TargetModules:             req.TargetModules,
+		LearningRate:              req.LearningRate,
+		NumEpochs:                 req.NumEpochs,
+		BatchSize:                 req.BatchSize,
+		GradientAccumulationSteps: req.GradientAccumulationSteps,
+		WarmupSteps:               req.WarmupSteps,
+		MaxSteps:                  req.MaxSteps,
+		SaveSteps:                 req.SaveSteps,
+		WeightDecay:               req.WeightDecay,
+		GradientCheckpointing:     req.GradientCheckpointing,
+		Optimizer:                 req.Optimizer,
+		Seed:                      req.Seed,
+		MixedPrecision:            req.MixedPrecision,
+		DatasetSource:             req.DatasetSource,
+		DatasetSplit:              req.DatasetSplit,
+		OutputDir:                 outputDir,
+		JobId:                     jobID,
+		ResumeFromCheckpoint:      req.ResumeFromCheckpoint,
+		ExtraOptions:              req.ExtraOptions,
+	}
+
+	// Serialize reward functions into extra_options for the backend
+	if len(req.RewardFunctions) > 0 {
+		rfJSON, err := json.Marshal(req.RewardFunctions)
+		if err != nil {
+			return nil, fmt.Errorf("failed to serialize reward functions: %w", err)
+		}
+		if grpcReq.ExtraOptions == nil {
+			grpcReq.ExtraOptions = make(map[string]string)
+		}
+		grpcReq.ExtraOptions["reward_funcs"] = string(rfJSON)
+	}
+
+	// Load the fine-tuning backend (per-job model ID so multiple jobs can run concurrently)
+	modelID := backendName + "-finetune-" + jobID
+	backendModel, err := s.modelLoader.Load(
+		model.WithBackendString(backendName),
+		model.WithModel(backendName),
+		model.WithModelID(modelID),
+	)
+	if err != nil {
+		return nil, fmt.Errorf("failed to load backend %s: %w", backendName, err)
+	}
+
+	// Start fine-tuning via gRPC
+	result, err := backendModel.StartFineTune(ctx, grpcReq)
+	if err != nil {
+		return nil, fmt.Errorf("failed to start fine-tuning: %w", err)
+	}
+	if !result.Success {
+		return nil, fmt.Errorf("fine-tuning failed to start: %s", result.Message)
+	}
+
+	// Track the job
+	job := &schema.FineTuneJob{
+		ID:             jobID,
+		UserID:         userID,
+		Model:          req.Model,
+		Backend:        backendName,
+		ModelID:        modelID,
+		TrainingType:   req.TrainingType,
+		TrainingMethod: req.TrainingMethod,
+		Status:         "queued",
+		OutputDir:      outputDir,
+		ExtraOptions:   req.ExtraOptions,
+		CreatedAt:      time.Now().UTC().Format(time.RFC3339),
+		Config:         &req,
+	}
+	s.jobs[jobID] = job
+	s.saveJobState(job)
+
+	return &schema.FineTuneJobResponse{
+		ID:      jobID,
+		Status:  "queued",
+		Message: result.Message,
+	}, nil
+}
+
+// GetJob returns a fine-tuning job by ID.
+func (s *FineTuneService) GetJob(userID, jobID string) (*schema.FineTuneJob, error) {
+	s.mu.Lock()
+	defer s.mu.Unlock()
+
+	job, ok := s.jobs[jobID]
+	if !ok {
+		return nil, fmt.Errorf("job not found: %s", jobID)
+	}
+	if userID != "" && job.UserID != userID {
+		return nil, fmt.Errorf("job not found: %s", jobID)
+	}
+	return job, nil
+}
+
+// ListJobs returns all jobs for a user, sorted by creation time (newest first).
+func (s *FineTuneService) ListJobs(userID string) []*schema.FineTuneJob {
+	s.mu.Lock()
+	defer s.mu.Unlock()
+
+	var result []*schema.FineTuneJob
+	for _, job := range s.jobs {
+		if userID == "" || job.UserID == userID {
+			result = append(result, job)
+		}
+	}
+
+	sort.Slice(result, func(i, j int) bool {
+		return result[i].CreatedAt > result[j].CreatedAt
+	})
+
+	return result
+}
+
+// StopJob stops a running fine-tuning job.
+func (s *FineTuneService) StopJob(ctx context.Context, userID, jobID string, saveCheckpoint bool) error {
+	s.mu.Lock()
+	job, ok := s.jobs[jobID]
+	if !ok {
+		s.mu.Unlock()
+		return fmt.Errorf("job not found: %s", jobID)
+	}
+	if userID != "" && job.UserID != userID {
+		s.mu.Unlock()
+		return fmt.Errorf("job not found: %s", jobID)
+	}
+	s.mu.Unlock()
+
+	// Kill the backend process directly
+	stopModelID := job.ModelID
+	if stopModelID == "" {
+		stopModelID = job.Backend + "-finetune"
+	}
+	s.modelLoader.ShutdownModel(stopModelID)
+
+	s.mu.Lock()
+	job.Status = "stopped"
+	job.Message = "Training stopped by user"
+	s.saveJobState(job)
+	s.mu.Unlock()
+
+	return nil
+}
+
+// DeleteJob removes a fine-tuning job and its associated data from disk.
+func (s *FineTuneService) DeleteJob(userID, jobID string) error {
+	s.mu.Lock()
+	job, ok := s.jobs[jobID]
+	if !ok {
+		s.mu.Unlock()
+		return fmt.Errorf("job not found: %s", jobID)
+	}
+	if userID != "" && job.UserID != userID {
+		s.mu.Unlock()
+		return fmt.Errorf("job not found: %s", jobID)
+	}
+
+	// Reject deletion of actively running jobs
+	activeStatuses := map[string]bool{
+		"queued": true, "loading_model": true, "loading_dataset": true,
+		"training": true, "saving": true,
+	}
+	if activeStatuses[job.Status] {
+		s.mu.Unlock()
+		return fmt.Errorf("cannot delete job %s: currently %s (stop it first)", jobID, job.Status)
+	}
+	if job.ExportStatus == "exporting" {
+		s.mu.Unlock()
+		return fmt.Errorf("cannot delete job %s: export in progress", jobID)
+	}
+
+	exportModelName := job.ExportModelName
+	delete(s.jobs, jobID)
+	s.mu.Unlock()
+
+	// Remove job directory (state.json, checkpoints, output)
+	jobDir := s.jobDir(jobID)
+	if err := os.RemoveAll(jobDir); err != nil {
+		xlog.Warn("Failed to remove job directory", "job_id", jobID, "path", jobDir, "error", err)
+	}
+
+	// If an exported model exists, clean it up too
+	if exportModelName != "" {
+		modelsPath := s.appConfig.SystemState.Model.ModelsPath
+		modelDir := filepath.Join(modelsPath, exportModelName)
+		configPath := filepath.Join(modelsPath, exportModelName+".yaml")
+
+		if err := os.RemoveAll(modelDir); err != nil {
+			xlog.Warn("Failed to remove exported model directory", "path", modelDir, "error", err)
+		}
+		if err := os.Remove(configPath); err != nil && !os.IsNotExist(err) {
+			xlog.Warn("Failed to remove exported model config", "path", configPath, "error", err)
+		}
+
+		// Reload model configs
+		if err := s.configLoader.LoadModelConfigsFromPath(modelsPath, s.appConfig.ToConfigLoaderOptions()...); err != nil {
+			xlog.Warn("Failed to reload configs after delete", "error", err)
+		}
+	}
+
+	xlog.Info("Deleted fine-tune job", "job_id", jobID)
+	return nil
+}
+
+// StreamProgress opens a gRPC progress stream and calls the callback for each update.
+func (s *FineTuneService) StreamProgress(ctx context.Context, userID, jobID string, callback func(event *schema.FineTuneProgressEvent)) error {
+	s.mu.Lock()
+	job, ok := s.jobs[jobID]
+	if !ok {
+		s.mu.Unlock()
+		return fmt.Errorf("job not found: %s", jobID)
+	}
+	if userID != "" && job.UserID != userID {
+		s.mu.Unlock()
+		return fmt.Errorf("job not found: %s", jobID)
+	}
+	s.mu.Unlock()
+
+	streamModelID := job.ModelID
+	if streamModelID == "" {
+		streamModelID = job.Backend + "-finetune"
+	}
+	backendModel, err := s.modelLoader.Load(
+		model.WithBackendString(job.Backend),
+		model.WithModel(job.Backend),
+		model.WithModelID(streamModelID),
+	)
+	if err != nil {
+		return fmt.Errorf("failed to load backend: %w", err)
+	}
+
+	return backendModel.FineTuneProgress(ctx, &pb.FineTuneProgressRequest{
+		JobId: jobID,
+	}, func(update *pb.FineTuneProgressUpdate) {
+		// Update job status and persist
+		s.mu.Lock()
+		if j, ok := s.jobs[jobID]; ok {
+			// Don't let progress updates overwrite terminal states
+			isTerminal := j.Status == "stopped" || j.Status == "completed" || j.Status == "failed"
+			if !isTerminal {
+				j.Status = update.Status
+			}
+			if update.Message != "" {
+				j.Message = update.Message
+			}
+			s.saveJobState(j)
+		}
+		s.mu.Unlock()
+
+		// Convert extra metrics
+		extraMetrics := make(map[string]float32)
+		for k, v := range update.ExtraMetrics {
+			extraMetrics[k] = v
+		}
+
+		event := &schema.FineTuneProgressEvent{
+			JobID:           update.JobId,
+			CurrentStep:     update.CurrentStep,
+			TotalSteps:      update.TotalSteps,
+			CurrentEpoch:    update.CurrentEpoch,
+			TotalEpochs:     update.TotalEpochs,
+			Loss:            update.Loss,
+			LearningRate:    update.LearningRate,
+			GradNorm:        update.GradNorm,
+			EvalLoss:        update.EvalLoss,
+			EtaSeconds:      update.EtaSeconds,
+			ProgressPercent: update.ProgressPercent,
+			Status:          update.Status,
+			Message:         update.Message,
+			CheckpointPath:  update.CheckpointPath,
+			SamplePath:      update.SamplePath,
+			ExtraMetrics:    extraMetrics,
+		}
+		callback(event)
+	})
+}
+
+// ListCheckpoints lists checkpoints for a job.
+func (s *FineTuneService) ListCheckpoints(ctx context.Context, userID, jobID string) ([]*pb.CheckpointInfo, error) {
+	s.mu.Lock()
+	job, ok := s.jobs[jobID]
+	if !ok {
+		s.mu.Unlock()
+		return nil, fmt.Errorf("job not found: %s", jobID)
+	}
+	if userID != "" && job.UserID != userID {
+		s.mu.Unlock()
+		return nil, fmt.Errorf("job not found: %s", jobID)
+	}
+	s.mu.Unlock()
+
+	ckptModelID := job.ModelID
+	if ckptModelID == "" {
+		ckptModelID = job.Backend + "-finetune"
+	}
+	backendModel, err := s.modelLoader.Load(
+		model.WithBackendString(job.Backend),
+		model.WithModel(job.Backend),
+		model.WithModelID(ckptModelID),
+	)
+	if err != nil {
+		return nil, fmt.Errorf("failed to load backend: %w", err)
+	}
+
+	resp, err := backendModel.ListCheckpoints(ctx, &pb.ListCheckpointsRequest{
+		OutputDir: job.OutputDir,
+	})
+	if err != nil {
+		return nil, fmt.Errorf("failed to list checkpoints: %w", err)
+	}
+
+	return resp.Checkpoints, nil
+}
+
+// sanitizeModelName replaces non-alphanumeric characters with hyphens and lowercases.
+func sanitizeModelName(s string) string {
+	re := regexp.MustCompile(`[^a-zA-Z0-9\-]`)
+	s = re.ReplaceAllString(s, "-")
+	s = regexp.MustCompile(`-+`).ReplaceAllString(s, "-")
+	s = strings.Trim(s, "-")
+	return strings.ToLower(s)
+}
+
+// ExportModel starts an async model export from a checkpoint and returns the intended model name immediately.
+func (s *FineTuneService) ExportModel(ctx context.Context, userID, jobID string, req schema.ExportRequest) (string, error) {
+	s.mu.Lock()
+	job, ok := s.jobs[jobID]
+	if !ok {
+		s.mu.Unlock()
+		return "", fmt.Errorf("job not found: %s", jobID)
+	}
+	if userID != "" && job.UserID != userID {
+		s.mu.Unlock()
+		return "", fmt.Errorf("job not found: %s", jobID)
+	}
+	if job.ExportStatus == "exporting" {
+		s.mu.Unlock()
+		return "", fmt.Errorf("export already in progress for job %s", jobID)
+	}
+	s.mu.Unlock()
+
+	// Compute model name
+	modelName := req.Name
+	if modelName == "" {
+		base := sanitizeModelName(job.Model)
+		if base == "" {
+			base = "model"
+		}
+		shortID := jobID
+		if len(shortID) > 8 {
+			shortID = shortID[:8]
+		}
+		modelName = base + "-ft-" + shortID
+	}
+
+	// Compute output path in models directory
+	modelsPath := s.appConfig.SystemState.Model.ModelsPath
+	outputPath := filepath.Join(modelsPath, modelName)
+
+	// Check for name collision (synchronous — fast validation)
+	configPath := filepath.Join(modelsPath, modelName+".yaml")
+	if err := utils.VerifyPath(modelName+".yaml", modelsPath); err != nil {
+		return "", fmt.Errorf("invalid model name: %w", err)
+	}
+	if _, err := os.Stat(configPath); err == nil {
+		return "", fmt.Errorf("model %q already exists, choose a different name", modelName)
+	}
+
+	// Create output directory
+	if err := os.MkdirAll(outputPath, 0750); err != nil {
+		return "", fmt.Errorf("failed to create output directory: %w", err)
+	}
+
+	// Set export status to "exporting" and persist
+	s.mu.Lock()
+	job.ExportStatus = "exporting"
+	job.ExportMessage = ""
+	job.ExportModelName = ""
+	s.saveJobState(job)
+	s.mu.Unlock()
+
+	// Launch the export in a background goroutine
+	go func() {
+		s.setExportMessage(job, "Loading export backend...")
+
+		exportModelID := job.ModelID
+		if exportModelID == "" {
+			exportModelID = job.Backend + "-finetune"
+		}
+		backendModel, err := s.modelLoader.Load(
+			model.WithBackendString(job.Backend),
+			model.WithModel(job.Backend),
+			model.WithModelID(exportModelID),
+		)
+		if err != nil {
+			s.setExportFailed(job, fmt.Sprintf("failed to load backend: %v", err))
+			return
+		}
+
+		// Merge job's extra_options (contains hf_token from training) with request's
+		mergedOpts := make(map[string]string)
+		for k, v := range job.ExtraOptions {
+			mergedOpts[k] = v
+		}
+		for k, v := range req.ExtraOptions {
+			mergedOpts[k] = v // request overrides job
+		}
+
+		grpcReq := &pb.ExportModelRequest{
+			CheckpointPath:     req.CheckpointPath,
+			OutputPath:         outputPath,
+			ExportFormat:       req.ExportFormat,
+			QuantizationMethod: req.QuantizationMethod,
+			Model:              req.Model,
+			ExtraOptions:       mergedOpts,
+		}
+
+		s.setExportMessage(job, "Running model export (merging and converting — this may take a while)...")
+
+		result, err := backendModel.ExportModel(context.Background(), grpcReq)
+		if err != nil {
+			s.setExportFailed(job, fmt.Sprintf("export failed: %v", err))
+			return
+		}
+		if !result.Success {
+			s.setExportFailed(job, fmt.Sprintf("export failed: %s", result.Message))
+			return
+		}
+
+		s.setExportMessage(job, "Export complete, generating model configuration...")
+
+		// Auto-import: detect format and generate config
+		cfg, err := importers.ImportLocalPath(outputPath, modelName)
+		if err != nil {
+			s.setExportFailed(job, fmt.Sprintf("model exported to %s but config generation failed: %v", outputPath, err))
+			return
+		}
+
+		cfg.Name = modelName
+
+		// If base model not detected from files, use the job's model field
+		if cfg.Model == "" && job.Model != "" {
+			cfg.Model = job.Model
+		}
+
+		// Write YAML config
+		yamlData, err := yaml.Marshal(cfg)
+		if err != nil {
+			s.setExportFailed(job, fmt.Sprintf("failed to marshal config: %v", err))
+			return
+		}
+		if err := os.WriteFile(configPath, yamlData, 0644); err != nil {
+			s.setExportFailed(job, fmt.Sprintf("failed to write config file: %v", err))
+			return
+		}
+
+		s.setExportMessage(job, "Registering model with LocalAI...")
+
+		// Reload configs so the model is immediately available
+		if err := s.configLoader.LoadModelConfigsFromPath(modelsPath, s.appConfig.ToConfigLoaderOptions()...); err != nil {
+			xlog.Warn("Failed to reload configs after export", "error", err)
+		}
+		if err := s.configLoader.Preload(modelsPath); err != nil {
+			xlog.Warn("Failed to preload after export", "error", err)
+		}
+
+		xlog.Info("Model exported and registered", "job_id", jobID, "model_name", modelName, "format", req.ExportFormat)
+
+		s.mu.Lock()
+		job.ExportStatus = "completed"
+		job.ExportModelName = modelName
+		job.ExportMessage = ""
+		s.saveJobState(job)
+		s.mu.Unlock()
+	}()
+
+	return modelName, nil
+}
+
+// setExportMessage updates the export message and persists the job state.
+func (s *FineTuneService) setExportMessage(job *schema.FineTuneJob, msg string) {
+	s.mu.Lock()
+	job.ExportMessage = msg
+	s.saveJobState(job)
+	s.mu.Unlock()
+}
+
+// GetExportedModelPath returns the path to the exported model directory and its name.
+func (s *FineTuneService) GetExportedModelPath(userID, jobID string) (string, string, error) {
+	s.mu.Lock()
+	job, ok := s.jobs[jobID]
+	if !ok {
+		s.mu.Unlock()
+		return "", "", fmt.Errorf("job not found: %s", jobID)
+	}
+	if userID != "" && job.UserID != userID {
+		s.mu.Unlock()
+		return "", "", fmt.Errorf("job not found: %s", jobID)
+	}
+	if job.ExportStatus != "completed" {
+		s.mu.Unlock()
+		return "", "", fmt.Errorf("export not completed for job %s (status: %s)", jobID, job.ExportStatus)
+	}
+	exportModelName := job.ExportModelName
+	s.mu.Unlock()
+
+	if exportModelName == "" {
+		return "", "", fmt.Errorf("no exported model name for job %s", jobID)
+	}
+
+	modelsPath := s.appConfig.SystemState.Model.ModelsPath
+	modelDir := filepath.Join(modelsPath, exportModelName)
+
+	if _, err := os.Stat(modelDir); os.IsNotExist(err) {
+		return "", "", fmt.Errorf("exported model directory not found: %s", modelDir)
+	}
+
+	return modelDir, exportModelName, nil
+}
+
+// setExportFailed sets the export status to failed with a message.
+func (s *FineTuneService) setExportFailed(job *schema.FineTuneJob, message string) {
+	xlog.Error("Export failed", "job_id", job.ID, "error", message)
+	s.mu.Lock()
+	job.ExportStatus = "failed"
+	job.ExportMessage = message
+	s.saveJobState(job)
+	s.mu.Unlock()
+}
+
+// UploadDataset handles dataset file upload and returns the local path.
+func (s *FineTuneService) UploadDataset(filename string, data []byte) (string, error) {
+	uploadDir := filepath.Join(s.fineTuneBaseDir(), "datasets")
+	if err := os.MkdirAll(uploadDir, 0750); err != nil {
+		return "", fmt.Errorf("failed to create dataset directory: %w", err)
+	}
+
+	filePath := filepath.Join(uploadDir, uuid.New().String()[:8]+"-"+filename)
+	if err := os.WriteFile(filePath, data, 0640); err != nil {
+		return "", fmt.Errorf("failed to write dataset: %w", err)
+	}
+
+	return filePath, nil
+}
+
+// MarshalProgressEvent converts a progress event to JSON for SSE.
+func MarshalProgressEvent(event *schema.FineTuneProgressEvent) (string, error) {
+	data, err := json.Marshal(event)
+	if err != nil {
+		return "", err
+	}
+	return string(data), nil
+}
diff --git a/docs/content/features/fine-tuning.md b/docs/content/features/fine-tuning.md
new file mode 100644
index 000000000..e5860416c
--- /dev/null
+++ b/docs/content/features/fine-tuning.md
@@ -0,0 +1,226 @@
++++
+disableToc = false
+title = "Fine-Tuning"
+weight = 18
+url = '/features/fine-tuning/'
++++
+
+LocalAI supports fine-tuning LLMs directly through the API and Web UI. Fine-tuning is powered by pluggable backends that implement a generic gRPC interface, allowing support for different training frameworks and model types.
+
+## Supported Backends
+
+| Backend | Domain | GPU Required | Training Methods | Adapter Types |
+|---------|--------|-------------|-----------------|---------------|
+| **trl** | LLM fine-tuning | No (CPU or GPU) | SFT, DPO, GRPO, RLOO, Reward, KTO, ORPO | LoRA, Full |
+
+## Enabling Fine-Tuning
+
+Fine-tuning is disabled by default. Enable it with:
+
+```bash
+LOCALAI_ENABLE_FINETUNING=true local-ai
+```
+
+When authentication is enabled, fine-tuning is a per-user feature (default OFF). Admins can enable it for specific users via the user management API.
+
+## Quick Start
+
+### 1. Start a fine-tuning job
+
+```bash
+curl -X POST http://localhost:8080/api/fine-tuning/jobs \
+  -H "Content-Type: application/json" \
+  -d '{
+    "model": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
+    "backend": "trl",
+    "training_method": "sft",
+    "training_type": "lora",
+    "dataset_source": "yahma/alpaca-cleaned",
+    "num_epochs": 1,
+    "batch_size": 2,
+    "learning_rate": 0.0002,
+    "adapter_rank": 16,
+    "adapter_alpha": 16,
+    "extra_options": {
+      "max_seq_length": "512"
+    }
+  }'
+```
+
+### 2. Monitor progress (SSE stream)
+
+```bash
+curl -N http://localhost:8080/api/fine-tuning/jobs/{job_id}/progress
+```
+
+### 3. List checkpoints
+
+```bash
+curl http://localhost:8080/api/fine-tuning/jobs/{job_id}/checkpoints
+```
+
+### 4. Export model
+
+```bash
+curl -X POST http://localhost:8080/api/fine-tuning/jobs/{job_id}/export \
+  -H "Content-Type: application/json" \
+  -d '{
+    "export_format": "gguf",
+    "quantization_method": "q4_k_m",
+    "output_path": "/models/my-finetuned-model"
+  }'
+```
+
+## API Reference
+
+### Endpoints
+
+| Method | Path | Description |
+|--------|------|-------------|
+| `POST` | `/api/fine-tuning/jobs` | Start a fine-tuning job |
+| `GET` | `/api/fine-tuning/jobs` | List all jobs |
+| `GET` | `/api/fine-tuning/jobs/:id` | Get job details |
+| `DELETE` | `/api/fine-tuning/jobs/:id` | Stop a running job |
+| `GET` | `/api/fine-tuning/jobs/:id/progress` | SSE progress stream |
+| `GET` | `/api/fine-tuning/jobs/:id/checkpoints` | List checkpoints |
+| `POST` | `/api/fine-tuning/jobs/:id/export` | Export model |
+| `POST` | `/api/fine-tuning/datasets` | Upload dataset file |
+
+### Job Request Fields
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `model` | string | HuggingFace model ID or local path (required) |
+| `backend` | string | Backend name (default: `trl`) |
+| `training_method` | string | `sft`, `dpo`, `grpo`, `rloo`, `reward`, `kto`, `orpo` |
+| `training_type` | string | `lora` or `full` |
+| `dataset_source` | string | HuggingFace dataset ID or local file path (required) |
+| `adapter_rank` | int | LoRA rank (default: 16) |
+| `adapter_alpha` | int | LoRA alpha (default: 16) |
+| `num_epochs` | int | Number of training epochs (default: 3) |
+| `batch_size` | int | Per-device batch size (default: 2) |
+| `learning_rate` | float | Learning rate (default: 2e-4) |
+| `gradient_accumulation_steps` | int | Gradient accumulation (default: 4) |
+| `warmup_steps` | int | Warmup steps (default: 5) |
+| `optimizer` | string | `adamw_torch`, `adamw_8bit`, `sgd`, `adafactor`, `prodigy` |
+| `extra_options` | map | Backend-specific options (see below) |
+
+### Backend-Specific Options (`extra_options`)
+
+#### TRL
+
+| Key | Description | Default |
+|-----|-------------|---------|
+| `max_seq_length` | Maximum sequence length | `512` |
+| `packing` | Enable sequence packing | `false` |
+| `trust_remote_code` | Trust remote code in model | `false` |
+| `load_in_4bit` | Enable 4-bit quantization (GPU only) | `false` |
+
+#### DPO-specific (training_method=dpo)
+
+| Key | Description | Default |
+|-----|-------------|---------|
+| `beta` | KL penalty coefficient | `0.1` |
+| `loss_type` | Loss type: `sigmoid`, `hinge`, `ipo` | `sigmoid` |
+| `max_length` | Maximum sequence length | `512` |
+
+#### GRPO-specific (training_method=grpo)
+
+| Key | Description | Default |
+|-----|-------------|---------|
+| `num_generations` | Number of generations per prompt | `4` |
+| `max_completion_length` | Max completion token length | `256` |
+
+### GRPO Reward Functions
+
+GRPO training requires reward functions to evaluate model completions. Specify them via the `reward_functions` field (a typed array) or via `extra_options["reward_funcs"]` (a JSON string).
+
+#### Built-in Reward Functions
+
+| Name | Description | Parameters |
+|------|-------------|-----------|
+| `format_reward` | Checks `<think>...</think>` then answer format (1.0/0.0) | — |
+| `reasoning_accuracy_reward` | Extracts `<answer>` content, compares to dataset's `answer` column | — |
+| `length_reward` | Score based on proximity to target length [0, 1] | `target_length` (default: 200) |
+| `xml_tag_reward` | Scores properly opened/closed `<think>` and `<answer>` tags | — |
+| `no_repetition_reward` | Penalizes n-gram repetition [0, 1] | — |
+| `code_execution_reward` | Checks Python code block syntax validity (1.0/0.0) | — |
+
+#### Inline Custom Reward Functions
+
+You can provide custom reward function code as a Python function body. The function receives `completions` (list of strings) and `**kwargs`, and must return `list[float]`.
+
+**Security restrictions for inline code:**
+- Allowed builtins: `len`, `int`, `float`, `str`, `list`, `dict`, `range`, `enumerate`, `zip`, `map`, `filter`, `sorted`, `min`, `max`, `sum`, `abs`, `round`, `any`, `all`, `isinstance`, `print`, `True`, `False`, `None`
+- Available modules: `re`, `math`, `json`, `string`
+- Blocked: `open`, `__import__`, `exec`, `eval`, `compile`, `os`, `subprocess`, `getattr`, `setattr`, `delattr`, `globals`, `locals`
+- Functions are compiled and validated at job start (fail-fast on syntax errors)
+
+#### Example API Request
+
+```bash
+curl -X POST http://localhost:8080/api/fine-tuning/jobs \
+  -H "Content-Type: application/json" \
+  -d '{
+    "model": "Qwen/Qwen2.5-1.5B-Instruct",
+    "backend": "trl",
+    "training_method": "grpo",
+    "training_type": "lora",
+    "dataset_source": "my-reasoning-dataset",
+    "num_epochs": 1,
+    "batch_size": 2,
+    "learning_rate": 5e-6,
+    "reward_functions": [
+      {"type": "builtin", "name": "reasoning_accuracy_reward"},
+      {"type": "builtin", "name": "format_reward"},
+      {"type": "builtin", "name": "length_reward", "params": {"target_length": "200"}},
+      {"type": "inline", "name": "think_presence", "code": "return [1.0 if \"<think>\" in c else 0.0 for c in completions]"}
+    ],
+    "extra_options": {
+      "num_generations": "4",
+      "max_completion_length": "256"
+    }
+  }'
+```
+
+### Export Formats
+
+| Format | Description | Notes |
+|--------|-------------|-------|
+| `lora` | LoRA adapter files | Smallest, requires base model |
+| `merged_16bit` | Full model in 16-bit | Large but standalone |
+| `merged_4bit` | Full model in 4-bit | Smaller, standalone |
+| `gguf` | GGUF format | For llama.cpp, requires `quantization_method` |
+
+### GGUF Quantization Methods
+
+`q4_k_m`, `q5_k_m`, `q8_0`, `f16`, `q4_0`, `q5_0`
+
+## Web UI
+
+When fine-tuning is enabled, a "Fine-Tune" page appears in the sidebar under the Agents section. The UI provides:
+
+1. **Job Configuration** — Select backend, model, training method, adapter type, and hyperparameters
+2. **Dataset Upload** — Upload local datasets or reference HuggingFace datasets
+3. **Training Monitor** — Real-time loss chart, progress bar, metrics display
+4. **Export** — Export trained models in various formats
+
+## Dataset Formats
+
+Datasets should follow standard HuggingFace formats:
+
+- **SFT**: Alpaca format (`instruction`, `input`, `output` fields) or ChatML/ShareGPT
+- **DPO**: Preference pairs (`prompt`, `chosen`, `rejected` fields)
+- **GRPO**: Prompts with reward signals
+
+Supported file formats: `.json`, `.jsonl`, `.csv`
+
+## Architecture
+
+Fine-tuning uses the same gRPC backend architecture as inference:
+
+1. **Proto layer**: `FineTuneRequest`, `FineTuneProgress` (streaming), `StopFineTune`, `ListCheckpoints`, `ExportModel`
+2. **Python backends**: Each backend implements the gRPC interface with its specific training framework
+3. **Go service**: Manages job lifecycle, routes API requests to backends
+4. **REST API**: HTTP endpoints with SSE progress streaming
+5. **React UI**: Configuration form, real-time training monitor, export panel
diff --git a/go.mod b/go.mod
index 139a11938..e94993eea 100644
--- a/go.mod
+++ b/go.mod
@@ -67,10 +67,18 @@ require (
 )
 
 require (
+	github.com/chasefleming/elem-go v0.30.0 // indirect
+	github.com/dave-gray101/v2keyauth v0.0.0-20240624150259-c45d584d25e2 // indirect
 	github.com/go-jose/go-jose/v4 v4.1.3 // indirect
+	github.com/gofiber/template v1.8.3 // indirect
+	github.com/gofiber/template/html/v2 v2.1.3 // indirect
+	github.com/gofiber/utils v1.1.0 // indirect
+	github.com/inconshreveable/mousetrap v1.1.0 // indirect
 	github.com/jinzhu/inflection v1.0.0 // indirect
 	github.com/jinzhu/now v1.1.5 // indirect
 	github.com/mattn/go-sqlite3 v1.14.22 // indirect
+	github.com/spf13/cobra v1.10.2 // indirect
+	github.com/spf13/pflag v1.0.9 // indirect
 	github.com/stretchr/testify v1.11.1 // indirect
 	github.com/tmc/langchaingo v0.1.14 // indirect
 )
@@ -136,8 +144,8 @@ require (
 	github.com/kevinburke/ssh_config v1.2.0 // indirect
 	github.com/labstack/gommon v0.4.2 // indirect
 	github.com/mschoch/smat v0.2.0 // indirect
-	github.com/mudler/LocalAGI v0.0.0-20260319174513-43c65ec7e88a
-	github.com/mudler/localrecall v0.5.9-0.20260319170742-933f68603f62 // indirect
+	github.com/mudler/LocalAGI v0.0.0-20260321004723-b485b77037c4
+	github.com/mudler/localrecall v0.5.9-0.20260321005011-810084e9369b // indirect
 	github.com/mudler/skillserver v0.0.5
 	github.com/olekukonko/tablewriter v0.0.5 // indirect
 	github.com/oxffaa/gopher-parse-sitemap v0.0.0-20191021113419-005d2eb1def4 // indirect
diff --git a/go.sum b/go.sum
index 6cc2c1622..bd796d8b4 100644
--- a/go.sum
+++ b/go.sum
@@ -148,6 +148,8 @@ github.com/charmbracelet/x/exp/slice v0.0.0-20250327172914-2fdc97757edf h1:rLG0Y
 github.com/charmbracelet/x/exp/slice v0.0.0-20250327172914-2fdc97757edf/go.mod h1:B3UgsnsBZS/eX42BlaNiJkD1pPOUa+oF1IYC6Yd2CEU=
 github.com/charmbracelet/x/term v0.2.1 h1:AQeHeLZ1OqSXhrAWpYUtZyX1T3zVxfpZuEQMIQaGIAQ=
 github.com/charmbracelet/x/term v0.2.1/go.mod h1:oQ4enTYFV7QN4m0i9mzHrViD7TQKvNEEkHUMCmsxdUg=
+github.com/chasefleming/elem-go v0.30.0 h1:BlhV1ekv1RbFiM8XZUQeln1Ikb4D+bu2eDO4agREvok=
+github.com/chasefleming/elem-go v0.30.0/go.mod h1:hz73qILBIKnTgOujnSMtEj20/epI+f6vg71RUilJAA4=
 github.com/chengxilo/virtualterm v1.0.4 h1:Z6IpERbRVlfB8WkOmtbHiDbBANU7cimRIof7mk9/PwM=
 github.com/chengxilo/virtualterm v1.0.4/go.mod h1:DyxxBZz/x1iqJjFxTFcr6/x+jSpqN0iwWCOK1q10rlY=
 github.com/client9/misspell v0.3.4/go.mod h1:qj6jICC3Q7zFZvVWo7KLAzC3yx5G7kyvSDkc90ppPyw=
@@ -177,6 +179,7 @@ github.com/coreos/go-systemd/v22 v22.5.0/go.mod h1:Y58oyj3AT4RCenI/lSvhwexgC+NSV
 github.com/cpuguy83/dockercfg v0.3.2 h1:DlJTyZGBDlXqUZ2Dk2Q3xHs/FtnooJJVaad2S9GKorA=
 github.com/cpuguy83/dockercfg v0.3.2/go.mod h1:sugsbF4//dDlL/i+S+rtpIWp+5h0BHJHfjj5/jFyUJc=
 github.com/cpuguy83/go-md2man/v2 v2.0.0-20190314233015-f79a8a8ca69d/go.mod h1:maD7wRr/U5Z6m/iR4s+kqSMx2CaBsrgA7czyZG/E6dU=
+github.com/cpuguy83/go-md2man/v2 v2.0.6/go.mod h1:oOW0eioCTA6cOiMLiUPZOpcVxMig6NIQQ7OS05n1F4g=
 github.com/creachadair/mds v0.21.3 h1:RRgEAPIb52cU0q7UxGyN+13QlCVTZIL4slRr0cYYQfA=
 github.com/creachadair/mds v0.21.3/go.mod h1:1ltMWZd9yXhaHEoZwBialMaviWVUpRPvMwVP7saFAzM=
 github.com/creachadair/otp v0.5.0 h1:q3Th7CXm2zlmCdBjw5tEPFOj4oWJMnVL5HXlq0sNKS0=
@@ -185,6 +188,8 @@ github.com/creack/pty v1.1.18 h1:n56/Zwd5o6whRC5PMGretI4IdRLlmBXYNjScPaBgsbY=
 github.com/creack/pty v1.1.18/go.mod h1:MOBLtS5ELjhRRrroQr9kyvTxUAFNvYEK993ew/Vr4O4=
 github.com/cyphar/filepath-securejoin v0.5.1 h1:eYgfMq5yryL4fbWfkLpFFy2ukSELzaJOTaUTuh+oF48=
 github.com/cyphar/filepath-securejoin v0.5.1/go.mod h1:Sdj7gXlvMcPZsbhwhQ33GguGLDGQL7h7bg04C/+u9jI=
+github.com/dave-gray101/v2keyauth v0.0.0-20240624150259-c45d584d25e2 h1:flLYmnQFZNo04x2NPehMbf30m7Pli57xwZ0NFqR/hb0=
+github.com/dave-gray101/v2keyauth v0.0.0-20240624150259-c45d584d25e2/go.mod h1:NtWqRzAp/1tw+twkW8uuBenEVVYndEAZACWU3F3xdoQ=
 github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
 github.com/davecgh/go-spew v1.1.1/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
 github.com/davecgh/go-spew v1.1.2-0.20180830191138-d8f796af33cc h1:U9qPSI2PIWSS1VwoXQT9A3Wy9MM3WgvqSxFWenqJduM=
@@ -341,6 +346,12 @@ github.com/godbus/dbus/v5 v5.1.0 h1:4KLkAxT3aOY8Li4FRJe/KvhoNFFxo0m6fNuFUO8QJUk=
 github.com/godbus/dbus/v5 v5.1.0/go.mod h1:xhWf0FNVPg57R7Z0UbKHbJfkEywrmjJnf7w5xrFpKfA=
 github.com/gofiber/fiber/v2 v2.52.9 h1:YjKl5DOiyP3j0mO61u3NTmK7or8GzzWzCFzkboyP5cw=
 github.com/gofiber/fiber/v2 v2.52.9/go.mod h1:YEcBbO/FB+5M1IZNBP9FO3J9281zgPAreiI1oqg8nDw=
+github.com/gofiber/template v1.8.3 h1:hzHdvMwMo/T2kouz2pPCA0zGiLCeMnoGsQZBTSYgZxc=
+github.com/gofiber/template v1.8.3/go.mod h1:bs/2n0pSNPOkRa5VJ8zTIvedcI/lEYxzV3+YPXdBvq8=
+github.com/gofiber/template/html/v2 v2.1.3 h1:n1LYBtmr9C0V/k/3qBblXyMxV5B0o/gpb6dFLp8ea+o=
+github.com/gofiber/template/html/v2 v2.1.3/go.mod h1:U5Fxgc5KpyujU9OqKzy6Kn6Qup6Tm7zdsISR+VpnHRE=
+github.com/gofiber/utils v1.1.0 h1:vdEBpn7AzIUJRhe+CiTOJdUcTg4Q9RK+pEa0KPbLdrM=
+github.com/gofiber/utils v1.1.0/go.mod h1:poZpsnhBykfnY1Mc0KeEa6mSHrS3dV0+oBWyeQmb2e0=
 github.com/gofrs/flock v0.13.0 h1:95JolYOvGMqeH31+FC7D2+uULf6mG61mEZ/A8dRYMzw=
 github.com/gofrs/flock v0.13.0/go.mod h1:jxeyy9R1auM5S6JYDBhDt+E2TCo7DkratH4Pgi8P+Z0=
 github.com/gogo/protobuf v1.1.1/go.mod h1:r8qH/GZQm5c6nD/R0oafs1akxWv10x8SbQlK7atdtwQ=
@@ -445,6 +456,8 @@ github.com/huandu/xstrings v1.5.0 h1:2ag3IFq9ZDANvthTwTiqSSZLjDc+BedvHPAp5tJy2TI
 github.com/huandu/xstrings v1.5.0/go.mod h1:y5/lhBue+AyNmUVz9RLU9xbLR0o4KIIExikq4ovT0aE=
 github.com/huin/goupnp v1.3.0 h1:UvLUlWDNpoUdYzb2TCn+MuTWtcjXKSza2n6CBdQ0xXc=
 github.com/huin/goupnp v1.3.0/go.mod h1:gnGPsThkYa7bFi/KWmEysQRf48l2dvR5bxr2OFckNX8=
+github.com/inconshreveable/mousetrap v1.1.0 h1:wN+x4NVGpMsO7ErUn/mUI3vEoE6Jt13X2s0bqwp9tc8=
+github.com/inconshreveable/mousetrap v1.1.0/go.mod h1:vpF70FUmC8bwa3OWnCshd2FqLfsEA9PFc4w1p2J65bw=
 github.com/ipfs/boxo v0.30.0 h1:7afsoxPGGqfoH7Dum/wOTGUB9M5fb8HyKPMlLfBvIEQ=
 github.com/ipfs/boxo v0.30.0/go.mod h1:BPqgGGyHB9rZZcPSzah2Dc9C+5Or3U1aQe7EH1H7370=
 github.com/ipfs/go-block-format v0.2.0 h1:ZqrkxBA2ICbDRbK8KJs/u0O3dlp6gmAuuXUJNiW1Ycs=
@@ -666,6 +679,8 @@ github.com/mschoch/smat v0.2.0 h1:8imxQsjDm8yFEAVBe7azKmKSgzSkZXDuKkSq9374khM=
 github.com/mschoch/smat v0.2.0/go.mod h1:kc9mz7DoBKqDyiRL7VZN8KvXQMWeTaVnttLRXOlotKw=
 github.com/mudler/LocalAGI v0.0.0-20260319174513-43c65ec7e88a h1:combrnE/eLPnUhqrYmtFmqEfR6x9xS+HoTFdnMozvik=
 github.com/mudler/LocalAGI v0.0.0-20260319174513-43c65ec7e88a/go.mod h1:AbBcAE9JqkexN4aG8rYQn5LzmzffWqcMvQ+Nlvin3WI=
+github.com/mudler/LocalAGI v0.0.0-20260321004723-b485b77037c4 h1:zWrAdAI/gwAPwXQAJuFLF8vvJdsxpxjKiBiC0EzhLOo=
+github.com/mudler/LocalAGI v0.0.0-20260321004723-b485b77037c4/go.mod h1:g+6CD5tP4a+rRW20CrMpE/JDazq5N4n4YDxIT7tT1mY=
 github.com/mudler/cogito v0.9.5-0.20260315222927-63abdec7189b h1:A74T2Lauvg61KodYqsjTYDY05kPLcW+efVZjd23dghU=
 github.com/mudler/cogito v0.9.5-0.20260315222927-63abdec7189b/go.mod h1:6sfja3lcu2nWRzEc0wwqGNu/eCG3EWgij+8s7xyUeQ4=
 github.com/mudler/edgevpn v0.31.1 h1:7qegiDWd0kAg6ljhNHxqvp8hbo/6BbzSdbb7/2WZfiY=
@@ -676,6 +691,10 @@ github.com/mudler/go-processmanager v0.1.0 h1:fcSKgF9U/a1Z7KofAFeZnke5YseadCI5Gq
 github.com/mudler/go-processmanager v0.1.0/go.mod h1:h6kmHUZeafr+k5hRYpGLMzJFH4hItHffgpRo2QIkP+o=
 github.com/mudler/localrecall v0.5.9-0.20260319170742-933f68603f62 h1:KVTEukvLlQXKZx1C1ZLru+ahaiECLF+7v2caK8vauJ0=
 github.com/mudler/localrecall v0.5.9-0.20260319170742-933f68603f62/go.mod h1:/d2bG9H8G/HzsnXTTQl2bOD+ui74XwpeiSDJ+2gdkGc=
+github.com/mudler/localrecall v0.5.9-0.20260321003356-422f3b1fff45 h1:+zTrbYk70wHrtvpsO2k7gMPvHYnWYCnXNxAtMex+7yg=
+github.com/mudler/localrecall v0.5.9-0.20260321003356-422f3b1fff45/go.mod h1:/d2bG9H8G/HzsnXTTQl2bOD+ui74XwpeiSDJ+2gdkGc=
+github.com/mudler/localrecall v0.5.9-0.20260321005011-810084e9369b h1:XeAnOEOOSKMfS5XNGpRTltQgjKCinho0V4uAhrgxN7Q=
+github.com/mudler/localrecall v0.5.9-0.20260321005011-810084e9369b/go.mod h1:xuPtgL9zUyiQLmspYzO3kaboYrGbWmwi8BQPt1aCAcs=
 github.com/mudler/memory v0.0.0-20251216220809-d1256471a6c2 h1:+WHsL/j6EWOMUiMVIOJNKOwSKiQt/qDPc9fePCf87fA=
 github.com/mudler/memory v0.0.0-20251216220809-d1256471a6c2/go.mod h1:EA8Ashhd56o32qN7ouPKFSRUs/Z+LrRCF4v6R2Oarm8=
 github.com/mudler/skillserver v0.0.5 h1:t6HPpeSX8kEP7B8F5GXoQUam5VEYNmJuG6oy2/vdTu8=
@@ -855,6 +874,7 @@ github.com/russross/blackfriday v1.5.2/go.mod h1:JO/DiYxRf+HjHt06OyowR9PTA263kcR
 github.com/russross/blackfriday v1.6.0 h1:KqfZb0pUVN2lYqZUYRddxF4OR8ZMURnJIG5Y3VRLtww=
 github.com/russross/blackfriday v1.6.0/go.mod h1:ti0ldHuxg49ri4ksnFxlkCfN+hvslNlmVHqNRXXJNAY=
 github.com/russross/blackfriday/v2 v2.0.1/go.mod h1:+Rmxgy9KzJVeS9/2gXHxylqXiyQDYRxCVz55jmeOWTM=
+github.com/russross/blackfriday/v2 v2.1.0/go.mod h1:+Rmxgy9KzJVeS9/2gXHxylqXiyQDYRxCVz55jmeOWTM=
 github.com/ruudk/golang-pdf417 v0.0.0-20181029194003-1af4ab5afa58/go.mod h1:6lfFZQK844Gfx8o5WFuvpxWRwnSoipWe/p622j1v06w=
 github.com/rymdport/portal v0.4.2 h1:7jKRSemwlTyVHHrTGgQg7gmNPJs88xkbKcIL3NlcmSU=
 github.com/rymdport/portal v0.4.2/go.mod h1:kFF4jslnJ8pD5uCi17brj/ODlfIidOxlgUDTO5ncnC4=
@@ -928,6 +948,10 @@ github.com/spaolacci/murmur3 v1.1.0 h1:7c1g84S4BPRrfL5Xrdp6fOJ206sU9y293DDHaoy0b
 github.com/spaolacci/murmur3 v1.1.0/go.mod h1:JwIasOWyU6f++ZhiEuf87xNszmSA2myDM2Kzu9HwQUA=
 github.com/spf13/cast v1.7.0 h1:ntdiHjuueXFgm5nzDRdOS4yfT43P5Fnud6DH50rz/7w=
 github.com/spf13/cast v1.7.0/go.mod h1:ancEpBxwJDODSW/UG4rDrAqiKolqNNh2DX3mk86cAdo=
+github.com/spf13/cobra v1.10.2 h1:DMTTonx5m65Ic0GOoRY2c16WCbHxOOw6xxezuLaBpcU=
+github.com/spf13/cobra v1.10.2/go.mod h1:7C1pvHqHw5A4vrJfjNwvOdzYu0Gml16OCs2GRiTUUS4=
+github.com/spf13/pflag v1.0.9 h1:9exaQaMOCwffKiiiYk6/BndUBv+iRViNW+4lEMi0PvY=
+github.com/spf13/pflag v1.0.9/go.mod h1:McXfInJRrz4CZXVZOBLb0bTZqETkiAhM9Iw0y3An2Bg=
 github.com/srwiley/oksvg v0.0.0-20221011165216-be6e8873101c h1:km8GpoQut05eY3GiYWEedbTT0qnSxrCjsVbb7yKY1KE=
 github.com/srwiley/oksvg v0.0.0-20221011165216-be6e8873101c/go.mod h1:cNQ3dwVJtS5Hmnjxy6AgTPd0Inb3pW05ftPSX7NZO7Q=
 github.com/srwiley/rasterx v0.0.0-20220730225603-2ab79fcdd4ef h1:Ch6Q+AZUxDBCVqdkI8FSpFyZDtCVBc2VmejdNrm5rRQ=
diff --git a/pkg/grpc/backend.go b/pkg/grpc/backend.go
index 348463808..e010d127e 100644
--- a/pkg/grpc/backend.go
+++ b/pkg/grpc/backend.go
@@ -63,4 +63,11 @@ type Backend interface {
 	AudioDecode(ctx context.Context, in *pb.AudioDecodeRequest, opts ...grpc.CallOption) (*pb.AudioDecodeResult, error)
 
 	ModelMetadata(ctx context.Context, in *pb.ModelOptions, opts ...grpc.CallOption) (*pb.ModelMetadataResponse, error)
+
+	// Fine-tuning
+	StartFineTune(ctx context.Context, in *pb.FineTuneRequest, opts ...grpc.CallOption) (*pb.FineTuneJobResult, error)
+	FineTuneProgress(ctx context.Context, in *pb.FineTuneProgressRequest, f func(update *pb.FineTuneProgressUpdate), opts ...grpc.CallOption) error
+	StopFineTune(ctx context.Context, in *pb.FineTuneStopRequest, opts ...grpc.CallOption) (*pb.Result, error)
+	ListCheckpoints(ctx context.Context, in *pb.ListCheckpointsRequest, opts ...grpc.CallOption) (*pb.ListCheckpointsResponse, error)
+	ExportModel(ctx context.Context, in *pb.ExportModelRequest, opts ...grpc.CallOption) (*pb.Result, error)
 }
diff --git a/pkg/grpc/base/base.go b/pkg/grpc/base/base.go
index da94c10ea..481c60762 100644
--- a/pkg/grpc/base/base.go
+++ b/pkg/grpc/base/base.go
@@ -120,6 +120,26 @@ func (llm *Base) AudioDecode(*pb.AudioDecodeRequest) (*pb.AudioDecodeResult, err
 	return nil, fmt.Errorf("unimplemented")
 }
 
+func (llm *Base) StartFineTune(*pb.FineTuneRequest) (*pb.FineTuneJobResult, error) {
+	return nil, fmt.Errorf("unimplemented")
+}
+
+func (llm *Base) FineTuneProgress(*pb.FineTuneProgressRequest, chan *pb.FineTuneProgressUpdate) error {
+	return fmt.Errorf("unimplemented")
+}
+
+func (llm *Base) StopFineTune(*pb.FineTuneStopRequest) error {
+	return fmt.Errorf("unimplemented")
+}
+
+func (llm *Base) ListCheckpoints(*pb.ListCheckpointsRequest) (*pb.ListCheckpointsResponse, error) {
+	return nil, fmt.Errorf("unimplemented")
+}
+
+func (llm *Base) ExportModel(*pb.ExportModelRequest) error {
+	return fmt.Errorf("unimplemented")
+}
+
 func memoryUsage() *pb.MemoryUsageData {
 	mud := pb.MemoryUsageData{
 		Breakdown: make(map[string]uint64),
diff --git a/pkg/grpc/client.go b/pkg/grpc/client.go
index eedd464c7..d3ef67814 100644
--- a/pkg/grpc/client.go
+++ b/pkg/grpc/client.go
@@ -632,6 +632,142 @@ func (c *Client) AudioDecode(ctx context.Context, in *pb.AudioDecodeRequest, opt
 	return client.AudioDecode(ctx, in, opts...)
 }
 
+func (c *Client) StartFineTune(ctx context.Context, in *pb.FineTuneRequest, opts ...grpc.CallOption) (*pb.FineTuneJobResult, error) {
+	if !c.parallel {
+		c.opMutex.Lock()
+		defer c.opMutex.Unlock()
+	}
+	c.setBusy(true)
+	defer c.setBusy(false)
+	c.wdMark()
+	defer c.wdUnMark()
+	conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()),
+		grpc.WithDefaultCallOptions(
+			grpc.MaxCallRecvMsgSize(50*1024*1024), // 50MB
+			grpc.MaxCallSendMsgSize(50*1024*1024), // 50MB
+		))
+	if err != nil {
+		return nil, err
+	}
+	defer conn.Close()
+	client := pb.NewBackendClient(conn)
+	return client.StartFineTune(ctx, in, opts...)
+}
+
+func (c *Client) FineTuneProgress(ctx context.Context, in *pb.FineTuneProgressRequest, f func(update *pb.FineTuneProgressUpdate), opts ...grpc.CallOption) error {
+	if !c.parallel {
+		c.opMutex.Lock()
+		defer c.opMutex.Unlock()
+	}
+	c.setBusy(true)
+	defer c.setBusy(false)
+	c.wdMark()
+	defer c.wdUnMark()
+	conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()),
+		grpc.WithDefaultCallOptions(
+			grpc.MaxCallRecvMsgSize(50*1024*1024), // 50MB
+			grpc.MaxCallSendMsgSize(50*1024*1024), // 50MB
+		))
+	if err != nil {
+		return err
+	}
+	defer conn.Close()
+	client := pb.NewBackendClient(conn)
+
+	stream, err := client.FineTuneProgress(ctx, in, opts...)
+	if err != nil {
+		return err
+	}
+
+	for {
+		select {
+		case <-ctx.Done():
+			return ctx.Err()
+		default:
+		}
+
+		update, err := stream.Recv()
+		if err == io.EOF {
+			break
+		}
+		if err != nil {
+			if ctx.Err() != nil {
+				return ctx.Err()
+			}
+			return err
+		}
+		f(update)
+	}
+
+	return nil
+}
+
+func (c *Client) StopFineTune(ctx context.Context, in *pb.FineTuneStopRequest, opts ...grpc.CallOption) (*pb.Result, error) {
+	if !c.parallel {
+		c.opMutex.Lock()
+		defer c.opMutex.Unlock()
+	}
+	c.setBusy(true)
+	defer c.setBusy(false)
+	c.wdMark()
+	defer c.wdUnMark()
+	conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()),
+		grpc.WithDefaultCallOptions(
+			grpc.MaxCallRecvMsgSize(50*1024*1024), // 50MB
+			grpc.MaxCallSendMsgSize(50*1024*1024), // 50MB
+		))
+	if err != nil {
+		return nil, err
+	}
+	defer conn.Close()
+	client := pb.NewBackendClient(conn)
+	return client.StopFineTune(ctx, in, opts...)
+}
+
+func (c *Client) ListCheckpoints(ctx context.Context, in *pb.ListCheckpointsRequest, opts ...grpc.CallOption) (*pb.ListCheckpointsResponse, error) {
+	if !c.parallel {
+		c.opMutex.Lock()
+		defer c.opMutex.Unlock()
+	}
+	c.setBusy(true)
+	defer c.setBusy(false)
+	c.wdMark()
+	defer c.wdUnMark()
+	conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()),
+		grpc.WithDefaultCallOptions(
+			grpc.MaxCallRecvMsgSize(50*1024*1024), // 50MB
+			grpc.MaxCallSendMsgSize(50*1024*1024), // 50MB
+		))
+	if err != nil {
+		return nil, err
+	}
+	defer conn.Close()
+	client := pb.NewBackendClient(conn)
+	return client.ListCheckpoints(ctx, in, opts...)
+}
+
+func (c *Client) ExportModel(ctx context.Context, in *pb.ExportModelRequest, opts ...grpc.CallOption) (*pb.Result, error) {
+	if !c.parallel {
+		c.opMutex.Lock()
+		defer c.opMutex.Unlock()
+	}
+	c.setBusy(true)
+	defer c.setBusy(false)
+	c.wdMark()
+	defer c.wdUnMark()
+	conn, err := grpc.Dial(c.address, grpc.WithTransportCredentials(insecure.NewCredentials()),
+		grpc.WithDefaultCallOptions(
+			grpc.MaxCallRecvMsgSize(50*1024*1024), // 50MB
+			grpc.MaxCallSendMsgSize(50*1024*1024), // 50MB
+		))
+	if err != nil {
+		return nil, err
+	}
+	defer conn.Close()
+	client := pb.NewBackendClient(conn)
+	return client.ExportModel(ctx, in, opts...)
+}
+
 func (c *Client) ModelMetadata(ctx context.Context, in *pb.ModelOptions, opts ...grpc.CallOption) (*pb.ModelMetadataResponse, error) {
 	if !c.parallel {
 		c.opMutex.Lock()
diff --git a/pkg/grpc/embed.go b/pkg/grpc/embed.go
index 905290c2a..a7bc8f40d 100644
--- a/pkg/grpc/embed.go
+++ b/pkg/grpc/embed.go
@@ -123,6 +123,68 @@ func (e *embedBackend) GetTokenMetrics(ctx context.Context, in *pb.MetricsReques
 	return e.s.GetMetrics(ctx, in)
 }
 
+func (e *embedBackend) StartFineTune(ctx context.Context, in *pb.FineTuneRequest, opts ...grpc.CallOption) (*pb.FineTuneJobResult, error) {
+	return e.s.StartFineTune(ctx, in)
+}
+
+func (e *embedBackend) FineTuneProgress(ctx context.Context, in *pb.FineTuneProgressRequest, f func(update *pb.FineTuneProgressUpdate), opts ...grpc.CallOption) error {
+	bs := &embedBackendFineTuneProgressStream{
+		ctx: ctx,
+		fn:  f,
+	}
+	return e.s.FineTuneProgress(in, bs)
+}
+
+func (e *embedBackend) StopFineTune(ctx context.Context, in *pb.FineTuneStopRequest, opts ...grpc.CallOption) (*pb.Result, error) {
+	return e.s.StopFineTune(ctx, in)
+}
+
+func (e *embedBackend) ListCheckpoints(ctx context.Context, in *pb.ListCheckpointsRequest, opts ...grpc.CallOption) (*pb.ListCheckpointsResponse, error) {
+	return e.s.ListCheckpoints(ctx, in)
+}
+
+func (e *embedBackend) ExportModel(ctx context.Context, in *pb.ExportModelRequest, opts ...grpc.CallOption) (*pb.Result, error) {
+	return e.s.ExportModel(ctx, in)
+}
+
+var _ pb.Backend_FineTuneProgressServer = new(embedBackendFineTuneProgressStream)
+
+type embedBackendFineTuneProgressStream struct {
+	ctx context.Context
+	fn  func(update *pb.FineTuneProgressUpdate)
+}
+
+func (e *embedBackendFineTuneProgressStream) Send(update *pb.FineTuneProgressUpdate) error {
+	e.fn(update)
+	return nil
+}
+
+func (e *embedBackendFineTuneProgressStream) SetHeader(md metadata.MD) error {
+	return nil
+}
+
+func (e *embedBackendFineTuneProgressStream) SendHeader(md metadata.MD) error {
+	return nil
+}
+
+func (e *embedBackendFineTuneProgressStream) SetTrailer(md metadata.MD) {
+}
+
+func (e *embedBackendFineTuneProgressStream) Context() context.Context {
+	return e.ctx
+}
+
+func (e *embedBackendFineTuneProgressStream) SendMsg(m any) error {
+	if x, ok := m.(*pb.FineTuneProgressUpdate); ok {
+		return e.Send(x)
+	}
+	return nil
+}
+
+func (e *embedBackendFineTuneProgressStream) RecvMsg(m any) error {
+	return nil
+}
+
 type embedBackendServerStream struct {
 	ctx context.Context
 	fn  func(reply *pb.Reply)
diff --git a/pkg/grpc/interface.go b/pkg/grpc/interface.go
index 6b1dd9a46..6f1b5346a 100644
--- a/pkg/grpc/interface.go
+++ b/pkg/grpc/interface.go
@@ -35,6 +35,13 @@ type AIModel interface {
 	AudioDecode(*pb.AudioDecodeRequest) (*pb.AudioDecodeResult, error)
 
 	ModelMetadata(*pb.ModelOptions) (*pb.ModelMetadataResponse, error)
+
+	// Fine-tuning
+	StartFineTune(*pb.FineTuneRequest) (*pb.FineTuneJobResult, error)
+	FineTuneProgress(*pb.FineTuneProgressRequest, chan *pb.FineTuneProgressUpdate) error
+	StopFineTune(*pb.FineTuneStopRequest) error
+	ListCheckpoints(*pb.ListCheckpointsRequest) (*pb.ListCheckpointsResponse, error)
+	ExportModel(*pb.ExportModelRequest) error
 }
 
 func newReply(s string) *pb.Reply {
diff --git a/pkg/grpc/server.go b/pkg/grpc/server.go
index 90d494f58..5bb0ca98b 100644
--- a/pkg/grpc/server.go
+++ b/pkg/grpc/server.go
@@ -308,6 +308,75 @@ func (s *server) AudioDecode(ctx context.Context, in *pb.AudioDecodeRequest) (*p
 	return res, nil
 }
 
+func (s *server) StartFineTune(ctx context.Context, in *pb.FineTuneRequest) (*pb.FineTuneJobResult, error) {
+	if s.llm.Locking() {
+		s.llm.Lock()
+		defer s.llm.Unlock()
+	}
+	res, err := s.llm.StartFineTune(in)
+	if err != nil {
+		return &pb.FineTuneJobResult{Success: false, Message: fmt.Sprintf("Error starting fine-tune: %s", err.Error())}, err
+	}
+	return res, nil
+}
+
+func (s *server) FineTuneProgress(in *pb.FineTuneProgressRequest, stream pb.Backend_FineTuneProgressServer) error {
+	if s.llm.Locking() {
+		s.llm.Lock()
+		defer s.llm.Unlock()
+	}
+	updateChan := make(chan *pb.FineTuneProgressUpdate)
+
+	done := make(chan bool)
+	go func() {
+		for update := range updateChan {
+			stream.Send(update)
+		}
+		done <- true
+	}()
+
+	err := s.llm.FineTuneProgress(in, updateChan)
+	<-done
+
+	return err
+}
+
+func (s *server) StopFineTune(ctx context.Context, in *pb.FineTuneStopRequest) (*pb.Result, error) {
+	if s.llm.Locking() {
+		s.llm.Lock()
+		defer s.llm.Unlock()
+	}
+	err := s.llm.StopFineTune(in)
+	if err != nil {
+		return &pb.Result{Message: fmt.Sprintf("Error stopping fine-tune: %s", err.Error()), Success: false}, err
+	}
+	return &pb.Result{Message: "Fine-tune stopped", Success: true}, nil
+}
+
+func (s *server) ListCheckpoints(ctx context.Context, in *pb.ListCheckpointsRequest) (*pb.ListCheckpointsResponse, error) {
+	if s.llm.Locking() {
+		s.llm.Lock()
+		defer s.llm.Unlock()
+	}
+	res, err := s.llm.ListCheckpoints(in)
+	if err != nil {
+		return nil, err
+	}
+	return res, nil
+}
+
+func (s *server) ExportModel(ctx context.Context, in *pb.ExportModelRequest) (*pb.Result, error) {
+	if s.llm.Locking() {
+		s.llm.Lock()
+		defer s.llm.Unlock()
+	}
+	err := s.llm.ExportModel(in)
+	if err != nil {
+		return &pb.Result{Message: fmt.Sprintf("Error exporting model: %s", err.Error()), Success: false}, err
+	}
+	return &pb.Result{Message: "Model exported", Success: true}, nil
+}
+
 func (s *server) ModelMetadata(ctx context.Context, in *pb.ModelOptions) (*pb.ModelMetadataResponse, error) {
 	if s.llm.Locking() {
 		s.llm.Lock()