readme: add instructions to build with MLX

glm-image wip
2026-03-01 21:46:45 -05:00 · 2026-01-15 09:52:56 -08:00 · 2026-01-14 16:46:50 -08:00
523 changed files with 25155 additions and 87491 deletions
--- a/.github/workflows/release.yaml
+++ b/.github/workflows/release.yaml
@@ -337,7 +337,6 @@ jobs:
          name: bundles-windows
          path: |
            dist/*.zip
-            dist/*.ps1
            dist/OllamaSetup.exe

  linux-build:
@@ -515,9 +514,6 @@ jobs:
      - name: Log dist contents
        run: |
          ls -l dist/
-      - name: Copy install scripts to dist
-        run: |
-          cp scripts/install.sh dist/install.sh
      - name: Generate checksum file
        run: find . -type f -not -name 'sha256sum.txt' | xargs sha256sum | tee sha256sum.txt
        working-directory: dist
@@ -540,7 +536,7 @@ jobs:
      - name: Upload release artifacts
        run: |
          pids=()
-          for payload in dist/*.txt dist/*.zip dist/*.tgz dist/*.tar.zst dist/*.exe dist/*.dmg dist/*.ps1 dist/*.sh ; do
+          for payload in dist/*.txt dist/*.zip dist/*.tgz dist/*.tar.zst dist/*.exe dist/*.dmg ; do
            echo "Uploading $payload"
            gh release upload ${GITHUB_REF_NAME} $payload --clobber &
            pids[$!]=$!
--- a/.github/workflows/test-install.yaml
+++ b/.github/workflows/test-install.yaml
@@ -1,22 +0,0 @@
-name: test-install
-
-on:
-  pull_request:
-    paths:
-      - 'scripts/install.sh'
-      - '.github/workflows/test-install.yaml'
-
-jobs:
-  test:
-    strategy:
-      matrix:
-        os: [ubuntu-latest, macos-latest]
-    runs-on: ${{ matrix.os }}
-    steps:
-      - uses: actions/checkout@v4
-      - name: Run install script
-        run: sh ./scripts/install.sh
-        env:
-          OLLAMA_NO_START: 1 # do not start app
-      - name: Verify ollama is available
-        run: ollama --version
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -182,7 +182,7 @@ option(MLX_ENGINE "Enable MLX backend" OFF)

 if(MLX_ENGINE)
    message(STATUS "Setting up MLX (this takes a while...)")
-    add_subdirectory(${CMAKE_CURRENT_SOURCE_DIR}/x/imagegen/mlx)
+    add_subdirectory(${CMAKE_CURRENT_SOURCE_DIR}/x/ml/backend/mlx)

    # Find CUDA toolkit if MLX is built with CUDA support
    find_package(CUDAToolkit)
@@ -216,4 +216,4 @@ if(MLX_ENGINE)
                COMPONENT MLX)
        endif()
    endif()
-endif()
+endif()
--- a/29
+++ b/29
@@ -9,10 +9,15 @@ ARG JETPACK6VERSION=r36.4.0
 ARG CMAKEVERSION=3.31.2
 ARG VULKANVERSION=1.4.321.1

+# We require gcc v10 minimum.  v10.3 has regressions, so the rockylinux 8.5 AppStream has the latest compatible version
 FROM --platform=linux/amd64 rocm/dev-almalinux-8:${ROCMVERSION}-complete AS base-amd64
-RUN dnf install -y yum-utils ccache gcc-toolset-11-gcc gcc-toolset-11-gcc-c++ gcc-toolset-11-binutils \
+RUN yum install -y yum-utils \
+    && yum-config-manager --add-repo https://dl.rockylinux.org/vault/rocky/8.5/AppStream/\$basearch/os/ \
+    && rpm --import https://dl.rockylinux.org/pub/rocky/RPM-GPG-KEY-Rocky-8 \
+    && dnf install -y yum-utils ccache gcc-toolset-10-gcc-10.2.1-8.2.el8 gcc-toolset-10-gcc-c++-10.2.1-8.2.el8 gcc-toolset-10-binutils-2.35-11.el8 \
+    && dnf install -y ccache \
    && yum-config-manager --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel8/x86_64/cuda-rhel8.repo
-ENV PATH=/opt/rh/gcc-toolset-11/root/usr/bin:$PATH
+ENV PATH=/opt/rh/gcc-toolset-10/root/usr/bin:$PATH
 ARG VULKANVERSION
 RUN wget https://sdk.lunarg.com/sdk/download/${VULKANVERSION}/linux/vulkansdk-linux-x86_64-${VULKANVERSION}.tar.xz -O /tmp/vulkansdk-linux-x86_64-${VULKANVERSION}.tar.xz \
    && tar xvf /tmp/vulkansdk-linux-x86_64-${VULKANVERSION}.tar.xz \
@@ -27,7 +32,7 @@ ENV PATH=/${VULKANVERSION}/x86_64/bin:$PATH
 FROM --platform=linux/arm64 almalinux:8 AS base-arm64
 # install epel-release for ccache
 RUN yum install -y yum-utils epel-release \
-    && dnf install -y clang ccache git \
+    && dnf install -y clang ccache \
    && yum-config-manager --add-repo https://developer.download.nvidia.com/compute/cuda/repos/rhel8/sbsa/cuda-rhel8.repo
 ENV CC=clang CXX=clang++

@@ -142,9 +147,8 @@ ARG PARALLEL
 WORKDIR /go/src/github.com/ollama/ollama
 COPY CMakeLists.txt CMakePresets.json .
 COPY ml/backend/ggml/ggml ml/backend/ggml/ggml
-COPY x/imagegen/mlx x/imagegen/mlx
+COPY x/ml/backend/mlx x/ml/backend/mlx
 COPY go.mod go.sum .
-COPY MLX_VERSION .
 RUN curl -fsSL https://golang.org/dl/go$(awk '/^go/ { print $2 }' go.mod).linux-$(case $(uname -m) in x86_64) echo amd64 ;; aarch64) echo arm64 ;; esac).tar.gz | tar xz -C /usr/local
 ENV PATH=/usr/local/go/bin:$PATH
 RUN go mod download
@@ -152,6 +156,14 @@ RUN --mount=type=cache,target=/root/.ccache \
    cmake --preset 'MLX CUDA 13' -DBLAS_INCLUDE_DIRS=/usr/include/openblas -DLAPACK_INCLUDE_DIRS=/usr/include/openblas \
        && cmake --build --parallel ${PARALLEL} --preset 'MLX CUDA 13' \
        && cmake --install build --component MLX --strip --parallel ${PARALLEL}
+COPY . .
+ARG GOFLAGS="'-ldflags=-w -s'"
+ENV CGO_ENABLED=1
+ARG CGO_CFLAGS
+ARG CGO_CXXFLAGS
+RUN mkdir -p dist/bin
+RUN --mount=type=cache,target=/root/.cache/go-build \
+    go build -tags mlx -trimpath -buildmode=pie -o dist/bin/ollama-mlx .

 FROM base AS build
 WORKDIR /go/src/github.com/ollama/ollama
@@ -160,16 +172,12 @@ RUN curl -fsSL https://golang.org/dl/go$(awk '/^go/ { print $2 }' go.mod).linux-
 ENV PATH=/usr/local/go/bin:$PATH
 RUN go mod download
 COPY . .
-# Clone mlx-c headers for CGO (version from MLX_VERSION file)
-RUN git clone --depth 1 --branch "$(cat MLX_VERSION)" https://github.com/ml-explore/mlx-c.git build/_deps/mlx-c-src
 ARG GOFLAGS="'-ldflags=-w -s'"
 ENV CGO_ENABLED=1
 ARG CGO_CFLAGS
 ARG CGO_CXXFLAGS
-ENV CGO_CFLAGS="${CGO_CFLAGS} -I/go/src/github.com/ollama/ollama/build/_deps/mlx-c-src"
-ENV CGO_CXXFLAGS="${CGO_CXXFLAGS}"
 RUN --mount=type=cache,target=/root/.cache/go-build \
-    go build -tags mlx -trimpath -buildmode=pie -o /bin/ollama .
+    go build -trimpath -buildmode=pie -o /bin/ollama .

 FROM --platform=linux/amd64 scratch AS amd64
 # COPY --from=cuda-11 dist/lib/ollama/ /lib/ollama/
@@ -177,6 +185,7 @@ COPY --from=cuda-12 dist/lib/ollama /lib/ollama/
 COPY --from=cuda-13 dist/lib/ollama /lib/ollama/
 COPY --from=vulkan  dist/lib/ollama  /lib/ollama/
 COPY --from=mlx     /go/src/github.com/ollama/ollama/dist/lib/ollama /lib/ollama/
+COPY --from=mlx     /go/src/github.com/ollama/ollama/dist/bin/ /bin/

 FROM --platform=linux/arm64 scratch AS arm64
 # COPY --from=cuda-11 dist/lib/ollama/ /lib/ollama/
--- a/1
+++ b/1
@@ -1 +0,0 @@
-v0.5.0
--- a/README.md
+++ b/README.md
@@ -1,30 +1,20 @@
-<p align="center">
-  <a href="https://ollama.com">
-    <img src="https://github.com/ollama/ollama/assets/3325447/0d0b44e2-8f4a-4e99-9b52-a5c1c741c8f7" alt="ollama" width="200"/>
+<div align="center">
+  <a href="https://ollama.com">
+    <img alt="ollama" width="240" src="https://github.com/ollama/ollama/assets/3325447/0d0b44e2-8f4a-4e99-9b52-a5c1c741c8f7">
  </a>
-</p>
+</div>

 # Ollama

-Start building with open models.
-
-## Download
+Get up and running with large language models.

 ### macOS

-```shell
-curl -fsSL https://ollama.com/install.sh | sh
-```
-
-or [download manually](https://ollama.com/download/Ollama.dmg)
+[Download](https://ollama.com/download/Ollama.dmg)

 ### Windows

-```shell
-irm https://ollama.com/install.ps1 | iex
-```
-
-or [download manually](https://ollama.com/download/OllamaSetup.exe)
+[Download](https://ollama.com/download/OllamaSetup.exe)

 ### Linux

@@ -46,311 +36,646 @@ The official [Ollama Docker image](https://hub.docker.com/r/ollama/ollama) `olla
 ### Community

 - [Discord](https://discord.gg/ollama)
- [𝕏 (Twitter)](https://x.com/ollama)
 - [Reddit](https://reddit.com/r/ollama)

-## Get started
+## Quickstart

-```
-ollama
-```
+To run and chat with [Gemma 3](https://ollama.com/library/gemma3):

-You'll be prompted to run a model or connect Ollama to your existing agents or applications such as `claude`, `codex`, `openclaw` and more.
-
-### Coding
-
-To launch a specific integration:
-
-```
-ollama launch claude
-```
-
-Supported integrations include [Claude Code](https://docs.ollama.com/integrations/claude-code), [Codex](https://docs.ollama.com/integrations/codex), [Droid](https://docs.ollama.com/integrations/droid), and [OpenCode](https://docs.ollama.com/integrations/opencode).
-
-### AI assistant
-
-Use [OpenClaw](https://docs.ollama.com/integrations/openclaw) to turn Ollama into a personal AI assistant across WhatsApp, Telegram, Slack, Discord, and more:
-
-```
-ollama launch openclaw
-```
-
-### Chat with a model
-
-Run and chat with [Gemma 3](https://ollama.com/library/gemma3):
-
-```
+```shell
 ollama run gemma3
 ```

-See [ollama.com/library](https://ollama.com/library) for the full list.
+## Model library

-See the [quickstart guide](https://docs.ollama.com/quickstart) for more details.
+Ollama supports a list of models available on [ollama.com/library](https://ollama.com/library "ollama model library")
+
+Here are some example models that can be downloaded:
+
+| Model              | Parameters | Size  | Download                         |
+| ------------------ | ---------- | ----- | -------------------------------- |
+| Gemma 3            | 1B         | 815MB | `ollama run gemma3:1b`           |
+| Gemma 3            | 4B         | 3.3GB | `ollama run gemma3`              |
+| Gemma 3            | 12B        | 8.1GB | `ollama run gemma3:12b`          |
+| Gemma 3            | 27B        | 17GB  | `ollama run gemma3:27b`          |
+| QwQ                | 32B        | 20GB  | `ollama run qwq`                 |
+| DeepSeek-R1        | 7B         | 4.7GB | `ollama run deepseek-r1`         |
+| DeepSeek-R1        | 671B       | 404GB | `ollama run deepseek-r1:671b`    |
+| Llama 4            | 109B       | 67GB  | `ollama run llama4:scout`        |
+| Llama 4            | 400B       | 245GB | `ollama run llama4:maverick`     |
+| Llama 3.3          | 70B        | 43GB  | `ollama run llama3.3`            |
+| Llama 3.2          | 3B         | 2.0GB | `ollama run llama3.2`            |
+| Llama 3.2          | 1B         | 1.3GB | `ollama run llama3.2:1b`         |
+| Llama 3.2 Vision   | 11B        | 7.9GB | `ollama run llama3.2-vision`     |
+| Llama 3.2 Vision   | 90B        | 55GB  | `ollama run llama3.2-vision:90b` |
+| Llama 3.1          | 8B         | 4.7GB | `ollama run llama3.1`            |
+| Llama 3.1          | 405B       | 231GB | `ollama run llama3.1:405b`       |
+| Phi 4              | 14B        | 9.1GB | `ollama run phi4`                |
+| Phi 4 Mini         | 3.8B       | 2.5GB | `ollama run phi4-mini`           |
+| Mistral            | 7B         | 4.1GB | `ollama run mistral`             |
+| Moondream 2        | 1.4B       | 829MB | `ollama run moondream`           |
+| Neural Chat        | 7B         | 4.1GB | `ollama run neural-chat`         |
+| Starling           | 7B         | 4.1GB | `ollama run starling-lm`         |
+| Code Llama         | 7B         | 3.8GB | `ollama run codellama`           |
+| Llama 2 Uncensored | 7B         | 3.8GB | `ollama run llama2-uncensored`   |
+| LLaVA              | 7B         | 4.5GB | `ollama run llava`               |
+| Granite-3.3        | 8B         | 4.9GB | `ollama run granite3.3`          |
+
+> [!NOTE]
+> You should have at least 8 GB of RAM available to run the 7B models, 16 GB to run the 13B models, and 32 GB to run the 33B models.
+
+## Customize a model
+
+### Import from GGUF
+
+Ollama supports importing GGUF models in the Modelfile:
+
+1. Create a file named `Modelfile`, with a `FROM` instruction with the local filepath to the model you want to import.
+
+   ```
+   FROM ./vicuna-33b.Q4_0.gguf
+   ```
+
+2. Create the model in Ollama
+
+   ```shell
+   ollama create example -f Modelfile
+   ```
+
+3. Run the model
+
+   ```shell
+   ollama run example
+   ```
+
+### Import from Safetensors
+
+See the [guide](https://docs.ollama.com/import) on importing models for more information.
+
+### Customize a prompt
+
+Models from the Ollama library can be customized with a prompt. For example, to customize the `llama3.2` model:
+
+```shell
+ollama pull llama3.2
+```
+
+Create a `Modelfile`:
+
+```
+FROM llama3.2
+
+# set the temperature to 1 [higher is more creative, lower is more coherent]
+PARAMETER temperature 1
+
+# set the system message
+SYSTEM """
+You are Mario from Super Mario Bros. Answer as Mario, the assistant, only.
+"""
+```
+
+Next, create and run the model:
+
+```
+ollama create mario -f ./Modelfile
+ollama run mario
+>>> hi
+Hello! It's your friend Mario.
+```
+
+For more information on working with a Modelfile, see the [Modelfile](https://docs.ollama.com/modelfile) documentation.
+
+## CLI Reference
+
+### Create a model
+
+`ollama create` is used to create a model from a Modelfile.
+
+```shell
+ollama create mymodel -f ./Modelfile
+```
+
+### Pull a model
+
+```shell
+ollama pull llama3.2
+```
+
+> This command can also be used to update a local model. Only the diff will be pulled.
+
+### Remove a model
+
+```shell
+ollama rm llama3.2
+```
+
+### Copy a model
+
+```shell
+ollama cp llama3.2 my-model
+```
+
+### Multiline input
+
+For multiline input, you can wrap text with `"""`:
+
+```
+>>> """Hello,
+... world!
+... """
+I'm a basic program that prints the famous "Hello, world!" message to the console.
+```
+
+### Multimodal models
+
+```
+ollama run llava "What's in this image? /Users/jmorgan/Desktop/smile.png"
+```
+
+> **Output**: The image features a yellow smiley face, which is likely the central focus of the picture.
+
+### Pass the prompt as an argument
+
+```shell
+ollama run llama3.2 "Summarize this file: $(cat README.md)"
+```
+
+> **Output**: Ollama is a lightweight, extensible framework for building and running language models on the local machine. It provides a simple API for creating, running, and managing models, as well as a library of pre-built models that can be easily used in a variety of applications.
+
+### Show model information
+
+```shell
+ollama show llama3.2
+```
+
+### List models on your computer
+
+```shell
+ollama list
+```
+
+### List which models are currently loaded
+
+```shell
+ollama ps
+```
+
+### Stop a model which is currently running
+
+```shell
+ollama stop llama3.2
+```
+
+### Generate embeddings from the CLI
+
+```shell
+ollama run embeddinggemma "Your text to embed"
+```
+
+You can also pipe text for scripted workflows:
+
+```shell
+echo "Your text to embed" | ollama run embeddinggemma
+```
+
+### Start Ollama
+
+`ollama serve` is used when you want to start ollama without running the desktop application.
+
+## Building
+
+See the [developer guide](https://github.com/ollama/ollama/blob/main/docs/development.md)
+
+### Running local builds
+
+Next, start the server:
+
+```shell
+./ollama serve
+```
+
+Finally, in a separate shell, run a model:
+
+```shell
+./ollama run llama3.2
+```
+
+## Building with MLX (experimental)
+
+First build the MLX libraries:
+
+```shell
+cmake --preset MLX
+cmake --build --preset MLX --parallel
+cmake --install build --component MLX
+```
+
+Next, build the `ollama-mlx` binary, which is a separate build of the Ollama runtime with MLX support enabled (needs to be in the same directory as `ollama`):
+
+```shell
+go build -tags mlx -o ollama-mlx .
+```
+
+Finally, start the server:
+
+```
+./ollama serve
+```
+
+### Building MLX with CUDA
+
+When building with CUDA, use the preset "MLX CUDA 13" or "MLX CUDA 12" to enable CUDA with default architectures:
+
+```shell
+cmake --preset 'MLX CUDA 13'
+cmake --build --preset 'MLX CUDA 13' --parallel
+cmake --install build --component MLX
+```

 ## REST API

 Ollama has a REST API for running and managing models.

-```
-curl http://localhost:11434/api/chat -d '{
-  "model": "gemma3",
-  "messages": [{
-    "role": "user",
-    "content": "Why is the sky blue?"
-  }],
-  "stream": false
+### Generate a response
+
+```shell
+curl http://localhost:11434/api/generate -d '{
+  "model": "llama3.2",
+  "prompt":"Why is the sky blue?"
 }'
 ```

-See the [API documentation](https://docs.ollama.com/api) for all endpoints.
+### Chat with a model

-### Python
-
-```
-pip install ollama
+```shell
+curl http://localhost:11434/api/chat -d '{
+  "model": "llama3.2",
+  "messages": [
+    { "role": "user", "content": "why is the sky blue?" }
+  ]
+}'
 ```

-```python
-from ollama import chat
-
-response = chat(model='gemma3', messages=[
-  {
-    'role': 'user',
-    'content': 'Why is the sky blue?',
-  },
-])
-print(response.message.content)
-```
-
-### JavaScript
-
-```
-npm i ollama
-```
-
-```javascript
-import ollama from "ollama";
-
-const response = await ollama.chat({
-  model: "gemma3",
-  messages: [{ role: "user", content: "Why is the sky blue?" }],
-});
-console.log(response.message.content);
-```
-
-## Supported backends
-
- [llama.cpp](https://github.com/ggml-org/llama.cpp) project founded by Georgi Gerganov.
-
-## Documentation
-
- [CLI reference](https://docs.ollama.com/cli)
- [REST API reference](https://docs.ollama.com/api)
- [Importing models](https://docs.ollama.com/import)
- [Modelfile reference](https://docs.ollama.com/modelfile)
- [Building from source](https://github.com/ollama/ollama/blob/main/docs/development.md)
+See the [API documentation](./docs/api.md) for all endpoints.

 ## Community Integrations

-> Want to add your project? Open a pull request.
+### Web & Desktop

-### Chat Interfaces
+- [Open WebUI](https://github.com/open-webui/open-webui)
+- [SwiftChat (macOS with ReactNative)](https://github.com/aws-samples/swift-chat)
+- [Enchanted (macOS native)](https://github.com/AugustDev/enchanted)
+- [Hollama](https://github.com/fmaclen/hollama)
+- [Lollms WebUI (Single user)](https://github.com/ParisNeo/lollms-webui)
+- [Lollms (Multi users)](https://github.com/ParisNeo/lollms)
+- [LibreChat](https://github.com/danny-avila/LibreChat)
+- [Bionic GPT](https://github.com/bionic-gpt/bionic-gpt)
+- [HTML UI](https://github.com/rtcfirefly/ollama-ui)
+- [AI-UI](https://github.com/bajahaw/ai-ui)
+- [Saddle](https://github.com/jikkuatwork/saddle)
+- [TagSpaces](https://www.tagspaces.org) (A platform for file-based apps, [utilizing Ollama](https://docs.tagspaces.org/ai/) for the generation of tags and descriptions)
+- [Chatbot UI](https://github.com/ivanfioravanti/chatbot-ollama)
+- [Chatbot UI v2](https://github.com/mckaywrigley/chatbot-ui)
+- [Typescript UI](https://github.com/ollama-interface/Ollama-Gui?tab=readme-ov-file)
+- [Minimalistic React UI for Ollama Models](https://github.com/richawo/minimal-llm-ui)
+- [Ollamac](https://github.com/kevinhermawan/Ollamac)
+- [big-AGI](https://github.com/enricoros/big-AGI)
+- [Cheshire Cat assistant framework](https://github.com/cheshire-cat-ai/core)
+- [Amica](https://github.com/semperai/amica)
+- [chatd](https://github.com/BruceMacD/chatd)
+- [Ollama-SwiftUI](https://github.com/kghandour/Ollama-SwiftUI)
+- [Dify.AI](https://github.com/langgenius/dify)
+- [MindMac](https://mindmac.app)
+- [NextJS Web Interface for Ollama](https://github.com/jakobhoeg/nextjs-ollama-llm-ui)
+- [Msty](https://msty.app)
+- [Chatbox](https://github.com/Bin-Huang/Chatbox)
+- [WinForm Ollama Copilot](https://github.com/tgraupmann/WinForm_Ollama_Copilot)
+- [NextChat](https://github.com/ChatGPTNextWeb/ChatGPT-Next-Web) with [Get Started Doc](https://docs.nextchat.dev/models/ollama)
+- [Alpaca WebUI](https://github.com/mmo80/alpaca-webui)
+- [OllamaGUI](https://github.com/enoch1118/ollamaGUI)
+- [OpenAOE](https://github.com/InternLM/OpenAOE)
+- [Odin Runes](https://github.com/leonid20000/OdinRunes)
+- [LLM-X](https://github.com/mrdjohnson/llm-x) (Progressive Web App)
+- [AnythingLLM (Docker + MacOs/Windows/Linux native app)](https://github.com/Mintplex-Labs/anything-llm)
+- [Ollama Basic Chat: Uses HyperDiv Reactive UI](https://github.com/rapidarchitect/ollama_basic_chat)
+- [Ollama-chats RPG](https://github.com/drazdra/ollama-chats)
+- [IntelliBar](https://intellibar.app/) (AI-powered assistant for macOS)
+- [Jirapt](https://github.com/AliAhmedNada/jirapt) (Jira Integration to generate issues, tasks, epics)
+- [ojira](https://github.com/AliAhmedNada/ojira) (Jira chrome plugin to easily generate descriptions for tasks)
+- [QA-Pilot](https://github.com/reid41/QA-Pilot) (Interactive chat tool that can leverage Ollama models for rapid understanding and navigation of GitHub code repositories)
+- [ChatOllama](https://github.com/sugarforever/chat-ollama) (Open Source Chatbot based on Ollama with Knowledge Bases)
+- [CRAG Ollama Chat](https://github.com/Nagi-ovo/CRAG-Ollama-Chat) (Simple Web Search with Corrective RAG)
+- [RAGFlow](https://github.com/infiniflow/ragflow) (Open-source Retrieval-Augmented Generation engine based on deep document understanding)
+- [StreamDeploy](https://github.com/StreamDeploy-DevRel/streamdeploy-llm-app-scaffold) (LLM Application Scaffold)
+- [chat](https://github.com/swuecho/chat) (chat web app for teams)
+- [Lobe Chat](https://github.com/lobehub/lobe-chat) with [Integrating Doc](https://lobehub.com/docs/self-hosting/examples/ollama)
+- [Ollama RAG Chatbot](https://github.com/datvodinh/rag-chatbot.git) (Local Chat with multiple PDFs using Ollama and RAG)
+- [BrainSoup](https://www.nurgo-software.com/products/brainsoup) (Flexible native client with RAG & multi-agent automation)
+- [macai](https://github.com/Renset/macai) (macOS client for Ollama, ChatGPT, and other compatible API back-ends)
+- [RWKV-Runner](https://github.com/josStorer/RWKV-Runner) (RWKV offline LLM deployment tool, also usable as a client for ChatGPT and Ollama)
+- [Ollama Grid Search](https://github.com/dezoito/ollama-grid-search) (app to evaluate and compare models)
+- [Olpaka](https://github.com/Otacon/olpaka) (User-friendly Flutter Web App for Ollama)
+- [Casibase](https://casibase.org) (An open source AI knowledge base and dialogue system combining the latest RAG, SSO, ollama support, and multiple large language models.)
+- [OllamaSpring](https://github.com/CrazyNeil/OllamaSpring) (Ollama Client for macOS)
+- [LLocal.in](https://github.com/kartikm7/llocal) (Easy to use Electron Desktop Client for Ollama)
+- [Shinkai Desktop](https://github.com/dcSpark/shinkai-apps) (Two click install Local AI using Ollama + Files + RAG)
+- [AiLama](https://github.com/zeyoyt/ailama) (A Discord User App that allows you to interact with Ollama anywhere in Discord)
+- [Ollama with Google Mesop](https://github.com/rapidarchitect/ollama_mesop/) (Mesop Chat Client implementation with Ollama)
+- [R2R](https://github.com/SciPhi-AI/R2R) (Open-source RAG engine)
+- [Ollama-Kis](https://github.com/elearningshow/ollama-kis) (A simple easy-to-use GUI with sample custom LLM for Drivers Education)
+- [OpenGPA](https://opengpa.org) (Open-source offline-first Enterprise Agentic Application)
+- [Painting Droid](https://github.com/mateuszmigas/painting-droid) (Painting app with AI integrations)
+- [Kerlig AI](https://www.kerlig.com/) (AI writing assistant for macOS)
+- [AI Studio](https://github.com/MindWorkAI/AI-Studio)
+- [Sidellama](https://github.com/gyopak/sidellama) (browser-based LLM client)
+- [LLMStack](https://github.com/trypromptly/LLMStack) (No-code multi-agent framework to build LLM agents and workflows)
+- [BoltAI for Mac](https://boltai.com) (AI Chat Client for Mac)
+- [Harbor](https://github.com/av/harbor) (Containerized LLM Toolkit with Ollama as default backend)
+- [PyGPT](https://github.com/szczyglis-dev/py-gpt) (AI desktop assistant for Linux, Windows, and Mac)
+- [Alpaca](https://github.com/Jeffser/Alpaca) (An Ollama client application for Linux and macOS made with GTK4 and Adwaita)
+- [AutoGPT](https://github.com/Significant-Gravitas/AutoGPT/blob/master/docs/content/platform/ollama.md) (AutoGPT Ollama integration)
+- [Go-CREW](https://www.jonathanhecl.com/go-crew/) (Powerful Offline RAG in Golang)
+- [PartCAD](https://github.com/openvmp/partcad/) (CAD model generation with OpenSCAD and CadQuery)
+- [Ollama4j Web UI](https://github.com/ollama4j/ollama4j-web-ui) - Java-based Web UI for Ollama built with Vaadin, Spring Boot, and Ollama4j
+- [PyOllaMx](https://github.com/kspviswa/pyOllaMx) - macOS application capable of chatting with both Ollama and Apple MLX models.
+- [Cline](https://github.com/cline/cline) - Formerly known as Claude Dev is a VS Code extension for multi-file/whole-repo coding
+- [Void](https://github.com/voideditor/void) (Open source AI code editor and Cursor alternative)
+- [Cherry Studio](https://github.com/kangfenmao/cherry-studio) (Desktop client with Ollama support)
+- [ConfiChat](https://github.com/1runeberg/confichat) (Lightweight, standalone, multi-platform, and privacy-focused LLM chat interface with optional encryption)
+- [Archyve](https://github.com/nickthecook/archyve) (RAG-enabling document library)
+- [crewAI with Mesop](https://github.com/rapidarchitect/ollama-crew-mesop) (Mesop Web Interface to run crewAI with Ollama)
+- [Tkinter-based client](https://github.com/chyok/ollama-gui) (Python tkinter-based Client for Ollama)
+- [LLMChat](https://github.com/trendy-design/llmchat) (Privacy focused, 100% local, intuitive all-in-one chat interface)
+- [Local Multimodal AI Chat](https://github.com/Leon-Sander/Local-Multimodal-AI-Chat) (Ollama-based LLM Chat with support for multiple features, including PDF RAG, voice chat, image-based interactions, and integration with OpenAI.)
+- [ARGO](https://github.com/xark-argo/argo) (Locally download and run Ollama and Huggingface models with RAG and deep research on Mac/Windows/Linux)
+- [OrionChat](https://github.com/EliasPereirah/OrionChat) - OrionChat is a web interface for chatting with different AI providers
+- [G1](https://github.com/bklieger-groq/g1) (Prototype of using prompting strategies to improve the LLM's reasoning through o1-like reasoning chains.)
+- [Web management](https://github.com/lemonit-eric-mao/ollama-web-management) (Web management page)
+- [Promptery](https://github.com/promptery/promptery) (desktop client for Ollama.)
+- [Ollama App](https://github.com/JHubi1/ollama-app) (Modern and easy-to-use multi-platform client for Ollama)
+- [chat-ollama](https://github.com/annilq/chat-ollama) (a React Native client for Ollama)
+- [SpaceLlama](https://github.com/tcsenpai/spacellama) (Firefox and Chrome extension to quickly summarize web pages with ollama in a sidebar)
+- [YouLama](https://github.com/tcsenpai/youlama) (Webapp to quickly summarize any YouTube video, supporting Invidious as well)
+- [DualMind](https://github.com/tcsenpai/dualmind) (Experimental app allowing two models to talk to each other in the terminal or in a web interface)
+- [ollamarama-matrix](https://github.com/h1ddenpr0cess20/ollamarama-matrix) (Ollama chatbot for the Matrix chat protocol)
+- [ollama-chat-app](https://github.com/anan1213095357/ollama-chat-app) (Flutter-based chat app)
+- [Perfect Memory AI](https://www.perfectmemory.ai/) (Productivity AI assists personalized by what you have seen on your screen, heard, and said in the meetings)
+- [Hexabot](https://github.com/hexastack/hexabot) (A conversational AI builder)
+- [Reddit Rate](https://github.com/rapidarchitect/reddit_analyzer) (Search and Rate Reddit topics with a weighted summation)
+- [OpenTalkGpt](https://github.com/adarshM84/OpenTalkGpt) (Chrome Extension to manage open-source models supported by Ollama, create custom models, and chat with models from a user-friendly UI)
+- [VT](https://github.com/vinhnx/vt.ai) (A minimal multimodal AI chat app, with dynamic conversation routing. Supports local models via Ollama)
+- [Nosia](https://github.com/nosia-ai/nosia) (Easy to install and use RAG platform based on Ollama)
+- [Witsy](https://github.com/nbonamy/witsy) (An AI Desktop application available for Mac/Windows/Linux)
+- [Abbey](https://github.com/US-Artificial-Intelligence/abbey) (A configurable AI interface server with notebooks, document storage, and YouTube support)
+- [Minima](https://github.com/dmayboroda/minima) (RAG with on-premises or fully local workflow)
+- [aidful-ollama-model-delete](https://github.com/AidfulAI/aidful-ollama-model-delete) (User interface for simplified model cleanup)
+- [Perplexica](https://github.com/ItzCrazyKns/Perplexica) (An AI-powered search engine & an open-source alternative to Perplexity AI)
+- [Ollama Chat WebUI for Docker ](https://github.com/oslook/ollama-webui) (Support for local docker deployment, lightweight ollama webui)
+- [AI Toolkit for Visual Studio Code](https://aka.ms/ai-tooklit/ollama-docs) (Microsoft-official VS Code extension to chat, test, evaluate models with Ollama support, and use them in your AI applications.)
+- [MinimalNextOllamaChat](https://github.com/anilkay/MinimalNextOllamaChat) (Minimal Web UI for Chat and Model Control)
+- [Chipper](https://github.com/TilmanGriesel/chipper) AI interface for tinkerers (Ollama, Haystack RAG, Python)
+- [ChibiChat](https://github.com/CosmicEventHorizon/ChibiChat) (Kotlin-based Android app to chat with Ollama and Koboldcpp API endpoints)
+- [LocalLLM](https://github.com/qusaismael/localllm) (Minimal Web-App to run ollama models on it with a GUI)
+- [Ollamazing](https://github.com/buiducnhat/ollamazing) (Web extension to run Ollama models)
+- [OpenDeepResearcher-via-searxng](https://github.com/benhaotang/OpenDeepResearcher-via-searxng) (A Deep Research equivalent endpoint with Ollama support for running locally)
+- [AntSK](https://github.com/AIDotNet/AntSK) (Out-of-the-box & Adaptable RAG Chatbot)
+- [MaxKB](https://github.com/1Panel-dev/MaxKB/) (Ready-to-use & flexible RAG Chatbot)
+- [yla](https://github.com/danielekp/yla) (Web interface to freely interact with your customized models)
+- [LangBot](https://github.com/RockChinQ/LangBot) (LLM-based instant messaging bots platform, with Agents, RAG features, supports multiple platforms)
+- [1Panel](https://github.com/1Panel-dev/1Panel/) (Web-based Linux Server Management Tool)
+- [AstrBot](https://github.com/Soulter/AstrBot/) (User-friendly LLM-based multi-platform chatbot with a WebUI, supporting RAG, LLM agents, and plugins integration)
+- [Reins](https://github.com/ibrahimcetin/reins) (Easily tweak parameters, customize system prompts per chat, and enhance your AI experiments with reasoning model support.)
+- [Flufy](https://github.com/Aharon-Bensadoun/Flufy) (A beautiful chat interface for interacting with Ollama's API. Built with React, TypeScript, and Material-UI.)
+- [Ellama](https://github.com/zeozeozeo/ellama) (Friendly native app to chat with an Ollama instance)
+- [screenpipe](https://github.com/mediar-ai/screenpipe) Build agents powered by your screen history
+- [Ollamb](https://github.com/hengkysteen/ollamb) (Simple yet rich in features, cross-platform built with Flutter and designed for Ollama. Try the [web demo](https://hengkysteen.github.io/demo/ollamb/).)
+- [Writeopia](https://github.com/Writeopia/Writeopia) (Text editor with integration with Ollama)
+- [AppFlowy](https://github.com/AppFlowy-IO/AppFlowy) (AI collaborative workspace with Ollama, cross-platform and self-hostable)
+- [Lumina](https://github.com/cushydigit/lumina.git) (A lightweight, minimal React.js frontend for interacting with Ollama servers)
+- [Tiny Notepad](https://pypi.org/project/tiny-notepad) (A lightweight, notepad-like interface to chat with ollama available on PyPI)
+- [macLlama (macOS native)](https://github.com/hellotunamayo/macLlama) (A native macOS GUI application for interacting with Ollama models, featuring a chat interface.)
+- [GPTranslate](https://github.com/philberndt/GPTranslate) (A fast and lightweight, AI powered desktop translation application written with Rust and Tauri. Features real-time translation with OpenAI/Azure/Ollama.)
+- [ollama launcher](https://github.com/NGC13009/ollama-launcher) (A launcher for Ollama, aiming to provide users with convenient functions such as ollama server launching, management, or configuration.)
+- [ai-hub](https://github.com/Aj-Seven/ai-hub) (AI Hub supports multiple models via API keys and Chat support via Ollama API.)
+- [Mayan EDMS](https://gitlab.com/mayan-edms/mayan-edms) (Open source document management system to organize, tag, search, and automate your files with powerful Ollama driven workflows.)
+- [Serene Pub](https://github.com/doolijb/serene-pub) (Beginner friendly, open source AI Roleplaying App for Windows, Mac OS and Linux. Search, download and use models with Ollama all inside the app.)
+- [Andes](https://github.com/aqerd/andes) (A Visual Studio Code extension that provides a local UI interface for Ollama models)
+- [KDeps](https://github.com/kdeps/kdeps) (Kdeps is an offline-first AI framework for building Dockerized full-stack AI applications declaratively using Apple PKL and integrates APIs with Ollama on the backend.)
+- [Clueless](https://github.com/KashyapTan/clueless) (Open Source & Local Cluely: A desktop application LLM assistant to help you talk to anything on your screen using locally served Ollama models. Also undetectable to screenshare)
+- [ollama-co2](https://github.com/carbonatedWaterOrg/ollama-co2) (FastAPI web interface for monitoring and managing local and remote Ollama servers with real-time model monitoring and concurrent downloads)
+- [Hillnote](https://hillnote.com) (A Markdown-first workspace designed to supercharge your AI workflow. Create documents ready to integrate with Claude, ChatGPT, Gemini, Cursor, and more - all while keeping your work on your device.)

-#### Web
-
- [Open WebUI](https://github.com/open-webui/open-webui) - Extensible, self-hosted AI interface
- [Onyx](https://github.com/onyx-dot-app/onyx) - Connected AI workspace
- [LibreChat](https://github.com/danny-avila/LibreChat) - Enhanced ChatGPT clone with multi-provider support
- [Lobe Chat](https://github.com/lobehub/lobe-chat) - Modern chat framework with plugin ecosystem ([docs](https://lobehub.com/docs/self-hosting/examples/ollama))
- [NextChat](https://github.com/ChatGPTNextWeb/ChatGPT-Next-Web) - Cross-platform ChatGPT UI ([docs](https://docs.nextchat.dev/models/ollama))
- [Perplexica](https://github.com/ItzCrazyKns/Perplexica) - AI-powered search engine, open-source Perplexity alternative
- [big-AGI](https://github.com/enricoros/big-AGI) - AI suite for professionals
- [Lollms WebUI](https://github.com/ParisNeo/lollms-webui) - Multi-model web interface
- [ChatOllama](https://github.com/sugarforever/chat-ollama) - Chatbot with knowledge bases
- [Bionic GPT](https://github.com/bionic-gpt/bionic-gpt) - On-premise AI platform
- [Chatbot UI](https://github.com/ivanfioravanti/chatbot-ollama) - ChatGPT-style web interface
- [Hollama](https://github.com/fmaclen/hollama) - Minimal web interface
- [Chatbox](https://github.com/Bin-Huang/Chatbox) - Desktop and web AI client
- [chat](https://github.com/swuecho/chat) - Chat web app for teams
- [Ollama RAG Chatbot](https://github.com/datvodinh/rag-chatbot.git) - Chat with multiple PDFs using RAG
- [Tkinter-based client](https://github.com/chyok/ollama-gui) - Python desktop client
-
-#### Desktop
-
- [Dify.AI](https://github.com/langgenius/dify) - LLM app development platform
- [AnythingLLM](https://github.com/Mintplex-Labs/anything-llm) - All-in-one AI app for Mac, Windows, and Linux
- [Maid](https://github.com/Mobile-Artificial-Intelligence/maid) - Cross-platform mobile and desktop client
- [Witsy](https://github.com/nbonamy/witsy) - AI desktop app for Mac, Windows, and Linux
- [Cherry Studio](https://github.com/kangfenmao/cherry-studio) - Multi-provider desktop client
- [Ollama App](https://github.com/JHubi1/ollama-app) - Multi-platform client for desktop and mobile
- [PyGPT](https://github.com/szczyglis-dev/py-gpt) - AI desktop assistant for Linux, Windows, and Mac
- [Alpaca](https://github.com/Jeffser/Alpaca) - GTK4 client for Linux and macOS
- [SwiftChat](https://github.com/aws-samples/swift-chat) - Cross-platform including iOS, Android, and Apple Vision Pro
- [Enchanted](https://github.com/AugustDev/enchanted) - Native macOS and iOS client
- [RWKV-Runner](https://github.com/josStorer/RWKV-Runner) - Multi-model desktop runner
- [Ollama Grid Search](https://github.com/dezoito/ollama-grid-search) - Evaluate and compare models
- [macai](https://github.com/Renset/macai) - macOS client for Ollama and ChatGPT
- [AI Studio](https://github.com/MindWorkAI/AI-Studio) - Multi-provider desktop IDE
- [Reins](https://github.com/ibrahimcetin/reins) - Parameter tuning and reasoning model support
- [ConfiChat](https://github.com/1runeberg/confichat) - Privacy-focused with optional encryption
- [LLocal.in](https://github.com/kartikm7/llocal) - Electron desktop client
- [MindMac](https://mindmac.app) - AI chat client for Mac
- [Msty](https://msty.app) - Multi-model desktop client
- [BoltAI for Mac](https://boltai.com) - AI chat client for Mac
- [IntelliBar](https://intellibar.app/) - AI-powered assistant for macOS
- [Kerlig AI](https://www.kerlig.com/) - AI writing assistant for macOS
- [Hillnote](https://hillnote.com) - Markdown-first AI workspace
- [Perfect Memory AI](https://www.perfectmemory.ai/) - Productivity AI personalized by screen and meeting history
-
-#### Mobile
-
- [Ollama Android Chat](https://github.com/sunshine0523/OllamaServer) - One-click Ollama on Android
-
-> SwiftChat, Enchanted, Maid, Ollama App, Reins, and ConfiChat listed above also support mobile platforms.
-
-### Code Editors & Development
-
- [Cline](https://github.com/cline/cline) - VS Code extension for multi-file/whole-repo coding
- [Continue](https://github.com/continuedev/continue) - Open-source AI code assistant for any IDE
- [Void](https://github.com/voideditor/void) - Open source AI code editor, Cursor alternative
- [Copilot for Obsidian](https://github.com/logancyang/obsidian-copilot) - AI assistant for Obsidian
- [twinny](https://github.com/rjmacarthy/twinny) - Copilot and Copilot chat alternative
- [gptel Emacs client](https://github.com/karthink/gptel) - LLM client for Emacs
- [Ollama Copilot](https://github.com/bernardo-bruning/ollama-copilot) - Use Ollama as GitHub Copilot
- [Obsidian Local GPT](https://github.com/pfrankov/obsidian-local-gpt) - Local AI for Obsidian
- [Ellama Emacs client](https://github.com/s-kostyaev/ellama) - LLM tool for Emacs
- [orbiton](https://github.com/xyproto/orbiton) - Config-free text editor with Ollama tab completion
- [AI ST Completion](https://github.com/yaroslavyaroslav/OpenAI-sublime-text) - Sublime Text 4 AI assistant
- [VT Code](https://github.com/vinhnx/vtcode) - Rust-based terminal coding agent with Tree-sitter
- [QodeAssist](https://github.com/Palm1r/QodeAssist) - AI coding assistant for Qt Creator
- [AI Toolkit for VS Code](https://aka.ms/ai-tooklit/ollama-docs) - Microsoft-official VS Code extension
- [Open Interpreter](https://docs.openinterpreter.com/language-model-setup/local-models/ollama) - Natural language interface for computers
-
-### Libraries & SDKs
-
- [LiteLLM](https://github.com/BerriAI/litellm) - Unified API for 100+ LLM providers
- [Semantic Kernel](https://github.com/microsoft/semantic-kernel/tree/main/python/semantic_kernel/connectors/ai/ollama) - Microsoft AI orchestration SDK
- [LangChain4j](https://github.com/langchain4j/langchain4j) - Java LangChain ([example](https://github.com/langchain4j/langchain4j-examples/tree/main/ollama-examples/src/main/java))
- [LangChainGo](https://github.com/tmc/langchaingo/) - Go LangChain ([example](https://github.com/tmc/langchaingo/tree/main/examples/ollama-completion-example))
- [Spring AI](https://github.com/spring-projects/spring-ai) - Spring framework AI support ([docs](https://docs.spring.io/spring-ai/reference/api/chat/ollama-chat.html))
- [LangChain](https://python.langchain.com/docs/integrations/chat/ollama/) and [LangChain.js](https://js.langchain.com/docs/integrations/chat/ollama/) with [example](https://js.langchain.com/docs/tutorials/local_rag/)
- [Ollama for Ruby](https://github.com/crmne/ruby_llm) - Ruby LLM library
- [any-llm](https://github.com/mozilla-ai/any-llm) - Unified LLM interface by Mozilla
- [OllamaSharp for .NET](https://github.com/awaescher/OllamaSharp) - .NET SDK
- [LangChainRust](https://github.com/Abraxas-365/langchain-rust) - Rust LangChain ([example](https://github.com/Abraxas-365/langchain-rust/blob/main/examples/llm_ollama.rs))
- [Agents-Flex for Java](https://github.com/agents-flex/agents-flex) - Java agent framework ([example](https://github.com/agents-flex/agents-flex/tree/main/agents-flex-llm/agents-flex-llm-ollama/src/test/java/com/agentsflex/llm/ollama))
- [Elixir LangChain](https://github.com/brainlid/langchain) - Elixir LangChain
- [Ollama-rs for Rust](https://github.com/pepperoni21/ollama-rs) - Rust SDK
- [LangChain for .NET](https://github.com/tryAGI/LangChain) - .NET LangChain ([example](https://github.com/tryAGI/LangChain/blob/main/examples/LangChain.Samples.OpenAI/Program.cs))
- [chromem-go](https://github.com/philippgille/chromem-go) - Go vector database with Ollama embeddings ([example](https://github.com/philippgille/chromem-go/tree/v0.5.0/examples/rag-wikipedia-ollama))
- [LangChainDart](https://github.com/davidmigloz/langchain_dart) - Dart LangChain
- [LlmTornado](https://github.com/lofcz/llmtornado) - Unified C# interface for multiple inference APIs
- [Ollama4j for Java](https://github.com/ollama4j/ollama4j) - Java SDK
- [Ollama for Laravel](https://github.com/cloudstudio/ollama-laravel) - Laravel integration
- [Ollama for Swift](https://github.com/mattt/ollama-swift) - Swift SDK
- [LlamaIndex](https://docs.llamaindex.ai/en/stable/examples/llm/ollama/) and [LlamaIndexTS](https://ts.llamaindex.ai/modules/llms/available_llms/ollama) - Data framework for LLM apps
- [Haystack](https://github.com/deepset-ai/haystack-integrations/blob/main/integrations/ollama.md) - AI pipeline framework
- [Firebase Genkit](https://firebase.google.com/docs/genkit/plugins/ollama) - Google AI framework
- [Ollama-hpp for C++](https://github.com/jmont-dev/ollama-hpp) - C++ SDK
- [PromptingTools.jl](https://github.com/svilupp/PromptingTools.jl) - Julia LLM toolkit ([example](https://svilupp.github.io/PromptingTools.jl/dev/examples/working_with_ollama))
- [Ollama for R - rollama](https://github.com/JBGruber/rollama) - R SDK
- [Portkey](https://portkey.ai/docs/welcome/integration-guides/ollama) - AI gateway
- [Testcontainers](https://testcontainers.com/modules/ollama/) - Container-based testing
- [LLPhant](https://github.com/theodo-group/LLPhant?tab=readme-ov-file#ollama) - PHP AI framework
-
-### Frameworks & Agents
-
- [AutoGPT](https://github.com/Significant-Gravitas/AutoGPT/blob/master/docs/content/platform/ollama.md) - Autonomous AI agent platform
- [crewAI](https://github.com/crewAIInc/crewAI) - Multi-agent orchestration framework
- [Strands Agents](https://github.com/strands-agents/sdk-python) - Model-driven agent building by AWS
- [Cheshire Cat](https://github.com/cheshire-cat-ai/core) - AI assistant framework
- [any-agent](https://github.com/mozilla-ai/any-agent) - Unified agent framework interface by Mozilla
- [Stakpak](https://github.com/stakpak/agent) - Open source DevOps agent
- [Hexabot](https://github.com/hexastack/hexabot) - Conversational AI builder
- [Neuro SAN](https://github.com/cognizant-ai-lab/neuro-san-studio) - Multi-agent orchestration ([docs](https://github.com/cognizant-ai-lab/neuro-san-studio/blob/main/docs/user_guide.md#ollama))
-
-### RAG & Knowledge Bases
-
- [RAGFlow](https://github.com/infiniflow/ragflow) - RAG engine based on deep document understanding
- [R2R](https://github.com/SciPhi-AI/R2R) - Open-source RAG engine
- [MaxKB](https://github.com/1Panel-dev/MaxKB/) - Ready-to-use RAG chatbot
- [Minima](https://github.com/dmayboroda/minima) - On-premises or fully local RAG
- [Chipper](https://github.com/TilmanGriesel/chipper) - AI interface with Haystack RAG
- [ARGO](https://github.com/xark-argo/argo) - RAG and deep research on Mac/Windows/Linux
- [Archyve](https://github.com/nickthecook/archyve) - RAG-enabling document library
- [Casibase](https://casibase.org) - AI knowledge base with RAG and SSO
- [BrainSoup](https://www.nurgo-software.com/products/brainsoup) - Native client with RAG and multi-agent automation
-
-### Bots & Messaging
-
- [LangBot](https://github.com/RockChinQ/LangBot) - Multi-platform messaging bots with agents and RAG
- [AstrBot](https://github.com/Soulter/AstrBot/) - Multi-platform chatbot with RAG and plugins
- [Discord-Ollama Chat Bot](https://github.com/kevinthedang/discord-ollama) - TypeScript Discord bot
- [Ollama Telegram Bot](https://github.com/ruecat/ollama-telegram) - Telegram bot
- [LLM Telegram Bot](https://github.com/innightwolfsleep/llm_telegram_bot) - Telegram bot for roleplay
-
-### Terminal & CLI
-
- [aichat](https://github.com/sigoden/aichat) - All-in-one LLM CLI with Shell Assistant, RAG, and AI tools
- [oterm](https://github.com/ggozad/oterm) - Terminal client for Ollama
- [gollama](https://github.com/sammcj/gollama) - Go-based model manager for Ollama
- [tlm](https://github.com/yusufcanb/tlm) - Local shell copilot
- [tenere](https://github.com/pythops/tenere) - TUI for LLMs
- [ParLlama](https://github.com/paulrobello/parllama) - TUI for Ollama
- [llm-ollama](https://github.com/taketwo/llm-ollama) - Plugin for [Datasette's LLM CLI](https://llm.datasette.io/en/stable/)
- [ShellOracle](https://github.com/djcopley/ShellOracle) - Shell command suggestions
- [LLM-X](https://github.com/mrdjohnson/llm-x) - Progressive web app for LLMs
- [cmdh](https://github.com/pgibler/cmdh) - Natural language to shell commands
- [VT](https://github.com/vinhnx/vt.ai) - Minimal multimodal AI chat app
-
-### Productivity & Apps
-
- [AppFlowy](https://github.com/AppFlowy-IO/AppFlowy) - AI collaborative workspace, self-hostable Notion alternative
- [Screenpipe](https://github.com/mediar-ai/screenpipe) - 24/7 screen and mic recording with AI-powered search
- [Vibe](https://github.com/thewh1teagle/vibe) - Transcribe and analyze meetings
- [Page Assist](https://github.com/n4ze3m/page-assist) - Chrome extension for AI-powered browsing
- [NativeMind](https://github.com/NativeMindBrowser/NativeMindExtension) - Private, on-device browser AI assistant
- [Ollama Fortress](https://github.com/ParisNeo/ollama_proxy_server) - Security proxy for Ollama
- [1Panel](https://github.com/1Panel-dev/1Panel/) - Web-based Linux server management
- [Writeopia](https://github.com/Writeopia/Writeopia) - Text editor with Ollama integration
- [QA-Pilot](https://github.com/reid41/QA-Pilot) - GitHub code repository understanding
- [Raycast extension](https://github.com/MassimilianoPasquini97/raycast_ollama) - Ollama in Raycast
- [Painting Droid](https://github.com/mateuszmigas/painting-droid) - Painting app with AI integrations
- [Serene Pub](https://github.com/doolijb/serene-pub) - AI roleplaying app
- [Mayan EDMS](https://gitlab.com/mayan-edms/mayan-edms) - Document management with Ollama workflows
- [TagSpaces](https://www.tagspaces.org) - File management with [AI tagging](https://docs.tagspaces.org/ai/)
-
-### Observability & Monitoring
-
- [Opik](https://www.comet.com/docs/opik/cookbook/ollama) - Debug, evaluate, and monitor LLM applications
- [OpenLIT](https://github.com/openlit/openlit) - OpenTelemetry-native monitoring for Ollama and GPUs
- [Lunary](https://lunary.ai/docs/integrations/ollama) - LLM observability with analytics and PII masking
- [Langfuse](https://langfuse.com/docs/integrations/ollama) - Open source LLM observability
- [HoneyHive](https://docs.honeyhive.ai/integrations/ollama) - AI observability and evaluation for agents
- [MLflow Tracing](https://mlflow.org/docs/latest/llms/tracing/index.html#automatic-tracing) - Open source LLM observability
-
-### Database & Embeddings
-
- [pgai](https://github.com/timescale/pgai) - PostgreSQL as a vector database ([guide](https://github.com/timescale/pgai/blob/main/docs/vectorizer-quick-start.md))
- [MindsDB](https://github.com/mindsdb/mindsdb/blob/staging/mindsdb/integrations/handlers/ollama_handler/README.md) - Connect Ollama with 200+ data platforms
- [chromem-go](https://github.com/philippgille/chromem-go/blob/v0.5.0/embed_ollama.go) - Embeddable vector database for Go ([example](https://github.com/philippgille/chromem-go/tree/v0.5.0/examples/rag-wikipedia-ollama))
- [Kangaroo](https://github.com/dbkangaroo/kangaroo) - AI-powered SQL client
-
-### Infrastructure & Deployment
-
-#### Cloud
+### Cloud

 - [Google Cloud](https://cloud.google.com/run/docs/tutorials/gpu-gemma2-with-ollama)
 - [Fly.io](https://fly.io/docs/python/do-more/add-ollama/)
 - [Koyeb](https://www.koyeb.com/deploy/ollama)
- [Harbor](https://github.com/av/harbor) - Containerized LLM toolkit with Ollama as default backend

-#### Package Managers
+### Tutorial
+
+- [handy-ollama](https://github.com/datawhalechina/handy-ollama) (Chinese Tutorial for Ollama by [Datawhale ](https://github.com/datawhalechina) - China's Largest Open Source AI Learning Community)
+
+### Terminal
+
+- [oterm](https://github.com/ggozad/oterm)
+- [Ellama Emacs client](https://github.com/s-kostyaev/ellama)
+- [Emacs client](https://github.com/zweifisch/ollama)
+- [neollama](https://github.com/paradoxical-dev/neollama) UI client for interacting with models from within Neovim
+- [gen.nvim](https://github.com/David-Kunz/gen.nvim)
+- [ollama.nvim](https://github.com/nomnivore/ollama.nvim)
+- [ollero.nvim](https://github.com/marco-souza/ollero.nvim)
+- [ollama-chat.nvim](https://github.com/gerazov/ollama-chat.nvim)
+- [ogpt.nvim](https://github.com/huynle/ogpt.nvim)
+- [gptel Emacs client](https://github.com/karthink/gptel)
+- [Oatmeal](https://github.com/dustinblackman/oatmeal)
+- [cmdh](https://github.com/pgibler/cmdh)
+- [ooo](https://github.com/npahlfer/ooo)
+- [shell-pilot](https://github.com/reid41/shell-pilot)(Interact with models via pure shell scripts on Linux or macOS)
+- [tenere](https://github.com/pythops/tenere)
+- [llm-ollama](https://github.com/taketwo/llm-ollama) for [Datasette's LLM CLI](https://llm.datasette.io/en/stable/).
+- [typechat-cli](https://github.com/anaisbetts/typechat-cli)
+- [ShellOracle](https://github.com/djcopley/ShellOracle)
+- [tlm](https://github.com/yusufcanb/tlm)
+- [podman-ollama](https://github.com/ericcurtin/podman-ollama)
+- [gollama](https://github.com/sammcj/gollama)
+- [ParLlama](https://github.com/paulrobello/parllama)
+- [Ollama eBook Summary](https://github.com/cognitivetech/ollama-ebook-summary/)
+- [Ollama Mixture of Experts (MOE) in 50 lines of code](https://github.com/rapidarchitect/ollama_moe)
+- [vim-intelligence-bridge](https://github.com/pepo-ec/vim-intelligence-bridge) Simple interaction of "Ollama" with the Vim editor
+- [x-cmd ollama](https://x-cmd.com/mod/ollama)
+- [bb7](https://github.com/drunkwcodes/bb7)
+- [SwollamaCLI](https://github.com/marcusziade/Swollama) bundled with the Swollama Swift package. [Demo](https://github.com/marcusziade/Swollama?tab=readme-ov-file#cli-usage)
+- [aichat](https://github.com/sigoden/aichat) All-in-one LLM CLI tool featuring Shell Assistant, Chat-REPL, RAG, AI tools & agents, with access to OpenAI, Claude, Gemini, Ollama, Groq, and more.
+- [PowershAI](https://github.com/rrg92/powershai) PowerShell module that brings AI to terminal on Windows, including support for Ollama
+- [DeepShell](https://github.com/Abyss-c0re/deepshell) Your self-hosted AI assistant. Interactive Shell, Files and Folders analysis.
+- [orbiton](https://github.com/xyproto/orbiton) Configuration-free text editor and IDE with support for tab completion with Ollama.
+- [orca-cli](https://github.com/molbal/orca-cli) Ollama Registry CLI Application - Browse, pull, and download models from Ollama Registry in your terminal.
+- [GGUF-to-Ollama](https://github.com/jonathanhecl/gguf-to-ollama) - Importing GGUF to Ollama made easy (multiplatform)
+- [AWS-Strands-With-Ollama](https://github.com/rapidarchitect/ollama_strands) - AWS Strands Agents with Ollama Examples
+- [ollama-multirun](https://github.com/attogram/ollama-multirun) - A bash shell script to run a single prompt against any or all of your locally installed ollama models, saving the output and performance statistics as easily navigable web pages. ([Demo](https://attogram.github.io/ai_test_zone/))
+- [ollama-bash-toolshed](https://github.com/attogram/ollama-bash-toolshed) - Bash scripts to chat with tool using models. Add new tools to your shed with ease. Runs on Ollama.
+- [hle-eval-ollama](https://github.com/mags0ft/hle-eval-ollama) - Runs benchmarks like "Humanity's Last Exam" (HLE) on your favorite local Ollama models and evaluates the quality of their responses
+- [VT Code](https://github.com/vinhnx/vtcode) - VT Code is a Rust-based terminal coding agent with semantic code intelligence via Tree-sitter. Ollama integration for running local/cloud models with configurable endpoints.
+
+### Apple Vision Pro
+
+- [SwiftChat](https://github.com/aws-samples/swift-chat) (Cross-platform AI chat app supporting Apple Vision Pro via "Designed for iPad")
+- [Enchanted](https://github.com/AugustDev/enchanted)
+
+### Database
+
+- [pgai](https://github.com/timescale/pgai) - PostgreSQL as a vector database (Create and search embeddings from Ollama models using pgvector)
+  - [Get started guide](https://github.com/timescale/pgai/blob/main/docs/vectorizer-quick-start.md)
+- [MindsDB](https://github.com/mindsdb/mindsdb/blob/staging/mindsdb/integrations/handlers/ollama_handler/README.md) (Connects Ollama models with nearly 200 data platforms and apps)
+- [chromem-go](https://github.com/philippgille/chromem-go/blob/v0.5.0/embed_ollama.go) with [example](https://github.com/philippgille/chromem-go/tree/v0.5.0/examples/rag-wikipedia-ollama)
+- [Kangaroo](https://github.com/dbkangaroo/kangaroo) (AI-powered SQL client and admin tool for popular databases)
+
+### Package managers

 - [Pacman](https://archlinux.org/packages/extra/x86_64/ollama/)
- [Homebrew](https://formulae.brew.sh/formula/ollama)
- [Nix package](https://search.nixos.org/packages?show=ollama&from=0&size=50&sort=relevance&type=packages&query=ollama)
- [Helm Chart](https://artifacthub.io/packages/helm/ollama-helm/ollama)
 - [Gentoo](https://github.com/gentoo/guru/tree/master/app-misc/ollama)
- [Flox](https://flox.dev/blog/ollama-part-one)
+- [Homebrew](https://formulae.brew.sh/formula/ollama)
+- [Helm Chart](https://artifacthub.io/packages/helm/ollama-helm/ollama)
 - [Guix channel](https://codeberg.org/tusharhero/ollama-guix)
+- [Nix package](https://search.nixos.org/packages?show=ollama&from=0&size=50&sort=relevance&type=packages&query=ollama)
+- [Flox](https://flox.dev/blog/ollama-part-one)
+
+### Libraries
+
+- [LangChain](https://python.langchain.com/docs/integrations/chat/ollama/) and [LangChain.js](https://js.langchain.com/docs/integrations/chat/ollama/) with [example](https://js.langchain.com/docs/tutorials/local_rag/)
+- [Firebase Genkit](https://firebase.google.com/docs/genkit/plugins/ollama)
+- [crewAI](https://github.com/crewAIInc/crewAI)
+- [Yacana](https://remembersoftwares.github.io/yacana/) (User-friendly multi-agent framework for brainstorming and executing predetermined flows with built-in tool integration)
+- [Strands Agents](https://github.com/strands-agents/sdk-python) (A model-driven approach to building AI agents in just a few lines of code)
+- [Spring AI](https://github.com/spring-projects/spring-ai) with [reference](https://docs.spring.io/spring-ai/reference/api/chat/ollama-chat.html) and [example](https://github.com/tzolov/ollama-tools)
+- [LangChainGo](https://github.com/tmc/langchaingo/) with [example](https://github.com/tmc/langchaingo/tree/main/examples/ollama-completion-example)
+- [LangChain4j](https://github.com/langchain4j/langchain4j) with [example](https://github.com/langchain4j/langchain4j-examples/tree/main/ollama-examples/src/main/java)
+- [LangChainRust](https://github.com/Abraxas-365/langchain-rust) with [example](https://github.com/Abraxas-365/langchain-rust/blob/main/examples/llm_ollama.rs)
+- [LangChain for .NET](https://github.com/tryAGI/LangChain) with [example](https://github.com/tryAGI/LangChain/blob/main/examples/LangChain.Samples.OpenAI/Program.cs)
+- [LLPhant](https://github.com/theodo-group/LLPhant?tab=readme-ov-file#ollama)
+- [LlamaIndex](https://docs.llamaindex.ai/en/stable/examples/llm/ollama/) and [LlamaIndexTS](https://ts.llamaindex.ai/modules/llms/available_llms/ollama)
+- [LiteLLM](https://github.com/BerriAI/litellm)
+- [OllamaFarm for Go](https://github.com/presbrey/ollamafarm)
+- [OllamaSharp for .NET](https://github.com/awaescher/OllamaSharp)
+- [Ollama for Ruby](https://github.com/gbaptista/ollama-ai)
+- [Ollama-rs for Rust](https://github.com/pepperoni21/ollama-rs)
+- [Ollama-hpp for C++](https://github.com/jmont-dev/ollama-hpp)
+- [Ollama4j for Java](https://github.com/ollama4j/ollama4j)
+- [ModelFusion Typescript Library](https://modelfusion.dev/integration/model-provider/ollama)
+- [OllamaKit for Swift](https://github.com/kevinhermawan/OllamaKit)
+- [Ollama for Dart](https://github.com/breitburg/dart-ollama)
+- [Ollama for Laravel](https://github.com/cloudstudio/ollama-laravel)
+- [LangChainDart](https://github.com/davidmigloz/langchain_dart)
+- [Semantic Kernel - Python](https://github.com/microsoft/semantic-kernel/tree/main/python/semantic_kernel/connectors/ai/ollama)
+- [Haystack](https://github.com/deepset-ai/haystack-integrations/blob/main/integrations/ollama.md)
+- [Elixir LangChain](https://github.com/brainlid/langchain)
+- [Ollama for R - rollama](https://github.com/JBGruber/rollama)
+- [Ollama for R - ollama-r](https://github.com/hauselin/ollama-r)
+- [Ollama-ex for Elixir](https://github.com/lebrunel/ollama-ex)
+- [Ollama Connector for SAP ABAP](https://github.com/b-tocs/abap_btocs_ollama)
+- [Testcontainers](https://testcontainers.com/modules/ollama/)
+- [Portkey](https://portkey.ai/docs/welcome/integration-guides/ollama)
+- [PromptingTools.jl](https://github.com/svilupp/PromptingTools.jl) with an [example](https://svilupp.github.io/PromptingTools.jl/dev/examples/working_with_ollama)
+- [LlamaScript](https://github.com/Project-Llama/llamascript)
+- [llm-axe](https://github.com/emirsahin1/llm-axe) (Python Toolkit for Building LLM Powered Apps)
+- [Gollm](https://docs.gollm.co/examples/ollama-example)
+- [Gollama for Golang](https://github.com/jonathanhecl/gollama)
+- [Ollamaclient for Golang](https://github.com/xyproto/ollamaclient)
+- [High-level function abstraction in Go](https://gitlab.com/tozd/go/fun)
+- [Ollama PHP](https://github.com/ArdaGnsrn/ollama-php)
+- [Agents-Flex for Java](https://github.com/agents-flex/agents-flex) with [example](https://github.com/agents-flex/agents-flex/tree/main/agents-flex-llm/agents-flex-llm-ollama/src/test/java/com/agentsflex/llm/ollama)
+- [Parakeet](https://github.com/parakeet-nest/parakeet) is a GoLang library, made to simplify the development of small generative AI applications with Ollama.
+- [Haverscript](https://github.com/andygill/haverscript) with [examples](https://github.com/andygill/haverscript/tree/main/examples)
+- [Ollama for Swift](https://github.com/mattt/ollama-swift)
+- [Swollama for Swift](https://github.com/guitaripod/Swollama) with [DocC](https://guitaripod.github.io/Swollama/documentation/swollama)
+- [GoLamify](https://github.com/prasad89/golamify)
+- [Ollama for Haskell](https://github.com/tusharad/ollama-haskell)
+- [multi-llm-ts](https://github.com/nbonamy/multi-llm-ts) (A Typescript/JavaScript library allowing access to different LLM in a unified API)
+- [LlmTornado](https://github.com/lofcz/llmtornado) (C# library providing a unified interface for major FOSS & Commercial inference APIs)
+- [Ollama for Zig](https://github.com/dravenk/ollama-zig)
+- [Abso](https://github.com/lunary-ai/abso) (OpenAI-compatible TypeScript SDK for any LLM provider)
+- [Nichey](https://github.com/goodreasonai/nichey) is a Python package for generating custom wikis for your research topic
+- [Ollama for D](https://github.com/kassane/ollama-d)
+- [OllamaPlusPlus](https://github.com/HardCodeDev777/OllamaPlusPlus) (Very simple C++ library for Ollama)
+- [any-llm](https://github.com/mozilla-ai/any-llm) (A single interface to use different llm providers by [mozilla.ai](https://www.mozilla.ai/))
+- [any-agent](https://github.com/mozilla-ai/any-agent) (A single interface to use and evaluate different agent frameworks by [mozilla.ai](https://www.mozilla.ai/))
+- [Neuro SAN](https://github.com/cognizant-ai-lab/neuro-san-studio) (Data-driven multi-agent orchestration framework) with [example](https://github.com/cognizant-ai-lab/neuro-san-studio/blob/main/docs/user_guide.md#ollama)
+- [achatbot-go](https://github.com/ai-bot-pro/achatbot-go) a multimodal(text/audio/image) chatbot.
+- [Ollama Bash Lib](https://github.com/attogram/ollama-bash-lib) - A Bash Library for Ollama. Run LLM prompts straight from your shell, and more
+
+### Mobile
+
+- [SwiftChat](https://github.com/aws-samples/swift-chat) (Lightning-fast Cross-platform AI chat app with native UI for Android, iOS, and iPad)
+- [Enchanted](https://github.com/AugustDev/enchanted)
+- [Maid](https://github.com/Mobile-Artificial-Intelligence/maid)
+- [Ollama App](https://github.com/JHubi1/ollama-app) (Modern and easy-to-use multi-platform client for Ollama)
+- [ConfiChat](https://github.com/1runeberg/confichat) (Lightweight, standalone, multi-platform, and privacy-focused LLM chat interface with optional encryption)
+- [Ollama Android Chat](https://github.com/sunshine0523/OllamaServer) (No need for Termux, start the Ollama service with one click on an Android device)
+- [Reins](https://github.com/ibrahimcetin/reins) (Easily tweak parameters, customize system prompts per chat, and enhance your AI experiments with reasoning model support.)
+
+### Extensions & Plugins
+
+- [Raycast extension](https://github.com/MassimilianoPasquini97/raycast_ollama)
+- [Discollama](https://github.com/mxyng/discollama) (Discord bot inside the Ollama discord channel)
+- [Continue](https://github.com/continuedev/continue)
+- [Vibe](https://github.com/thewh1teagle/vibe) (Transcribe and analyze meetings with Ollama)
+- [Obsidian Ollama plugin](https://github.com/hinterdupfinger/obsidian-ollama)
+- [Logseq Ollama plugin](https://github.com/omagdy7/ollama-logseq)
+- [NotesOllama](https://github.com/andersrex/notesollama) (Apple Notes Ollama plugin)
+- [Dagger Chatbot](https://github.com/samalba/dagger-chatbot)
+- [Discord AI Bot](https://github.com/mekb-turtle/discord-ai-bot)
+- [Ollama Telegram Bot](https://github.com/ruecat/ollama-telegram)
+- [Hass Ollama Conversation](https://github.com/ej52/hass-ollama-conversation)
+- [Rivet plugin](https://github.com/abrenneke/rivet-plugin-ollama)
+- [Obsidian BMO Chatbot plugin](https://github.com/longy2k/obsidian-bmo-chatbot)
+- [Cliobot](https://github.com/herval/cliobot) (Telegram bot with Ollama support)
+- [Copilot for Obsidian plugin](https://github.com/logancyang/obsidian-copilot)
+- [Obsidian Local GPT plugin](https://github.com/pfrankov/obsidian-local-gpt)
+- [Open Interpreter](https://docs.openinterpreter.com/language-model-setup/local-models/ollama)
+- [Llama Coder](https://github.com/ex3ndr/llama-coder) (Copilot alternative using Ollama)
+- [Ollama Copilot](https://github.com/bernardo-bruning/ollama-copilot) (Proxy that allows you to use Ollama as a copilot like GitHub Copilot)
+- [twinny](https://github.com/rjmacarthy/twinny) (Copilot and Copilot chat alternative using Ollama)
+- [Wingman-AI](https://github.com/RussellCanfield/wingman-ai) (Copilot code and chat alternative using Ollama and Hugging Face)
+- [Page Assist](https://github.com/n4ze3m/page-assist) (Chrome Extension)
+- [Plasmoid Ollama Control](https://github.com/imoize/plasmoid-ollamacontrol) (KDE Plasma extension that allows you to quickly manage/control Ollama model)
+- [AI Telegram Bot](https://github.com/tusharhero/aitelegrambot) (Telegram bot using Ollama in backend)
+- [AI ST Completion](https://github.com/yaroslavyaroslav/OpenAI-sublime-text) (Sublime Text 4 AI assistant plugin with Ollama support)
+- [Discord-Ollama Chat Bot](https://github.com/kevinthedang/discord-ollama) (Generalized TypeScript Discord Bot w/ Tuning Documentation)
+- [ChatGPTBox: All in one browser extension](https://github.com/josStorer/chatGPTBox) with [Integrating Tutorial](https://github.com/josStorer/chatGPTBox/issues/616#issuecomment-1975186467)
+- [Discord AI chat/moderation bot](https://github.com/rapmd73/Companion) Chat/moderation bot written in python. Uses Ollama to create personalities.
+- [Headless Ollama](https://github.com/nischalj10/headless-ollama) (Scripts to automatically install ollama client & models on any OS for apps that depend on ollama server)
+- [Terraform AWS Ollama & Open WebUI](https://github.com/xuyangbocn/terraform-aws-self-host-llm) (A Terraform module to deploy on AWS a ready-to-use Ollama service, together with its front-end Open WebUI service.)
+- [node-red-contrib-ollama](https://github.com/jakubburkiewicz/node-red-contrib-ollama)
+- [Local AI Helper](https://github.com/ivostoykov/localAI) (Chrome and Firefox extensions that enable interactions with the active tab and customisable API endpoints. Includes secure storage for user prompts.)
+- [LSP-AI](https://github.com/SilasMarvin/lsp-ai) (Open-source language server for AI-powered functionality)
+- [QodeAssist](https://github.com/Palm1r/QodeAssist) (AI-powered coding assistant plugin for Qt Creator)
+- [Obsidian Quiz Generator plugin](https://github.com/ECuiDev/obsidian-quiz-generator)
+- [AI Summary Helper plugin](https://github.com/philffm/ai-summary-helper)
+- [TextCraft](https://github.com/suncloudsmoon/TextCraft) (Copilot in Word alternative using Ollama)
+- [Alfred Ollama](https://github.com/zeitlings/alfred-ollama) (Alfred Workflow)
+- [TextLLaMA](https://github.com/adarshM84/TextLLaMA) A Chrome Extension that helps you write emails, correct grammar, and translate into any language
+- [Simple-Discord-AI](https://github.com/zyphixor/simple-discord-ai)
+- [LLM Telegram Bot](https://github.com/innightwolfsleep/llm_telegram_bot) (telegram bot, primary for RP. Oobabooga-like buttons, [A1111](https://github.com/AUTOMATIC1111/stable-diffusion-webui) API integration e.t.c)
+- [mcp-llm](https://github.com/sammcj/mcp-llm) (MCP Server to allow LLMs to call other LLMs)
+- [SimpleOllamaUnity](https://github.com/HardCodeDev777/SimpleOllamaUnity) (Unity Engine extension for communicating with Ollama in a few lines of code. Also works at runtime)
+- [UnityCodeLama](https://github.com/HardCodeDev777/UnityCodeLama) (Unity Editor tool to analyze scripts via Ollama)
+- [NativeMind](https://github.com/NativeMindBrowser/NativeMindExtension) (Private, on-device AI Assistant, no cloud dependencies)
+- [GMAI - Gradle Managed AI](https://gmai.premex.se/) (Gradle plugin for automated Ollama lifecycle management during build phases)
+- [NOMYO Router](https://github.com/nomyo-ai/nomyo-router) (A transparent Ollama proxy with model deployment aware routing which auto-manages multiple Ollama instances in a given network)
+
+### Supported backends
+
+- [llama.cpp](https://github.com/ggml-org/llama.cpp) project founded by Georgi Gerganov.
+
+### Observability
+
+- [Opik](https://www.comet.com/docs/opik/cookbook/ollama) is an open-source platform to debug, evaluate, and monitor your LLM applications, RAG systems, and agentic workflows with comprehensive tracing, automated evaluations, and production-ready dashboards. Opik supports native integration to Ollama.
+- [Lunary](https://lunary.ai/docs/integrations/ollama) is the leading open-source LLM observability platform. It provides a variety of enterprise-grade features such as real-time analytics, prompt templates management, PII masking, and comprehensive agent tracing.
+- [OpenLIT](https://github.com/openlit/openlit) is an OpenTelemetry-native tool for monitoring Ollama Applications & GPUs using traces and metrics.
+- [HoneyHive](https://docs.honeyhive.ai/integrations/ollama) is an AI observability and evaluation platform for AI agents. Use HoneyHive to evaluate agent performance, interrogate failures, and monitor quality in production.
+- [Langfuse](https://langfuse.com/docs/integrations/ollama) is an open source LLM observability platform that enables teams to collaboratively monitor, evaluate and debug AI applications.
+- [MLflow Tracing](https://mlflow.org/docs/latest/llms/tracing/index.html#automatic-tracing) is an open source LLM observability tool with a convenient API to log and visualize traces, making it easy to debug and evaluate GenAI applications.
+
+### Security
+
+- [Ollama Fortress](https://github.com/ParisNeo/ollama_proxy_server)
--- a/anthropic/anthropic.go
+++ b/anthropic/anthropic.go
@@ -1,25 +1,17 @@
 package anthropic

 import (
-	"bytes"
-	"context"
 	"crypto/rand"
 	"encoding/base64"
 	"encoding/json"
 	"errors"
 	"fmt"
-	"io"
 	"log/slog"
 	"net/http"
-	"net/url"
-	"strconv"
 	"strings"
 	"time"

 	"github.com/ollama/ollama/api"
-	"github.com/ollama/ollama/auth"
-	internalcloud "github.com/ollama/ollama/internal/cloud"
-	"github.com/ollama/ollama/logutil"
 )

 // Error types matching Anthropic API
@@ -90,25 +82,22 @@ type MessageParam struct {
 // Text and Thinking use pointers so they serialize as the field being present (even if empty)
 // only when set, which is required for SDK streaming accumulation.
 type ContentBlock struct {
-	Type string `json:"type"` // text, image, tool_use, tool_result, thinking, server_tool_use, web_search_tool_result
+	Type string `json:"type"` // text, image, tool_use, tool_result, thinking

 	// For text blocks - pointer so field only appears when set (SDK requires it for accumulation)
 	Text *string `json:"text,omitempty"`

-	// For text blocks with citations
-	Citations []Citation `json:"citations,omitempty"`
-
 	// For image blocks
 	Source *ImageSource `json:"source,omitempty"`

-	// For tool_use and server_tool_use blocks
+	// For tool_use blocks
 	ID    string `json:"id,omitempty"`
 	Name  string `json:"name,omitempty"`
 	Input any    `json:"input,omitempty"`

-	// For tool_result and web_search_tool_result blocks
+	// For tool_result blocks
 	ToolUseID string `json:"tool_use_id,omitempty"`
-	Content   any    `json:"content,omitempty"` // string, []ContentBlock, []WebSearchResult, or WebSearchToolResultError
+	Content   any    `json:"content,omitempty"` // string or []ContentBlock
 	IsError   bool   `json:"is_error,omitempty"`

 	// For thinking blocks - pointer so field only appears when set (SDK requires it for accumulation)
@@ -116,30 +105,6 @@ type ContentBlock struct {
 	Signature string  `json:"signature,omitempty"`
 }

-// Citation represents a citation in a text block
-type Citation struct {
-	Type           string `json:"type"` // "web_search_result_location"
-	URL            string `json:"url"`
-	Title          string `json:"title"`
-	EncryptedIndex string `json:"encrypted_index,omitempty"`
-	CitedText      string `json:"cited_text,omitempty"`
-}
-
-// WebSearchResult represents a single web search result
-type WebSearchResult struct {
-	Type             string `json:"type"` // "web_search_result"
-	URL              string `json:"url"`
-	Title            string `json:"title"`
-	EncryptedContent string `json:"encrypted_content,omitempty"`
-	PageAge          string `json:"page_age,omitempty"`
-}
-
-// WebSearchToolResultError represents an error from web search
-type WebSearchToolResultError struct {
-	Type      string `json:"type"` // "web_search_tool_result_error"
-	ErrorCode string `json:"error_code"`
-}
-
 // ImageSource represents the source of an image
 type ImageSource struct {
 	Type      string `json:"type"` // "base64" or "url"
@@ -150,13 +115,10 @@ type ImageSource struct {

 // Tool represents a tool definition
 type Tool struct {
-	Type        string          `json:"type,omitempty"` // "custom" for user-defined tools, or "web_search_20250305" for web search
+	Type        string          `json:"type,omitempty"` // "custom" for user-defined tools
 	Name        string          `json:"name"`
 	Description string          `json:"description,omitempty"`
 	InputSchema json.RawMessage `json:"input_schema,omitempty"`
-
-	// Web search specific fields
-	MaxUses int `json:"max_uses,omitempty"`
 }

 // ToolChoice controls how the model uses tools
@@ -249,7 +211,6 @@ type MessageDelta struct {

 // DeltaUsage contains cumulative token usage
 type DeltaUsage struct {
-	InputTokens  int `json:"input_tokens"`
 	OutputTokens int `json:"output_tokens"`
 }

@@ -271,8 +232,6 @@ type StreamErrorEvent struct {

 // FromMessagesRequest converts an Anthropic MessagesRequest to an Ollama api.ChatRequest
 func FromMessagesRequest(r MessagesRequest) (*api.ChatRequest, error) {
-	logutil.Trace("anthropic: converting request", "req", TraceMessagesRequest(r))
-
 	var messages []api.Message

 	if r.System != nil {
@@ -299,10 +258,9 @@ func FromMessagesRequest(r MessagesRequest) (*api.ChatRequest, error) {
 		}
 	}

-	for i, msg := range r.Messages {
+	for _, msg := range r.Messages {
 		converted, err := convertMessage(msg)
 		if err != nil {
-			logutil.Trace("anthropic: message conversion failed", "index", i, "role", msg.Role, "err", err)
 			return nil, err
 		}
 		messages = append(messages, converted...)
@@ -329,24 +287,8 @@ func FromMessagesRequest(r MessagesRequest) (*api.ChatRequest, error) {
 	}

 	var tools api.Tools
-	hasBuiltinWebSearch := false
 	for _, t := range r.Tools {
-		if strings.HasPrefix(t.Type, "web_search") {
-			hasBuiltinWebSearch = true
-			break
-		}
-	}
-
-	for _, t := range r.Tools {
-		// Anthropic built-in web_search maps to Ollama function name "web_search".
-		// If a user-defined tool also uses that name in the same request, drop the
-		// user-defined one to avoid ambiguous tool-call routing.
-		if hasBuiltinWebSearch && !strings.HasPrefix(t.Type, "web_search") && t.Name == "web_search" {
-			logutil.Trace("anthropic: dropping colliding custom web_search tool", "tool", TraceTool(t))
-			continue
-		}
-
-		tool, _, err := convertTool(t)
+		tool, err := convertTool(t)
 		if err != nil {
 			return nil, err
 		}
@@ -359,17 +301,15 @@ func FromMessagesRequest(r MessagesRequest) (*api.ChatRequest, error) {
 	}

 	stream := r.Stream
-	convertedRequest := &api.ChatRequest{
+
+	return &api.ChatRequest{
 		Model:    r.Model,
 		Messages: messages,
 		Options:  options,
 		Stream:   &stream,
 		Tools:    tools,
 		Think:    think,
-	}
-	logutil.Trace("anthropic: converted request", "req", TraceChatRequest(convertedRequest))
-
-	return convertedRequest, nil
+	}, nil
 }

 // convertMessage converts an Anthropic MessageParam to Ollama api.Message(s)
@@ -387,19 +327,10 @@ func convertMessage(msg MessageParam) ([]api.Message, error) {
 		var toolCalls []api.ToolCall
 		var thinking string
 		var toolResults []api.Message
-		textBlocks := 0
-		imageBlocks := 0
-		toolUseBlocks := 0
-		toolResultBlocks := 0
-		serverToolUseBlocks := 0
-		webSearchToolResultBlocks := 0
-		thinkingBlocks := 0
-		unknownBlocks := 0

 		for _, block := range content {
 			blockMap, ok := block.(map[string]any)
 			if !ok {
-				logutil.Trace("anthropic: invalid content block format", "role", role)
 				return nil, errors.New("invalid content block format")
 			}

@@ -407,16 +338,13 @@ func convertMessage(msg MessageParam) ([]api.Message, error) {

 			switch blockType {
 			case "text":
-				textBlocks++
 				if text, ok := blockMap["text"].(string); ok {
 					textContent.WriteString(text)
 				}

 			case "image":
-				imageBlocks++
 				source, ok := blockMap["source"].(map[string]any)
 				if !ok {
-					logutil.Trace("anthropic: invalid image source", "role", role)
 					return nil, errors.New("invalid image source")
 				}

@@ -425,26 +353,21 @@ func convertMessage(msg MessageParam) ([]api.Message, error) {
 					data, _ := source["data"].(string)
 					decoded, err := base64.StdEncoding.DecodeString(data)
 					if err != nil {
-						logutil.Trace("anthropic: invalid base64 image data", "role", role, "error", err)
 						return nil, fmt.Errorf("invalid base64 image data: %w", err)
 					}
 					images = append(images, decoded)
 				} else {
-					logutil.Trace("anthropic: unsupported image source type", "role", role, "source_type", sourceType)
 					return nil, fmt.Errorf("invalid image source type: %s. Only base64 images are supported.", sourceType)
 				}
 				// URL images would need to be fetched - skip for now

 			case "tool_use":
-				toolUseBlocks++
 				id, ok := blockMap["id"].(string)
 				if !ok {
-					logutil.Trace("anthropic: tool_use block missing id", "role", role)
 					return nil, errors.New("tool_use block missing required 'id' field")
 				}
 				name, ok := blockMap["name"].(string)
 				if !ok {
-					logutil.Trace("anthropic: tool_use block missing name", "role", role)
 					return nil, errors.New("tool_use block missing required 'name' field")
 				}
 				tc := api.ToolCall{
@@ -459,7 +382,6 @@ func convertMessage(msg MessageParam) ([]api.Message, error) {
 				toolCalls = append(toolCalls, tc)

 			case "tool_result":
-				toolResultBlocks++
 				toolUseID, _ := blockMap["tool_use_id"].(string)
 				var resultContent string

@@ -485,36 +407,9 @@ func convertMessage(msg MessageParam) ([]api.Message, error) {
 				})

 			case "thinking":
-				thinkingBlocks++
 				if t, ok := blockMap["thinking"].(string); ok {
 					thinking = t
 				}
-
-			case "server_tool_use":
-				serverToolUseBlocks++
-				id, _ := blockMap["id"].(string)
-				name, _ := blockMap["name"].(string)
-				tc := api.ToolCall{
-					ID: id,
-					Function: api.ToolCallFunction{
-						Name: name,
-					},
-				}
-				if input, ok := blockMap["input"].(map[string]any); ok {
-					tc.Function.Arguments = mapToArgs(input)
-				}
-				toolCalls = append(toolCalls, tc)
-
-			case "web_search_tool_result":
-				webSearchToolResultBlocks++
-				toolUseID, _ := blockMap["tool_use_id"].(string)
-				toolResults = append(toolResults, api.Message{
-					Role:       "tool",
-					Content:    formatWebSearchToolResultContent(blockMap["content"]),
-					ToolCallID: toolUseID,
-				})
-			default:
-				unknownBlocks++
 			}
 		}

@@ -531,19 +426,6 @@ func convertMessage(msg MessageParam) ([]api.Message, error) {

 		// Add tool results as separate messages
 		messages = append(messages, toolResults...)
-		logutil.Trace("anthropic: converted block message",
-			"role", role,
-			"blocks", len(content),
-			"text", textBlocks,
-			"image", imageBlocks,
-			"tool_use", toolUseBlocks,
-			"tool_result", toolResultBlocks,
-			"server_tool_use", serverToolUseBlocks,
-			"web_search_result", webSearchToolResultBlocks,
-			"thinking", thinkingBlocks,
-			"unknown", unknownBlocks,
-			"messages", TraceAPIMessages(messages),
-		)

 	default:
 		return nil, fmt.Errorf("invalid message content type: %T", content)
@@ -552,94 +434,12 @@ func convertMessage(msg MessageParam) ([]api.Message, error) {
 	return messages, nil
 }

-func formatWebSearchToolResultContent(content any) string {
-	switch c := content.(type) {
-	case string:
-		return c
-	case []WebSearchResult:
-		var resultContent strings.Builder
-		for _, item := range c {
-			if item.Type != "web_search_result" {
-				continue
-			}
-			fmt.Fprintf(&resultContent, "- %s: %s\n", item.Title, item.URL)
-		}
-		return resultContent.String()
-	case []any:
-		var resultContent strings.Builder
-		for _, item := range c {
-			itemMap, ok := item.(map[string]any)
-			if !ok {
-				continue
-			}
-			switch itemMap["type"] {
-			case "web_search_result":
-				title, _ := itemMap["title"].(string)
-				url, _ := itemMap["url"].(string)
-				fmt.Fprintf(&resultContent, "- %s: %s\n", title, url)
-			case "web_search_tool_result_error":
-				errorCode, _ := itemMap["error_code"].(string)
-				if errorCode == "" {
-					return "web_search_tool_result_error"
-				}
-				return "web_search_tool_result_error: " + errorCode
-			}
-		}
-		return resultContent.String()
-	case map[string]any:
-		if c["type"] == "web_search_tool_result_error" {
-			errorCode, _ := c["error_code"].(string)
-			if errorCode == "" {
-				return "web_search_tool_result_error"
-			}
-			return "web_search_tool_result_error: " + errorCode
-		}
-		data, err := json.Marshal(c)
-		if err != nil {
-			return ""
-		}
-		return string(data)
-	case WebSearchToolResultError:
-		if c.ErrorCode == "" {
-			return "web_search_tool_result_error"
-		}
-		return "web_search_tool_result_error: " + c.ErrorCode
-	default:
-		data, err := json.Marshal(c)
-		if err != nil {
-			return ""
-		}
-		return string(data)
-	}
-}
-
-// convertTool converts an Anthropic Tool to an Ollama api.Tool, returning true if it's a server tool
-func convertTool(t Tool) (api.Tool, bool, error) {
-	if strings.HasPrefix(t.Type, "web_search") {
-		props := api.NewToolPropertiesMap()
-		props.Set("query", api.ToolProperty{
-			Type:        api.PropertyType{"string"},
-			Description: "The search query to look up on the web",
-		})
-		return api.Tool{
-			Type: "function",
-			Function: api.ToolFunction{
-				Name:        "web_search",
-				Description: "Search the web for current information. Use this to find up-to-date information about any topic.",
-				Parameters: api.ToolFunctionParameters{
-					Type:       "object",
-					Required:   []string{"query"},
-					Properties: props,
-				},
-			},
-		}, true, nil
-	}
-
+// convertTool converts an Anthropic Tool to an Ollama api.Tool
+func convertTool(t Tool) (api.Tool, error) {
 	var params api.ToolFunctionParameters
 	if len(t.InputSchema) > 0 {
 		if err := json.Unmarshal(t.InputSchema, &params); err != nil {
-			logutil.Trace("anthropic: invalid tool schema", "tool", t.Name, "err", err)
-			return api.Tool{}, false, fmt.Errorf("invalid input_schema for tool %q: %w", t.Name, err)
+			return api.Tool{}, fmt.Errorf("invalid input_schema for tool %q: %w", t.Name, err)
 		}
 	}

@@ -650,7 +450,7 @@ func convertTool(t Tool) (api.Tool, bool, error) {
 			Description: t.Description,
 			Parameters:  params,
 		},
-	}, false, nil
+	}, nil
 }

 // ToMessagesResponse converts an Ollama api.ChatResponse to an Anthropic MessagesResponse
@@ -717,26 +517,24 @@ func mapStopReason(reason string, hasToolCalls bool) string {

 // StreamConverter manages state for converting Ollama streaming responses to Anthropic format
 type StreamConverter struct {
-	ID                   string
-	Model                string
-	firstWrite           bool
-	contentIndex         int
-	inputTokens          int
-	outputTokens         int
-	estimatedInputTokens int // Estimated tokens from request (used when actual metrics are 0)
-	thinkingStarted      bool
-	thinkingDone         bool
-	textStarted          bool
-	toolCallsSent        map[string]bool
+	ID              string
+	Model           string
+	firstWrite      bool
+	contentIndex    int
+	inputTokens     int
+	outputTokens    int
+	thinkingStarted bool
+	thinkingDone    bool
+	textStarted     bool
+	toolCallsSent   map[string]bool
 }

-func NewStreamConverter(id, model string, estimatedInputTokens int) *StreamConverter {
+func NewStreamConverter(id, model string) *StreamConverter {
 	return &StreamConverter{
-		ID:                   id,
-		Model:                model,
-		firstWrite:           true,
-		estimatedInputTokens: estimatedInputTokens,
-		toolCallsSent:        make(map[string]bool),
+		ID:            id,
+		Model:         model,
+		firstWrite:    true,
+		toolCallsSent: make(map[string]bool),
 	}
 }

@@ -752,11 +550,7 @@ func (c *StreamConverter) Process(r api.ChatResponse) []StreamEvent {

 	if c.firstWrite {
 		c.firstWrite = false
-		// Use actual metrics if available, otherwise use estimate
 		c.inputTokens = r.Metrics.PromptEvalCount
-		if c.inputTokens == 0 && c.estimatedInputTokens > 0 {
-			c.inputTokens = c.estimatedInputTokens
-		}

 		events = append(events, StreamEvent{
 			Event: "message_start",
@@ -927,7 +721,6 @@ func (c *StreamConverter) Process(r api.ChatResponse) []StreamEvent {
 			})
 		}

-		c.inputTokens = r.Metrics.PromptEvalCount
 		c.outputTokens = r.Metrics.EvalCount
 		stopReason := mapStopReason(r.DoneReason, len(c.toolCallsSent) > 0)

@@ -939,7 +732,6 @@ func (c *StreamConverter) Process(r api.ChatResponse) []StreamEvent {
 					StopReason: stopReason,
 				},
 				Usage: DeltaUsage{
-					InputTokens:  c.inputTokens,
 					OutputTokens: c.outputTokens,
 				},
 			},
@@ -984,227 +776,3 @@ func mapToArgs(m map[string]any) api.ToolCallFunctionArguments {
 	}
 	return args
 }
-
-// CountTokensRequest represents an Anthropic count_tokens request
-type CountTokensRequest struct {
-	Model    string          `json:"model"`
-	Messages []MessageParam  `json:"messages"`
-	System   any             `json:"system,omitempty"`
-	Tools    []Tool          `json:"tools,omitempty"`
-	Thinking *ThinkingConfig `json:"thinking,omitempty"`
-}
-
-// EstimateInputTokens estimates input tokens from a MessagesRequest (reuses CountTokensRequest logic)
-func EstimateInputTokens(req MessagesRequest) int {
-	return estimateTokens(CountTokensRequest{
-		Model:    req.Model,
-		Messages: req.Messages,
-		System:   req.System,
-		Tools:    req.Tools,
-		Thinking: req.Thinking,
-	})
-}
-
-// CountTokensResponse represents an Anthropic count_tokens response
-type CountTokensResponse struct {
-	InputTokens int `json:"input_tokens"`
-}
-
-// estimateTokens returns a rough estimate of tokens (len/4).
-// TODO: Replace with actual tokenization via Tokenize API for accuracy.
-// Current len/4 heuristic is a rough approximation (~4 chars/token average).
-func estimateTokens(req CountTokensRequest) int {
-	var totalLen int
-
-	// Count system prompt
-	if req.System != nil {
-		totalLen += countAnyContent(req.System)
-	}
-
-	// Count messages
-	for _, msg := range req.Messages {
-		// Count role (always present)
-		totalLen += len(msg.Role)
-		// Count content
-		contentLen := countAnyContent(msg.Content)
-		totalLen += contentLen
-	}
-
-	for _, tool := range req.Tools {
-		totalLen += len(tool.Name) + len(tool.Description) + len(tool.InputSchema)
-	}
-
-	// Return len/4 as rough token estimate, minimum 1 if there's any content
-	tokens := totalLen / 4
-	if tokens == 0 && (len(req.Messages) > 0 || req.System != nil) {
-		tokens = 1
-	}
-	return tokens
-}
-
-func countAnyContent(content any) int {
-	if content == nil {
-		return 0
-	}
-
-	switch c := content.(type) {
-	case string:
-		return len(c)
-	case []any:
-		total := 0
-		for _, block := range c {
-			total += countContentBlock(block)
-		}
-		return total
-	default:
-		if data, err := json.Marshal(content); err == nil {
-			return len(data)
-		}
-		return 0
-	}
-}
-
-func countContentBlock(block any) int {
-	blockMap, ok := block.(map[string]any)
-	if !ok {
-		if s, ok := block.(string); ok {
-			return len(s)
-		}
-		return 0
-	}
-
-	total := 0
-	blockType, _ := blockMap["type"].(string)
-
-	if text, ok := blockMap["text"].(string); ok {
-		total += len(text)
-	}
-
-	if thinking, ok := blockMap["thinking"].(string); ok {
-		total += len(thinking)
-	}
-
-	if blockType == "tool_use" {
-		if data, err := json.Marshal(blockMap); err == nil {
-			total += len(data)
-		}
-	}
-
-	if blockType == "tool_result" {
-		if data, err := json.Marshal(blockMap); err == nil {
-			total += len(data)
-		}
-	}
-
-	return total
-}
-
-// OllamaWebSearchRequest represents a request to the Ollama web search API
-type OllamaWebSearchRequest struct {
-	Query      string `json:"query"`
-	MaxResults int    `json:"max_results,omitempty"`
-}
-
-// OllamaWebSearchResult represents a single search result from Ollama API
-type OllamaWebSearchResult struct {
-	Title   string `json:"title"`
-	URL     string `json:"url"`
-	Content string `json:"content"`
-}
-
-// OllamaWebSearchResponse represents the response from the Ollama web search API
-type OllamaWebSearchResponse struct {
-	Results []OllamaWebSearchResult `json:"results"`
-}
-
-var WebSearchEndpoint = "https://ollama.com/api/web_search"
-
-func WebSearch(ctx context.Context, query string, maxResults int) (*OllamaWebSearchResponse, error) {
-	if internalcloud.Disabled() {
-		logutil.TraceContext(ctx, "anthropic: web search blocked", "reason", "cloud_disabled")
-		return nil, errors.New(internalcloud.DisabledError("web search is unavailable"))
-	}
-
-	if maxResults <= 0 {
-		maxResults = 5
-	}
-	if maxResults > 10 {
-		maxResults = 10
-	}
-
-	reqBody := OllamaWebSearchRequest{
-		Query:      query,
-		MaxResults: maxResults,
-	}
-
-	body, err := json.Marshal(reqBody)
-	if err != nil {
-		return nil, fmt.Errorf("failed to marshal web search request: %w", err)
-	}
-
-	searchURL, err := url.Parse(WebSearchEndpoint)
-	if err != nil {
-		return nil, fmt.Errorf("failed to parse web search URL: %w", err)
-	}
-	logutil.TraceContext(ctx, "anthropic: web search request",
-		"query", TraceTruncateString(query),
-		"max_results", maxResults,
-		"url", searchURL.String(),
-	)
-
-	q := searchURL.Query()
-	q.Set("ts", strconv.FormatInt(time.Now().Unix(), 10))
-	searchURL.RawQuery = q.Encode()
-
-	signature := ""
-	if strings.EqualFold(searchURL.Hostname(), "ollama.com") {
-		challenge := fmt.Sprintf("%s,%s", http.MethodPost, searchURL.RequestURI())
-		signature, err = auth.Sign(ctx, []byte(challenge))
-		if err != nil {
-			return nil, fmt.Errorf("failed to sign web search request: %w", err)
-		}
-	}
-	logutil.TraceContext(ctx, "anthropic: web search auth", "signed", signature != "")
-
-	req, err := http.NewRequestWithContext(ctx, "POST", searchURL.String(), bytes.NewReader(body))
-	if err != nil {
-		return nil, fmt.Errorf("failed to create web search request: %w", err)
-	}
-
-	req.Header.Set("Content-Type", "application/json")
-	if signature != "" {
-		req.Header.Set("Authorization", fmt.Sprintf("Bearer %s", signature))
-	}
-
-	resp, err := http.DefaultClient.Do(req)
-	if err != nil {
-		return nil, fmt.Errorf("web search request failed: %w", err)
-	}
-	defer resp.Body.Close()
-	logutil.TraceContext(ctx, "anthropic: web search response", "status", resp.StatusCode)
-
-	if resp.StatusCode != http.StatusOK {
-		respBody, _ := io.ReadAll(resp.Body)
-		return nil, fmt.Errorf("web search returned status %d: %s", resp.StatusCode, string(respBody))
-	}
-
-	var searchResp OllamaWebSearchResponse
-	if err := json.NewDecoder(resp.Body).Decode(&searchResp); err != nil {
-		return nil, fmt.Errorf("failed to decode web search response: %w", err)
-	}
-	logutil.TraceContext(ctx, "anthropic: web search results", "count", len(searchResp.Results))
-
-	return &searchResp, nil
-}
-
-func ConvertOllamaToAnthropicResults(ollamaResults *OllamaWebSearchResponse) []WebSearchResult {
-	var results []WebSearchResult
-	for _, r := range ollamaResults.Results {
-		results = append(results, WebSearchResult{
-			Type:  "web_search_result",
-			URL:   r.URL,
-			Title: r.Title,
-		})
-	}
-	return results
-}
--- a/anthropic/anthropic_test.go
+++ b/anthropic/anthropic_test.go
@@ -3,7 +3,6 @@ package anthropic
 import (
 	"encoding/base64"
 	"encoding/json"
-	"strings"
 	"testing"

 	"github.com/google/go-cmp/cmp"
@@ -301,78 +300,6 @@ func TestFromMessagesRequest_WithTools(t *testing.T) {
 	}
 }

-func TestFromMessagesRequest_DropsCustomWebSearchWhenBuiltinPresent(t *testing.T) {
-	req := MessagesRequest{
-		Model:     "test-model",
-		MaxTokens: 1024,
-		Messages:  []MessageParam{{Role: "user", Content: "Hello"}},
-		Tools: []Tool{
-			{
-				Type: "web_search_20250305",
-				Name: "web_search",
-			},
-			{
-				Type:        "custom",
-				Name:        "web_search",
-				Description: "User-defined web search that should be dropped",
-				InputSchema: json.RawMessage(`{"type":"invalid"}`),
-			},
-			{
-				Type:        "custom",
-				Name:        "get_weather",
-				Description: "Get current weather",
-				InputSchema: json.RawMessage(`{"type":"object","properties":{"location":{"type":"string"}},"required":["location"]}`),
-			},
-		},
-	}
-
-	result, err := FromMessagesRequest(req)
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	if len(result.Tools) != 2 {
-		t.Fatalf("expected 2 tools after dropping custom web_search, got %d", len(result.Tools))
-	}
-	if result.Tools[0].Function.Name != "web_search" {
-		t.Fatalf("expected first tool to be built-in web_search, got %q", result.Tools[0].Function.Name)
-	}
-	if result.Tools[1].Function.Name != "get_weather" {
-		t.Fatalf("expected second tool to be get_weather, got %q", result.Tools[1].Function.Name)
-	}
-}
-
-func TestFromMessagesRequest_KeepsCustomWebSearchWhenBuiltinAbsent(t *testing.T) {
-	req := MessagesRequest{
-		Model:     "test-model",
-		MaxTokens: 1024,
-		Messages:  []MessageParam{{Role: "user", Content: "Hello"}},
-		Tools: []Tool{
-			{
-				Type:        "custom",
-				Name:        "web_search",
-				Description: "User-defined web search",
-				InputSchema: json.RawMessage(`{"type":"object","properties":{"query":{"type":"string"}},"required":["query"]}`),
-			},
-		},
-	}
-
-	result, err := FromMessagesRequest(req)
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	if len(result.Tools) != 1 {
-		t.Fatalf("expected 1 custom tool, got %d", len(result.Tools))
-	}
-	if result.Tools[0].Function.Name != "web_search" {
-		t.Fatalf("expected custom tool name web_search, got %q", result.Tools[0].Function.Name)
-	}
-	if result.Tools[0].Function.Description != "User-defined web search" {
-		t.Fatalf("expected custom description preserved, got %q", result.Tools[0].Function.Description)
-	}
-}
-
 func TestFromMessagesRequest_WithThinking(t *testing.T) {
 	req := MessagesRequest{
 		Model:     "test-model",
@@ -394,6 +321,8 @@ func TestFromMessagesRequest_WithThinking(t *testing.T) {
 	}
 }

+// TestFromMessagesRequest_ThinkingOnlyBlock verifies that messages containing only
+// a thinking block (no text, images, or tool calls) are preserved and not dropped.
 func TestFromMessagesRequest_ThinkingOnlyBlock(t *testing.T) {
 	req := MessagesRequest{
 		Model:     "test-model",
@@ -676,7 +605,7 @@ func TestGenerateMessageID(t *testing.T) {
 }

 func TestStreamConverter_Basic(t *testing.T) {
-	conv := NewStreamConverter("msg_123", "test-model", 0)
+	conv := NewStreamConverter("msg_123", "test-model")

 	// First chunk
 	resp1 := api.ChatResponse{
@@ -713,7 +642,7 @@ func TestStreamConverter_Basic(t *testing.T) {
 		},
 		Done:       true,
 		DoneReason: "stop",
-		Metrics:    api.Metrics{PromptEvalCount: 10, EvalCount: 5},
+		Metrics:    api.Metrics{EvalCount: 5},
 	}

 	events2 := conv.Process(resp2)
@@ -721,24 +650,6 @@ func TestStreamConverter_Basic(t *testing.T) {
 	// Should have content_block_delta, content_block_stop, message_delta, message_stop
 	hasStop := false
 	for _, e := range events2 {
-		if e.Event == "message_delta" {
-			if data, ok := e.Data.(MessageDeltaEvent); ok {
-				if data.Type != "message_delta" {
-					t.Errorf("unexpected data type: %+v", data)
-				}
-
-				if data.Delta.StopReason != "end_turn" {
-					t.Errorf("unexpected stop reason: %+v", data.Delta.StopReason)
-				}
-
-				if data.Usage.InputTokens != 10 || data.Usage.OutputTokens != 5 {
-					t.Errorf("unexpected usage: %+v", data.Usage)
-				}
-			} else {
-				t.Errorf("unexpected data: %+v", e.Data)
-			}
-		}
-
 		if e.Event == "message_stop" {
 			hasStop = true
 		}
@@ -749,7 +660,7 @@ func TestStreamConverter_Basic(t *testing.T) {
 }

 func TestStreamConverter_WithToolCalls(t *testing.T) {
-	conv := NewStreamConverter("msg_123", "test-model", 0)
+	conv := NewStreamConverter("msg_123", "test-model")

 	resp := api.ChatResponse{
 		Model: "test-model",
@@ -802,7 +713,7 @@ func TestStreamConverter_WithToolCalls(t *testing.T) {
 func TestStreamConverter_ToolCallWithUnmarshalableArgs(t *testing.T) {
 	// Test that unmarshalable arguments (like channels) are handled gracefully
 	// and don't cause a panic or corrupt stream
-	conv := NewStreamConverter("msg_123", "test-model", 0)
+	conv := NewStreamConverter("msg_123", "test-model")

 	// Create a channel which cannot be JSON marshaled
 	unmarshalable := make(chan int)
@@ -849,7 +760,7 @@ func TestStreamConverter_ToolCallWithUnmarshalableArgs(t *testing.T) {

 func TestStreamConverter_MultipleToolCallsWithMixedValidity(t *testing.T) {
 	// Test that valid tool calls still work when mixed with invalid ones
-	conv := NewStreamConverter("msg_123", "test-model", 0)
+	conv := NewStreamConverter("msg_123", "test-model")

 	unmarshalable := make(chan int)
 	badArgs := api.NewToolCallFunctionArguments()
@@ -913,6 +824,10 @@ func TestStreamConverter_MultipleToolCallsWithMixedValidity(t *testing.T) {
 	}
 }

+// TestContentBlockJSON_EmptyFieldsPresent verifies that empty text and thinking fields
+// are serialized in JSON output. The Anthropic SDK requires these fields to be present
+// (even when empty) in content_block_start events to properly accumulate streaming deltas.
+// Without these fields, the SDK throws: "TypeError: unsupported operand type(s) for +=: 'NoneType' and 'str'"
 func TestContentBlockJSON_EmptyFieldsPresent(t *testing.T) {
 	tests := []struct {
 		name     string
@@ -966,9 +881,11 @@ func TestContentBlockJSON_EmptyFieldsPresent(t *testing.T) {
 	}
 }

+// TestStreamConverter_ContentBlockStartIncludesEmptyFields verifies that content_block_start
+// events include the required empty fields for SDK compatibility.
 func TestStreamConverter_ContentBlockStartIncludesEmptyFields(t *testing.T) {
 	t.Run("text block start includes empty text", func(t *testing.T) {
-		conv := NewStreamConverter("msg_123", "test-model", 0)
+		conv := NewStreamConverter("msg_123", "test-model")

 		resp := api.ChatResponse{
 			Model:   "test-model",
@@ -1002,7 +919,7 @@ func TestStreamConverter_ContentBlockStartIncludesEmptyFields(t *testing.T) {
 	})

 	t.Run("thinking block start includes empty thinking", func(t *testing.T) {
-		conv := NewStreamConverter("msg_123", "test-model", 0)
+		conv := NewStreamConverter("msg_123", "test-model")

 		resp := api.ChatResponse{
 			Model:   "test-model",
@@ -1034,422 +951,3 @@ func TestStreamConverter_ContentBlockStartIncludesEmptyFields(t *testing.T) {
 		}
 	})
 }
-
-func TestEstimateTokens_SimpleMessage(t *testing.T) {
-	req := CountTokensRequest{
-		Model: "test-model",
-		Messages: []MessageParam{
-			{Role: "user", Content: "Hello, world!"},
-		},
-	}
-
-	tokens := estimateTokens(req)
-
-	// "user" (4) + "Hello, world!" (13) = 17 chars / 4 = 4 tokens
-	if tokens < 1 {
-		t.Errorf("expected at least 1 token, got %d", tokens)
-	}
-	// Sanity check: shouldn't be wildly off
-	if tokens > 10 {
-		t.Errorf("expected fewer than 10 tokens for short message, got %d", tokens)
-	}
-}
-
-func TestEstimateTokens_WithSystemPrompt(t *testing.T) {
-	req := CountTokensRequest{
-		Model:  "test-model",
-		System: "You are a helpful assistant.",
-		Messages: []MessageParam{
-			{Role: "user", Content: "Hello"},
-		},
-	}
-
-	tokens := estimateTokens(req)
-
-	// System prompt adds to count
-	if tokens < 5 {
-		t.Errorf("expected at least 5 tokens with system prompt, got %d", tokens)
-	}
-}
-
-func TestEstimateTokens_WithTools(t *testing.T) {
-	req := CountTokensRequest{
-		Model: "test-model",
-		Messages: []MessageParam{
-			{Role: "user", Content: "What's the weather?"},
-		},
-		Tools: []Tool{
-			{
-				Name:        "get_weather",
-				Description: "Get the current weather for a location",
-				InputSchema: json.RawMessage(`{"type":"object","properties":{"location":{"type":"string"}}}`),
-			},
-		},
-	}
-
-	tokens := estimateTokens(req)
-
-	// Tools add significant content
-	if tokens < 10 {
-		t.Errorf("expected at least 10 tokens with tools, got %d", tokens)
-	}
-}
-
-func TestEstimateTokens_WithThinking(t *testing.T) {
-	req := CountTokensRequest{
-		Model: "test-model",
-		Messages: []MessageParam{
-			{Role: "user", Content: "Hello"},
-			{
-				Role: "assistant",
-				Content: []any{
-					map[string]any{
-						"type":     "thinking",
-						"thinking": "Let me think about this carefully...",
-					},
-					map[string]any{
-						"type": "text",
-						"text": "Here is my response.",
-					},
-				},
-			},
-		},
-	}
-
-	tokens := estimateTokens(req)
-
-	// Thinking content should be counted
-	if tokens < 10 {
-		t.Errorf("expected at least 10 tokens with thinking content, got %d", tokens)
-	}
-}
-
-func TestEstimateTokens_EmptyContent(t *testing.T) {
-	req := CountTokensRequest{
-		Model:    "test-model",
-		Messages: []MessageParam{},
-	}
-
-	tokens := estimateTokens(req)
-
-	if tokens != 0 {
-		t.Errorf("expected 0 tokens for empty content, got %d", tokens)
-	}
-}
-
-// Web Search Tests
-
-func TestConvertTool_WebSearch(t *testing.T) {
-	tool := Tool{
-		Type:    "web_search_20250305",
-		Name:    "web_search",
-		MaxUses: 5,
-	}
-
-	result, isServerTool, err := convertTool(tool)
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	if !isServerTool {
-		t.Error("expected isServerTool to be true for web_search tool")
-	}
-
-	if result.Type != "function" {
-		t.Errorf("expected type 'function', got %q", result.Type)
-	}
-
-	if result.Function.Name != "web_search" {
-		t.Errorf("expected name 'web_search', got %q", result.Function.Name)
-	}
-
-	if result.Function.Description == "" {
-		t.Error("expected non-empty description for web_search tool")
-	}
-
-	// Check that query parameter is defined
-	if result.Function.Parameters.Properties == nil {
-		t.Fatal("expected properties to be defined")
-	}
-
-	queryProp, ok := result.Function.Parameters.Properties.Get("query")
-	if !ok {
-		t.Error("expected 'query' property to be defined")
-	}
-
-	if len(queryProp.Type) == 0 || queryProp.Type[0] != "string" {
-		t.Errorf("expected query type to be 'string', got %v", queryProp.Type)
-	}
-}
-
-func TestConvertTool_RegularTool(t *testing.T) {
-	tool := Tool{
-		Type:        "custom",
-		Name:        "get_weather",
-		Description: "Get the weather",
-		InputSchema: json.RawMessage(`{"type":"object","properties":{"location":{"type":"string"}}}`),
-	}
-
-	result, isServerTool, err := convertTool(tool)
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	if isServerTool {
-		t.Error("expected isServerTool to be false for regular tool")
-	}
-
-	if result.Function.Name != "get_weather" {
-		t.Errorf("expected name 'get_weather', got %q", result.Function.Name)
-	}
-}
-
-func TestConvertMessage_ServerToolUse(t *testing.T) {
-	msg := MessageParam{
-		Role: "assistant",
-		Content: []any{
-			map[string]any{
-				"type":  "server_tool_use",
-				"id":    "srvtoolu_123",
-				"name":  "web_search",
-				"input": map[string]any{"query": "test query"},
-			},
-		},
-	}
-
-	messages, err := convertMessage(msg)
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	if len(messages) != 1 {
-		t.Fatalf("expected 1 message, got %d", len(messages))
-	}
-
-	if len(messages[0].ToolCalls) != 1 {
-		t.Fatalf("expected 1 tool call, got %d", len(messages[0].ToolCalls))
-	}
-
-	tc := messages[0].ToolCalls[0]
-	if tc.ID != "srvtoolu_123" {
-		t.Errorf("expected tool call ID 'srvtoolu_123', got %q", tc.ID)
-	}
-
-	if tc.Function.Name != "web_search" {
-		t.Errorf("expected tool name 'web_search', got %q", tc.Function.Name)
-	}
-}
-
-func TestConvertMessage_WebSearchToolResult(t *testing.T) {
-	msg := MessageParam{
-		Role: "user",
-		Content: []any{
-			map[string]any{
-				"type":        "web_search_tool_result",
-				"tool_use_id": "srvtoolu_123",
-				"content": []any{
-					map[string]any{
-						"type":  "web_search_result",
-						"title": "Test Result",
-						"url":   "https://example.com",
-					},
-				},
-			},
-		},
-	}
-
-	messages, err := convertMessage(msg)
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	// Should have a tool result message
-	if len(messages) != 1 {
-		t.Fatalf("expected 1 message, got %d", len(messages))
-	}
-
-	if messages[0].Role != "tool" {
-		t.Errorf("expected role 'tool', got %q", messages[0].Role)
-	}
-
-	if messages[0].ToolCallID != "srvtoolu_123" {
-		t.Errorf("expected tool_call_id 'srvtoolu_123', got %q", messages[0].ToolCallID)
-	}
-
-	if messages[0].Content == "" {
-		t.Error("expected non-empty content from web search results")
-	}
-}
-
-func TestConvertMessage_WebSearchToolResultEmptyStillCreatesToolMessage(t *testing.T) {
-	msg := MessageParam{
-		Role: "user",
-		Content: []any{
-			map[string]any{
-				"type":        "web_search_tool_result",
-				"tool_use_id": "srvtoolu_empty",
-				"content":     []any{},
-			},
-		},
-	}
-
-	messages, err := convertMessage(msg)
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	if len(messages) != 1 {
-		t.Fatalf("expected 1 message, got %d", len(messages))
-	}
-	if messages[0].Role != "tool" {
-		t.Fatalf("expected role tool, got %q", messages[0].Role)
-	}
-	if messages[0].ToolCallID != "srvtoolu_empty" {
-		t.Fatalf("expected tool_call_id srvtoolu_empty, got %q", messages[0].ToolCallID)
-	}
-	if messages[0].Content != "" {
-		t.Fatalf("expected empty content for empty web search results, got %q", messages[0].Content)
-	}
-}
-
-func TestConvertMessage_WebSearchToolResultErrorStillCreatesToolMessage(t *testing.T) {
-	msg := MessageParam{
-		Role: "user",
-		Content: []any{
-			map[string]any{
-				"type":        "web_search_tool_result",
-				"tool_use_id": "srvtoolu_error",
-				"content": map[string]any{
-					"type":       "web_search_tool_result_error",
-					"error_code": "max_uses_exceeded",
-				},
-			},
-		},
-	}
-
-	messages, err := convertMessage(msg)
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	if len(messages) != 1 {
-		t.Fatalf("expected 1 message, got %d", len(messages))
-	}
-	if messages[0].Role != "tool" {
-		t.Fatalf("expected role tool, got %q", messages[0].Role)
-	}
-	if messages[0].ToolCallID != "srvtoolu_error" {
-		t.Fatalf("expected tool_call_id srvtoolu_error, got %q", messages[0].ToolCallID)
-	}
-	if !strings.Contains(messages[0].Content, "max_uses_exceeded") {
-		t.Fatalf("expected error code in converted tool content, got %q", messages[0].Content)
-	}
-}
-
-func TestConvertOllamaToAnthropicResults(t *testing.T) {
-	ollamaResp := &OllamaWebSearchResponse{
-		Results: []OllamaWebSearchResult{
-			{
-				Title:   "Test Title",
-				URL:     "https://example.com",
-				Content: "Test content",
-			},
-			{
-				Title:   "Another Result",
-				URL:     "https://example.org",
-				Content: "More content",
-			},
-		},
-	}
-
-	results := ConvertOllamaToAnthropicResults(ollamaResp)
-
-	if len(results) != 2 {
-		t.Fatalf("expected 2 results, got %d", len(results))
-	}
-
-	if results[0].Type != "web_search_result" {
-		t.Errorf("expected type 'web_search_result', got %q", results[0].Type)
-	}
-
-	if results[0].Title != "Test Title" {
-		t.Errorf("expected title 'Test Title', got %q", results[0].Title)
-	}
-
-	if results[0].URL != "https://example.com" {
-		t.Errorf("expected URL 'https://example.com', got %q", results[0].URL)
-	}
-}
-
-func TestWebSearchTypes(t *testing.T) {
-	// Test that WebSearchResult serializes correctly
-	result := WebSearchResult{
-		Type:             "web_search_result",
-		URL:              "https://example.com",
-		Title:            "Test",
-		EncryptedContent: "abc123",
-		PageAge:          "2025-01-01",
-	}
-
-	data, err := json.Marshal(result)
-	if err != nil {
-		t.Fatalf("failed to marshal WebSearchResult: %v", err)
-	}
-
-	var unmarshaled WebSearchResult
-	if err := json.Unmarshal(data, &unmarshaled); err != nil {
-		t.Fatalf("failed to unmarshal WebSearchResult: %v", err)
-	}
-
-	if unmarshaled.Type != result.Type {
-		t.Errorf("type mismatch: expected %q, got %q", result.Type, unmarshaled.Type)
-	}
-
-	// Test WebSearchToolResultError
-	errResult := WebSearchToolResultError{
-		Type:      "web_search_tool_result_error",
-		ErrorCode: "max_uses_exceeded",
-	}
-
-	data, err = json.Marshal(errResult)
-	if err != nil {
-		t.Fatalf("failed to marshal WebSearchToolResultError: %v", err)
-	}
-
-	var unmarshaledErr WebSearchToolResultError
-	if err := json.Unmarshal(data, &unmarshaledErr); err != nil {
-		t.Fatalf("failed to unmarshal WebSearchToolResultError: %v", err)
-	}
-
-	if unmarshaledErr.ErrorCode != "max_uses_exceeded" {
-		t.Errorf("error_code mismatch: expected 'max_uses_exceeded', got %q", unmarshaledErr.ErrorCode)
-	}
-}
-
-func TestCitation(t *testing.T) {
-	citation := Citation{
-		Type:           "web_search_result_location",
-		URL:            "https://example.com",
-		Title:          "Example",
-		EncryptedIndex: "enc123",
-		CitedText:      "Some cited text...",
-	}
-
-	data, err := json.Marshal(citation)
-	if err != nil {
-		t.Fatalf("failed to marshal Citation: %v", err)
-	}
-
-	var unmarshaled Citation
-	if err := json.Unmarshal(data, &unmarshaled); err != nil {
-		t.Fatalf("failed to unmarshal Citation: %v", err)
-	}
-
-	if unmarshaled.Type != "web_search_result_location" {
-		t.Errorf("type mismatch: expected 'web_search_result_location', got %q", unmarshaled.Type)
-	}
-
-	if unmarshaled.CitedText != "Some cited text..." {
-		t.Errorf("cited_text mismatch: expected 'Some cited text...', got %q", unmarshaled.CitedText)
-	}
-}
--- a/anthropic/trace.go
+++ b/anthropic/trace.go
@@ -1,352 +0,0 @@
-package anthropic
-
-import (
-	"encoding/json"
-	"fmt"
-	"sort"
-
-	"github.com/ollama/ollama/api"
-)
-
-// Trace truncation limits.
-const (
-	TraceMaxStringRunes = 240
-	TraceMaxSliceItems  = 8
-	TraceMaxMapEntries  = 16
-	TraceMaxDepth       = 4
-)
-
-// TraceTruncateString shortens s to TraceMaxStringRunes, appending a count of
-// omitted characters when truncated.
-func TraceTruncateString(s string) string {
-	if len(s) == 0 {
-		return s
-	}
-	runes := []rune(s)
-	if len(runes) <= TraceMaxStringRunes {
-		return s
-	}
-	return fmt.Sprintf("%s...(+%d chars)", string(runes[:TraceMaxStringRunes]), len(runes)-TraceMaxStringRunes)
-}
-
-// TraceJSON round-trips v through JSON and returns a compacted representation.
-func TraceJSON(v any) any {
-	if v == nil {
-		return nil
-	}
-	data, err := json.Marshal(v)
-	if err != nil {
-		return map[string]any{"marshal_error": err.Error(), "type": fmt.Sprintf("%T", v)}
-	}
-	var out any
-	if err := json.Unmarshal(data, &out); err != nil {
-		return TraceTruncateString(string(data))
-	}
-	return TraceCompactValue(out, 0)
-}
-
-// TraceCompactValue recursively truncates strings, slices, and maps for trace
-// output. depth tracks recursion to enforce TraceMaxDepth.
-func TraceCompactValue(v any, depth int) any {
-	if v == nil {
-		return nil
-	}
-	if depth >= TraceMaxDepth {
-		switch t := v.(type) {
-		case string:
-			return TraceTruncateString(t)
-		case []any:
-			return fmt.Sprintf("<array len=%d>", len(t))
-		case map[string]any:
-			return fmt.Sprintf("<object keys=%d>", len(t))
-		default:
-			return fmt.Sprintf("<%T>", v)
-		}
-	}
-	switch t := v.(type) {
-	case string:
-		return TraceTruncateString(t)
-	case []any:
-		limit := min(len(t), TraceMaxSliceItems)
-		out := make([]any, 0, limit+1)
-		for i := range limit {
-			out = append(out, TraceCompactValue(t[i], depth+1))
-		}
-		if len(t) > limit {
-			out = append(out, fmt.Sprintf("... +%d more items", len(t)-limit))
-		}
-		return out
-	case map[string]any:
-		keys := make([]string, 0, len(t))
-		for k := range t {
-			keys = append(keys, k)
-		}
-		sort.Strings(keys)
-		limit := min(len(keys), TraceMaxMapEntries)
-		out := make(map[string]any, limit+1)
-		for i := range limit {
-			out[keys[i]] = TraceCompactValue(t[keys[i]], depth+1)
-		}
-		if len(keys) > limit {
-			out["__truncated_keys"] = len(keys) - limit
-		}
-		return out
-	default:
-		return t
-	}
-}
-
-// ---------------------------------------------------------------------------
-// Anthropic request/response tracing
-// ---------------------------------------------------------------------------
-
-// TraceMessagesRequest returns a compact trace representation of a MessagesRequest.
-func TraceMessagesRequest(r MessagesRequest) map[string]any {
-	return map[string]any{
-		"model":          r.Model,
-		"max_tokens":     r.MaxTokens,
-		"messages":       traceMessageParams(r.Messages),
-		"system":         traceAnthropicContent(r.System),
-		"stream":         r.Stream,
-		"tools":          traceTools(r.Tools),
-		"tool_choice":    TraceJSON(r.ToolChoice),
-		"thinking":       TraceJSON(r.Thinking),
-		"stop_sequences": r.StopSequences,
-		"temperature":    ptrVal(r.Temperature),
-		"top_p":          ptrVal(r.TopP),
-		"top_k":          ptrVal(r.TopK),
-	}
-}
-
-// TraceMessagesResponse returns a compact trace representation of a MessagesResponse.
-func TraceMessagesResponse(r MessagesResponse) map[string]any {
-	return map[string]any{
-		"id":          r.ID,
-		"model":       r.Model,
-		"content":     TraceJSON(r.Content),
-		"stop_reason": r.StopReason,
-		"usage":       r.Usage,
-	}
-}
-
-func traceMessageParams(msgs []MessageParam) []map[string]any {
-	out := make([]map[string]any, 0, len(msgs))
-	for _, m := range msgs {
-		out = append(out, map[string]any{
-			"role":    m.Role,
-			"content": traceAnthropicContent(m.Content),
-		})
-	}
-	return out
-}
-
-func traceAnthropicContent(content any) any {
-	switch c := content.(type) {
-	case nil:
-		return nil
-	case string:
-		return TraceTruncateString(c)
-	case []any:
-		blocks := make([]any, 0, len(c))
-		for _, block := range c {
-			blockMap, ok := block.(map[string]any)
-			if !ok {
-				blocks = append(blocks, TraceCompactValue(block, 0))
-				continue
-			}
-			blocks = append(blocks, traceAnthropicBlock(blockMap))
-		}
-		return blocks
-	default:
-		return TraceJSON(c)
-	}
-}
-
-func traceAnthropicBlock(block map[string]any) map[string]any {
-	blockType, _ := block["type"].(string)
-	out := map[string]any{"type": blockType}
-	switch blockType {
-	case "text":
-		if text, ok := block["text"].(string); ok {
-			out["text"] = TraceTruncateString(text)
-		} else {
-			out["text"] = TraceCompactValue(block["text"], 0)
-		}
-	case "thinking":
-		if thinking, ok := block["thinking"].(string); ok {
-			out["thinking"] = TraceTruncateString(thinking)
-		} else {
-			out["thinking"] = TraceCompactValue(block["thinking"], 0)
-		}
-	case "tool_use", "server_tool_use":
-		out["id"] = block["id"]
-		out["name"] = block["name"]
-		out["input"] = TraceCompactValue(block["input"], 0)
-	case "tool_result", "web_search_tool_result":
-		out["tool_use_id"] = block["tool_use_id"]
-		out["content"] = TraceCompactValue(block["content"], 0)
-	case "image":
-		if source, ok := block["source"].(map[string]any); ok {
-			out["source"] = map[string]any{
-				"type":       source["type"],
-				"media_type": source["media_type"],
-				"url":        source["url"],
-				"data_len":   len(fmt.Sprint(source["data"])),
-			}
-		}
-	default:
-		out["block"] = TraceCompactValue(block, 0)
-	}
-	return out
-}
-
-func traceTools(tools []Tool) []map[string]any {
-	out := make([]map[string]any, 0, len(tools))
-	for _, t := range tools {
-		out = append(out, TraceTool(t))
-	}
-	return out
-}
-
-// TraceTool returns a compact trace representation of an Anthropic Tool.
-func TraceTool(t Tool) map[string]any {
-	return map[string]any{
-		"type":         t.Type,
-		"name":         t.Name,
-		"description":  TraceTruncateString(t.Description),
-		"input_schema": TraceJSON(t.InputSchema),
-		"max_uses":     t.MaxUses,
-	}
-}
-
-// ContentBlockTypes returns the type strings from content (when it's []any blocks).
-func ContentBlockTypes(content any) []string {
-	blocks, ok := content.([]any)
-	if !ok {
-		return nil
-	}
-	types := make([]string, 0, len(blocks))
-	for _, block := range blocks {
-		blockMap, ok := block.(map[string]any)
-		if !ok {
-			types = append(types, fmt.Sprintf("%T", block))
-			continue
-		}
-		t, _ := blockMap["type"].(string)
-		types = append(types, t)
-	}
-	return types
-}
-
-func ptrVal[T any](v *T) any {
-	if v == nil {
-		return nil
-	}
-	return *v
-}
-
-// ---------------------------------------------------------------------------
-// Ollama api.* tracing (shared between anthropic and middleware packages)
-// ---------------------------------------------------------------------------
-
-// TraceChatRequest returns a compact trace representation of an Ollama ChatRequest.
-func TraceChatRequest(req *api.ChatRequest) map[string]any {
-	if req == nil {
-		return nil
-	}
-	stream := false
-	if req.Stream != nil {
-		stream = *req.Stream
-	}
-	return map[string]any{
-		"model":    req.Model,
-		"messages": TraceAPIMessages(req.Messages),
-		"tools":    TraceAPITools(req.Tools),
-		"stream":   stream,
-		"options":  req.Options,
-		"think":    TraceJSON(req.Think),
-	}
-}
-
-// TraceChatResponse returns a compact trace representation of an Ollama ChatResponse.
-func TraceChatResponse(resp api.ChatResponse) map[string]any {
-	return map[string]any{
-		"model":       resp.Model,
-		"done":        resp.Done,
-		"done_reason": resp.DoneReason,
-		"message":     TraceAPIMessage(resp.Message),
-		"metrics":     TraceJSON(resp.Metrics),
-	}
-}
-
-// TraceAPIMessages returns compact trace representations for a slice of api.Message.
-func TraceAPIMessages(msgs []api.Message) []map[string]any {
-	out := make([]map[string]any, 0, len(msgs))
-	for _, m := range msgs {
-		out = append(out, TraceAPIMessage(m))
-	}
-	return out
-}
-
-// TraceAPIMessage returns a compact trace representation of a single api.Message.
-func TraceAPIMessage(m api.Message) map[string]any {
-	return map[string]any{
-		"role":         m.Role,
-		"content":      TraceTruncateString(m.Content),
-		"thinking":     TraceTruncateString(m.Thinking),
-		"images":       traceImageSizes(m.Images),
-		"tool_calls":   traceToolCalls(m.ToolCalls),
-		"tool_name":    m.ToolName,
-		"tool_call_id": m.ToolCallID,
-	}
-}
-
-func traceImageSizes(images []api.ImageData) []int {
-	if len(images) == 0 {
-		return nil
-	}
-	sizes := make([]int, 0, len(images))
-	for _, img := range images {
-		sizes = append(sizes, len(img))
-	}
-	return sizes
-}
-
-// TraceAPITools returns compact trace representations for a slice of api.Tool.
-func TraceAPITools(tools api.Tools) []map[string]any {
-	out := make([]map[string]any, 0, len(tools))
-	for _, t := range tools {
-		out = append(out, TraceAPITool(t))
-	}
-	return out
-}
-
-// TraceAPITool returns a compact trace representation of a single api.Tool.
-func TraceAPITool(t api.Tool) map[string]any {
-	return map[string]any{
-		"type":        t.Type,
-		"name":        t.Function.Name,
-		"description": TraceTruncateString(t.Function.Description),
-		"parameters":  TraceJSON(t.Function.Parameters),
-	}
-}
-
-// TraceToolCall returns a compact trace representation of an api.ToolCall.
-func TraceToolCall(tc api.ToolCall) map[string]any {
-	return map[string]any{
-		"id":   tc.ID,
-		"name": tc.Function.Name,
-		"args": TraceJSON(tc.Function.Arguments),
-	}
-}
-
-func traceToolCalls(tcs []api.ToolCall) []map[string]any {
-	if len(tcs) == 0 {
-		return nil
-	}
-	out := make([]map[string]any, 0, len(tcs))
-	for _, tc := range tcs {
-		out = append(out, TraceToolCall(tc))
-	}
-	return out
-}
--- a/api/client.go
+++ b/api/client.go
@@ -449,16 +449,6 @@ func (c *Client) Version(ctx context.Context) (string, error) {
 	return version.Version, nil
 }

-// CloudStatusExperimental returns whether cloud features are disabled on the server.
-func (c *Client) CloudStatusExperimental(ctx context.Context) (*StatusResponse, error) {
-	var status StatusResponse
-	if err := c.do(ctx, http.MethodGet, "/api/status", nil, &status); err != nil {
-		return nil, err
-	}
-
-	return &status, nil
-}
-
 // Signout will signout a client for a local ollama server.
 func (c *Client) Signout(ctx context.Context) error {
 	return c.do(ctx, http.MethodPost, "/api/signout", nil, nil)
@@ -476,25 +466,3 @@ func (c *Client) Whoami(ctx context.Context) (*UserResponse, error) {
 	}
 	return &resp, nil
 }
-
-// AliasRequest is the request body for creating or updating a model alias.
-type AliasRequest struct {
-	Alias          string `json:"alias"`
-	Target         string `json:"target"`
-	PrefixMatching bool   `json:"prefix_matching,omitempty"`
-}
-
-// SetAliasExperimental creates or updates a model alias via the experimental aliases API.
-func (c *Client) SetAliasExperimental(ctx context.Context, req *AliasRequest) error {
-	return c.do(ctx, http.MethodPost, "/api/experimental/aliases", req, nil)
-}
-
-// AliasDeleteRequest is the request body for deleting a model alias.
-type AliasDeleteRequest struct {
-	Alias string `json:"alias"`
-}
-
-// DeleteAliasExperimental deletes a model alias via the experimental aliases API.
-func (c *Client) DeleteAliasExperimental(ctx context.Context, req *AliasDeleteRequest) error {
-	return c.do(ctx, http.MethodDelete, "/api/experimental/aliases", req, nil)
-}
--- a/api/types.go
+++ b/api/types.go
@@ -15,7 +15,6 @@ import (
 	"github.com/google/uuid"

 	"github.com/ollama/ollama/envconfig"
-	"github.com/ollama/ollama/format"
 	"github.com/ollama/ollama/internal/orderedmap"
 	"github.com/ollama/ollama/types/model"
 )
@@ -128,20 +127,6 @@ type GenerateRequest struct {
 	// each with an associated log probability. Only applies when Logprobs is true.
 	// Valid values are 0-20. Default is 0 (only return the selected token's logprob).
 	TopLogprobs int `json:"top_logprobs,omitempty"`
-
-	// Experimental: Image generation fields (may change or be removed)
-
-	// Width is the width of the generated image in pixels.
-	// Only used for image generation models.
-	Width int32 `json:"width,omitempty"`
-
-	// Height is the height of the generated image in pixels.
-	// Only used for image generation models.
-	Height int32 `json:"height,omitempty"`
-
-	// Steps is the number of diffusion steps for image generation.
-	// Only used for image generation models.
-	Steps int32 `json:"steps,omitempty"`
 }

 // ChatRequest describes a request sent by [Client.Chat].
@@ -570,7 +555,6 @@ type DebugInfo struct {

 type Metrics struct {
 	TotalDuration      time.Duration `json:"total_duration,omitempty"`
-	PeakMemory         uint64        `json:"peak_memory,omitempty"`
 	LoadDuration       time.Duration `json:"load_duration,omitempty"`
 	PromptEvalCount    int           `json:"prompt_eval_count,omitempty"`
 	PromptEvalDuration time.Duration `json:"prompt_eval_duration,omitempty"`
@@ -751,7 +735,7 @@ type ShowResponse struct {
 	Messages      []Message          `json:"messages,omitempty"`
 	RemoteModel   string             `json:"remote_model,omitempty"`
 	RemoteHost    string             `json:"remote_host,omitempty"`
-	ModelInfo     map[string]any     `json:"model_info"`
+	ModelInfo     map[string]any     `json:"model_info,omitempty"`
 	ProjectorInfo map[string]any     `json:"projector_info,omitempty"`
 	Tensors       []Tensor           `json:"tensors,omitempty"`
 	Capabilities  []model.Capability `json:"capabilities,omitempty"`
@@ -836,16 +820,6 @@ type TokenResponse struct {
 	Token string `json:"token"`
 }

-type CloudStatus struct {
-	Disabled bool   `json:"disabled"`
-	Source   string `json:"source"`
-}
-
-// StatusResponse is the response from [Client.CloudStatusExperimental].
-type StatusResponse struct {
-	Cloud CloudStatus `json:"cloud"`
-}
-
 // GenerateResponse is the response passed into [GenerateResponseFunc].
 type GenerateResponse struct {
 	// Model is the model name that generated the response.
@@ -886,20 +860,6 @@ type GenerateResponse struct {
 	// Logprobs contains log probability information for the generated tokens,
 	// if requested via the Logprobs parameter.
 	Logprobs []Logprob `json:"logprobs,omitempty"`
-
-	// Experimental: Image generation fields (may change or be removed)
-
-	// Image contains a base64-encoded generated image.
-	// Only present for image generation models.
-	Image string `json:"image,omitempty"`
-
-	// Completed is the number of completed steps in image generation.
-	// Only present for image generation models during streaming.
-	Completed int64 `json:"completed,omitempty"`
-
-	// Total is the total number of steps for image generation.
-	// Only present for image generation models during streaming.
-	Total int64 `json:"total,omitempty"`
 }

 // ModelDetails provides details about a model.
@@ -936,10 +896,6 @@ func (m *Metrics) Summary() {
 		fmt.Fprintf(os.Stderr, "total duration:       %v\n", m.TotalDuration)
 	}

-	if m.PeakMemory > 0 {
-		fmt.Fprintf(os.Stderr, "peak memory:          %s\n", formatPeakMemory(m.PeakMemory))
-	}
-
 	if m.LoadDuration > 0 {
 		fmt.Fprintf(os.Stderr, "load duration:        %v\n", m.LoadDuration)
 	}
@@ -963,14 +919,6 @@ func (m *Metrics) Summary() {
 	}
 }

-func formatPeakMemory(b uint64) string {
-	if b >= format.GibiByte {
-		return fmt.Sprintf("%.3f GiB", float64(b)/float64(format.GibiByte))
-	}
-
-	return format.HumanBytes2(b)
-}
-
 func (opts *Options) FromMap(m map[string]any) error {
 	valueOpts := reflect.ValueOf(opts).Elem() // names of the fields in the options struct
 	typeOpts := reflect.TypeOf(opts).Elem()   // types of the fields in the options struct
--- a/app/README.md
+++ b/app/README.md
@@ -75,9 +75,9 @@ The `-dev` flag enables:
 CI builds with Xcode 14.1 for OS compatibility prior to v13.  If you want to manually build v11+ support, you can download the older Xcode [here](https://developer.apple.com/services-account/download?path=/Developer_Tools/Xcode_14.1/Xcode_14.1.xip), extract, then `mv ./Xcode.app /Applications/Xcode_14.1.0.app` then activate with:

 ```
-export CGO_CFLAGS="-O3 -mmacosx-version-min=12.0"
-export CGO_CXXFLAGS="-O3 -mmacosx-version-min=12.0"
-export CGO_LDFLAGS="-mmacosx-version-min=12.0"
+export CGO_CFLAGS=-mmacosx-version-min=12.0
+export CGO_CXXFLAGS=-mmacosx-version-min=12.0
+export CGO_LDFLAGS=-mmacosx-version-min=12.0
 export SDKROOT=/Applications/Xcode_14.1.0.app/Contents/Developer/Platforms/MacOSX.platform/Developer/SDKs/MacOSX.sdk
 export DEVELOPER_DIR=/Applications/Xcode_14.1.0.app/Contents/Developer
 ```
--- a/app/cmd/app/app.go
+++ b/app/cmd/app/app.go
@@ -35,7 +35,6 @@ import (
 var (
 	wv           = &Webview{}
 	uiServerPort int
-	appStore     *store.Store
 )

 var debug = strings.EqualFold(os.Getenv("OLLAMA_DEBUG"), "true") || os.Getenv("OLLAMA_DEBUG") == "1"
@@ -209,7 +208,6 @@ func main() {
 	uiServerPort = port

 	st := &store.Store{}
-	appStore = st

 	// Enable CORS in development mode
 	if devMode {
@@ -255,8 +253,6 @@ func main() {
 		done <- osrv.Run(octx)
 	}()

-	upd := &updater.Updater{Store: st}
-
 	uiServer := ui.Server{
 		Token: token,
 		Restart: func() {
@@ -271,10 +267,6 @@ func main() {
 		ToolRegistry: toolRegistry,
 		Dev:          devMode,
 		Logger:       slog.Default(),
-		Updater:      upd,
-		UpdateAvailableFunc: func() {
-			UpdateAvailable("")
-		},
 	}

 	srv := &http.Server{
@@ -292,20 +284,8 @@ func main() {
 		slog.Debug("background desktop server done")
 	}()

-	upd.StartBackgroundUpdaterChecker(ctx, UpdateAvailable)
-
-	// Check for pending updates on startup (show tray notification if update is ready)
-	if updater.IsUpdatePending() {
-		// On Windows, the tray is initialized in osRun(). Calling UpdateAvailable
-		// before that would dereference a nil tray callback.
-		// TODO: refactor so the update check runs after platform init on all platforms.
-		if runtime.GOOS == "windows" {
-			slog.Debug("update pending on startup, deferring tray notification until tray initialization")
-		} else {
-			slog.Debug("update pending on startup, showing tray notification")
-			UpdateAvailable("")
-		}
-	}
+	updater := &updater.Updater{Store: st}
+	updater.StartBackgroundUpdaterChecker(ctx, UpdateAvailable)

 	hasCompletedFirstRun, err := st.HasCompletedFirstRun()
 	if err != nil {
@@ -368,17 +348,6 @@ func startHiddenTasks() {
 			// CLI triggered app startup use-case
 			slog.Info("deferring pending update for fast startup")
 		} else {
-			// Check if auto-update is enabled before automatically upgrading
-			settings, err := appStore.Settings()
-			if err != nil {
-				slog.Warn("failed to load settings for upgrade check", "error", err)
-			} else if !settings.AutoUpdateEnabled {
-				slog.Info("auto-update disabled, skipping automatic upgrade at startup")
-				// Still show tray notification so user knows update is ready
-				UpdateAvailable("")
-				return
-			}
-
 			if err := updater.DoUpgradeAtStartup(); err != nil {
 				slog.Info("unable to perform upgrade at startup", "error", err)
 				// Make sure the restart to upgrade menu shows so we can attempt an interactive upgrade to get authorization
--- a/app/cmd/app/app_darwin.m
+++ b/app/cmd/app/app_darwin.m
@@ -14,7 +14,6 @@ extern NSString *SystemWidePath;
@interface AppDelegate () <NSWindowDelegate, WKNavigationDelegate, WKUIDelegate>
@property(strong, nonatomic) NSStatusItem *statusItem;
@property(assign, nonatomic) BOOL updateAvailable;
-@property(assign, nonatomic) BOOL systemShutdownInProgress;
@end

@implementation AppDelegate
@@ -41,13 +40,6 @@ bool firstTimeRun,startHidden; // Set in run before initialization
 }

 - (void)applicationDidFinishLaunching:(NSNotification *)aNotification {
-    // Register for system shutdown/restart notification so we can allow termination
-    [[[NSWorkspace sharedWorkspace] notificationCenter]
-        addObserver:self
-           selector:@selector(systemWillPowerOff:)
-               name:NSWorkspaceWillPowerOffNotification
-             object:nil];
-
    // if we're in development mode, set the app icon
    NSString *bundlePath = [[NSBundle mainBundle] bundlePath];
    if (![bundlePath hasSuffix:@".app"]) {
@@ -286,18 +278,7 @@ bool firstTimeRun,startHidden; // Set in run before initialization
    [NSApp activateIgnoringOtherApps:YES];
 }

- (void)systemWillPowerOff:(NSNotification *)notification {
-    // Set flag so applicationShouldTerminate: knows to allow termination.
-    // The system will call applicationShouldTerminate: after posting this notification.
-    self.systemShutdownInProgress = YES;
-}
-
 - (NSApplicationTerminateReply)applicationShouldTerminate:(NSApplication *)sender {
-    // Allow termination if the system is shutting down or restarting
-    if (self.systemShutdownInProgress) {
-        return NSTerminateNow;
-    }
-    // Otherwise just hide the app (for Cmd+Q, close button, etc.)
    [NSApp hide:nil];
    [NSApp setActivationPolicy:NSApplicationActivationPolicyAccessory];
    return NSTerminateCancel;
--- a/app/cmd/app/app_windows.go
+++ b/app/cmd/app/app_windows.go
@@ -154,10 +154,6 @@ func handleURLSchemeRequest(urlScheme string) {
 }

 func UpdateAvailable(ver string) error {
-	if app.t == nil {
-		slog.Debug("tray not yet initialized, skipping update notification")
-		return nil
-	}
 	return app.t.UpdateAvailable(ver)
 }

@@ -169,14 +165,6 @@ func osRun(shutdown func(), hasCompletedFirstRun, startHidden bool) {
 		log.Fatalf("Failed to start: %s", err)
 	}

-	// Check for pending updates now that the tray is initialized.
-	// The platform-independent check in app.go fires before osRun,
-	// when app.t is still nil, so we must re-check here.
-	if updater.IsUpdatePending() {
-		slog.Debug("update pending on startup, showing tray notification")
-		UpdateAvailable("")
-	}
-
 	signals := make(chan os.Signal, 1)
 	signal.Notify(signals, syscall.SIGINT, syscall.SIGTERM)

--- a/app/server/server.go
+++ b/app/server/server.go
@@ -41,11 +41,6 @@ type InferenceCompute struct {
 	VRAM    string
 }

-type InferenceInfo struct {
-	Computes             []InferenceCompute
-	DefaultContextLength int
-}
-
 func New(s *store.Store, devMode bool) *Server {
 	p := resolvePath("ollama")
 	return &Server{store: s, bin: p, dev: devMode}
@@ -210,11 +205,6 @@ func (s *Server) cmd(ctx context.Context) (*exec.Cmd, error) {
 		return nil, err
 	}

-	cloudDisabled, err := s.store.CloudDisabled()
-	if err != nil {
-		return nil, err
-	}
-
 	cmd := commandContext(ctx, s.bin, "serve")
 	cmd.Stdout, cmd.Stderr = s.log, s.log

@@ -240,11 +230,6 @@ func (s *Server) cmd(ctx context.Context) (*exec.Cmd, error) {
 	if settings.ContextLength > 0 {
 		env["OLLAMA_CONTEXT_LENGTH"] = strconv.Itoa(settings.ContextLength)
 	}
-	if cloudDisabled {
-		env["OLLAMA_NO_CLOUD"] = "1"
-	} else {
-		env["OLLAMA_NO_CLOUD"] = "0"
-	}
 	cmd.Env = []string{}
 	for k, v := range env {
 		cmd.Env = append(cmd.Env, k+"="+v)
@@ -277,12 +262,9 @@ func openRotatingLog() (io.WriteCloser, error) {

 // Attempt to retrieve inference compute information from the server
 // log.  Set ctx to timeout to control how long to wait for the logs to appear
-func GetInferenceInfo(ctx context.Context) (*InferenceInfo, error) {
-	info := &InferenceInfo{}
-	computeMarker := regexp.MustCompile(`inference compute.*library=`)
-	defaultCtxMarker := regexp.MustCompile(`vram-based default context`)
-	defaultCtxRegex := regexp.MustCompile(`default_num_ctx=(\d+)`)
-
+func GetInferenceComputer(ctx context.Context) ([]InferenceCompute, error) {
+	inference := []InferenceCompute{}
+	marker := regexp.MustCompile(`inference compute.*library=`)
 	q := `inference compute.*%s=["]([^"]*)["]`
 	nq := `inference compute.*%s=(\S+)\s`
 	type regex struct {
@@ -348,8 +330,8 @@ func GetInferenceInfo(ctx context.Context) (*InferenceInfo, error) {
 		scanner := bufio.NewScanner(file)
 		for scanner.Scan() {
 			line := scanner.Text()
-			// Check for inference compute lines
-			if computeMarker.MatchString(line) {
+			match := marker.FindStringSubmatch(line)
+			if len(match) > 0 {
 				ic := InferenceCompute{
 					Library: get("library", line),
 					Variant: get("variant", line),
@@ -360,25 +342,12 @@ func GetInferenceInfo(ctx context.Context) (*InferenceInfo, error) {
 				}

 				slog.Info("Matched", "inference compute", ic)
-				info.Computes = append(info.Computes, ic)
-				continue
-			}
-			// Check for default context length line
-			if defaultCtxMarker.MatchString(line) {
-				match := defaultCtxRegex.FindStringSubmatch(line)
-				if len(match) > 1 {
-					numCtx, err := strconv.Atoi(match[1])
-					if err == nil {
-						info.DefaultContextLength = numCtx
-						slog.Info("Matched default context length", "default_num_ctx", numCtx)
-					}
+				inference = append(inference, ic)
+			} else {
+				// Break out on first non matching line after we start matching
+				if len(inference) > 0 {
+					return inference, nil
 				}
-				return info, nil
-			}
-			// If we've found compute info but hit a non-matching line, return what we have
-			// This handles older server versions that don't log the default context line
-			if len(info.Computes) > 0 {
-				return info, nil
 			}
 		}
 		time.Sleep(100 * time.Millisecond)
--- a/app/server/server_test.go
+++ b/app/server/server_test.go
@@ -111,7 +111,7 @@ func TestServerCmd(t *testing.T) {
 			for _, want := range tt.want {
 				found := false
 				for _, env := range cmd.Env {
-					if strings.HasPrefix(env, want) {
+					if strings.Contains(env, want) {
 						found = true
 						break
 					}
@@ -123,7 +123,7 @@ func TestServerCmd(t *testing.T) {

 			for _, dont := range tt.dont {
 				for _, env := range cmd.Env {
-					if strings.HasPrefix(env, dont) {
+					if strings.Contains(env, dont) {
 						t.Errorf("unexpected environment variable: %s", env)
 					}
 				}
@@ -136,119 +136,44 @@ func TestServerCmd(t *testing.T) {
 	}
 }

-func TestServerCmdCloudSettingEnv(t *testing.T) {
+func TestGetInferenceComputer(t *testing.T) {
 	tests := []struct {
-		name          string
-		envValue      string
-		configContent string
-		want          string
-	}{
-		{
-			name: "default cloud enabled",
-			want: "OLLAMA_NO_CLOUD=0",
-		},
-		{
-			name:     "env disables cloud",
-			envValue: "1",
-			want:     "OLLAMA_NO_CLOUD=1",
-		},
-		{
-			name:          "config disables cloud",
-			configContent: `{"disable_ollama_cloud": true}`,
-			want:          "OLLAMA_NO_CLOUD=1",
-		},
-		{
-			name:     "invalid env disables cloud",
-			envValue: "invalid",
-			want:     "OLLAMA_NO_CLOUD=1",
-		},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			tmpHome := t.TempDir()
-			t.Setenv("HOME", tmpHome)
-			t.Setenv("USERPROFILE", tmpHome)
-			t.Setenv("OLLAMA_NO_CLOUD", tt.envValue)
-
-			if tt.configContent != "" {
-				configDir := filepath.Join(tmpHome, ".ollama")
-				if err := os.MkdirAll(configDir, 0o755); err != nil {
-					t.Fatalf("mkdir config dir: %v", err)
-				}
-				configPath := filepath.Join(configDir, "server.json")
-				if err := os.WriteFile(configPath, []byte(tt.configContent), 0o644); err != nil {
-					t.Fatalf("write config: %v", err)
-				}
-			}
-
-			st := &store.Store{DBPath: filepath.Join(t.TempDir(), "db.sqlite")}
-			defer st.Close()
-
-			s := &Server{store: st}
-			cmd, err := s.cmd(t.Context())
-			if err != nil {
-				t.Fatalf("s.cmd() error = %v", err)
-			}
-
-			found := false
-			for _, env := range cmd.Env {
-				if env == tt.want {
-					found = true
-					break
-				}
-			}
-			if !found {
-				t.Fatalf("expected environment variable %q in command env", tt.want)
-			}
-		})
-	}
-}
-
-func TestGetInferenceInfo(t *testing.T) {
-	tests := []struct {
-		name             string
-		log              string
-		expComputes      []InferenceCompute
-		expDefaultCtxLen int
+		name string
+		log  string
+		exp  []InferenceCompute
 	}{
 		{
 			name: "metal",
 			log: `time=2025-06-30T09:23:07.374-07:00 level=DEBUG source=sched.go:108 msg="starting llm scheduler"
 time=2025-06-30T09:23:07.416-07:00 level=INFO source=types.go:130 msg="inference compute" id=0 library=metal variant="" compute="" driver=0.0 name="" total="96.0 GiB" available="96.0 GiB"
-time=2025-06-30T09:23:07.417-07:00 level=INFO source=routes.go:1721 msg="vram-based default context" total_vram="96.0 GiB" default_num_ctx=262144
 time=2025-06-30T09:25:56.197-07:00 level=DEBUG source=ggml.go:155 msg="key not found" key=general.alignment default=32
 `,
-			expComputes: []InferenceCompute{{
+			exp: []InferenceCompute{{
 				Library: "metal",
 				Driver:  "0.0",
 				VRAM:    "96.0 GiB",
 			}},
-			expDefaultCtxLen: 262144,
 		},
 		{
 			name: "cpu",
 			log: `time=2025-07-01T17:59:51.470Z level=INFO source=gpu.go:377 msg="no compatible GPUs were discovered"
 time=2025-07-01T17:59:51.470Z level=INFO source=types.go:130 msg="inference compute" id=0 library=cpu variant="" compute="" driver=0.0 name="" total="31.3 GiB" available="30.4 GiB"
-time=2025-07-01T17:59:51.471Z level=INFO source=routes.go:1721 msg="vram-based default context" total_vram="31.3 GiB" default_num_ctx=32768
 [GIN] 2025/07/01 - 18:00:09 | 200 |      50.263µs | 100.126.204.152 | HEAD     "/"
 `,
-			expComputes: []InferenceCompute{{
+			exp: []InferenceCompute{{
 				Library: "cpu",
 				Driver:  "0.0",
 				VRAM:    "31.3 GiB",
 			}},
-			expDefaultCtxLen: 32768,
 		},
 		{
 			name: "cuda1",
 			log: `time=2025-07-01T19:33:43.162Z level=DEBUG source=amd_linux.go:419 msg="amdgpu driver not detected /sys/module/amdgpu"
 releasing cuda driver library
 time=2025-07-01T19:33:43.162Z level=INFO source=types.go:130 msg="inference compute" id=GPU-452cac9f-6960-839c-4fb3-0cec83699196 library=cuda variant=v12 compute=6.1 driver=12.7 name="NVIDIA GeForce GT 1030" total="3.9 GiB" available="3.9 GiB"
-time=2025-07-01T19:33:43.163Z level=INFO source=routes.go:1721 msg="vram-based default context" total_vram="3.9 GiB" default_num_ctx=4096
 [GIN] 2025/07/01 - 18:00:09 | 200 |      50.263µs | 100.126.204.152 | HEAD     "/"
 `,
-			expComputes: []InferenceCompute{{
+			exp: []InferenceCompute{{
 				Library: "cuda",
 				Variant: "v12",
 				Compute: "6.1",
@@ -256,7 +181,6 @@ time=2025-07-01T19:33:43.163Z level=INFO source=routes.go:1721 msg="vram-based d
 				Name:    "NVIDIA GeForce GT 1030",
 				VRAM:    "3.9 GiB",
 			}},
-			expDefaultCtxLen: 4096,
 		},
 		{
 			name: "frank",
@@ -264,10 +188,9 @@ time=2025-07-01T19:33:43.163Z level=INFO source=routes.go:1721 msg="vram-based d
 		releasing cuda driver library
 		time=2025-07-01T19:36:13.315Z level=INFO source=types.go:130 msg="inference compute" id=GPU-d6de3398-9932-6902-11ec-fee8e424c8a2 library=cuda variant=v12 compute=7.5 driver=12.8 name="NVIDIA GeForce RTX 2080 Ti" total="10.6 GiB" available="10.4 GiB"
 		time=2025-07-01T19:36:13.315Z level=INFO source=types.go:130 msg="inference compute" id=GPU-9abb57639fa80c50 library=rocm variant="" compute=gfx1030 driver=6.3 name=1002:73bf total="16.0 GiB" available="1.3 GiB"
-		time=2025-07-01T19:36:13.316Z level=INFO source=routes.go:1721 msg="vram-based default context" total_vram="26.6 GiB" default_num_ctx=32768
 		[GIN] 2025/07/01 - 18:00:09 | 200 |      50.263µs | 100.126.204.152 | HEAD     "/"
 		`,
-			expComputes: []InferenceCompute{
+			exp: []InferenceCompute{
 				{
 					Library: "cuda",
 					Variant: "v12",
@@ -284,20 +207,6 @@ time=2025-07-01T19:33:43.163Z level=INFO source=routes.go:1721 msg="vram-based d
 					VRAM:    "16.0 GiB",
 				},
 			},
-			expDefaultCtxLen: 32768,
-		},
-		{
-			name: "missing_default_context",
-			log: `time=2025-06-30T09:23:07.374-07:00 level=DEBUG source=sched.go:108 msg="starting llm scheduler"
-time=2025-06-30T09:23:07.416-07:00 level=INFO source=types.go:130 msg="inference compute" id=0 library=metal variant="" compute="" driver=0.0 name="" total="96.0 GiB" available="96.0 GiB"
-time=2025-06-30T09:25:56.197-07:00 level=DEBUG source=ggml.go:155 msg="key not found" key=general.alignment default=32
-`,
-			expComputes: []InferenceCompute{{
-				Library: "metal",
-				Driver:  "0.0",
-				VRAM:    "96.0 GiB",
-			}},
-			expDefaultCtxLen: 0, // No default context line, should return 0
 		},
 	}
 	for _, tt := range tests {
@@ -310,21 +219,18 @@ time=2025-06-30T09:25:56.197-07:00 level=DEBUG source=ggml.go:155 msg="key not f
 			}
 			ctx, cancel := context.WithTimeout(t.Context(), 10*time.Millisecond)
 			defer cancel()
-			info, err := GetInferenceInfo(ctx)
+			ics, err := GetInferenceComputer(ctx)
 			if err != nil {
-				t.Fatalf("failed to get inference info: %v", err)
+				t.Fatalf(" failed to get inference compute: %v", err)
 			}
-			if !reflect.DeepEqual(info.Computes, tt.expComputes) {
-				t.Fatalf("computes mismatch\ngot:\n%#v\nwant:\n%#v", info.Computes, tt.expComputes)
-			}
-			if info.DefaultContextLength != tt.expDefaultCtxLen {
-				t.Fatalf("default context length mismatch: got %d, want %d", info.DefaultContextLength, tt.expDefaultCtxLen)
+			if !reflect.DeepEqual(ics, tt.exp) {
+				t.Fatalf("got:\n%#v\nwant:\n%#v", ics, tt.exp)
 			}
 		})
 	}
 }

-func TestGetInferenceInfoTimeout(t *testing.T) {
+func TestGetInferenceComputerTimeout(t *testing.T) {
 	ctx, cancel := context.WithTimeout(t.Context(), 10*time.Millisecond)
 	defer cancel()
 	tmpDir := t.TempDir()
@@ -333,7 +239,7 @@ func TestGetInferenceInfoTimeout(t *testing.T) {
 	if err != nil {
 		t.Fatalf("failed to write log file %s: %s", serverLogPath, err)
 	}
-	_, err = GetInferenceInfo(ctx)
+	_, err = GetInferenceComputer(ctx)
 	if err == nil {
 		t.Fatal("expected timeout")
 	}
--- a/app/store/cloud_config.go
+++ b/app/store/cloud_config.go
@@ -1,128 +0,0 @@
-//go:build windows || darwin
-
-package store
-
-import (
-	"encoding/json"
-	"errors"
-	"fmt"
-	"os"
-	"path/filepath"
-
-	"github.com/ollama/ollama/envconfig"
-)
-
-const serverConfigFilename = "server.json"
-
-type serverConfig struct {
-	DisableOllamaCloud bool `json:"disable_ollama_cloud,omitempty"`
-}
-
-// CloudDisabled returns whether cloud features should be disabled.
-// The source of truth is: OLLAMA_NO_CLOUD OR ~/.ollama/server.json:disable_ollama_cloud.
-func (s *Store) CloudDisabled() (bool, error) {
-	disabled, _, err := s.CloudStatus()
-	return disabled, err
-}
-
-// CloudStatus returns whether cloud is disabled and the source of that decision.
-// Source is one of: "none", "env", "config", "both".
-func (s *Store) CloudStatus() (bool, string, error) {
-	if err := s.ensureDB(); err != nil {
-		return false, "", err
-	}
-
-	configDisabled, err := readServerConfigCloudDisabled()
-	if err != nil {
-		return false, "", err
-	}
-
-	envDisabled := envconfig.NoCloudEnv()
-	return envDisabled || configDisabled, cloudStatusSource(envDisabled, configDisabled), nil
-}
-
-// SetCloudEnabled writes the cloud setting to ~/.ollama/server.json.
-func (s *Store) SetCloudEnabled(enabled bool) error {
-	if err := s.ensureDB(); err != nil {
-		return err
-	}
-	return setCloudEnabled(enabled)
-}
-
-func setCloudEnabled(enabled bool) error {
-	configPath, err := serverConfigPath()
-	if err != nil {
-		return err
-	}
-
-	if err := os.MkdirAll(filepath.Dir(configPath), 0o755); err != nil {
-		return fmt.Errorf("create server config directory: %w", err)
-	}
-
-	configMap := map[string]any{}
-	if data, err := os.ReadFile(configPath); err == nil {
-		if err := json.Unmarshal(data, &configMap); err != nil {
-			// If the existing file is invalid JSON, overwrite with a fresh object.
-			configMap = map[string]any{}
-		}
-	} else if !errors.Is(err, os.ErrNotExist) {
-		return fmt.Errorf("read server config: %w", err)
-	}
-
-	configMap["disable_ollama_cloud"] = !enabled
-
-	data, err := json.MarshalIndent(configMap, "", "  ")
-	if err != nil {
-		return fmt.Errorf("marshal server config: %w", err)
-	}
-	data = append(data, '\n')
-
-	if err := os.WriteFile(configPath, data, 0o644); err != nil {
-		return fmt.Errorf("write server config: %w", err)
-	}
-
-	return nil
-}
-
-func readServerConfigCloudDisabled() (bool, error) {
-	configPath, err := serverConfigPath()
-	if err != nil {
-		return false, err
-	}
-
-	data, err := os.ReadFile(configPath)
-	if err != nil {
-		if errors.Is(err, os.ErrNotExist) {
-			return false, nil
-		}
-		return false, fmt.Errorf("read server config: %w", err)
-	}
-
-	var cfg serverConfig
-	// Invalid or unexpected JSON should not block startup; treat as default.
-	if json.Unmarshal(data, &cfg) == nil {
-		return cfg.DisableOllamaCloud, nil
-	}
-	return false, nil
-}
-
-func serverConfigPath() (string, error) {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return "", fmt.Errorf("resolve home directory: %w", err)
-	}
-	return filepath.Join(home, ".ollama", serverConfigFilename), nil
-}
-
-func cloudStatusSource(envDisabled bool, configDisabled bool) string {
-	switch {
-	case envDisabled && configDisabled:
-		return "both"
-	case envDisabled:
-		return "env"
-	case configDisabled:
-		return "config"
-	default:
-		return "none"
-	}
-}
--- a/app/store/cloud_config_test.go
+++ b/app/store/cloud_config_test.go
@@ -1,130 +0,0 @@
-//go:build windows || darwin
-
-package store
-
-import (
-	"encoding/json"
-	"os"
-	"path/filepath"
-	"testing"
-)
-
-func TestCloudDisabled(t *testing.T) {
-	tests := []struct {
-		name          string
-		envValue      string
-		configContent string
-		wantDisabled  bool
-		wantSource    string
-	}{
-		{
-			name:         "default enabled",
-			wantDisabled: false,
-			wantSource:   "none",
-		},
-		{
-			name:         "env disables cloud",
-			envValue:     "1",
-			wantDisabled: true,
-			wantSource:   "env",
-		},
-		{
-			name:          "config disables cloud",
-			configContent: `{"disable_ollama_cloud": true}`,
-			wantDisabled:  true,
-			wantSource:    "config",
-		},
-		{
-			name:          "env and config",
-			envValue:      "1",
-			configContent: `{"disable_ollama_cloud": false}`,
-			wantDisabled:  true,
-			wantSource:    "env",
-		},
-		{
-			name:          "invalid config is ignored",
-			configContent: `{bad`,
-			wantDisabled:  false,
-			wantSource:    "none",
-		},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			tmpHome := t.TempDir()
-			setTestHome(t, tmpHome)
-			t.Setenv("OLLAMA_NO_CLOUD", tt.envValue)
-
-			if tt.configContent != "" {
-				configDir := filepath.Join(tmpHome, ".ollama")
-				if err := os.MkdirAll(configDir, 0o755); err != nil {
-					t.Fatalf("mkdir config dir: %v", err)
-				}
-				configPath := filepath.Join(configDir, serverConfigFilename)
-				if err := os.WriteFile(configPath, []byte(tt.configContent), 0o644); err != nil {
-					t.Fatalf("write config: %v", err)
-				}
-			}
-
-			s := &Store{DBPath: filepath.Join(tmpHome, "db.sqlite")}
-			defer s.Close()
-
-			disabled, err := s.CloudDisabled()
-			if err != nil {
-				t.Fatalf("CloudDisabled() error = %v", err)
-			}
-			if disabled != tt.wantDisabled {
-				t.Fatalf("CloudDisabled() = %v, want %v", disabled, tt.wantDisabled)
-			}
-
-			statusDisabled, source, err := s.CloudStatus()
-			if err != nil {
-				t.Fatalf("CloudStatus() error = %v", err)
-			}
-			if statusDisabled != tt.wantDisabled {
-				t.Fatalf("CloudStatus() disabled = %v, want %v", statusDisabled, tt.wantDisabled)
-			}
-			if source != tt.wantSource {
-				t.Fatalf("CloudStatus() source = %v, want %v", source, tt.wantSource)
-			}
-		})
-	}
-}
-
-func TestSetCloudEnabled(t *testing.T) {
-	tmpHome := t.TempDir()
-	setTestHome(t, tmpHome)
-
-	configDir := filepath.Join(tmpHome, ".ollama")
-	if err := os.MkdirAll(configDir, 0o755); err != nil {
-		t.Fatalf("mkdir config dir: %v", err)
-	}
-	configPath := filepath.Join(configDir, serverConfigFilename)
-	if err := os.WriteFile(configPath, []byte(`{"another_key":"value","disable_ollama_cloud":true}`), 0o644); err != nil {
-		t.Fatalf("seed config: %v", err)
-	}
-
-	s := &Store{DBPath: filepath.Join(tmpHome, "db.sqlite")}
-	defer s.Close()
-
-	if err := s.SetCloudEnabled(true); err != nil {
-		t.Fatalf("SetCloudEnabled(true) error = %v", err)
-	}
-
-	data, err := os.ReadFile(configPath)
-	if err != nil {
-		t.Fatalf("read config: %v", err)
-	}
-
-	var got map[string]any
-	if err := json.Unmarshal(data, &got); err != nil {
-		t.Fatalf("unmarshal config: %v", err)
-	}
-
-	if got["disable_ollama_cloud"] != false {
-		t.Fatalf("disable_ollama_cloud = %v, want false", got["disable_ollama_cloud"])
-	}
-	if got["another_key"] != "value" {
-		t.Fatalf("another_key = %v, want value", got["another_key"])
-	}
-}
--- a/app/store/database.go
+++ b/app/store/database.go
@@ -9,12 +9,12 @@ import (
 	"strings"
 	"time"

-	_ "github.com/mattn/go-sqlite3"
+	sqlite3 "github.com/mattn/go-sqlite3"
 )

 // currentSchemaVersion defines the current database schema version.
 // Increment this when making schema changes that require migrations.
-const currentSchemaVersion = 15
+const currentSchemaVersion = 12

 // database wraps the SQLite connection.
 // SQLite handles its own locking for concurrent access:
@@ -73,7 +73,7 @@ func (db *database) init() error {
 		agent BOOLEAN NOT NULL DEFAULT 0,
 		tools BOOLEAN NOT NULL DEFAULT 0,
 		working_dir TEXT NOT NULL DEFAULT '',
-		context_length INTEGER NOT NULL DEFAULT 0,
+		context_length INTEGER NOT NULL DEFAULT 4096,
 		window_width INTEGER NOT NULL DEFAULT 0,
 		window_height INTEGER NOT NULL DEFAULT 0,
 		config_migrated BOOLEAN NOT NULL DEFAULT 0,
@@ -84,9 +84,7 @@ func (db *database) init() error {
 		sidebar_open BOOLEAN NOT NULL DEFAULT 0,
 		think_enabled BOOLEAN NOT NULL DEFAULT 0,
 		think_level TEXT NOT NULL DEFAULT '',
-		cloud_setting_migrated BOOLEAN NOT NULL DEFAULT 0,
 		remote TEXT NOT NULL DEFAULT '', -- deprecated
-		auto_update_enabled BOOLEAN NOT NULL DEFAULT 1,
 		schema_version INTEGER NOT NULL DEFAULT %d
 	);

@@ -246,24 +244,6 @@ func (db *database) migrate() error {
 				return fmt.Errorf("migrate v11 to v12: %w", err)
 			}
 			version = 12
-		case 12:
-			// add cloud_setting_migrated column to settings table
-			if err := db.migrateV12ToV13(); err != nil {
-				return fmt.Errorf("migrate v12 to v13: %w", err)
-			}
-			version = 13
-		case 13:
-			// change default context_length from 4096 to 0 (VRAM-based tiered defaults)
-			if err := db.migrateV13ToV14(); err != nil {
-				return fmt.Errorf("migrate v13 to v14: %w", err)
-			}
-			version = 14
-		case 14:
-			// add auto_update_enabled column to settings table
-			if err := db.migrateV14ToV15(); err != nil {
-				return fmt.Errorf("migrate v14 to v15: %w", err)
-			}
-			version = 15
 		default:
 			// If we have a version we don't recognize, just set it to current
 			// This might happen during development
@@ -472,52 +452,6 @@ func (db *database) migrateV11ToV12() error {
 	return nil
 }

-// migrateV12ToV13 adds cloud_setting_migrated to settings.
-func (db *database) migrateV12ToV13() error {
-	_, err := db.conn.Exec(`ALTER TABLE settings ADD COLUMN cloud_setting_migrated BOOLEAN NOT NULL DEFAULT 0`)
-	if err != nil && !duplicateColumnError(err) {
-		return fmt.Errorf("add cloud_setting_migrated column: %w", err)
-	}
-
-	_, err = db.conn.Exec(`UPDATE settings SET schema_version = 13`)
-	if err != nil {
-		return fmt.Errorf("update schema version: %w", err)
-	}
-
-	return nil
-}
-
-// migrateV13ToV14 changes the default context_length from 4096 to 0.
-// When context_length is 0, the ollama server uses VRAM-based tiered defaults.
-func (db *database) migrateV13ToV14() error {
-	_, err := db.conn.Exec(`UPDATE settings SET context_length = 0 WHERE context_length = 4096`)
-	if err != nil {
-		return fmt.Errorf("update context_length default: %w", err)
-	}
-
-	_, err = db.conn.Exec(`UPDATE settings SET schema_version = 14`)
-	if err != nil {
-		return fmt.Errorf("update schema version: %w", err)
-	}
-
-	return nil
-}
-
-// migrateV14ToV15 adds the auto_update_enabled column to the settings table
-func (db *database) migrateV14ToV15() error {
-	_, err := db.conn.Exec(`ALTER TABLE settings ADD COLUMN auto_update_enabled BOOLEAN NOT NULL DEFAULT 1`)
-	if err != nil && !duplicateColumnError(err) {
-		return fmt.Errorf("add auto_update_enabled column: %w", err)
-	}
-
-	_, err = db.conn.Exec(`UPDATE settings SET schema_version = 15`)
-	if err != nil {
-		return fmt.Errorf("update schema version: %w", err)
-	}
-
-	return nil
-}
-
 // cleanupOrphanedData removes orphaned records that may exist due to the foreign key bug
 func (db *database) cleanupOrphanedData() error {
 	_, err := db.conn.Exec(`
@@ -548,11 +482,19 @@ func (db *database) cleanupOrphanedData() error {
 }

 func duplicateColumnError(err error) bool {
-	return err != nil && strings.Contains(err.Error(), "duplicate column name")
+	if sqlite3Err, ok := err.(sqlite3.Error); ok {
+		return sqlite3Err.Code == sqlite3.ErrError &&
+			strings.Contains(sqlite3Err.Error(), "duplicate column name")
+	}
+	return false
 }

 func columnNotExists(err error) bool {
-	return err != nil && strings.Contains(err.Error(), "no such column")
+	if sqlite3Err, ok := err.(sqlite3.Error); ok {
+		return sqlite3Err.Code == sqlite3.ErrError &&
+			strings.Contains(sqlite3Err.Error(), "no such column")
+	}
+	return false
 }

 func (db *database) getAllChats() ([]Chat, error) {
@@ -1166,9 +1108,9 @@ func (db *database) getSettings() (Settings, error) {
 	var s Settings

 	err := db.conn.QueryRow(`
-		SELECT expose, survey, browser, models, agent, tools, working_dir, context_length, turbo_enabled, websearch_enabled, selected_model, sidebar_open, think_enabled, think_level, auto_update_enabled
+		SELECT expose, survey, browser, models, agent, tools, working_dir, context_length, airplane_mode, turbo_enabled, websearch_enabled, selected_model, sidebar_open, think_enabled, think_level 
 		FROM settings
-	`).Scan(&s.Expose, &s.Survey, &s.Browser, &s.Models, &s.Agent, &s.Tools, &s.WorkingDir, &s.ContextLength, &s.TurboEnabled, &s.WebSearchEnabled, &s.SelectedModel, &s.SidebarOpen, &s.ThinkEnabled, &s.ThinkLevel, &s.AutoUpdateEnabled)
+	`).Scan(&s.Expose, &s.Survey, &s.Browser, &s.Models, &s.Agent, &s.Tools, &s.WorkingDir, &s.ContextLength, &s.AirplaneMode, &s.TurboEnabled, &s.WebSearchEnabled, &s.SelectedModel, &s.SidebarOpen, &s.ThinkEnabled, &s.ThinkLevel)
 	if err != nil {
 		return Settings{}, fmt.Errorf("get settings: %w", err)
 	}
@@ -1178,41 +1120,15 @@ func (db *database) getSettings() (Settings, error) {

 func (db *database) setSettings(s Settings) error {
 	_, err := db.conn.Exec(`
-		UPDATE settings
-		SET expose = ?, survey = ?, browser = ?, models = ?, agent = ?, tools = ?, working_dir = ?, context_length = ?, turbo_enabled = ?, websearch_enabled = ?, selected_model = ?, sidebar_open = ?, think_enabled = ?, think_level = ?, auto_update_enabled = ?
-	`, s.Expose, s.Survey, s.Browser, s.Models, s.Agent, s.Tools, s.WorkingDir, s.ContextLength, s.TurboEnabled, s.WebSearchEnabled, s.SelectedModel, s.SidebarOpen, s.ThinkEnabled, s.ThinkLevel, s.AutoUpdateEnabled)
+		UPDATE settings 
+		SET expose = ?, survey = ?, browser = ?, models = ?, agent = ?, tools = ?, working_dir = ?, context_length = ?, airplane_mode = ?, turbo_enabled = ?, websearch_enabled = ?, selected_model = ?, sidebar_open = ?, think_enabled = ?, think_level = ?
+	`, s.Expose, s.Survey, s.Browser, s.Models, s.Agent, s.Tools, s.WorkingDir, s.ContextLength, s.AirplaneMode, s.TurboEnabled, s.WebSearchEnabled, s.SelectedModel, s.SidebarOpen, s.ThinkEnabled, s.ThinkLevel)
 	if err != nil {
 		return fmt.Errorf("set settings: %w", err)
 	}
 	return nil
 }

-func (db *database) isCloudSettingMigrated() (bool, error) {
-	var migrated bool
-	err := db.conn.QueryRow("SELECT cloud_setting_migrated FROM settings").Scan(&migrated)
-	if err != nil {
-		return false, fmt.Errorf("get cloud setting migration status: %w", err)
-	}
-	return migrated, nil
-}
-
-func (db *database) setCloudSettingMigrated(migrated bool) error {
-	_, err := db.conn.Exec("UPDATE settings SET cloud_setting_migrated = ?", migrated)
-	if err != nil {
-		return fmt.Errorf("set cloud setting migration status: %w", err)
-	}
-	return nil
-}
-
-func (db *database) getAirplaneMode() (bool, error) {
-	var airplaneMode bool
-	err := db.conn.QueryRow("SELECT airplane_mode FROM settings").Scan(&airplaneMode)
-	if err != nil {
-		return false, fmt.Errorf("get airplane_mode: %w", err)
-	}
-	return airplaneMode, nil
-}
-
 func (db *database) getWindowSize() (int, int, error) {
 	var width, height int
 	err := db.conn.QueryRow("SELECT window_width, window_height FROM settings").Scan(&width, &height)
--- a/app/store/database_test.go
+++ b/app/store/database_test.go
@@ -98,43 +98,6 @@ func TestSchemaMigrations(t *testing.T) {
 	})
 }

-func TestMigrationV13ToV14ContextLength(t *testing.T) {
-	tmpDir := t.TempDir()
-	dbPath := filepath.Join(tmpDir, "test.db")
-
-	db, err := newDatabase(dbPath)
-	if err != nil {
-		t.Fatalf("failed to create database: %v", err)
-	}
-	defer db.Close()
-
-	_, err = db.conn.Exec("UPDATE settings SET context_length = 4096, schema_version = 13")
-	if err != nil {
-		t.Fatalf("failed to seed v13 settings row: %v", err)
-	}
-
-	if err := db.migrate(); err != nil {
-		t.Fatalf("migration from v13 to v14 failed: %v", err)
-	}
-
-	var contextLength int
-	if err := db.conn.QueryRow("SELECT context_length FROM settings").Scan(&contextLength); err != nil {
-		t.Fatalf("failed to read context_length: %v", err)
-	}
-
-	if contextLength != 0 {
-		t.Fatalf("expected context_length to migrate to 0, got %d", contextLength)
-	}
-
-	version, err := db.getSchemaVersion()
-	if err != nil {
-		t.Fatalf("failed to get schema version: %v", err)
-	}
-	if version != currentSchemaVersion {
-		t.Fatalf("expected schema version %d, got %d", currentSchemaVersion, version)
-	}
-}
-
 func TestChatDeletionWithCascade(t *testing.T) {
 	t.Run("chat deletion cascades to related messages", func(t *testing.T) {
 		tmpDir := t.TempDir()
--- a/app/store/migration_test.go
+++ b/app/store/migration_test.go
@@ -127,65 +127,6 @@ func TestNoConfigToMigrate(t *testing.T) {
 	}
 }

-func TestCloudMigrationFromAirplaneMode(t *testing.T) {
-	tmpHome := t.TempDir()
-	setTestHome(t, tmpHome)
-	t.Setenv("OLLAMA_NO_CLOUD", "")
-
-	dbPath := filepath.Join(tmpHome, "db.sqlite")
-	db, err := newDatabase(dbPath)
-	if err != nil {
-		t.Fatalf("failed to create database: %v", err)
-	}
-
-	if _, err := db.conn.Exec("UPDATE settings SET airplane_mode = 1, cloud_setting_migrated = 0"); err != nil {
-		db.Close()
-		t.Fatalf("failed to seed airplane migration state: %v", err)
-	}
-	db.Close()
-
-	s := Store{DBPath: dbPath}
-	defer s.Close()
-
-	// Trigger DB initialization + one-time cloud migration.
-	if _, err := s.ID(); err != nil {
-		t.Fatalf("failed to initialize store: %v", err)
-	}
-
-	disabled, err := s.CloudDisabled()
-	if err != nil {
-		t.Fatalf("CloudDisabled() error: %v", err)
-	}
-	if !disabled {
-		t.Fatal("expected cloud to be disabled after migrating airplane_mode=true")
-	}
-
-	configPath := filepath.Join(tmpHome, ".ollama", serverConfigFilename)
-	data, err := os.ReadFile(configPath)
-	if err != nil {
-		t.Fatalf("failed to read migrated server config: %v", err)
-	}
-
-	var cfg map[string]any
-	if err := json.Unmarshal(data, &cfg); err != nil {
-		t.Fatalf("failed to parse migrated server config: %v", err)
-	}
-	if cfg["disable_ollama_cloud"] != true {
-		t.Fatalf("disable_ollama_cloud = %v, want true", cfg["disable_ollama_cloud"])
-	}
-
-	var airplaneMode, migrated bool
-	if err := s.db.conn.QueryRow("SELECT airplane_mode, cloud_setting_migrated FROM settings").Scan(&airplaneMode, &migrated); err != nil {
-		t.Fatalf("failed to read migration flags from DB: %v", err)
-	}
-	if !airplaneMode {
-		t.Fatal("expected legacy airplane_mode value to remain unchanged")
-	}
-	if !migrated {
-		t.Fatal("expected cloud_setting_migrated to be true")
-	}
-}
-
 const (
 	v1Schema = `
 	CREATE TABLE IF NOT EXISTS settings (
--- a/app/store/store.go
+++ b/app/store/store.go
@@ -149,6 +149,9 @@ type Settings struct {
 	// ContextLength specifies the context length for the ollama server (using OLLAMA_CONTEXT_LENGTH)
 	ContextLength int

+	// AirplaneMode when true, turns off Ollama Turbo features and only uses local models
+	AirplaneMode bool
+
 	// TurboEnabled indicates if Ollama Turbo features are enabled
 	TurboEnabled bool

@@ -166,9 +169,6 @@ type Settings struct {

 	// SidebarOpen indicates if the chat sidebar is open
 	SidebarOpen bool
-
-	// AutoUpdateEnabled indicates if automatic updates should be downloaded
-	AutoUpdateEnabled bool
 }

 type Store struct {
@@ -259,40 +259,6 @@ func (s *Store) ensureDB() error {
 		}
 	}

-	// Run one-time migration from legacy airplane_mode behavior.
-	if err := s.migrateCloudSetting(database); err != nil {
-		return fmt.Errorf("migrate cloud setting: %w", err)
-	}
-
-	return nil
-}
-
-// migrateCloudSetting migrates legacy airplane_mode into server.json exactly once.
-// After this, cloud state is sourced from server.json OR OLLAMA_NO_CLOUD.
-func (s *Store) migrateCloudSetting(database *database) error {
-	migrated, err := database.isCloudSettingMigrated()
-	if err != nil {
-		return err
-	}
-	if migrated {
-		return nil
-	}
-
-	airplaneMode, err := database.getAirplaneMode()
-	if err != nil {
-		return err
-	}
-
-	if airplaneMode {
-		if err := setCloudEnabled(false); err != nil {
-			return fmt.Errorf("migrate airplane_mode to cloud disabled: %w", err)
-		}
-	}
-
-	if err := database.setCloudSettingMigrated(true); err != nil {
-		return err
-	}
-
 	return nil
 }

--- a/app/store/test_home_test.go
+++ b/app/store/test_home_test.go
@@ -1,11 +0,0 @@
-//go:build windows || darwin
-
-package store
-
-import "testing"
-
-func setTestHome(t *testing.T, home string) {
-	t.Helper()
-	t.Setenv("HOME", home)
-	t.Setenv("USERPROFILE", home)
-}
--- a/app/store/testdata/schema.sql
+++ b/app/store/testdata/schema.sql
@@ -13,7 +13,7 @@ CREATE TABLE IF NOT EXISTS settings (
    agent BOOLEAN NOT NULL DEFAULT 0,
    tools BOOLEAN NOT NULL DEFAULT 0,
    working_dir TEXT NOT NULL DEFAULT '',
-    context_length INTEGER NOT NULL DEFAULT 0,
+    context_length INTEGER NOT NULL DEFAULT 4096,
    window_width INTEGER NOT NULL DEFAULT 0,
    window_height INTEGER NOT NULL DEFAULT 0,
    config_migrated BOOLEAN NOT NULL DEFAULT 0,
--- a/app/tools/cloud_policy.go
+++ b/app/tools/cloud_policy.go
@@ -1,35 +0,0 @@
-//go:build windows || darwin
-
-package tools
-
-import (
-	"context"
-	"errors"
-
-	"github.com/ollama/ollama/api"
-	internalcloud "github.com/ollama/ollama/internal/cloud"
-)
-
-// ensureCloudEnabledForTool checks cloud policy from the connected Ollama server.
-// If policy cannot be determined, this fails closed and blocks the operation.
-func ensureCloudEnabledForTool(ctx context.Context, operation string) error {
-	// Reuse shared message formatting; policy evaluation is still done via
-	// the connected server's /api/status endpoint below.
-	disabledMessage := internalcloud.DisabledError(operation)
-
-	client, err := api.ClientFromEnvironment()
-	if err != nil {
-		return errors.New(disabledMessage + " (unable to verify server cloud policy)")
-	}
-
-	status, err := client.CloudStatusExperimental(ctx)
-	if err != nil {
-		return errors.New(disabledMessage + " (unable to verify server cloud policy)")
-	}
-
-	if status.Cloud.Disabled {
-		return errors.New(disabledMessage)
-	}
-
-	return nil
-}
--- a/app/tools/cloud_policy_test.go
+++ b/app/tools/cloud_policy_test.go
@@ -1,73 +0,0 @@
-//go:build windows || darwin
-
-package tools
-
-import (
-	"context"
-	"net/http"
-	"net/http/httptest"
-	"strings"
-	"testing"
-)
-
-func TestEnsureCloudEnabledForTool(t *testing.T) {
-	const op = "web search is unavailable"
-	const disabledPrefix = "ollama cloud is disabled: web search is unavailable"
-
-	t.Run("enabled allows tool execution", func(t *testing.T) {
-		ts := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			if r.URL.Path != "/api/status" {
-				http.NotFound(w, r)
-				return
-			}
-			w.Header().Set("Content-Type", "application/json")
-			_, _ = w.Write([]byte(`{"cloud":{"disabled":false,"source":"none"}}`))
-		}))
-		t.Cleanup(ts.Close)
-		t.Setenv("OLLAMA_HOST", ts.URL)
-
-		if err := ensureCloudEnabledForTool(context.Background(), op); err != nil {
-			t.Fatalf("expected nil error, got %v", err)
-		}
-	})
-
-	t.Run("disabled blocks tool execution", func(t *testing.T) {
-		ts := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			if r.URL.Path != "/api/status" {
-				http.NotFound(w, r)
-				return
-			}
-			w.Header().Set("Content-Type", "application/json")
-			_, _ = w.Write([]byte(`{"cloud":{"disabled":true,"source":"config"}}`))
-		}))
-		t.Cleanup(ts.Close)
-		t.Setenv("OLLAMA_HOST", ts.URL)
-
-		err := ensureCloudEnabledForTool(context.Background(), op)
-		if err == nil {
-			t.Fatal("expected error, got nil")
-		}
-		if got := err.Error(); got != disabledPrefix {
-			t.Fatalf("unexpected error: %q", got)
-		}
-	})
-
-	t.Run("status unavailable fails closed", func(t *testing.T) {
-		ts := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			http.NotFound(w, r)
-		}))
-		t.Cleanup(ts.Close)
-		t.Setenv("OLLAMA_HOST", ts.URL)
-
-		err := ensureCloudEnabledForTool(context.Background(), op)
-		if err == nil {
-			t.Fatal("expected error, got nil")
-		}
-		if got := err.Error(); !strings.Contains(got, disabledPrefix) {
-			t.Fatalf("expected disabled prefix, got %q", got)
-		}
-		if got := err.Error(); !strings.Contains(got, "unable to verify server cloud policy") {
-			t.Fatalf("expected verification failure detail, got %q", got)
-		}
-	})
-}
--- a/app/tools/web_fetch.go
+++ b/app/tools/web_fetch.go
@@ -77,10 +77,6 @@ func (w *WebFetch) Execute(ctx context.Context, args map[string]any) (any, strin
 }

 func performWebFetch(ctx context.Context, targetURL string) (*FetchResponse, error) {
-	if err := ensureCloudEnabledForTool(ctx, "web fetch is unavailable"); err != nil {
-		return nil, err
-	}
-
 	reqBody := FetchRequest{URL: targetURL}
 	jsonBody, err := json.Marshal(reqBody)
 	if err != nil {
--- a/app/tools/web_search.go
+++ b/app/tools/web_search.go
@@ -93,10 +93,6 @@ func (w *WebSearch) Execute(ctx context.Context, args map[string]any) (any, stri
 }

 func performWebSearch(ctx context.Context, query string, maxResults int) (*SearchResponse, error) {
-	if err := ensureCloudEnabledForTool(ctx, "web search is unavailable"); err != nil {
-		return nil, err
-	}
-
 	reqBody := SearchRequest{Query: query, MaxResults: maxResults}

 	jsonBody, err := json.Marshal(reqBody)
--- a/app/ui/app/codegen/gotypes.gen.ts
+++ b/app/ui/app/codegen/gotypes.gen.ts
@@ -289,12 +289,10 @@ export class InferenceCompute {
 }
 export class InferenceComputeResponse {
    inferenceComputes: InferenceCompute[];
-    defaultContextLength: number;

    constructor(source: any = {}) {
        if ('string' === typeof source) source = JSON.parse(source);
        this.inferenceComputes = this.convertValues(source["inferenceComputes"], InferenceCompute);
-        this.defaultContextLength = source["defaultContextLength"];
    }

 	convertValues(a: any, classs: any, asMap: boolean = false): any {
@@ -408,13 +406,13 @@ export class Settings {
    Tools: boolean;
    WorkingDir: string;
    ContextLength: number;
+    AirplaneMode: boolean;
    TurboEnabled: boolean;
    WebSearchEnabled: boolean;
    ThinkEnabled: boolean;
    ThinkLevel: string;
    SelectedModel: string;
    SidebarOpen: boolean;
-    AutoUpdateEnabled: boolean;

    constructor(source: any = {}) {
        if ('string' === typeof source) source = JSON.parse(source);
@@ -426,13 +424,13 @@ export class Settings {
        this.Tools = source["Tools"];
        this.WorkingDir = source["WorkingDir"];
        this.ContextLength = source["ContextLength"];
+        this.AirplaneMode = source["AirplaneMode"];
        this.TurboEnabled = source["TurboEnabled"];
        this.WebSearchEnabled = source["WebSearchEnabled"];
        this.ThinkEnabled = source["ThinkEnabled"];
        this.ThinkLevel = source["ThinkLevel"];
        this.SelectedModel = source["SelectedModel"];
        this.SidebarOpen = source["SidebarOpen"];
-        this.AutoUpdateEnabled = source["AutoUpdateEnabled"];
    }
 }
 export class SettingsResponse {
--- a/app/ui/app/src/api.ts
+++ b/app/ui/app/src/api.ts
@@ -4,6 +4,7 @@ import {
  ChatEvent,
  DownloadEvent,
  ErrorEvent,
+  InferenceCompute,
  InferenceComputeResponse,
  ModelCapabilitiesResponse,
  Model,
@@ -26,12 +27,6 @@ declare module "@/gotypes" {
 Model.prototype.isCloud = function (): boolean {
  return this.model.endsWith("cloud");
 };
-
-export type CloudStatusSource = "env" | "config" | "both" | "none";
-export interface CloudStatusResponse {
-  disabled: boolean;
-  source: CloudStatusSource;
-}
 // Helper function to convert Uint8Array to base64
 function uint8ArrayToBase64(uint8Array: Uint8Array): string {
  const chunkSize = 0x8000; // 32KB chunks to avoid stack overflow
@@ -290,28 +285,6 @@ export async function updateSettings(settings: Settings): Promise<{
  };
 }

-export async function updateCloudSetting(
-  enabled: boolean,
-): Promise<CloudStatusResponse> {
-  const response = await fetch(`${API_BASE}/api/v1/cloud`, {
-    method: "POST",
-    headers: {
-      "Content-Type": "application/json",
-    },
-    body: JSON.stringify({ enabled }),
-  });
-  if (!response.ok) {
-    const error = await response.text();
-    throw new Error(error || "Failed to update cloud setting");
-  }
-
-  const data = await response.json();
-  return {
-    disabled: Boolean(data.disabled),
-    source: (data.source as CloudStatusSource) || "none",
-  };
-}
-
 export async function renameChat(chatId: string, title: string): Promise<void> {
  const response = await fetch(`${API_BASE}/api/v1/chat/${chatId}/rename`, {
    method: "PUT",
@@ -406,7 +379,7 @@ export async function* pullModel(
  }
 }

-export async function getInferenceCompute(): Promise<InferenceComputeResponse> {
+export async function getInferenceCompute(): Promise<InferenceCompute[]> {
  const response = await fetch(`${API_BASE}/api/v1/inference-compute`);
  if (!response.ok) {
    throw new Error(
@@ -415,7 +388,8 @@ export async function getInferenceCompute(): Promise<InferenceComputeResponse> {
  }

  const data = await response.json();
-  return new InferenceComputeResponse(data);
+  const inferenceComputeResponse = new InferenceComputeResponse(data);
+  return inferenceComputeResponse.inferenceComputes || [];
 }

 export async function fetchHealth(): Promise<boolean> {
@@ -440,16 +414,3 @@ export async function fetchHealth(): Promise<boolean> {
    return false;
  }
 }
-
-export async function getCloudStatus(): Promise<CloudStatusResponse | null> {
-  const response = await fetch(`${API_BASE}/api/v1/cloud`);
-  if (!response.ok) {
-    throw new Error(`Failed to fetch cloud status: ${response.status}`);
-  }
-
-  const data = await response.json();
-  return {
-    disabled: Boolean(data.disabled),
-    source: (data.source as CloudStatusSource) || "none",
-  };
-}
--- a/app/ui/app/src/components/ChatForm.tsx
+++ b/app/ui/app/src/components/ChatForm.tsx
@@ -17,15 +17,11 @@ import {
 } from "@/hooks/useChats";
 import { useNavigate } from "@tanstack/react-router";
 import { useSelectedModel } from "@/hooks/useSelectedModel";
-import {
-  useHasVisionCapability,
-  useHasToolsCapability,
-} from "@/hooks/useModelCapabilities";
+import { useHasVisionCapability } from "@/hooks/useModelCapabilities";
 import { useUser } from "@/hooks/useUser";
 import { DisplayLogin } from "@/components/DisplayLogin";
 import { ErrorEvent, Message } from "@/gotypes";
 import { useSettings } from "@/hooks/useSettings";
-import { useCloudStatus } from "@/hooks/useCloudStatus";
 import { ThinkButton } from "./ThinkButton";
 import { ErrorMessage } from "./ErrorMessage";
 import { processFiles } from "@/utils/fileValidation";
@@ -145,14 +141,19 @@ function ChatForm({
  const {
    settings: {
      webSearchEnabled,
+      airplaneMode,
      thinkEnabled,
      thinkLevel: settingsThinkLevel,
    },
    setSettings,
  } = useSettings();
-  const { cloudDisabled } = useCloudStatus();

-  const supportsWebSearch = useHasToolsCapability(selectedModel?.model);
+  // current supported models for web search
+  const modelLower = selectedModel?.model.toLowerCase() || "";
+  const supportsWebSearch =
+    modelLower.startsWith("gpt-oss") ||
+    modelLower.startsWith("qwen3") ||
+    modelLower.startsWith("deepseek-v3");
  // Use per-chat thinking level instead of global
  const thinkLevel: ThinkingLevel =
    settingsThinkLevel === "none" || !settingsThinkLevel
@@ -179,12 +180,6 @@ function ChatForm({
    setSettings,
  ]);

-  useEffect(() => {
-    if (cloudDisabled && webSearchEnabled) {
-      setSettings({ WebSearchEnabled: false });
-    }
-  }, [cloudDisabled, webSearchEnabled, setSettings]);
-
  const removeFile = (index: number) => {
    setMessage((prev) => ({
      ...prev,
@@ -239,19 +234,19 @@ function ChatForm({

  // Determine if login banner should be shown
  const shouldShowLoginBanner =
-    !cloudDisabled &&
    !isLoadingUser &&
    !isAuthenticated &&
-    ((webSearchEnabled && supportsWebSearch) || selectedModel?.isCloud());
+    ((webSearchEnabled && supportsWebSearch) ||
+      (selectedModel?.isCloud() && !airplaneMode));

  // Determine which feature to highlight in the banner
  const getActiveFeatureForBanner = () => {
-    if (cloudDisabled) return null;
    if (!isAuthenticated) {
      if (loginPromptFeature) return loginPromptFeature;
-      if (webSearchEnabled && selectedModel?.isCloud()) return "webSearch";
+      if (webSearchEnabled && selectedModel?.isCloud() && !airplaneMode)
+        return "webSearch";
      if (webSearchEnabled) return "webSearch";
-      if (selectedModel?.isCloud()) return "turbo";
+      if (selectedModel?.isCloud() && !airplaneMode) return "turbo";
    }
    return null;
  };
@@ -274,12 +269,11 @@ function ChatForm({
  useEffect(() => {
    if (
      isAuthenticated ||
-      cloudDisabled ||
-      (!webSearchEnabled && !!selectedModel?.isCloud())
+      (!webSearchEnabled && !!selectedModel?.isCloud() && !airplaneMode)
    ) {
      setLoginPromptFeature(null);
    }
-  }, [isAuthenticated, webSearchEnabled, selectedModel, cloudDisabled]);
+  }, [isAuthenticated, webSearchEnabled, selectedModel, airplaneMode]);

  // When entering edit mode, populate the composition with existing data
  useEffect(() => {
@@ -471,10 +465,6 @@ function ChatForm({
  const handleSubmit = async () => {
    if (!message.content.trim() || isStreaming || isDownloading) return;

-    if (cloudDisabled && selectedModel?.isCloud()) {
-      return;
-    }
-
    // Check if cloud mode is enabled but user is not authenticated
    if (shouldShowLoginBanner) {
      return;
@@ -488,8 +478,7 @@ function ChatForm({
      }),
    );

-    const useWebSearch =
-      supportsWebSearch && webSearchEnabled && !cloudDisabled;
+    const useWebSearch = supportsWebSearch && webSearchEnabled && !airplaneMode;
    const useThink = modelSupportsThinkingLevels
      ? thinkLevel
      : supportsThinkToggling
@@ -910,7 +899,7 @@ function ChatForm({
                )}
                <WebSearchButton
                  ref={webSearchButtonRef}
-                  isVisible={supportsWebSearch && cloudDisabled === false}
+                  isVisible={supportsWebSearch && airplaneMode === false}
                  isActive={webSearchEnabled}
                  onToggle={() => {
                    if (!webSearchEnabled && !isAuthenticated) {
@@ -951,7 +940,6 @@ function ChatForm({
                !isDownloading &&
                (!message.content.trim() ||
                  shouldShowLoginBanner ||
-                  (cloudDisabled && selectedModel?.isCloud()) ||
                  message.fileErrors.length > 0)
              }
              className={`flex items-center justify-center h-9 w-9 rounded-full disabled:cursor-default cursor-pointer bg-black text-white dark:bg-white dark:text-black disabled:opacity-10 focus:outline-none focus:ring-2 focus:ring-blue-500`}
--- a/app/ui/app/src/components/ModelPicker.tsx
+++ b/app/ui/app/src/components/ModelPicker.tsx
@@ -8,7 +8,7 @@ import {
 } from "react";
 import { Model } from "@/gotypes";
 import { useSelectedModel } from "@/hooks/useSelectedModel";
-import { useCloudStatus } from "@/hooks/useCloudStatus";
+import { useSettings } from "@/hooks/useSettings";
 import { useQueryClient } from "@tanstack/react-query";
 import { getModelUpstreamInfo } from "@/api";
 import { ArrowDownTrayIcon } from "@heroicons/react/24/outline";
@@ -34,7 +34,7 @@ export const ModelPicker = forwardRef<
    chatId,
    searchQuery,
  );
-  const { cloudDisabled } = useCloudStatus();
+  const { settings } = useSettings();
  const dropdownRef = useRef<HTMLDivElement>(null);
  const searchInputRef = useRef<HTMLInputElement>(null);
  const queryClient = useQueryClient();
@@ -219,7 +219,7 @@ export const ModelPicker = forwardRef<
            models={models}
            selectedModel={selectedModel}
            onModelSelect={handleModelSelect}
-            cloudDisabled={cloudDisabled}
+            airplaneMode={settings.airplaneMode}
            isOpen={isOpen}
          />
        </div>
@@ -233,13 +233,13 @@ export const ModelList = forwardRef(function ModelList(
    models,
    selectedModel,
    onModelSelect,
-    cloudDisabled,
+    airplaneMode,
    isOpen,
  }: {
    models: Model[];
    selectedModel: Model | null;
    onModelSelect: (model: Model) => void;
-    cloudDisabled: boolean;
+    airplaneMode: boolean;
    isOpen: boolean;
  },
  ref,
@@ -348,7 +348,7 @@ export const ModelList = forwardRef(function ModelList(
                  </svg>
                )}
                {model.digest === undefined &&
-                  (cloudDisabled || !model.isCloud()) && (
+                  (airplaneMode || !model.isCloud()) && (
                    <ArrowDownTrayIcon
                      className="h-4 w-4 text-neutral-500 dark:text-neutral-400"
                      strokeWidth={1.75}
--- a/app/ui/app/src/components/Settings.tsx
+++ b/app/ui/app/src/components/Settings.tsx
@@ -11,24 +11,15 @@ import {
  FolderIcon,
  BoltIcon,
  WrenchIcon,
-  CloudIcon,
  XMarkIcon,
  CogIcon,
  ArrowLeftIcon,
-  ArrowDownTrayIcon,
 } from "@heroicons/react/20/solid";
 import { Settings as SettingsType } from "@/gotypes";
 import { useNavigate } from "@tanstack/react-router";
 import { useUser } from "@/hooks/useUser";
-import { useCloudStatus } from "@/hooks/useCloudStatus";
 import { useQuery, useMutation, useQueryClient } from "@tanstack/react-query";
-import {
-  getSettings,
-  type CloudStatusResponse,
-  updateCloudSetting,
-  updateSettings,
-  getInferenceCompute,
-} from "@/api";
+import { getSettings, updateSettings } from "@/api";

 function AnimatedDots() {
  return (
@@ -62,11 +53,6 @@ export default function Settings() {
  const [connectionError, setConnectionError] = useState<string | null>(null);
  const [pollingInterval, setPollingInterval] = useState<number | null>(null);
  const navigate = useNavigate();
-  const {
-    cloudDisabled,
-    cloudStatus,
-    isLoading: cloudStatusLoading,
-  } = useCloudStatus();

  const {
    data: settingsData,
@@ -79,13 +65,6 @@ export default function Settings() {

  const settings = settingsData?.settings || null;

-  const { data: inferenceComputeResponse } = useQuery({
-    queryKey: ["inferenceCompute"],
-    queryFn: getInferenceCompute,
-  });
-
-  const defaultContextLength = inferenceComputeResponse?.defaultContextLength;
-
  const updateSettingsMutation = useMutation({
    mutationFn: updateSettings,
    onSuccess: () => {
@@ -95,50 +74,6 @@ export default function Settings() {
    },
  });

-  const updateCloudMutation = useMutation({
-    mutationFn: (enabled: boolean) => updateCloudSetting(enabled),
-    onMutate: async (enabled: boolean) => {
-      await queryClient.cancelQueries({ queryKey: ["cloudStatus"] });
-
-      const previous = queryClient.getQueryData<CloudStatusResponse | null>([
-        "cloudStatus",
-      ]);
-      const envForcesDisabled =
-        previous?.source === "env" || previous?.source === "both";
-
-      queryClient.setQueryData<CloudStatusResponse | null>(
-        ["cloudStatus"],
-        previous
-          ? {
-              ...previous,
-              disabled: !enabled || envForcesDisabled,
-            }
-          : {
-              disabled: !enabled,
-              source: "config",
-            },
-      );
-
-      return { previous };
-    },
-    onError: (_error, _enabled, context) => {
-      if (context?.previous !== undefined) {
-        queryClient.setQueryData(["cloudStatus"], context.previous);
-      }
-    },
-    onSuccess: (status) => {
-      queryClient.setQueryData<CloudStatusResponse | null>(
-        ["cloudStatus"],
-        status,
-      );
-      queryClient.invalidateQueries({ queryKey: ["models"] });
-      queryClient.invalidateQueries({ queryKey: ["cloudStatus"] });
-
-      setShowSaved(true);
-      setTimeout(() => setShowSaved(false), 1500);
-    },
-  });
-
  useEffect(() => {
    refetchUser();
  }, []); // eslint-disable-line react-hooks/exhaustive-deps
@@ -213,17 +148,13 @@ export default function Settings() {
        Models: "",
        Agent: false,
        Tools: false,
-        ContextLength: 0,
+        ContextLength: 4096,
+        AirplaneMode: false,
      });
      updateSettingsMutation.mutate(defaultSettings);
    }
  };

-  const cloudOverriddenByEnv =
-    cloudStatus?.source === "env" || cloudStatus?.source === "both";
-  const cloudToggleDisabled =
-    cloudStatusLoading || updateCloudMutation.isPending || cloudOverriddenByEnv;
-
  const handleConnectOllamaAccount = async () => {
    setConnectionError(null);

@@ -306,7 +237,7 @@ export default function Settings() {
        <div className="space-y-4 max-w-2xl mx-auto">
          {/* Connect Ollama Account */}
          <div className="overflow-hidden rounded-xl bg-white dark:bg-neutral-800">
-            <div className="p-4">
+            <div className="p-4 border-b border-neutral-200 dark:border-neutral-800">
              <Field>
                {isLoading ? (
                  // Loading skeleton, this will only happen if the app started recently
@@ -413,57 +344,6 @@ export default function Settings() {
          {/* Local Configuration */}
          <div className="relative overflow-hidden rounded-xl bg-white dark:bg-neutral-800">
            <div className="space-y-4 p-4">
-              <Field>
-                <div className="flex items-start justify-between gap-4">
-                  <div className="flex items-start space-x-3 flex-1">
-                    <CloudIcon className="mt-1 h-5 w-5 flex-shrink-0 text-black dark:text-neutral-100" />
-                    <div>
-                      <Label>Cloud</Label>
-                      <Description>
-                        {cloudOverriddenByEnv
-                          ? "The OLLAMA_NO_CLOUD environment variable is currently forcing cloud off."
-                          : "Enable cloud models and web search."}
-                      </Description>
-                    </div>
-                  </div>
-                  <div className="flex-shrink-0">
-                    <Switch
-                      checked={!cloudDisabled}
-                      disabled={cloudToggleDisabled}
-                      onChange={(checked) => {
-                        if (cloudOverriddenByEnv) {
-                          return;
-                        }
-                        updateCloudMutation.mutate(checked);
-                      }}
-                    />
-                  </div>
-                </div>
-              </Field>
-
-              {/* Auto Update */}
-              <Field>
-                <div className="flex items-start justify-between gap-4">
-                  <div className="flex items-start space-x-3 flex-1">
-                    <ArrowDownTrayIcon className="mt-1 h-5 w-5 flex-shrink-0 text-black dark:text-neutral-100" />
-                    <div>
-                      <Label>Auto-download updates</Label>
-                      <Description>
-                        {settings.AutoUpdateEnabled
-                          ? "Automatically download updates when available."
-                          : "Updates will not be downloaded automatically."}
-                      </Description>
-                    </div>
-                  </div>
-                  <div className="flex-shrink-0">
-                    <Switch
-                      checked={settings.AutoUpdateEnabled}
-                      onChange={(checked) => handleChange("AutoUpdateEnabled", checked)}
-                    />
-                  </div>
-                </div>
-              </Field>
-
              {/* Expose Ollama */}
              <Field>
                <div className="flex items-start justify-between gap-4">
@@ -539,11 +419,13 @@ export default function Settings() {
                    </Description>
                    <div className="mt-3">
                      <Slider
-                        value={settings.ContextLength || defaultContextLength || 0}
+                        value={(() => {
+                          // Otherwise use the settings value
+                          return settings.ContextLength || 4096;
+                        })()}
                        onChange={(value) => {
                          handleChange("ContextLength", value);
                        }}
-                        disabled={!defaultContextLength}
                        options={[
                          { value: 4096, label: "4k" },
                          { value: 8192, label: "8k" },
@@ -558,6 +440,35 @@ export default function Settings() {
                  </div>
                </div>
              </Field>
+              {/* Airplane Mode */}
+              <Field>
+                <div className="flex items-start justify-between gap-4">
+                  <div className="flex items-start space-x-3 flex-1">
+                    <svg
+                      className="mt-1 h-5 w-5 flex-shrink-0 text-black dark:text-neutral-100"
+                      viewBox="0 0 21.5508 17.9033"
+                      fill="currentColor"
+                    >
+                      <path d="M21.5508 8.94727C21.542 7.91895 20.1445 7.17188 18.4658 7.17188L14.9238 7.17188C14.4316 7.17188 14.2471 7.09277 13.957 6.75879L8.05078 0.316406C7.86621 0.105469 7.6377 0 7.37402 0L6.35449 0C6.12598 0 5.99414 0.202148 6.1084 0.448242L9.14941 7.17188L4.68457 7.68164L3.09375 4.76367C2.97949 4.54395 2.78613 4.44727 2.49609 4.44727L2.11816 4.44727C1.88965 4.44727 1.74023 4.59668 1.74023 4.8252L1.74023 13.0693C1.74023 13.2979 1.88965 13.4385 2.11816 13.4385L2.49609 13.4385C2.78613 13.4385 2.97949 13.3418 3.09375 13.1309L4.68457 10.2129L9.14941 10.7227L6.1084 17.4463C5.99414 17.6836 6.12598 17.8945 6.35449 17.8945L7.37402 17.8945C7.6377 17.8945 7.86621 17.7803 8.05078 17.5781L13.957 11.127C14.2471 10.8018 14.4316 10.7227 14.9238 10.7227L18.4658 10.7227C20.1445 10.7227 21.542 9.9668 21.5508 8.94727Z" />
+                    </svg>
+                    <div>
+                      <Label>Airplane mode</Label>
+                      <Description>
+                        Airplane mode keeps data local, disabling cloud models
+                        and web search.
+                      </Description>
+                    </div>
+                  </div>
+                  <div className="flex-shrink-0">
+                    <Switch
+                      checked={settings.AirplaneMode}
+                      onChange={(checked) =>
+                        handleChange("AirplaneMode", checked)
+                      }
+                    />
+                  </div>
+                </div>
+              </Field>
            </div>
          </div>

--- a/app/ui/app/src/components/ui/slider.tsx
+++ b/app/ui/app/src/components/ui/slider.tsx
@@ -6,11 +6,10 @@ export interface SliderProps {
  value?: number;
  onChange?: (value: number) => void;
  className?: string;
-  disabled?: boolean;
 }

 const Slider = React.forwardRef<HTMLDivElement, SliderProps>(
-  ({ label, options, value = 0, onChange, disabled = false }, ref) => {
+  ({ label, options, value = 0, onChange }, ref) => {
    const [selectedValue, setSelectedValue] = React.useState(value);
    const [isDragging, setIsDragging] = React.useState(false);
    const containerRef = React.useRef<HTMLDivElement>(null);
@@ -21,7 +20,6 @@ const Slider = React.forwardRef<HTMLDivElement, SliderProps>(
    }, [value]);

    const handleClick = (optionValue: number) => {
-      if (disabled) return;
      setSelectedValue(optionValue);
      onChange?.(optionValue);
    };
@@ -41,7 +39,6 @@ const Slider = React.forwardRef<HTMLDivElement, SliderProps>(
    };

    const handleMouseDown = (e: React.MouseEvent) => {
-      if (disabled) return;
      setIsDragging(true);
      e.preventDefault();
    };
@@ -80,7 +77,7 @@ const Slider = React.forwardRef<HTMLDivElement, SliderProps>(
    }

    return (
-      <div className={`space-y-2 ${disabled ? "opacity-50" : ""}`} ref={ref}>
+      <div className="space-y-2" ref={ref}>
        {label && <label className="text-sm font-medium">{label}</label>}
        <div className="relative">
          <div className="absolute top-[9px] left-2 right-2 h-1 bg-neutral-200 dark:bg-neutral-700 pointer-events-none rounded-full" />
@@ -91,11 +88,10 @@ const Slider = React.forwardRef<HTMLDivElement, SliderProps>(
                <button
                  onClick={() => handleClick(option.value)}
                  onMouseDown={handleMouseDown}
-                  disabled={disabled}
-                  className={`relative px-3 py-6 -mx-3 -my-6 z-10 ${disabled ? "cursor-not-allowed" : "cursor-pointer"}`}
+                  className="relative px-3 py-6 -mx-3 -my-6 z-10 cursor-pointer"
                >
                  <div className="relative w-5 h-5 flex items-center justify-center">
-                    {selectedValue === option.value && !disabled && (
+                    {selectedValue === option.value && (
                      <div className="w-4 h-4 bg-white dark:bg-white border border-neutral-400 dark:border-neutral-500 rounded-full cursor-grab active:cursor-grabbing" />
                    )}
                  </div>
--- a/app/ui/app/src/hooks/useChats.ts
+++ b/app/ui/app/src/hooks/useChats.ts
@@ -6,8 +6,8 @@ import { useSelectedModel } from "./useSelectedModel";
 import { createQueryBatcher } from "./useQueryBatcher";
 import { useRefetchModels } from "./useModels";
 import { useStreamingContext } from "@/contexts/StreamingContext";
+import { useSettings } from "./useSettings";
 import { getModelCapabilities } from "@/api";
-import { useCloudStatus } from "./useCloudStatus";

 export const useChats = () => {
  return useQuery({
@@ -116,9 +116,11 @@ export const useIsModelStale = (modelName: string) => {
 export const useShouldShowStaleDisplay = (model: Model | null) => {
  const isStale = useIsModelStale(model?.model || "");
  const { data: dismissedModels } = useDismissedStaleModels();
-  const { cloudDisabled } = useCloudStatus();
+  const {
+    settings: { airplaneMode },
+  } = useSettings();

-  if (model?.isCloud() && !cloudDisabled) {
+  if (model?.isCloud() && !airplaneMode) {
    return false;
  }

--- a/app/ui/app/src/hooks/useCloudStatus.ts
+++ b/app/ui/app/src/hooks/useCloudStatus.ts
@@ -1,20 +0,0 @@
-import { useQuery } from "@tanstack/react-query";
-import { getCloudStatus, type CloudStatusResponse } from "@/api";
-
-export function useCloudStatus() {
-  const cloudQuery = useQuery<CloudStatusResponse | null>({
-    queryKey: ["cloudStatus"],
-    queryFn: getCloudStatus,
-    retry: false,
-    staleTime: 60 * 1000,
-  });
-
-  return {
-    cloudStatus: cloudQuery.data,
-    cloudDisabled: cloudQuery.data?.disabled ?? false,
-    isKnown: cloudQuery.data !== null && cloudQuery.data !== undefined,
-    isLoading: cloudQuery.isLoading,
-    isError: cloudQuery.isError,
-    error: cloudQuery.error,
-  };
-}
--- a/app/ui/app/src/hooks/useModelCapabilities.ts
+++ b/app/ui/app/src/hooks/useModelCapabilities.ts
@@ -20,8 +20,3 @@ export function useHasVisionCapability(modelName: string | undefined) {
  const { data: capabilitiesResponse } = useModelCapabilities(modelName);
  return capabilitiesResponse?.capabilities?.includes("vision") ?? false;
 }
-
-export function useHasToolsCapability(modelName: string | undefined) {
-  const { data: capabilitiesResponse } = useModelCapabilities(modelName);
-  return capabilitiesResponse?.capabilities?.includes("tools") ?? false;
-}
--- a/app/ui/app/src/hooks/useModels.ts
+++ b/app/ui/app/src/hooks/useModels.ts
@@ -2,11 +2,11 @@ import { useQuery } from "@tanstack/react-query";
 import { Model } from "@/gotypes";
 import { getModels } from "@/api";
 import { mergeModels } from "@/utils/mergeModels";
+import { useSettings } from "./useSettings";
 import { useMemo } from "react";
-import { useCloudStatus } from "./useCloudStatus";

 export function useModels(searchQuery = "") {
-  const { cloudDisabled } = useCloudStatus();
+  const { settings } = useSettings();
  const localQuery = useQuery<Model[], Error>({
    queryKey: ["models", searchQuery],
    queryFn: () => getModels(searchQuery),
@@ -20,7 +20,7 @@ export function useModels(searchQuery = "") {
  });

  const allModels = useMemo(() => {
-    const models = mergeModels(localQuery.data || [], cloudDisabled);
+    const models = mergeModels(localQuery.data || [], settings.airplaneMode);

    if (searchQuery && searchQuery.trim()) {
      const query = searchQuery.toLowerCase().trim();
@@ -40,7 +40,7 @@ export function useModels(searchQuery = "") {
    }

    return models;
-  }, [localQuery.data, searchQuery, cloudDisabled]);
+  }, [localQuery.data, searchQuery, settings.airplaneMode]);

  return {
    ...localQuery,
--- a/app/ui/app/src/hooks/useSelectedModel.ts
+++ b/app/ui/app/src/hooks/useSelectedModel.ts
@@ -7,7 +7,6 @@ import { Model } from "@/gotypes";
 import { FEATURED_MODELS } from "@/utils/mergeModels";
 import { getTotalVRAM } from "@/utils/vram.ts";
 import { getInferenceCompute } from "@/api";
-import { useCloudStatus } from "./useCloudStatus";

 export function recommendDefaultModel(totalVRAM: number): string {
  const vram = Math.max(0, Number(totalVRAM) || 0);
@@ -23,19 +22,16 @@ export function recommendDefaultModel(totalVRAM: number): string {
 export function useSelectedModel(currentChatId?: string, searchQuery?: string) {
  const { settings, setSettings } = useSettings();
  const { data: models = [], isLoading } = useModels(searchQuery || "");
-  const { cloudDisabled } = useCloudStatus();
  const { data: chatData, isLoading: isChatLoading } = useChat(
    currentChatId && currentChatId !== "new" ? currentChatId : "",
  );

-  const { data: inferenceComputeResponse } = useQuery({
-    queryKey: ["inferenceCompute"],
+  const { data: inferenceComputes = [] } = useQuery({
+    queryKey: ["inference-compute"],
    queryFn: getInferenceCompute,
    enabled: !settings.selectedModel, // Only fetch if no model is selected
  });

-  const inferenceComputes = inferenceComputeResponse?.inferenceComputes || [];
-
  const totalVRAM = useMemo(
    () => getTotalVRAM(inferenceComputes),
    [inferenceComputes],
@@ -50,11 +46,12 @@ export function useSelectedModel(currentChatId?: string, searchQuery?: string) {
  const restoredChatRef = useRef<string | null>(null);

  const selectedModel: Model | null = useMemo(() => {
-    // If cloud is disabled and selected model ends with cloud, switch to a local default.
-    if (cloudDisabled && settings.selectedModel?.endsWith("cloud")) {
+    // if airplane mode is on and selected model ends with cloud,
+    // switch to recommended default model
+    if (settings.airplaneMode && settings.selectedModel?.endsWith("cloud")) {
      return (
        models.find((m) => m.model === recommendedModel) ||
-        models.find((m) => !m.isCloud()) ||
+        models.find((m) => m.isCloud) ||
        models.find((m) => m.digest === undefined || m.digest === "") ||
        models[0] ||
        null
@@ -71,7 +68,7 @@ export function useSelectedModel(currentChatId?: string, searchQuery?: string) {
      "qwen3-coder:480b",
    ];
    const shouldMigrate =
-      !cloudDisabled &&
+      !settings.airplaneMode &&
      settings.turboEnabled &&
      baseModelsToMigrate.includes(settings.selectedModel);

@@ -99,18 +96,13 @@ export function useSelectedModel(currentChatId?: string, searchQuery?: string) {
        })) ||
      null
    );
-  }, [
-    models,
-    settings.selectedModel,
-    cloudDisabled,
-    recommendedModel,
-  ]);
+  }, [models, settings.selectedModel, settings.airplaneMode, recommendedModel]);

  useEffect(() => {
    if (!selectedModel) return;

    if (
-      cloudDisabled &&
+      settings.airplaneMode &&
      settings.selectedModel?.endsWith("cloud") &&
      selectedModel.model !== settings.selectedModel
    ) {
@@ -118,17 +110,13 @@ export function useSelectedModel(currentChatId?: string, searchQuery?: string) {
    }

    if (
-      !cloudDisabled &&
+      !settings.airplaneMode &&
      settings.turboEnabled &&
      selectedModel.model !== settings.selectedModel
    ) {
      setSettings({ SelectedModel: selectedModel.model, TurboEnabled: false });
    }
-  }, [
-    selectedModel,
-    cloudDisabled,
-    settings.selectedModel,
-  ]);
+  }, [selectedModel, settings.airplaneMode, settings.selectedModel]);

  // Set model from chat history when chat data loads
  useEffect(() => {
@@ -181,9 +169,7 @@ export function useSelectedModel(currentChatId?: string, searchQuery?: string) {

    const defaultModel =
      models.find((m) => m.model === recommendedModel) ||
-      (cloudDisabled
-        ? models.find((m) => !m.isCloud())
-        : models.find((m) => m.isCloud())) ||
+      models.find((m) => m.isCloud()) ||
      models.find((m) => m.digest === undefined || m.digest === "") ||
      models[0];

@@ -195,7 +181,6 @@ export function useSelectedModel(currentChatId?: string, searchQuery?: string) {
    inferenceComputes.length,
    models.length,
    settings.selectedModel,
-    cloudDisabled,
  ]);

  // Add the selected model to the models list if it's not already there
--- a/app/ui/app/src/hooks/useSettings.ts
+++ b/app/ui/app/src/hooks/useSettings.ts
@@ -9,6 +9,7 @@ interface SettingsState {
  webSearchEnabled: boolean;
  selectedModel: string;
  sidebarOpen: boolean;
+  airplaneMode: boolean;
  thinkEnabled: boolean;
  thinkLevel: string;
 }
@@ -50,6 +51,7 @@ export function useSettings() {
      thinkLevel: settingsData?.settings?.ThinkLevel ?? "none",
      selectedModel: settingsData?.settings?.SelectedModel ?? "",
      sidebarOpen: settingsData?.settings?.SidebarOpen ?? false,
+      airplaneMode: settingsData?.settings?.AirplaneMode ?? false,
    }),
    [settingsData?.settings],
  );
--- a/app/ui/app/src/routes/__root.tsx
+++ b/app/ui/app/src/routes/__root.tsx
@@ -2,7 +2,6 @@ import type { QueryClient } from "@tanstack/react-query";
 import { createRootRouteWithContext, Outlet } from "@tanstack/react-router";
 import { getSettings } from "@/api";
 import { useQuery } from "@tanstack/react-query";
-import { useCloudStatus } from "@/hooks/useCloudStatus";

 function RootComponent() {
  // This hook ensures settings are fetched on app startup
@@ -10,8 +9,6 @@ function RootComponent() {
    queryKey: ["settings"],
    queryFn: getSettings,
  });
-  // Fetch cloud status on startup (best-effort)
-  useCloudStatus();

  return (
    <div>
--- a/app/ui/app/src/utils/mergeModels.test.ts
+++ b/app/ui/app/src/utils/mergeModels.test.ts
@@ -41,14 +41,14 @@ describe("Model merging logic", () => {
    expect(merged.length).toBe(FEATURED_MODELS.length + 2);
  });

-  it("should hide cloud models when cloud is disabled", () => {
+  it("should hide cloud models in airplane mode", () => {
    const localModels: Model[] = [
      new Model({ model: "gpt-oss:120b-cloud" }),
      new Model({ model: "llama3:latest" }),
      new Model({ model: "mistral:latest" }),
    ];

-    const merged = mergeModels(localModels, true); // cloud disabled = true
+    const merged = mergeModels(localModels, true); // airplane mode = true

    // No cloud models should be present
    const cloudModels = merged.filter((m) => m.isCloud());
--- a/app/ui/app/src/utils/mergeModels.ts
+++ b/app/ui/app/src/utils/mergeModels.ts
@@ -32,7 +32,7 @@ function alphabeticalSort(a: Model, b: Model): number {
 //Merges models, sorting cloud models first, then other models
 export function mergeModels(
  localModels: Model[],
-  hideCloudModels: boolean = false,
+  airplaneMode: boolean = false,
 ): Model[] {
  const allModels = (localModels || []).map((model) => model);

@@ -95,7 +95,7 @@ export function mergeModels(

  remainingModels.sort(alphabeticalSort);

-  return hideCloudModels
+  return airplaneMode
    ? [...featuredModels, ...remainingModels]
    : [...cloudModels, ...featuredModels, ...remainingModels];
 }
--- a/app/ui/responses/types.go
+++ b/app/ui/responses/types.go
@@ -45,8 +45,7 @@ type InferenceCompute struct {
 }

 type InferenceComputeResponse struct {
-	InferenceComputes    []InferenceCompute `json:"inferenceComputes"`
-	DefaultContextLength int                `json:"defaultContextLength"`
+	InferenceComputes []InferenceCompute `json:"inferenceComputes"`
 }

 type ModelCapabilitiesResponse struct {
--- a/app/ui/ui.go
+++ b/app/ui/ui.go
@@ -28,7 +28,6 @@ import (
 	"github.com/ollama/ollama/app/tools"
 	"github.com/ollama/ollama/app/types/not"
 	"github.com/ollama/ollama/app/ui/responses"
-	"github.com/ollama/ollama/app/updater"
 	"github.com/ollama/ollama/app/version"
 	ollamaAuth "github.com/ollama/ollama/auth"
 	"github.com/ollama/ollama/envconfig"
@@ -107,10 +106,6 @@ type Server struct {

 	// Dev is true if the server is running in development mode
 	Dev bool
-
-	// Updater for checking and downloading updates
-	Updater             *updater.Updater
-	UpdateAvailableFunc func()
 }

 func (s *Server) log() *slog.Logger {
@@ -289,15 +284,12 @@ func (s *Server) Handler() http.Handler {
 	mux.Handle("POST /api/v1/model/upstream", handle(s.modelUpstream))
 	mux.Handle("GET /api/v1/settings", handle(s.getSettings))
 	mux.Handle("POST /api/v1/settings", handle(s.settings))
-	mux.Handle("GET /api/v1/cloud", handle(s.getCloudSetting))
-	mux.Handle("POST /api/v1/cloud", handle(s.cloudSetting))

 	// Ollama proxy endpoints
 	ollamaProxy := s.ollamaProxy()
 	mux.Handle("GET /api/tags", ollamaProxy)
 	mux.Handle("POST /api/show", ollamaProxy)
 	mux.Handle("GET /api/version", ollamaProxy)
-	mux.Handle("GET /api/status", ollamaProxy)
 	mux.Handle("HEAD /api/version", ollamaProxy)
 	mux.Handle("POST /api/me", ollamaProxy)
 	mux.Handle("POST /api/signout", ollamaProxy)
@@ -834,9 +826,8 @@ func (s *Server) chat(w http.ResponseWriter, r *http.Request) error {

 	if !hasAttachments {
 		WebSearchEnabled := req.WebSearch != nil && *req.WebSearch
-		hasToolsCapability := slices.Contains(details.Capabilities, model.CapabilityTools)

-		if WebSearchEnabled && hasToolsCapability {
+		if WebSearchEnabled {
 			if supportsBrowserTools(req.Model) {
 				browserState, ok := s.browserState(chat)
 				if !ok {
@@ -846,7 +837,7 @@ func (s *Server) chat(w http.ResponseWriter, r *http.Request) error {
 				registry.Register(tools.NewBrowserSearch(browser))
 				registry.Register(tools.NewBrowserOpen(browser))
 				registry.Register(tools.NewBrowserFind(browser))
-			} else {
+			} else if supportsWebSearchTools(req.Model) {
 				registry.Register(&tools.WebSearch{})
 				registry.Register(&tools.WebFetch{})
 			}
@@ -1426,6 +1417,11 @@ func (s *Server) getSettings(w http.ResponseWriter, r *http.Request) error {
 		settings.Models = envconfig.Models()
 	}

+	// set default context length if not set
+	if settings.ContextLength == 0 {
+		settings.ContextLength = 4096
+	}
+
 	// Include current runtime settings
 	settings.Agent = s.Agent
 	settings.Tools = s.Tools
@@ -1452,24 +1448,6 @@ func (s *Server) settings(w http.ResponseWriter, r *http.Request) error {
 		return fmt.Errorf("failed to save settings: %w", err)
 	}

-	// Handle auto-update toggle changes
-	if old.AutoUpdateEnabled != settings.AutoUpdateEnabled {
-		if !settings.AutoUpdateEnabled {
-			// Auto-update disabled: cancel any ongoing download
-			if s.Updater != nil {
-				s.Updater.CancelOngoingDownload()
-			}
-		} else {
-			// Auto-update re-enabled: show notification if update is already staged, or trigger immediate check
-			if (updater.IsUpdatePending() || updater.UpdateDownloaded) && s.UpdateAvailableFunc != nil {
-				s.UpdateAvailableFunc()
-			} else if s.Updater != nil {
-				// Trigger the background checker to run immediately
-				s.Updater.TriggerImmediateCheck()
-			}
-		}
-	}
-
 	if old.ContextLength != settings.ContextLength ||
 		old.Models != settings.Models ||
 		old.Expose != settings.Expose {
@@ -1482,51 +1460,17 @@ func (s *Server) settings(w http.ResponseWriter, r *http.Request) error {
 	})
 }

-func (s *Server) cloudSetting(w http.ResponseWriter, r *http.Request) error {
-	var req struct {
-		Enabled bool `json:"enabled"`
-	}
-	if err := json.NewDecoder(r.Body).Decode(&req); err != nil {
-		return fmt.Errorf("invalid request body: %w", err)
-	}
-
-	if err := s.Store.SetCloudEnabled(req.Enabled); err != nil {
-		return fmt.Errorf("failed to persist cloud setting: %w", err)
-	}
-
-	s.Restart()
-
-	return s.writeCloudStatus(w)
-}
-
-func (s *Server) getCloudSetting(w http.ResponseWriter, r *http.Request) error {
-	return s.writeCloudStatus(w)
-}
-
-func (s *Server) writeCloudStatus(w http.ResponseWriter) error {
-	disabled, source, err := s.Store.CloudStatus()
-	if err != nil {
-		return fmt.Errorf("failed to load cloud status: %w", err)
-	}
-
-	w.Header().Set("Content-Type", "application/json")
-	return json.NewEncoder(w).Encode(map[string]any{
-		"disabled": disabled,
-		"source":   source,
-	})
-}
-
 func (s *Server) getInferenceCompute(w http.ResponseWriter, r *http.Request) error {
 	ctx, cancel := context.WithTimeout(r.Context(), 500*time.Millisecond)
 	defer cancel()
-	info, err := server.GetInferenceInfo(ctx)
+	serverInferenceComputes, err := server.GetInferenceComputer(ctx)
 	if err != nil {
-		s.log().Error("failed to get inference info", "error", err)
-		return fmt.Errorf("failed to get inference info: %w", err)
+		s.log().Error("failed to get inference compute", "error", err)
+		return fmt.Errorf("failed to get inference compute: %w", err)
 	}

-	inferenceComputes := make([]responses.InferenceCompute, len(info.Computes))
-	for i, ic := range info.Computes {
+	inferenceComputes := make([]responses.InferenceCompute, len(serverInferenceComputes))
+	for i, ic := range serverInferenceComputes {
 		inferenceComputes[i] = responses.InferenceCompute{
 			Library: ic.Library,
 			Variant: ic.Variant,
@@ -1538,8 +1482,7 @@ func (s *Server) getInferenceCompute(w http.ResponseWriter, r *http.Request) err
 	}

 	response := responses.InferenceComputeResponse{
-		InferenceComputes:    inferenceComputes,
-		DefaultContextLength: info.DefaultContextLength,
+		InferenceComputes: inferenceComputes,
 	}

 	w.Header().Set("Content-Type", "application/json")
@@ -1672,6 +1615,17 @@ func supportsBrowserTools(model string) bool {
 	return strings.HasPrefix(strings.ToLower(model), "gpt-oss")
 }

+// Web search tools are simpler, providing only basic web search and fetch capabilities (e.g., "web_search", "web_fetch") without simulating a browser. Currently only qwen3 and deepseek-v3 support web search tools.
+func supportsWebSearchTools(model string) bool {
+	model = strings.ToLower(model)
+	prefixes := []string{"qwen3", "deepseek-v3"}
+	for _, p := range prefixes {
+		if strings.HasPrefix(model, p) {
+			return true
+		}
+	}
+	return false
+}

 // buildChatRequest converts store.Chat to api.ChatRequest
 func (s *Server) buildChatRequest(chat *store.Chat, model string, think any, availableTools []map[string]any) (*api.ChatRequest, error) {
--- a/app/ui/ui_test.go
+++ b/app/ui/ui_test.go
@@ -4,7 +4,6 @@ package ui

 import (
 	"bytes"
-	"context"
 	"encoding/json"
 	"io"
 	"net/http"
@@ -12,11 +11,9 @@ import (
 	"path/filepath"
 	"runtime"
 	"strings"
-	"sync/atomic"
 	"testing"

 	"github.com/ollama/ollama/app/store"
-	"github.com/ollama/ollama/app/updater"
 )

 func TestHandlePostApiSettings(t *testing.T) {
@@ -118,107 +115,6 @@ func TestHandlePostApiSettings(t *testing.T) {
 	}
 }

-func TestHandlePostApiCloudSetting(t *testing.T) {
-	tmpHome := t.TempDir()
-	t.Setenv("HOME", tmpHome)
-	t.Setenv("OLLAMA_NO_CLOUD", "")
-
-	testStore := &store.Store{
-		DBPath: filepath.Join(t.TempDir(), "db.sqlite"),
-	}
-	defer testStore.Close()
-
-	restartCount := 0
-	server := &Server{
-		Store: testStore,
-		Restart: func() {
-			restartCount++
-		},
-	}
-
-	for _, tc := range []struct {
-		name        string
-		body        string
-		wantEnabled bool
-	}{
-		{name: "disable cloud", body: `{"enabled": false}`, wantEnabled: false},
-		{name: "enable cloud", body: `{"enabled": true}`, wantEnabled: true},
-	} {
-		t.Run(tc.name, func(t *testing.T) {
-			req := httptest.NewRequest("POST", "/api/v1/cloud", bytes.NewBufferString(tc.body))
-			req.Header.Set("Content-Type", "application/json")
-			rr := httptest.NewRecorder()
-
-			if err := server.cloudSetting(rr, req); err != nil {
-				t.Fatalf("cloudSetting() error = %v", err)
-			}
-			if rr.Code != http.StatusOK {
-				t.Fatalf("cloudSetting() status = %d, want %d", rr.Code, http.StatusOK)
-			}
-
-			var got map[string]any
-			if err := json.Unmarshal(rr.Body.Bytes(), &got); err != nil {
-				t.Fatalf("cloudSetting() invalid response JSON: %v", err)
-			}
-			if got["disabled"] != !tc.wantEnabled {
-				t.Fatalf("response disabled = %v, want %v", got["disabled"], !tc.wantEnabled)
-			}
-
-			disabled, err := testStore.CloudDisabled()
-			if err != nil {
-				t.Fatalf("CloudDisabled() error = %v", err)
-			}
-			if gotEnabled := !disabled; gotEnabled != tc.wantEnabled {
-				t.Fatalf("cloud enabled = %v, want %v", gotEnabled, tc.wantEnabled)
-			}
-		})
-	}
-
-	if restartCount != 2 {
-		t.Fatalf("Restart called %d times, want 2", restartCount)
-	}
-}
-
-func TestHandleGetApiCloudSetting(t *testing.T) {
-	tmpHome := t.TempDir()
-	t.Setenv("HOME", tmpHome)
-	t.Setenv("OLLAMA_NO_CLOUD", "")
-
-	testStore := &store.Store{
-		DBPath: filepath.Join(t.TempDir(), "db.sqlite"),
-	}
-	defer testStore.Close()
-
-	if err := testStore.SetCloudEnabled(false); err != nil {
-		t.Fatalf("SetCloudEnabled(false) error = %v", err)
-	}
-
-	server := &Server{
-		Store:   testStore,
-		Restart: func() {},
-	}
-
-	req := httptest.NewRequest("GET", "/api/v1/cloud", nil)
-	rr := httptest.NewRecorder()
-	if err := server.getCloudSetting(rr, req); err != nil {
-		t.Fatalf("getCloudSetting() error = %v", err)
-	}
-	if rr.Code != http.StatusOK {
-		t.Fatalf("getCloudSetting() status = %d, want %d", rr.Code, http.StatusOK)
-	}
-
-	var got map[string]any
-	if err := json.Unmarshal(rr.Body.Bytes(), &got); err != nil {
-		t.Fatalf("getCloudSetting() invalid response JSON: %v", err)
-	}
-	if got["disabled"] != true {
-		t.Fatalf("response disabled = %v, want true", got["disabled"])
-	}
-	if got["source"] != "config" {
-		t.Fatalf("response source = %v, want config", got["source"])
-	}
-}
-
 func TestAuthenticationMiddleware(t *testing.T) {
 	tests := []struct {
 		name         string
@@ -525,290 +421,3 @@ func TestUserAgentTransport(t *testing.T) {

 	t.Logf("User-Agent transport successfully set: %s", receivedUA)
 }
-
-func TestSupportsBrowserTools(t *testing.T) {
-	tests := []struct {
-		model string
-		want  bool
-	}{
-		{"gpt-oss", true},
-		{"gpt-oss-latest", true},
-		{"GPT-OSS", true},
-		{"Gpt-Oss-v2", true},
-		{"qwen3", false},
-		{"deepseek-v3", false},
-		{"llama3.3", false},
-		{"", false},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.model, func(t *testing.T) {
-			if got := supportsBrowserTools(tt.model); got != tt.want {
-				t.Errorf("supportsBrowserTools(%q) = %v, want %v", tt.model, got, tt.want)
-			}
-		})
-	}
-}
-
-func TestWebSearchToolRegistration(t *testing.T) {
-	// Validates that the capability-gating logic in chat() correctly
-	// decides which tools to register based on model capabilities and
-	// the web search flag.
-	tests := []struct {
-		name             string
-		webSearchEnabled bool
-		hasToolsCap      bool
-		model            string
-		wantBrowser      bool // expects browser tools (gpt-oss)
-		wantWebSearch    bool // expects basic web search/fetch tools
-		wantNone         bool // expects no tools registered
-	}{
-		{
-			name:             "web search enabled with tools capability - browser model",
-			webSearchEnabled: true,
-			hasToolsCap:      true,
-			model:            "gpt-oss-latest",
-			wantBrowser:      true,
-		},
-		{
-			name:             "web search enabled with tools capability - non-browser model",
-			webSearchEnabled: true,
-			hasToolsCap:      true,
-			model:            "qwen3",
-			wantWebSearch:    true,
-		},
-		{
-			name:             "web search enabled without tools capability",
-			webSearchEnabled: true,
-			hasToolsCap:      false,
-			model:            "llama3.3",
-			wantNone:         true,
-		},
-		{
-			name:             "web search disabled with tools capability",
-			webSearchEnabled: false,
-			hasToolsCap:      true,
-			model:            "qwen3",
-			wantNone:         true,
-		},
-		{
-			name:             "web search disabled without tools capability",
-			webSearchEnabled: false,
-			hasToolsCap:      false,
-			model:            "llama3.3",
-			wantNone:         true,
-		},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			// Replicate the decision logic from chat() handler
-			gotBrowser := false
-			gotWebSearch := false
-
-			if tt.webSearchEnabled && tt.hasToolsCap {
-				if supportsBrowserTools(tt.model) {
-					gotBrowser = true
-				} else {
-					gotWebSearch = true
-				}
-			}
-
-			if tt.wantBrowser && !gotBrowser {
-				t.Error("expected browser tools to be registered")
-			}
-			if tt.wantWebSearch && !gotWebSearch {
-				t.Error("expected web search tools to be registered")
-			}
-			if tt.wantNone && (gotBrowser || gotWebSearch) {
-				t.Error("expected no tools to be registered")
-			}
-			if !tt.wantBrowser && gotBrowser {
-				t.Error("unexpected browser tools registered")
-			}
-			if !tt.wantWebSearch && gotWebSearch {
-				t.Error("unexpected web search tools registered")
-			}
-		})
-	}
-}
-
-func TestSettingsToggleAutoUpdateOff_CancelsDownload(t *testing.T) {
-	testStore := &store.Store{
-		DBPath: filepath.Join(t.TempDir(), "db.sqlite"),
-	}
-	defer testStore.Close()
-
-	// Start with auto-update enabled
-	settings, err := testStore.Settings()
-	if err != nil {
-		t.Fatal(err)
-	}
-	settings.AutoUpdateEnabled = true
-	if err := testStore.SetSettings(settings); err != nil {
-		t.Fatal(err)
-	}
-
-	upd := &updater.Updater{Store: &store.Store{
-		DBPath: filepath.Join(t.TempDir(), "db2.sqlite"),
-	}}
-	defer upd.Store.Close()
-
-	// We can't easily mock CancelOngoingDownload, but we can verify
-	// the full settings handler flow works without error
-	server := &Server{
-		Store:   testStore,
-		Restart: func() {},
-		Updater: upd,
-	}
-
-	// Disable auto-update via settings API
-	settings.AutoUpdateEnabled = false
-	body, err := json.Marshal(settings)
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	req := httptest.NewRequest("POST", "/api/v1/settings", bytes.NewReader(body))
-	req.Header.Set("Content-Type", "application/json")
-	rr := httptest.NewRecorder()
-
-	if err := server.settings(rr, req); err != nil {
-		t.Fatalf("settings() error = %v", err)
-	}
-	if rr.Code != http.StatusOK {
-		t.Fatalf("settings() status = %d, want %d", rr.Code, http.StatusOK)
-	}
-
-	// Verify settings were saved with auto-update disabled
-	saved, err := testStore.Settings()
-	if err != nil {
-		t.Fatal(err)
-	}
-	if saved.AutoUpdateEnabled {
-		t.Fatal("expected AutoUpdateEnabled to be false after toggle off")
-	}
-}
-
-func TestSettingsToggleAutoUpdateOn_WithPendingUpdate_ShowsNotification(t *testing.T) {
-	testStore := &store.Store{
-		DBPath: filepath.Join(t.TempDir(), "db.sqlite"),
-	}
-	defer testStore.Close()
-
-	// Start with auto-update disabled
-	settings, err := testStore.Settings()
-	if err != nil {
-		t.Fatal(err)
-	}
-	settings.AutoUpdateEnabled = false
-	if err := testStore.SetSettings(settings); err != nil {
-		t.Fatal(err)
-	}
-
-	// Simulate that an update was previously downloaded
-	oldVal := updater.UpdateDownloaded
-	updater.UpdateDownloaded = true
-	defer func() { updater.UpdateDownloaded = oldVal }()
-
-	var notificationCalled atomic.Bool
-	server := &Server{
-		Store:   testStore,
-		Restart: func() {},
-		UpdateAvailableFunc: func() {
-			notificationCalled.Store(true)
-		},
-	}
-
-	// Re-enable auto-update via settings API
-	settings.AutoUpdateEnabled = true
-	body, err := json.Marshal(settings)
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	req := httptest.NewRequest("POST", "/api/v1/settings", bytes.NewReader(body))
-	req.Header.Set("Content-Type", "application/json")
-	rr := httptest.NewRecorder()
-
-	if err := server.settings(rr, req); err != nil {
-		t.Fatalf("settings() error = %v", err)
-	}
-	if rr.Code != http.StatusOK {
-		t.Fatalf("settings() status = %d, want %d", rr.Code, http.StatusOK)
-	}
-
-	if !notificationCalled.Load() {
-		t.Fatal("expected UpdateAvailableFunc to be called when re-enabling with a downloaded update")
-	}
-}
-
-func TestSettingsToggleAutoUpdateOn_NoPendingUpdate_TriggersCheck(t *testing.T) {
-	testStore := &store.Store{
-		DBPath: filepath.Join(t.TempDir(), "db.sqlite"),
-	}
-	defer testStore.Close()
-
-	// Start with auto-update disabled
-	settings, err := testStore.Settings()
-	if err != nil {
-		t.Fatal(err)
-	}
-	settings.AutoUpdateEnabled = false
-	if err := testStore.SetSettings(settings); err != nil {
-		t.Fatal(err)
-	}
-
-	// Ensure no pending update - clear both the downloaded flag and the stage dir
-	oldVal := updater.UpdateDownloaded
-	updater.UpdateDownloaded = false
-	defer func() { updater.UpdateDownloaded = oldVal }()
-
-	oldStageDir := updater.UpdateStageDir
-	updater.UpdateStageDir = t.TempDir() // empty dir means IsUpdatePending() returns false
-	defer func() { updater.UpdateStageDir = oldStageDir }()
-
-	upd := &updater.Updater{Store: &store.Store{
-		DBPath: filepath.Join(t.TempDir(), "db2.sqlite"),
-	}}
-	defer upd.Store.Close()
-
-	// Initialize the checkNow channel by starting (and immediately stopping) the checker
-	// so TriggerImmediateCheck doesn't panic on nil channel
-	ctx, cancel := context.WithCancel(t.Context())
-	upd.StartBackgroundUpdaterChecker(ctx, func(string) error { return nil })
-	defer cancel()
-
-	var notificationCalled atomic.Bool
-	server := &Server{
-		Store:   testStore,
-		Restart: func() {},
-		Updater: upd,
-		UpdateAvailableFunc: func() {
-			notificationCalled.Store(true)
-		},
-	}
-
-	// Re-enable auto-update via settings API
-	settings.AutoUpdateEnabled = true
-	body, err := json.Marshal(settings)
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	req := httptest.NewRequest("POST", "/api/v1/settings", bytes.NewReader(body))
-	req.Header.Set("Content-Type", "application/json")
-	rr := httptest.NewRecorder()
-
-	if err := server.settings(rr, req); err != nil {
-		t.Fatalf("settings() error = %v", err)
-	}
-	if rr.Code != http.StatusOK {
-		t.Fatalf("settings() status = %d, want %d", rr.Code, http.StatusOK)
-	}
-
-	// UpdateAvailableFunc should NOT be called since there's no pending update
-	if notificationCalled.Load() {
-		t.Fatal("UpdateAvailableFunc should not be called when there is no pending update")
-	}
-}
--- a/app/updater/updater.go
+++ b/app/updater/updater.go
@@ -19,7 +19,6 @@ import (
 	"runtime"
 	"strconv"
 	"strings"
-	"sync"
 	"time"

 	"github.com/ollama/ollama/app/store"
@@ -59,8 +58,7 @@ func (u *Updater) checkForUpdate(ctx context.Context) (bool, UpdateResponse) {
 	query := requestURL.Query()
 	query.Add("os", runtime.GOOS)
 	query.Add("arch", runtime.GOARCH)
-	currentVersion := version.Version
-	query.Add("version", currentVersion)
+	query.Add("version", version.Version)
 	query.Add("ts", strconv.FormatInt(time.Now().Unix(), 10))

 	// The original macOS app used to use the device ID
@@ -133,27 +131,15 @@ func (u *Updater) checkForUpdate(ctx context.Context) (bool, UpdateResponse) {
 }

 func (u *Updater) DownloadNewRelease(ctx context.Context, updateResp UpdateResponse) error {
-	// Create a cancellable context for this download
-	downloadCtx, cancel := context.WithCancel(ctx)
-	u.cancelDownloadLock.Lock()
-	u.cancelDownload = cancel
-	u.cancelDownloadLock.Unlock()
-	defer func() {
-		u.cancelDownloadLock.Lock()
-		u.cancelDownload = nil
-		u.cancelDownloadLock.Unlock()
-		cancel()
-	}()
-
 	// Do a head first to check etag info
-	req, err := http.NewRequestWithContext(downloadCtx, http.MethodHead, updateResp.UpdateURL, nil)
+	req, err := http.NewRequestWithContext(ctx, http.MethodHead, updateResp.UpdateURL, nil)
 	if err != nil {
 		return err
 	}

 	// In case of slow downloads, continue the update check in the background
-	bgctx, bgcancel := context.WithCancel(downloadCtx)
-	defer bgcancel()
+	bgctx, cancel := context.WithCancel(ctx)
+	defer cancel()
 	go func() {
 		for {
 			select {
@@ -190,7 +176,6 @@ func (u *Updater) DownloadNewRelease(ctx context.Context, updateResp UpdateRespo
 	_, err = os.Stat(stageFilename)
 	if err == nil {
 		slog.Info("update already downloaded", "bundle", stageFilename)
-		UpdateDownloaded = true
 		return nil
 	}

@@ -259,85 +244,33 @@ func cleanupOldDownloads(stageDir string) {
 }

 type Updater struct {
-	Store              *store.Store
-	cancelDownload     context.CancelFunc
-	cancelDownloadLock sync.Mutex
-	checkNow           chan struct{}
-}
-
-// CancelOngoingDownload cancels any currently running download
-func (u *Updater) CancelOngoingDownload() {
-	u.cancelDownloadLock.Lock()
-	defer u.cancelDownloadLock.Unlock()
-	if u.cancelDownload != nil {
-		slog.Info("cancelling ongoing update download")
-		u.cancelDownload()
-		u.cancelDownload = nil
-	}
-}
-
-// TriggerImmediateCheck signals the background checker to check for updates immediately
-func (u *Updater) TriggerImmediateCheck() {
-	if u.checkNow != nil {
-		select {
-		case u.checkNow <- struct{}{}:
-		default:
-			// Check already pending, no need to queue another
-		}
-	}
+	Store *store.Store
 }

 func (u *Updater) StartBackgroundUpdaterChecker(ctx context.Context, cb func(string) error) {
-	u.checkNow = make(chan struct{}, 1)
-	u.checkNow <- struct{}{} // Trigger first check after initial delay
 	go func() {
 		// Don't blast an update message immediately after startup
 		time.Sleep(UpdateCheckInitialDelay)
 		slog.Info("beginning update checker", "interval", UpdateCheckInterval)
-		ticker := time.NewTicker(UpdateCheckInterval)
-		defer ticker.Stop()
-
 		for {
+			available, resp := u.checkForUpdate(ctx)
+			if available {
+				err := u.DownloadNewRelease(ctx, resp)
+				if err != nil {
+					slog.Error(fmt.Sprintf("failed to download new release: %s", err))
+				} else {
+					err = cb(resp.UpdateVersion)
+					if err != nil {
+						slog.Warn(fmt.Sprintf("failed to register update available with tray: %s", err))
+					}
+				}
+			}
 			select {
 			case <-ctx.Done():
 				slog.Debug("stopping background update checker")
 				return
-			case <-u.checkNow:
-				// Immediate check triggered
-			case <-ticker.C:
-				// Regular interval check
-			}
-
-			// Always check for updates
-			available, resp := u.checkForUpdate(ctx)
-			if !available {
-				continue
-			}
-
-			// Update is available - check if auto-update is enabled for downloading
-			settings, err := u.Store.Settings()
-			if err != nil {
-				slog.Error("failed to load settings", "error", err)
-				continue
-			}
-
-			if !settings.AutoUpdateEnabled {
-				// Auto-update disabled - don't download, just log
-				slog.Debug("update available but auto-update disabled", "version", resp.UpdateVersion)
-				continue
-			}
-
-			// Auto-update is enabled - download
-			err = u.DownloadNewRelease(ctx, resp)
-			if err != nil {
-				slog.Error("failed to download new release", "error", err)
-				continue
-			}
-
-			// Download successful - show tray notification
-			err = cb(resp.UpdateVersion)
-			if err != nil {
-				slog.Warn("failed to register update available with tray", "error", err)
+			default:
+				time.Sleep(UpdateCheckInterval)
 			}
 		}
 	}()
--- a/app/updater/updater_test.go
+++ b/app/updater/updater_test.go
@@ -11,8 +11,6 @@ import (
 	"log/slog"
 	"net/http"
 	"net/http/httptest"
-	"path/filepath"
-	"sync/atomic"
 	"testing"
 	"time"

@@ -35,7 +33,7 @@ func TestIsNewReleaseAvailable(t *testing.T) {
 	defer server.Close()
 	slog.Debug("server", "url", server.URL)

-	updater := &Updater{Store: &store.Store{DBPath: filepath.Join(t.TempDir(), "test.db")}}
+	updater := &Updater{Store: &store.Store{}}
 	defer updater.Store.Close() // Ensure database is closed
 	UpdateCheckURLBase = server.URL + "/update.json"
 	updatePresent, resp := updater.checkForUpdate(t.Context())
@@ -86,18 +84,8 @@ func TestBackgoundChecker(t *testing.T) {
 	defer server.Close()
 	UpdateCheckURLBase = server.URL + "/update.json"

-	updater := &Updater{Store: &store.Store{DBPath: filepath.Join(t.TempDir(), "test.db")}}
-	defer updater.Store.Close()
-
-	settings, err := updater.Store.Settings()
-	if err != nil {
-		t.Fatal(err)
-	}
-	settings.AutoUpdateEnabled = true
-	if err := updater.Store.SetSettings(settings); err != nil {
-		t.Fatal(err)
-	}
-
+	updater := &Updater{Store: &store.Store{}}
+	defer updater.Store.Close() // Ensure database is closed
 	updater.StartBackgroundUpdaterChecker(ctx, cb)
 	select {
 	case <-stallTimer.C:
@@ -111,267 +99,3 @@ func TestBackgoundChecker(t *testing.T) {
 		}
 	}
 }
-
-func TestAutoUpdateDisabledSkipsDownload(t *testing.T) {
-	UpdateStageDir = t.TempDir()
-	var downloadAttempted atomic.Bool
-	done := make(chan struct{})
-
-	ctx, cancel := context.WithCancel(t.Context())
-	defer cancel()
-	UpdateCheckInitialDelay = 5 * time.Millisecond
-	UpdateCheckInterval = 5 * time.Millisecond
-	VerifyDownload = func() error {
-		return nil
-	}
-
-	var server *httptest.Server
-	server = httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-		if r.URL.Path == "/update.json" {
-			w.Write([]byte(
-				fmt.Sprintf(`{"version": "9.9.9", "url": "%s"}`,
-					server.URL+"/9.9.9/"+Installer)))
-		} else if r.URL.Path == "/9.9.9/"+Installer {
-			downloadAttempted.Store(true)
-			buf := &bytes.Buffer{}
-			zw := zip.NewWriter(buf)
-			zw.Close()
-			io.Copy(w, buf)
-		}
-	}))
-	defer server.Close()
-	UpdateCheckURLBase = server.URL + "/update.json"
-
-	updater := &Updater{Store: &store.Store{DBPath: filepath.Join(t.TempDir(), "test.db")}}
-	defer updater.Store.Close()
-
-	// Ensure auto-update is disabled
-	settings, err := updater.Store.Settings()
-	if err != nil {
-		t.Fatal(err)
-	}
-	settings.AutoUpdateEnabled = false
-	if err := updater.Store.SetSettings(settings); err != nil {
-		t.Fatal(err)
-	}
-
-	cb := func(ver string) error {
-		t.Fatal("callback should not be called when auto-update is disabled")
-		return nil
-	}
-
-	updater.StartBackgroundUpdaterChecker(ctx, cb)
-
-	// Wait enough time for multiple check cycles
-	time.Sleep(50 * time.Millisecond)
-	close(done)
-
-	if downloadAttempted.Load() {
-		t.Fatal("download should not be attempted when auto-update is disabled")
-	}
-}
-
-func TestAutoUpdateReenabledDownloadsUpdate(t *testing.T) {
-	UpdateStageDir = t.TempDir()
-	var downloadAttempted atomic.Bool
-	callbackCalled := make(chan struct{}, 1)
-
-	ctx, cancel := context.WithCancel(t.Context())
-	defer cancel()
-	UpdateCheckInitialDelay = 5 * time.Millisecond
-	UpdateCheckInterval = 5 * time.Millisecond
-	VerifyDownload = func() error {
-		return nil
-	}
-
-	var server *httptest.Server
-	server = httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-		if r.URL.Path == "/update.json" {
-			w.Write([]byte(
-				fmt.Sprintf(`{"version": "9.9.9", "url": "%s"}`,
-					server.URL+"/9.9.9/"+Installer)))
-		} else if r.URL.Path == "/9.9.9/"+Installer {
-			downloadAttempted.Store(true)
-			buf := &bytes.Buffer{}
-			zw := zip.NewWriter(buf)
-			zw.Close()
-			io.Copy(w, buf)
-		}
-	}))
-	defer server.Close()
-	UpdateCheckURLBase = server.URL + "/update.json"
-
-	upd := &Updater{Store: &store.Store{DBPath: filepath.Join(t.TempDir(), "test.db")}}
-	defer upd.Store.Close()
-
-	// Start with auto-update disabled
-	settings, err := upd.Store.Settings()
-	if err != nil {
-		t.Fatal(err)
-	}
-	settings.AutoUpdateEnabled = false
-	if err := upd.Store.SetSettings(settings); err != nil {
-		t.Fatal(err)
-	}
-
-	cb := func(ver string) error {
-		select {
-		case callbackCalled <- struct{}{}:
-		default:
-		}
-		return nil
-	}
-
-	upd.StartBackgroundUpdaterChecker(ctx, cb)
-
-	// Wait for a few cycles with auto-update disabled - no download should happen
-	time.Sleep(50 * time.Millisecond)
-	if downloadAttempted.Load() {
-		t.Fatal("download should not happen while auto-update is disabled")
-	}
-
-	// Re-enable auto-update
-	settings.AutoUpdateEnabled = true
-	if err := upd.Store.SetSettings(settings); err != nil {
-		t.Fatal(err)
-	}
-
-	// Wait for the checker to pick it up and download
-	select {
-	case <-callbackCalled:
-		// Success: download happened and callback was called after re-enabling
-		if !downloadAttempted.Load() {
-			t.Fatal("expected download to be attempted after re-enabling")
-		}
-	case <-time.After(5 * time.Second):
-		t.Fatal("expected download and callback after re-enabling auto-update")
-	}
-}
-
-func TestCancelOngoingDownload(t *testing.T) {
-	UpdateStageDir = t.TempDir()
-	downloadStarted := make(chan struct{})
-	downloadCancelled := make(chan struct{})
-
-	ctx := t.Context()
-	VerifyDownload = func() error {
-		return nil
-	}
-
-	var server *httptest.Server
-	server = httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-		if r.URL.Path == "/update.json" {
-			w.Write([]byte(
-				fmt.Sprintf(`{"version": "9.9.9", "url": "%s"}`,
-					server.URL+"/9.9.9/"+Installer)))
-		} else if r.URL.Path == "/9.9.9/"+Installer {
-			if r.Method == http.MethodHead {
-				w.Header().Set("Content-Length", "1000000")
-				w.WriteHeader(http.StatusOK)
-				return
-			}
-			// Signal that download has started
-			close(downloadStarted)
-			// Wait for cancellation or timeout
-			select {
-			case <-r.Context().Done():
-				close(downloadCancelled)
-				return
-			case <-time.After(5 * time.Second):
-				t.Error("download was not cancelled in time")
-			}
-		}
-	}))
-	defer server.Close()
-	UpdateCheckURLBase = server.URL + "/update.json"
-
-	updater := &Updater{Store: &store.Store{DBPath: filepath.Join(t.TempDir(), "test.db")}}
-	defer updater.Store.Close()
-
-	_, resp := updater.checkForUpdate(ctx)
-
-	// Start download in goroutine
-	go func() {
-		_ = updater.DownloadNewRelease(ctx, resp)
-	}()
-
-	// Wait for download to start
-	select {
-	case <-downloadStarted:
-	case <-time.After(2 * time.Second):
-		t.Fatal("download did not start in time")
-	}
-
-	// Cancel the download
-	updater.CancelOngoingDownload()
-
-	// Verify cancellation was received
-	select {
-	case <-downloadCancelled:
-		// Success
-	case <-time.After(2 * time.Second):
-		t.Fatal("download cancellation was not received by server")
-	}
-}
-
-func TestTriggerImmediateCheck(t *testing.T) {
-	UpdateStageDir = t.TempDir()
-	checkCount := atomic.Int32{}
-	checkDone := make(chan struct{}, 10)
-
-	ctx, cancel := context.WithCancel(t.Context())
-	defer cancel()
-	// Set a very long interval so only TriggerImmediateCheck causes checks
-	UpdateCheckInitialDelay = 1 * time.Millisecond
-	UpdateCheckInterval = 1 * time.Hour
-	VerifyDownload = func() error {
-		return nil
-	}
-
-	server := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-		if r.URL.Path == "/update.json" {
-			checkCount.Add(1)
-			select {
-			case checkDone <- struct{}{}:
-			default:
-			}
-			// Return no update available
-			w.WriteHeader(http.StatusNoContent)
-		}
-	}))
-	defer server.Close()
-	UpdateCheckURLBase = server.URL + "/update.json"
-
-	updater := &Updater{Store: &store.Store{DBPath: filepath.Join(t.TempDir(), "test.db")}}
-	defer updater.Store.Close()
-
-	cb := func(ver string) error {
-		return nil
-	}
-
-	updater.StartBackgroundUpdaterChecker(ctx, cb)
-
-	// Wait for the initial check that fires after the initial delay
-	select {
-	case <-checkDone:
-	case <-time.After(2 * time.Second):
-		t.Fatal("initial check did not happen")
-	}
-
-	initialCount := checkCount.Load()
-
-	// Trigger immediate check
-	updater.TriggerImmediateCheck()
-
-	// Wait for the triggered check
-	select {
-	case <-checkDone:
-	case <-time.After(2 * time.Second):
-		t.Fatal("triggered check did not happen")
-	}
-
-	finalCount := checkCount.Load()
-	if finalCount <= initialCount {
-		t.Fatalf("TriggerImmediateCheck did not cause additional check: initial=%d, final=%d", initialCount, finalCount)
-	}
-}
--- a/app/wintray/tray.go
+++ b/app/wintray/tray.go
@@ -369,6 +369,25 @@ func (t *winTray) addSeparatorMenuItem(menuItemId, parentId uint32) error {
 	return nil
 }

+// func (t *winTray) hideMenuItem(menuItemId, parentId uint32) error {
+// 	const ERROR_SUCCESS syscall.Errno = 0
+
+// 	t.muMenus.RLock()
+// 	menu := uintptr(t.menus[parentId])
+// 	t.muMenus.RUnlock()
+// 	res, _, err := pRemoveMenu.Call(
+// 		menu,
+// 		uintptr(menuItemId),
+// 		MF_BYCOMMAND,
+// 	)
+// 	if res == 0 && err.(syscall.Errno) != ERROR_SUCCESS {
+// 		return err
+// 	}
+// 	t.delFromVisibleItems(parentId, menuItemId)
+
+// 	return nil
+// }
+
 func (t *winTray) showMenu() error {
 	p := point{}
 	boolRet, _, err := pGetCursorPos.Call(uintptr(unsafe.Pointer(&p)))
--- a/app/wintray/w32api.go
+++ b/app/wintray/w32api.go
@@ -51,6 +51,7 @@ const (
 	IMAGE_ICON          = 1          // Loads an icon
 	LR_DEFAULTSIZE      = 0x00000040 // Loads default-size icon for windows(SM_CXICON x SM_CYICON) if cx, cy are set to zero
 	LR_LOADFROMFILE     = 0x00000010 // Loads the stand-alone image from the file
+	MF_BYCOMMAND        = 0x00000000
 	MFS_DISABLED        = 0x00000003
 	MFT_SEPARATOR       = 0x00000800
 	MFT_STRING          = 0x00000000
--- a/cmd/background_unix.go
+++ b/cmd/background_unix.go
@@ -1,13 +0,0 @@
-//go:build !windows
-
-package cmd
-
-import "syscall"
-
-// backgroundServerSysProcAttr returns SysProcAttr for running the server in the background on Unix.
-// Setpgid prevents the server from being killed when the parent process exits.
-func backgroundServerSysProcAttr() *syscall.SysProcAttr {
-	return &syscall.SysProcAttr{
-		Setpgid: true,
-	}
-}
--- a/cmd/background_windows.go
+++ b/cmd/background_windows.go
@@ -1,12 +0,0 @@
-package cmd
-
-import "syscall"
-
-// backgroundServerSysProcAttr returns SysProcAttr for running the server in the background on Windows.
-// CREATE_NO_WINDOW (0x08000000) prevents a console window from appearing.
-func backgroundServerSysProcAttr() *syscall.SysProcAttr {
-	return &syscall.SysProcAttr{
-		CreationFlags: 0x08000000,
-		HideWindow:    true,
-	}
-}
--- a/cmd/cmd.go
+++ b/cmd/cmd.go
@@ -15,7 +15,6 @@ import (
 	"net"
 	"net/http"
 	"os"
-	"os/exec"
 	"os/signal"
 	"path/filepath"
 	"runtime"
@@ -30,15 +29,12 @@ import (
 	"github.com/containerd/console"
 	"github.com/mattn/go-runewidth"
 	"github.com/olekukonko/tablewriter"
-	"github.com/pkg/browser"
 	"github.com/spf13/cobra"
 	"golang.org/x/crypto/ssh"
 	"golang.org/x/sync/errgroup"
 	"golang.org/x/term"

 	"github.com/ollama/ollama/api"
-	"github.com/ollama/ollama/cmd/config"
-	"github.com/ollama/ollama/cmd/tui"
 	"github.com/ollama/ollama/envconfig"
 	"github.com/ollama/ollama/format"
 	"github.com/ollama/ollama/parser"
@@ -50,49 +46,11 @@ import (
 	"github.com/ollama/ollama/types/syncmap"
 	"github.com/ollama/ollama/version"
 	xcmd "github.com/ollama/ollama/x/cmd"
-	"github.com/ollama/ollama/x/create"
-	xcreateclient "github.com/ollama/ollama/x/create/client"
 	"github.com/ollama/ollama/x/imagegen"
+	imagegenclient "github.com/ollama/ollama/x/imagegen/client"
 )

-func init() {
-	// Override default selectors to use Bubbletea TUI instead of raw terminal I/O.
-	config.DefaultSingleSelector = func(title string, items []config.ModelItem, current string) (string, error) {
-		tuiItems := tui.ReorderItems(tui.ConvertItems(items))
-		result, err := tui.SelectSingle(title, tuiItems, current)
-		if errors.Is(err, tui.ErrCancelled) {
-			return "", config.ErrCancelled
-		}
-		return result, err
-	}
-
-	config.DefaultMultiSelector = func(title string, items []config.ModelItem, preChecked []string) ([]string, error) {
-		tuiItems := tui.ReorderItems(tui.ConvertItems(items))
-		result, err := tui.SelectMultiple(title, tuiItems, preChecked)
-		if errors.Is(err, tui.ErrCancelled) {
-			return nil, config.ErrCancelled
-		}
-		return result, err
-	}
-
-	config.DefaultSignIn = func(modelName, signInURL string) (string, error) {
-		userName, err := tui.RunSignIn(modelName, signInURL)
-		if errors.Is(err, tui.ErrCancelled) {
-			return "", config.ErrCancelled
-		}
-		return userName, err
-	}
-
-	config.DefaultConfirmPrompt = func(prompt string) (bool, error) {
-		ok, err := tui.RunConfirm(prompt)
-		if errors.Is(err, tui.ErrCancelled) {
-			return false, config.ErrCancelled
-		}
-		return ok, err
-	}
-}
-
-const ConnectInstructions = "If your browser did not open, navigate to:\n    %s\n\n"
+const ConnectInstructions = "To sign in, navigate to:\n    %s\n\n"

 // ensureThinkingSupport emits a warning if the model does not advertise thinking support
 func ensureThinkingSupport(ctx context.Context, client *api.Client, name string) {
@@ -135,91 +93,15 @@ func CreateHandler(cmd *cobra.Command, args []string) error {
 	p := progress.NewProgress(os.Stderr)
 	defer p.Stop()

-	// Validate model name early to fail fast
-	modelName := args[0]
-	name := model.ParseName(modelName)
-	if !name.IsValid() {
-		return fmt.Errorf("invalid model name: %s", modelName)
-	}
-
-	// Check for --experimental flag for safetensors model creation
-	experimental, _ := cmd.Flags().GetBool("experimental")
-	if experimental {
-		// Get Modelfile content - either from -f flag or default to "FROM ."
-		var reader io.Reader
-		filename, err := getModelfileName(cmd)
-		if os.IsNotExist(err) || filename == "" {
-			// No Modelfile specified or found - use default
-			reader = strings.NewReader("FROM .\n")
-		} else if err != nil {
-			return err
-		} else {
-			f, err := os.Open(filename)
-			if err != nil {
-				return err
-			}
-			defer f.Close()
-			reader = f
-		}
-
-		// Parse the Modelfile
-		modelfile, err := parser.ParseFile(reader)
-		if err != nil {
-			return fmt.Errorf("failed to parse Modelfile: %w", err)
-		}
-
-		// Extract FROM path and configuration
-		var modelDir string
-		mfConfig := &xcreateclient.ModelfileConfig{}
-
-		for _, cmd := range modelfile.Commands {
-			switch cmd.Name {
-			case "model":
-				modelDir = cmd.Args
-			case "template":
-				mfConfig.Template = cmd.Args
-			case "system":
-				mfConfig.System = cmd.Args
-			case "license":
-				mfConfig.License = cmd.Args
-			case "parser":
-				mfConfig.Parser = cmd.Args
-			case "renderer":
-				mfConfig.Renderer = cmd.Args
-			}
-		}
-
-		if modelDir == "" {
-			modelDir = "."
-		}
-
-		// Resolve relative paths based on Modelfile location
-		if !filepath.IsAbs(modelDir) && filename != "" {
-			modelDir = filepath.Join(filepath.Dir(filename), modelDir)
-		}
-
-		quantize, _ := cmd.Flags().GetString("quantize")
-		return xcreateclient.CreateModel(xcreateclient.CreateOptions{
-			ModelName: modelName,
-			ModelDir:  modelDir,
-			Quantize:  quantize,
-			Modelfile: mfConfig,
-		}, p)
-	}
-
 	var reader io.Reader

 	filename, err := getModelfileName(cmd)
 	if os.IsNotExist(err) {
 		if filename == "" {
 			// No Modelfile found - check if current directory is an image gen model
-			if create.IsTensorModelDir(".") {
+			if imagegen.IsTensorModelDir(".") {
 				quantize, _ := cmd.Flags().GetString("quantize")
-				return xcreateclient.CreateModel(xcreateclient.CreateOptions{
-					ModelName: modelName,
-					ModelDir:  ".",
-					Quantize:  quantize,
-				}, p)
+				return imagegenclient.CreateModel(args[0], ".", quantize, p)
 			}
 			reader = strings.NewReader("FROM .\n")
 		} else {
@@ -252,7 +134,7 @@ func CreateHandler(cmd *cobra.Command, args []string) error {
 	}
 	spinner.Stop()

-	req.Model = modelName
+	req.Model = args[0]
 	quantize, _ := cmd.Flags().GetString("quantize")
 	if quantize != "" {
 		req.Quantize = quantize
@@ -410,25 +292,14 @@ func loadOrUnloadModel(cmd *cobra.Command, opts *runOptions) error {
 		return err
 	} else if info.RemoteHost != "" {
 		// Cloud model, no need to load/unload
-
-		isCloud := strings.HasPrefix(info.RemoteHost, "https://ollama.com")
-
-		// Check if user is signed in for ollama.com cloud models
-		if isCloud {
-			if _, err := client.Whoami(cmd.Context()); err != nil {
-				return err
-			}
-		}
-
 		if opts.ShowConnect {
 			p.StopAndClear()
-			if isCloud {
+			if strings.HasPrefix(info.RemoteHost, "https://ollama.com") {
 				fmt.Fprintf(os.Stderr, "Connecting to '%s' on 'ollama.com' ⚡\n", info.RemoteModel)
 			} else {
 				fmt.Fprintf(os.Stderr, "Connecting to '%s' on '%s'\n", info.RemoteModel, info.RemoteHost)
 			}
 		}
-
 		return nil
 	}

@@ -585,17 +456,6 @@ func RunHandler(cmd *cobra.Command, args []string) error {
 	}
 	opts.WordWrap = !nowrap

-	useImagegen := false
-	if cmd.Flags().Lookup("imagegen") != nil {
-		useImagegen, err = cmd.Flags().GetBool("imagegen")
-		if err != nil {
-			return err
-		}
-	}
-	if useImagegen {
-		opts.Options["use_imagegen_runner"] = true
-	}
-
 	// Fill out the rest of the options based on information about the
 	// model.
 	client, err := api.ClientFromEnvironment()
@@ -667,7 +527,7 @@ func RunHandler(cmd *cobra.Command, args []string) error {
 	}

 	// Check if this is an image generation model
-	if slices.Contains(info.Capabilities, model.CapabilityImage) {
+	if slices.Contains(info.Capabilities, model.CapabilityImageGeneration) {
 		if opts.Prompt == "" && !interactive {
 			return errors.New("image generation models require a prompt. Usage: ollama run " + name + " \"your prompt here\"")
 		}
@@ -729,7 +589,6 @@ func SigninHandler(cmd *cobra.Command, args []string) error {
 			fmt.Println()

 			if aErr.SigninURL != "" {
-				_ = browser.OpenURL(aErr.SigninURL)
 				fmt.Printf(ConnectInstructions, aErr.SigninURL)
 			}
 			return nil
@@ -967,11 +826,11 @@ func DeleteHandler(cmd *cobra.Command, args []string) error {
 	for _, arg := range args {
 		// Unload the model if it's running before deletion
 		if err := loadOrUnloadModel(cmd, &runOptions{
-			Model:     arg,
+			Model:     args[0],
 			KeepAlive: &api.Duration{Duration: 0},
 		}); err != nil {
 			if !strings.Contains(strings.ToLower(err.Error()), "not found") {
-				fmt.Fprintf(os.Stderr, "Warning: unable to stop model '%s'\n", arg)
+				fmt.Fprintf(os.Stderr, "Warning: unable to stop model '%s'\n", args[0])
 			}
 		}

@@ -1086,10 +945,8 @@ func showInfo(resp *api.ShowResponse, verbose bool, w io.Writer) error {
 		}

 		if resp.ModelInfo != nil {
-			arch, _ := resp.ModelInfo["general.architecture"].(string)
-			if arch != "" {
-				rows = append(rows, []string{"", "architecture", arch})
-			}
+			arch := resp.ModelInfo["general.architecture"].(string)
+			rows = append(rows, []string{"", "architecture", arch})

 			var paramStr string
 			if resp.Details.ParameterSize != "" {
@@ -1099,9 +956,7 @@ func showInfo(resp *api.ShowResponse, verbose bool, w io.Writer) error {
 					paramStr = format.HumanNumber(uint64(f))
 				}
 			}
-			if paramStr != "" {
-				rows = append(rows, []string{"", "parameters", paramStr})
-			}
+			rows = append(rows, []string{"", "parameters", paramStr})

 			if v, ok := resp.ModelInfo[fmt.Sprintf("%s.context_length", arch)]; ok {
 				if f, ok := v.(float64); ok {
@@ -1817,7 +1672,7 @@ func checkServerHeartbeat(cmd *cobra.Command, _ []string) error {
 			return err
 		}
 		if err := startApp(cmd.Context(), client); err != nil {
-			return err
+			return fmt.Errorf("ollama server not responding - %w", err)
 		}
 	}
 	return nil
@@ -1858,220 +1713,6 @@ Environment Variables:
 	cmd.SetUsageTemplate(cmd.UsageTemplate() + envUsage)
 }

-// ensureServerRunning checks if the ollama server is running and starts it in the background if not.
-func ensureServerRunning(ctx context.Context) error {
-	client, err := api.ClientFromEnvironment()
-	if err != nil {
-		return err
-	}
-
-	// Check if server is already running
-	if err := client.Heartbeat(ctx); err == nil {
-		return nil // server is already running
-	}
-
-	// Server not running, start it in the background
-	exe, err := os.Executable()
-	if err != nil {
-		return fmt.Errorf("could not find executable: %w", err)
-	}
-
-	serverCmd := exec.CommandContext(ctx, exe, "serve")
-	serverCmd.Env = os.Environ()
-	serverCmd.SysProcAttr = backgroundServerSysProcAttr()
-	if err := serverCmd.Start(); err != nil {
-		return fmt.Errorf("failed to start server: %w", err)
-	}
-
-	// Wait for the server to be ready
-	for {
-		time.Sleep(500 * time.Millisecond)
-		if err := client.Heartbeat(ctx); err == nil {
-			return nil // server has started
-		}
-	}
-}
-
-// runInteractiveTUI runs the main interactive TUI menu.
-func runInteractiveTUI(cmd *cobra.Command) {
-	// Ensure the server is running before showing the TUI
-	if err := ensureServerRunning(cmd.Context()); err != nil {
-		fmt.Fprintf(os.Stderr, "Error starting server: %v\n", err)
-		return
-	}
-
-	// Selector adapters for tui
-	singleSelector := func(title string, items []config.ModelItem, current string) (string, error) {
-		tuiItems := tui.ReorderItems(tui.ConvertItems(items))
-		result, err := tui.SelectSingle(title, tuiItems, current)
-		if errors.Is(err, tui.ErrCancelled) {
-			return "", config.ErrCancelled
-		}
-		return result, err
-	}
-
-	multiSelector := func(title string, items []config.ModelItem, preChecked []string) ([]string, error) {
-		tuiItems := tui.ReorderItems(tui.ConvertItems(items))
-		result, err := tui.SelectMultiple(title, tuiItems, preChecked)
-		if errors.Is(err, tui.ErrCancelled) {
-			return nil, config.ErrCancelled
-		}
-		return result, err
-	}
-
-	for {
-		result, err := tui.Run()
-		if err != nil {
-			fmt.Fprintf(os.Stderr, "Error: %v\n", err)
-			return
-		}
-
-		runModel := func(modelName string) {
-			client, err := api.ClientFromEnvironment()
-			if err != nil {
-				fmt.Fprintf(os.Stderr, "Error: %v\n", err)
-				return
-			}
-			if err := config.ShowOrPull(cmd.Context(), client, modelName); err != nil {
-				if errors.Is(err, config.ErrCancelled) {
-					return
-				}
-				fmt.Fprintf(os.Stderr, "Error: %v\n", err)
-				return
-			}
-			_ = config.SetLastModel(modelName)
-			opts := runOptions{
-				Model:       modelName,
-				WordWrap:    os.Getenv("TERM") == "xterm-256color",
-				Options:     map[string]any{},
-				ShowConnect: true,
-			}
-			if err := loadOrUnloadModel(cmd, &opts); err != nil {
-				fmt.Fprintf(os.Stderr, "Error loading model: %v\n", err)
-				return
-			}
-			if err := generateInteractive(cmd, opts); err != nil {
-				fmt.Fprintf(os.Stderr, "Error running model: %v\n", err)
-			}
-		}
-
-		launchIntegration := func(name string) bool {
-			if err := config.EnsureInstalled(name); err != nil {
-				fmt.Fprintf(os.Stderr, "Error: %v\n", err)
-				return true
-			}
-			// If not configured or model no longer exists, prompt for model selection
-			configuredModel := config.IntegrationModel(name)
-			if configuredModel == "" || !config.ModelExists(cmd.Context(), configuredModel) || config.IsCloudModelDisabled(cmd.Context(), configuredModel) {
-				err := config.ConfigureIntegrationWithSelectors(cmd.Context(), name, singleSelector, multiSelector)
-				if errors.Is(err, config.ErrCancelled) {
-					return false // Return to main menu
-				}
-				if err != nil {
-					fmt.Fprintf(os.Stderr, "Error configuring %s: %v\n", name, err)
-					return true
-				}
-			}
-			if err := config.LaunchIntegration(name); err != nil {
-				fmt.Fprintf(os.Stderr, "Error launching %s: %v\n", name, err)
-			}
-			return true
-		}
-
-		switch result.Selection {
-		case tui.SelectionNone:
-			// User quit
-			return
-		case tui.SelectionRunModel:
-			_ = config.SetLastSelection("run")
-			if modelName := config.LastModel(); modelName != "" && !config.IsCloudModelDisabled(cmd.Context(), modelName) {
-				runModel(modelName)
-			} else {
-				modelName, err := config.SelectModelWithSelector(cmd.Context(), singleSelector)
-				if errors.Is(err, config.ErrCancelled) {
-					continue // Return to main menu
-				}
-				if err != nil {
-					fmt.Fprintf(os.Stderr, "Error selecting model: %v\n", err)
-					continue
-				}
-				runModel(modelName)
-			}
-		case tui.SelectionChangeRunModel:
-			_ = config.SetLastSelection("run")
-			// Use model from modal if selected, otherwise show picker
-			modelName := result.Model
-			if modelName == "" {
-				var err error
-				modelName, err = config.SelectModelWithSelector(cmd.Context(), singleSelector)
-				if errors.Is(err, config.ErrCancelled) {
-					continue // Return to main menu
-				}
-				if err != nil {
-					fmt.Fprintf(os.Stderr, "Error selecting model: %v\n", err)
-					continue
-				}
-			}
-			if config.IsCloudModelDisabled(cmd.Context(), modelName) {
-				continue // Return to main menu
-			}
-			runModel(modelName)
-		case tui.SelectionIntegration:
-			_ = config.SetLastSelection(result.Integration)
-			if !launchIntegration(result.Integration) {
-				continue // Return to main menu
-			}
-		case tui.SelectionChangeIntegration:
-			_ = config.SetLastSelection(result.Integration)
-			if len(result.Models) > 0 {
-				// Filter out cloud-disabled models
-				var filtered []string
-				for _, m := range result.Models {
-					if !config.IsCloudModelDisabled(cmd.Context(), m) {
-						filtered = append(filtered, m)
-					}
-				}
-				if len(filtered) == 0 {
-					continue
-				}
-				result.Models = filtered
-				// Multi-select from modal (Editor integrations)
-				if err := config.SaveAndEditIntegration(result.Integration, result.Models); err != nil {
-					fmt.Fprintf(os.Stderr, "Error configuring %s: %v\n", result.Integration, err)
-					continue
-				}
-				if err := config.LaunchIntegrationWithModel(result.Integration, result.Models[0]); err != nil {
-					fmt.Fprintf(os.Stderr, "Error launching %s: %v\n", result.Integration, err)
-				}
-			} else if result.Model != "" {
-				if config.IsCloudModelDisabled(cmd.Context(), result.Model) {
-					continue
-				}
-				// Single-select from modal - save and launch
-				if err := config.SaveIntegration(result.Integration, []string{result.Model}); err != nil {
-					fmt.Fprintf(os.Stderr, "Error saving config: %v\n", err)
-					continue
-				}
-				if err := config.LaunchIntegrationWithModel(result.Integration, result.Model); err != nil {
-					fmt.Fprintf(os.Stderr, "Error launching %s: %v\n", result.Integration, err)
-				}
-			} else {
-				err := config.ConfigureIntegrationWithSelectors(cmd.Context(), result.Integration, singleSelector, multiSelector)
-				if errors.Is(err, config.ErrCancelled) {
-					continue // Return to main menu
-				}
-				if err != nil {
-					fmt.Fprintf(os.Stderr, "Error configuring %s: %v\n", result.Integration, err)
-					continue
-				}
-				if err := config.LaunchIntegration(result.Integration); err != nil {
-					fmt.Fprintf(os.Stderr, "Error launching %s: %v\n", result.Integration, err)
-				}
-			}
-		}
-	}
-}
-
 func NewCLI() *cobra.Command {
 	log.SetFlags(log.LstdFlags | log.Lshortfile)
 	cobra.EnableCommandSorting = false
@@ -2094,31 +1735,22 @@ func NewCLI() *cobra.Command {
 				return
 			}

-			runInteractiveTUI(cmd)
+			cmd.Print(cmd.UsageString())
 		},
 	}

 	rootCmd.Flags().BoolP("version", "v", false, "Show version information")
-	rootCmd.Flags().Bool("verbose", false, "Show timings for response")
-	rootCmd.Flags().Bool("nowordwrap", false, "Don't wrap words to the next line automatically")

 	createCmd := &cobra.Command{
-		Use:   "create MODEL",
-		Short: "Create a model",
-		Args:  cobra.ExactArgs(1),
-		PreRunE: func(cmd *cobra.Command, args []string) error {
-			// Skip server check for experimental mode (writes directly to disk)
-			if experimental, _ := cmd.Flags().GetBool("experimental"); experimental {
-				return nil
-			}
-			return checkServerHeartbeat(cmd, args)
-		},
-		RunE: CreateHandler,
+		Use:     "create MODEL",
+		Short:   "Create a model",
+		Args:    cobra.ExactArgs(1),
+		PreRunE: checkServerHeartbeat,
+		RunE:    CreateHandler,
 	}

 	createCmd.Flags().StringP("file", "f", "", "Name of the Modelfile (default \"Modelfile\")")
 	createCmd.Flags().StringP("quantize", "q", "", "Quantize model to this level (e.g. q4_K_M)")
-	createCmd.Flags().Bool("experimental", false, "Enable experimental safetensors model creation")

 	showCmd := &cobra.Command{
 		Use:     "show MODEL",
@@ -2160,9 +1792,6 @@ func NewCLI() *cobra.Command {
 	// Image generation flags (width, height, steps, seed, etc.)
 	imagegen.RegisterFlags(runCmd)

-	runCmd.Flags().Bool("imagegen", false, "Use the imagegen runner for LLM inference")
-	runCmd.Flags().MarkHidden("imagegen")
-
 	stopCmd := &cobra.Command{
 		Use:     "stop MODEL",
 		Short:   "Stop a running model",
@@ -2174,7 +1803,7 @@ func NewCLI() *cobra.Command {
 	serveCmd := &cobra.Command{
 		Use:     "serve",
 		Aliases: []string{"start"},
-		Short:   "Start Ollama",
+		Short:   "Start ollama",
 		Args:    cobra.ExactArgs(0),
 		RunE:    RunServer,
 	}
@@ -2207,15 +1836,6 @@ func NewCLI() *cobra.Command {
 		RunE:    SigninHandler,
 	}

-	loginCmd := &cobra.Command{
-		Use:     "login",
-		Short:   "Sign in to ollama.com",
-		Hidden:  true,
-		Args:    cobra.ExactArgs(0),
-		PreRunE: checkServerHeartbeat,
-		RunE:    SigninHandler,
-	}
-
 	signoutCmd := &cobra.Command{
 		Use:     "signout",
 		Short:   "Sign out from ollama.com",
@@ -2224,15 +1844,6 @@ func NewCLI() *cobra.Command {
 		RunE:    SignoutHandler,
 	}

-	logoutCmd := &cobra.Command{
-		Use:     "logout",
-		Short:   "Sign out from ollama.com",
-		Hidden:  true,
-		Args:    cobra.ExactArgs(0),
-		PreRunE: checkServerHeartbeat,
-		RunE:    SignoutHandler,
-	}
-
 	listCmd := &cobra.Command{
 		Use:     "list",
 		Aliases: []string{"ls"},
@@ -2294,8 +1905,7 @@ func NewCLI() *cobra.Command {
 	} {
 		switch cmd {
 		case runCmd:
-			imagegen.AppendFlagsDocs(cmd)
-			appendEnvDocs(cmd, []envconfig.EnvVar{envVars["OLLAMA_EDITOR"], envVars["OLLAMA_HOST"], envVars["OLLAMA_NOHISTORY"]})
+			appendEnvDocs(cmd, []envconfig.EnvVar{envVars["OLLAMA_HOST"], envVars["OLLAMA_NOHISTORY"]})
 		case serveCmd:
 			appendEnvDocs(cmd, []envconfig.EnvVar{
 				envVars["OLLAMA_DEBUG"],
@@ -2306,7 +1916,6 @@ func NewCLI() *cobra.Command {
 				envVars["OLLAMA_MAX_QUEUE"],
 				envVars["OLLAMA_MODELS"],
 				envVars["OLLAMA_NUM_PARALLEL"],
-				envVars["OLLAMA_NO_CLOUD"],
 				envVars["OLLAMA_NOPRUNE"],
 				envVars["OLLAMA_ORIGINS"],
 				envVars["OLLAMA_SCHED_SPREAD"],
@@ -2330,15 +1939,12 @@ func NewCLI() *cobra.Command {
 		pullCmd,
 		pushCmd,
 		signinCmd,
-		loginCmd,
 		signoutCmd,
-		logoutCmd,
 		listCmd,
 		psCmd,
 		copyCmd,
 		deleteCmd,
 		runnerCmd,
-		config.LaunchCmd(checkServerHeartbeat, runInteractiveTUI),
 	)

 	return rootCmd
--- a/cmd/cmd_test.go
+++ b/cmd/cmd_test.go
@@ -3,7 +3,6 @@ package cmd
 import (
 	"bytes"
 	"encoding/json"
-	"errors"
 	"fmt"
 	"io"
 	"net/http"
@@ -1554,9 +1553,9 @@ func TestShowInfoImageGen(t *testing.T) {
 		Details: api.ModelDetails{
 			Family:            "ZImagePipeline",
 			ParameterSize:     "10.3B",
-			QuantizationLevel: "Q8",
+			QuantizationLevel: "FP8",
 		},
-		Capabilities: []model.Capability{model.CapabilityImage},
+		Capabilities: []model.Capability{model.CapabilityImageGeneration},
 		Requires:     "0.14.0",
 	}, false, &b)
 	if err != nil {
@@ -1566,7 +1565,7 @@ func TestShowInfoImageGen(t *testing.T) {
 	expect := "  Model\n" +
 		"    architecture    ZImagePipeline    \n" +
 		"    parameters      10.3B             \n" +
-		"    quantization    Q8                \n" +
+		"    quantization    FP8               \n" +
 		"    requires        0.14.0            \n" +
 		"\n" +
 		"  Capabilities\n" +
@@ -1660,103 +1659,3 @@ func TestRunOptions_Copy_Independence(t *testing.T) {
 		t.Error("Copy Think should not be affected by original modification")
 	}
 }
-
-func TestLoadOrUnloadModel_CloudModelAuth(t *testing.T) {
-	tests := []struct {
-		name          string
-		remoteHost    string
-		whoamiStatus  int
-		whoamiResp    any
-		expectedError string
-	}{
-		{
-			name:         "ollama.com cloud model - user signed in",
-			remoteHost:   "https://ollama.com",
-			whoamiStatus: http.StatusOK,
-			whoamiResp:   api.UserResponse{Name: "testuser"},
-		},
-		{
-			name:         "ollama.com cloud model - user not signed in",
-			remoteHost:   "https://ollama.com",
-			whoamiStatus: http.StatusUnauthorized,
-			whoamiResp: map[string]string{
-				"error":      "unauthorized",
-				"signin_url": "https://ollama.com/signin",
-			},
-			expectedError: "unauthorized",
-		},
-		{
-			name:         "non-ollama.com remote - no auth check",
-			remoteHost:   "https://other-remote.com",
-			whoamiStatus: http.StatusUnauthorized, // should not be called
-			whoamiResp:   nil,
-		},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			whoamiCalled := false
-			mockServer := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-				switch r.URL.Path {
-				case "/api/show":
-					w.Header().Set("Content-Type", "application/json")
-					if err := json.NewEncoder(w).Encode(api.ShowResponse{
-						RemoteHost:  tt.remoteHost,
-						RemoteModel: "test-model",
-					}); err != nil {
-						http.Error(w, err.Error(), http.StatusInternalServerError)
-					}
-				case "/api/me":
-					whoamiCalled = true
-					w.Header().Set("Content-Type", "application/json")
-					w.WriteHeader(tt.whoamiStatus)
-					if tt.whoamiResp != nil {
-						if err := json.NewEncoder(w).Encode(tt.whoamiResp); err != nil {
-							http.Error(w, err.Error(), http.StatusInternalServerError)
-						}
-					}
-				default:
-					http.NotFound(w, r)
-				}
-			}))
-			defer mockServer.Close()
-
-			t.Setenv("OLLAMA_HOST", mockServer.URL)
-
-			cmd := &cobra.Command{}
-			cmd.SetContext(t.Context())
-
-			opts := &runOptions{
-				Model:       "test-cloud-model",
-				ShowConnect: false,
-			}
-
-			err := loadOrUnloadModel(cmd, opts)
-
-			if strings.HasPrefix(tt.remoteHost, "https://ollama.com") {
-				if !whoamiCalled {
-					t.Error("expected whoami to be called for ollama.com cloud model")
-				}
-			} else {
-				if whoamiCalled {
-					t.Error("whoami should not be called for non-ollama.com remote")
-				}
-			}
-
-			if tt.expectedError != "" {
-				if err == nil {
-					t.Errorf("expected error containing %q, got nil", tt.expectedError)
-				} else {
-					var authErr api.AuthorizationError
-					if !errors.As(err, &authErr) {
-						t.Errorf("expected AuthorizationError, got %T: %v", err, err)
-					}
-				}
-			} else {
-				if err != nil {
-					t.Errorf("expected no error, got %v", err)
-				}
-			}
-		})
-	}
-}
--- a/cmd/config/claude.go
+++ b/cmd/config/claude.go
@@ -1,192 +0,0 @@
-package config
-
-import (
-	"context"
-	"fmt"
-	"os"
-	"os/exec"
-	"path/filepath"
-	"runtime"
-
-	"github.com/ollama/ollama/api"
-	"github.com/ollama/ollama/envconfig"
-)
-
-// Claude implements Runner and AliasConfigurer for Claude Code integration
-type Claude struct{}
-
-// Compile-time check that Claude implements AliasConfigurer
-var _ AliasConfigurer = (*Claude)(nil)
-
-func (c *Claude) String() string { return "Claude Code" }
-
-func (c *Claude) args(model string, extra []string) []string {
-	var args []string
-	if model != "" {
-		args = append(args, "--model", model)
-	}
-	args = append(args, extra...)
-	return args
-}
-
-func (c *Claude) findPath() (string, error) {
-	if p, err := exec.LookPath("claude"); err == nil {
-		return p, nil
-	}
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return "", err
-	}
-	name := "claude"
-	if runtime.GOOS == "windows" {
-		name = "claude.exe"
-	}
-	fallback := filepath.Join(home, ".claude", "local", name)
-	if _, err := os.Stat(fallback); err != nil {
-		return "", err
-	}
-	return fallback, nil
-}
-
-func (c *Claude) Run(model string, args []string) error {
-	claudePath, err := c.findPath()
-	if err != nil {
-		return fmt.Errorf("claude is not installed, install from https://code.claude.com/docs/en/quickstart")
-	}
-
-	cmd := exec.Command(claudePath, c.args(model, args)...)
-	cmd.Stdin = os.Stdin
-	cmd.Stdout = os.Stdout
-	cmd.Stderr = os.Stderr
-
-	env := append(os.Environ(),
-		"ANTHROPIC_BASE_URL="+envconfig.Host().String(),
-		"ANTHROPIC_API_KEY=",
-		"ANTHROPIC_AUTH_TOKEN=ollama",
-	)
-
-	env = append(env, c.modelEnvVars(model)...)
-
-	cmd.Env = env
-	return cmd.Run()
-}
-
-// modelEnvVars returns Claude Code env vars that route all model tiers through Ollama.
-func (c *Claude) modelEnvVars(model string) []string {
-	primary := model
-	fast := model
-	if cfg, err := loadIntegration("claude"); err == nil && cfg.Aliases != nil {
-		if p := cfg.Aliases["primary"]; p != "" {
-			primary = p
-		}
-		if f := cfg.Aliases["fast"]; f != "" {
-			fast = f
-		}
-	}
-	return []string{
-		"ANTHROPIC_DEFAULT_OPUS_MODEL=" + primary,
-		"ANTHROPIC_DEFAULT_SONNET_MODEL=" + primary,
-		"ANTHROPIC_DEFAULT_HAIKU_MODEL=" + fast,
-		"CLAUDE_CODE_SUBAGENT_MODEL=" + primary,
-	}
-}
-
-// ConfigureAliases sets up model aliases for Claude Code.
-// model: the model to use (if empty, user will be prompted to select)
-// aliases: existing alias configuration to preserve/update
-// Cloud-only: subagent routing (fast model) is gated to cloud models only until
-// there is a better strategy for prompt caching on local models.
-func (c *Claude) ConfigureAliases(ctx context.Context, model string, existingAliases map[string]string, force bool) (map[string]string, bool, error) {
-	aliases := make(map[string]string)
-	for k, v := range existingAliases {
-		aliases[k] = v
-	}
-
-	if model != "" {
-		aliases["primary"] = model
-	}
-
-	if !force && aliases["primary"] != "" {
-		client, _ := api.ClientFromEnvironment()
-		if isCloudModel(ctx, client, aliases["primary"]) {
-			if isCloudModel(ctx, client, aliases["fast"]) {
-				return aliases, false, nil
-			}
-		} else {
-			delete(aliases, "fast")
-			return aliases, false, nil
-		}
-	}
-
-	items, existingModels, cloudModels, client, err := listModels(ctx)
-	if err != nil {
-		return nil, false, err
-	}
-
-	fmt.Fprintf(os.Stderr, "\n%sModel Configuration%s\n\n", ansiBold, ansiReset)
-
-	if aliases["primary"] == "" || force {
-		primary, err := DefaultSingleSelector("Select model:", items, aliases["primary"])
-		if err != nil {
-			return nil, false, err
-		}
-		if err := pullIfNeeded(ctx, client, existingModels, primary); err != nil {
-			return nil, false, err
-		}
-		if err := ensureAuth(ctx, client, cloudModels, []string{primary}); err != nil {
-			return nil, false, err
-		}
-		aliases["primary"] = primary
-	}
-
-	if isCloudModel(ctx, client, aliases["primary"]) {
-		if aliases["fast"] == "" || !isCloudModel(ctx, client, aliases["fast"]) {
-			aliases["fast"] = aliases["primary"]
-		}
-	} else {
-		delete(aliases, "fast")
-	}
-
-	return aliases, true, nil
-}
-
-// SetAliases syncs the configured aliases to the Ollama server using prefix matching.
-// Cloud-only: for local models (fast is empty), we delete any existing aliases to
-// prevent stale routing to a previous cloud model.
-func (c *Claude) SetAliases(ctx context.Context, aliases map[string]string) error {
-	client, err := api.ClientFromEnvironment()
-	if err != nil {
-		return err
-	}
-
-	prefixes := []string{"claude-sonnet-", "claude-haiku-"}
-
-	if aliases["fast"] == "" {
-		for _, prefix := range prefixes {
-			_ = client.DeleteAliasExperimental(ctx, &api.AliasDeleteRequest{Alias: prefix})
-		}
-		return nil
-	}
-
-	prefixAliases := map[string]string{
-		"claude-sonnet-": aliases["primary"],
-		"claude-haiku-":  aliases["fast"],
-	}
-
-	var errs []string
-	for prefix, target := range prefixAliases {
-		req := &api.AliasRequest{
-			Alias:          prefix,
-			Target:         target,
-			PrefixMatching: true,
-		}
-		if err := client.SetAliasExperimental(ctx, req); err != nil {
-			errs = append(errs, prefix)
-		}
-	}
-
-	if len(errs) > 0 {
-		return fmt.Errorf("failed to set aliases: %v", errs)
-	}
-	return nil
-}
--- a/cmd/config/claude_test.go
+++ b/cmd/config/claude_test.go
@@ -1,198 +0,0 @@
-package config
-
-import (
-	"os"
-	"path/filepath"
-	"runtime"
-	"slices"
-	"strings"
-	"testing"
-)
-
-func TestClaudeIntegration(t *testing.T) {
-	c := &Claude{}
-
-	t.Run("String", func(t *testing.T) {
-		if got := c.String(); got != "Claude Code" {
-			t.Errorf("String() = %q, want %q", got, "Claude Code")
-		}
-	})
-
-	t.Run("implements Runner", func(t *testing.T) {
-		var _ Runner = c
-	})
-}
-
-func TestClaudeFindPath(t *testing.T) {
-	c := &Claude{}
-
-	t.Run("finds claude in PATH", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		name := "claude"
-		if runtime.GOOS == "windows" {
-			name = "claude.exe"
-		}
-		fakeBin := filepath.Join(tmpDir, name)
-		os.WriteFile(fakeBin, []byte("#!/bin/sh\n"), 0o755)
-		t.Setenv("PATH", tmpDir)
-
-		got, err := c.findPath()
-		if err != nil {
-			t.Fatalf("unexpected error: %v", err)
-		}
-		if got != fakeBin {
-			t.Errorf("findPath() = %q, want %q", got, fakeBin)
-		}
-	})
-
-	t.Run("falls back to ~/.claude/local/claude", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-		t.Setenv("PATH", t.TempDir()) // empty dir, no claude binary
-
-		name := "claude"
-		if runtime.GOOS == "windows" {
-			name = "claude.exe"
-		}
-		fallback := filepath.Join(tmpDir, ".claude", "local", name)
-		os.MkdirAll(filepath.Dir(fallback), 0o755)
-		os.WriteFile(fallback, []byte("#!/bin/sh\n"), 0o755)
-
-		got, err := c.findPath()
-		if err != nil {
-			t.Fatalf("unexpected error: %v", err)
-		}
-		if got != fallback {
-			t.Errorf("findPath() = %q, want %q", got, fallback)
-		}
-	})
-
-	t.Run("returns error when neither PATH nor fallback exists", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-		t.Setenv("PATH", t.TempDir()) // empty dir, no claude binary
-
-		_, err := c.findPath()
-		if err == nil {
-			t.Fatal("expected error, got nil")
-		}
-	})
-}
-
-func TestClaudeArgs(t *testing.T) {
-	c := &Claude{}
-
-	tests := []struct {
-		name  string
-		model string
-		args  []string
-		want  []string
-	}{
-		{"with model", "llama3.2", nil, []string{"--model", "llama3.2"}},
-		{"empty model", "", nil, nil},
-		{"with model and verbose", "llama3.2", []string{"--verbose"}, []string{"--model", "llama3.2", "--verbose"}},
-		{"empty model with help", "", []string{"--help"}, []string{"--help"}},
-		{"with allowed tools", "llama3.2", []string{"--allowedTools", "Read,Write,Bash"}, []string{"--model", "llama3.2", "--allowedTools", "Read,Write,Bash"}},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			got := c.args(tt.model, tt.args)
-			if !slices.Equal(got, tt.want) {
-				t.Errorf("args(%q, %v) = %v, want %v", tt.model, tt.args, got, tt.want)
-			}
-		})
-	}
-}
-
-func TestClaudeModelEnvVars(t *testing.T) {
-	c := &Claude{}
-
-	envMap := func(envs []string) map[string]string {
-		m := make(map[string]string)
-		for _, e := range envs {
-			k, v, _ := strings.Cut(e, "=")
-			m[k] = v
-		}
-		return m
-	}
-
-	t.Run("falls back to model param when no aliases saved", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		got := envMap(c.modelEnvVars("llama3.2"))
-		if got["ANTHROPIC_DEFAULT_OPUS_MODEL"] != "llama3.2" {
-			t.Errorf("OPUS = %q, want llama3.2", got["ANTHROPIC_DEFAULT_OPUS_MODEL"])
-		}
-		if got["ANTHROPIC_DEFAULT_SONNET_MODEL"] != "llama3.2" {
-			t.Errorf("SONNET = %q, want llama3.2", got["ANTHROPIC_DEFAULT_SONNET_MODEL"])
-		}
-		if got["ANTHROPIC_DEFAULT_HAIKU_MODEL"] != "llama3.2" {
-			t.Errorf("HAIKU = %q, want llama3.2", got["ANTHROPIC_DEFAULT_HAIKU_MODEL"])
-		}
-		if got["CLAUDE_CODE_SUBAGENT_MODEL"] != "llama3.2" {
-			t.Errorf("SUBAGENT = %q, want llama3.2", got["CLAUDE_CODE_SUBAGENT_MODEL"])
-		}
-	})
-
-	t.Run("uses primary alias for opus sonnet and subagent", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		SaveIntegration("claude", []string{"qwen3:8b"})
-		saveAliases("claude", map[string]string{"primary": "qwen3:8b"})
-
-		got := envMap(c.modelEnvVars("qwen3:8b"))
-		if got["ANTHROPIC_DEFAULT_OPUS_MODEL"] != "qwen3:8b" {
-			t.Errorf("OPUS = %q, want qwen3:8b", got["ANTHROPIC_DEFAULT_OPUS_MODEL"])
-		}
-		if got["ANTHROPIC_DEFAULT_SONNET_MODEL"] != "qwen3:8b" {
-			t.Errorf("SONNET = %q, want qwen3:8b", got["ANTHROPIC_DEFAULT_SONNET_MODEL"])
-		}
-		if got["ANTHROPIC_DEFAULT_HAIKU_MODEL"] != "qwen3:8b" {
-			t.Errorf("HAIKU = %q, want qwen3:8b (no fast alias)", got["ANTHROPIC_DEFAULT_HAIKU_MODEL"])
-		}
-		if got["CLAUDE_CODE_SUBAGENT_MODEL"] != "qwen3:8b" {
-			t.Errorf("SUBAGENT = %q, want qwen3:8b", got["CLAUDE_CODE_SUBAGENT_MODEL"])
-		}
-	})
-
-	t.Run("uses fast alias for haiku", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		SaveIntegration("claude", []string{"llama3.2:70b"})
-		saveAliases("claude", map[string]string{
-			"primary": "llama3.2:70b",
-			"fast":    "llama3.2:8b",
-		})
-
-		got := envMap(c.modelEnvVars("llama3.2:70b"))
-		if got["ANTHROPIC_DEFAULT_OPUS_MODEL"] != "llama3.2:70b" {
-			t.Errorf("OPUS = %q, want llama3.2:70b", got["ANTHROPIC_DEFAULT_OPUS_MODEL"])
-		}
-		if got["ANTHROPIC_DEFAULT_SONNET_MODEL"] != "llama3.2:70b" {
-			t.Errorf("SONNET = %q, want llama3.2:70b", got["ANTHROPIC_DEFAULT_SONNET_MODEL"])
-		}
-		if got["ANTHROPIC_DEFAULT_HAIKU_MODEL"] != "llama3.2:8b" {
-			t.Errorf("HAIKU = %q, want llama3.2:8b", got["ANTHROPIC_DEFAULT_HAIKU_MODEL"])
-		}
-		if got["CLAUDE_CODE_SUBAGENT_MODEL"] != "llama3.2:70b" {
-			t.Errorf("SUBAGENT = %q, want llama3.2:70b", got["CLAUDE_CODE_SUBAGENT_MODEL"])
-		}
-	})
-
-	t.Run("alias primary overrides model param", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		SaveIntegration("claude", []string{"saved-model"})
-		saveAliases("claude", map[string]string{"primary": "saved-model"})
-
-		got := envMap(c.modelEnvVars("different-model"))
-		if got["ANTHROPIC_DEFAULT_OPUS_MODEL"] != "saved-model" {
-			t.Errorf("OPUS = %q, want saved-model", got["ANTHROPIC_DEFAULT_OPUS_MODEL"])
-		}
-	})
-}
--- a/cmd/config/cline.go
+++ b/cmd/config/cline.go
@@ -1,123 +0,0 @@
-package config
-
-import (
-	"context"
-	"encoding/json"
-	"errors"
-	"fmt"
-	"os"
-	"os/exec"
-	"path/filepath"
-
-	"github.com/ollama/ollama/envconfig"
-)
-
-// Cline implements Runner and Editor for the Cline CLI integration
-type Cline struct{}
-
-func (c *Cline) String() string { return "Cline" }
-
-func (c *Cline) Run(model string, args []string) error {
-	if _, err := exec.LookPath("cline"); err != nil {
-		return fmt.Errorf("cline is not installed, install with: npm install -g cline")
-	}
-
-	models := []string{model}
-	if config, err := loadIntegration("cline"); err == nil && len(config.Models) > 0 {
-		models = config.Models
-	}
-	var err error
-	models, err = resolveEditorModels("cline", models, func() ([]string, error) {
-		return selectModels(context.Background(), "cline", "")
-	})
-	if errors.Is(err, errCancelled) {
-		return nil
-	}
-	if err != nil {
-		return err
-	}
-	if err := c.Edit(models); err != nil {
-		return fmt.Errorf("setup failed: %w", err)
-	}
-
-	cmd := exec.Command("cline", args...)
-	cmd.Stdin = os.Stdin
-	cmd.Stdout = os.Stdout
-	cmd.Stderr = os.Stderr
-	return cmd.Run()
-}
-
-func (c *Cline) Paths() []string {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return nil
-	}
-	p := filepath.Join(home, ".cline", "data", "globalState.json")
-	if _, err := os.Stat(p); err == nil {
-		return []string{p}
-	}
-	return nil
-}
-
-func (c *Cline) Edit(models []string) error {
-	if len(models) == 0 {
-		return nil
-	}
-
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return err
-	}
-
-	configPath := filepath.Join(home, ".cline", "data", "globalState.json")
-	if err := os.MkdirAll(filepath.Dir(configPath), 0o755); err != nil {
-		return err
-	}
-
-	config := make(map[string]any)
-	if data, err := os.ReadFile(configPath); err == nil {
-		if err := json.Unmarshal(data, &config); err != nil {
-			return fmt.Errorf("failed to parse config: %w, at: %s", err, configPath)
-		}
-	}
-
-	// Set Ollama as the provider for both act and plan modes
-	baseURL := envconfig.Host().String()
-	config["ollamaBaseUrl"] = baseURL
-	config["actModeApiProvider"] = "ollama"
-	config["actModeOllamaModelId"] = models[0]
-	config["actModeOllamaBaseUrl"] = baseURL
-	config["planModeApiProvider"] = "ollama"
-	config["planModeOllamaModelId"] = models[0]
-	config["planModeOllamaBaseUrl"] = baseURL
-
-	config["welcomeViewCompleted"] = true
-
-	data, err := json.MarshalIndent(config, "", "  ")
-	if err != nil {
-		return err
-	}
-	return writeWithBackup(configPath, data)
-}
-
-func (c *Cline) Models() []string {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return nil
-	}
-
-	config, err := readJSONFile(filepath.Join(home, ".cline", "data", "globalState.json"))
-	if err != nil {
-		return nil
-	}
-
-	if config["actModeApiProvider"] != "ollama" {
-		return nil
-	}
-
-	modelID, _ := config["actModeOllamaModelId"].(string)
-	if modelID == "" {
-		return nil
-	}
-	return []string{modelID}
-}
--- a/cmd/config/cline_test.go
+++ b/cmd/config/cline_test.go
@@ -1,204 +0,0 @@
-package config
-
-import (
-	"encoding/json"
-	"os"
-	"path/filepath"
-	"testing"
-)
-
-func TestClineIntegration(t *testing.T) {
-	c := &Cline{}
-
-	t.Run("String", func(t *testing.T) {
-		if got := c.String(); got != "Cline" {
-			t.Errorf("String() = %q, want %q", got, "Cline")
-		}
-	})
-
-	t.Run("implements Runner", func(t *testing.T) {
-		var _ Runner = c
-	})
-
-	t.Run("implements Editor", func(t *testing.T) {
-		var _ Editor = c
-	})
-}
-
-func TestClineEdit(t *testing.T) {
-	c := &Cline{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configDir := filepath.Join(tmpDir, ".cline", "data")
-	configPath := filepath.Join(configDir, "globalState.json")
-
-	readConfig := func() map[string]any {
-		data, _ := os.ReadFile(configPath)
-		var config map[string]any
-		json.Unmarshal(data, &config)
-		return config
-	}
-
-	t.Run("creates config from scratch", func(t *testing.T) {
-		os.RemoveAll(filepath.Join(tmpDir, ".cline"))
-
-		if err := c.Edit([]string{"kimi-k2.5:cloud"}); err != nil {
-			t.Fatal(err)
-		}
-
-		config := readConfig()
-		if config["actModeApiProvider"] != "ollama" {
-			t.Errorf("actModeApiProvider = %v, want ollama", config["actModeApiProvider"])
-		}
-		if config["actModeOllamaModelId"] != "kimi-k2.5:cloud" {
-			t.Errorf("actModeOllamaModelId = %v, want kimi-k2.5:cloud", config["actModeOllamaModelId"])
-		}
-		if config["planModeApiProvider"] != "ollama" {
-			t.Errorf("planModeApiProvider = %v, want ollama", config["planModeApiProvider"])
-		}
-		if config["planModeOllamaModelId"] != "kimi-k2.5:cloud" {
-			t.Errorf("planModeOllamaModelId = %v, want kimi-k2.5:cloud", config["planModeOllamaModelId"])
-		}
-		if config["welcomeViewCompleted"] != true {
-			t.Errorf("welcomeViewCompleted = %v, want true", config["welcomeViewCompleted"])
-		}
-	})
-
-	t.Run("preserves existing fields", func(t *testing.T) {
-		os.RemoveAll(filepath.Join(tmpDir, ".cline"))
-		os.MkdirAll(configDir, 0o755)
-
-		existing := map[string]any{
-			"remoteRulesToggles":    map[string]any{},
-			"remoteWorkflowToggles": map[string]any{},
-			"customSetting":         "keep-me",
-		}
-		data, _ := json.Marshal(existing)
-		os.WriteFile(configPath, data, 0o644)
-
-		if err := c.Edit([]string{"glm-5:cloud"}); err != nil {
-			t.Fatal(err)
-		}
-
-		config := readConfig()
-		if config["customSetting"] != "keep-me" {
-			t.Errorf("customSetting was not preserved")
-		}
-		if config["actModeOllamaModelId"] != "glm-5:cloud" {
-			t.Errorf("actModeOllamaModelId = %v, want glm-5:cloud", config["actModeOllamaModelId"])
-		}
-	})
-
-	t.Run("updates model on re-edit", func(t *testing.T) {
-		os.RemoveAll(filepath.Join(tmpDir, ".cline"))
-
-		if err := c.Edit([]string{"kimi-k2.5:cloud"}); err != nil {
-			t.Fatal(err)
-		}
-		if err := c.Edit([]string{"glm-5:cloud"}); err != nil {
-			t.Fatal(err)
-		}
-
-		config := readConfig()
-		if config["actModeOllamaModelId"] != "glm-5:cloud" {
-			t.Errorf("actModeOllamaModelId = %v, want glm-5:cloud", config["actModeOllamaModelId"])
-		}
-		if config["planModeOllamaModelId"] != "glm-5:cloud" {
-			t.Errorf("planModeOllamaModelId = %v, want glm-5:cloud", config["planModeOllamaModelId"])
-		}
-	})
-
-	t.Run("empty models is no-op", func(t *testing.T) {
-		os.RemoveAll(filepath.Join(tmpDir, ".cline"))
-
-		if err := c.Edit(nil); err != nil {
-			t.Fatal(err)
-		}
-
-		if _, err := os.Stat(configPath); !os.IsNotExist(err) {
-			t.Error("expected no config file to be created for empty models")
-		}
-	})
-
-	t.Run("uses first model as primary", func(t *testing.T) {
-		os.RemoveAll(filepath.Join(tmpDir, ".cline"))
-
-		if err := c.Edit([]string{"kimi-k2.5:cloud", "glm-5:cloud"}); err != nil {
-			t.Fatal(err)
-		}
-
-		config := readConfig()
-		if config["actModeOllamaModelId"] != "kimi-k2.5:cloud" {
-			t.Errorf("actModeOllamaModelId = %v, want kimi-k2.5:cloud (first model)", config["actModeOllamaModelId"])
-		}
-	})
-}
-
-func TestClineModels(t *testing.T) {
-	c := &Cline{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configDir := filepath.Join(tmpDir, ".cline", "data")
-	configPath := filepath.Join(configDir, "globalState.json")
-
-	t.Run("returns nil when no config", func(t *testing.T) {
-		if models := c.Models(); models != nil {
-			t.Errorf("Models() = %v, want nil", models)
-		}
-	})
-
-	t.Run("returns nil when provider is not ollama", func(t *testing.T) {
-		os.MkdirAll(configDir, 0o755)
-		config := map[string]any{
-			"actModeApiProvider":   "anthropic",
-			"actModeOllamaModelId": "some-model",
-		}
-		data, _ := json.Marshal(config)
-		os.WriteFile(configPath, data, 0o644)
-
-		if models := c.Models(); models != nil {
-			t.Errorf("Models() = %v, want nil", models)
-		}
-	})
-
-	t.Run("returns model when ollama is configured", func(t *testing.T) {
-		os.MkdirAll(configDir, 0o755)
-		config := map[string]any{
-			"actModeApiProvider":   "ollama",
-			"actModeOllamaModelId": "kimi-k2.5:cloud",
-		}
-		data, _ := json.Marshal(config)
-		os.WriteFile(configPath, data, 0o644)
-
-		models := c.Models()
-		if len(models) != 1 || models[0] != "kimi-k2.5:cloud" {
-			t.Errorf("Models() = %v, want [kimi-k2.5:cloud]", models)
-		}
-	})
-}
-
-func TestClinePaths(t *testing.T) {
-	c := &Cline{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	t.Run("returns nil when no config exists", func(t *testing.T) {
-		if paths := c.Paths(); paths != nil {
-			t.Errorf("Paths() = %v, want nil", paths)
-		}
-	})
-
-	t.Run("returns path when config exists", func(t *testing.T) {
-		configDir := filepath.Join(tmpDir, ".cline", "data")
-		os.MkdirAll(configDir, 0o755)
-		configPath := filepath.Join(configDir, "globalState.json")
-		os.WriteFile(configPath, []byte("{}"), 0o644)
-
-		paths := c.Paths()
-		if len(paths) != 1 || paths[0] != configPath {
-			t.Errorf("Paths() = %v, want [%s]", paths, configPath)
-		}
-	})
-}
--- a/cmd/config/codex.go
+++ b/cmd/config/codex.go
@@ -1,67 +0,0 @@
-package config
-
-import (
-	"fmt"
-	"os"
-	"os/exec"
-	"strings"
-
-	"github.com/ollama/ollama/envconfig"
-	"golang.org/x/mod/semver"
-)
-
-// Codex implements Runner for Codex integration
-type Codex struct{}
-
-func (c *Codex) String() string { return "Codex" }
-
-func (c *Codex) args(model string, extra []string) []string {
-	args := []string{"--oss"}
-	if model != "" {
-		args = append(args, "-m", model)
-	}
-	args = append(args, extra...)
-	return args
-}
-
-func (c *Codex) Run(model string, args []string) error {
-	if err := checkCodexVersion(); err != nil {
-		return err
-	}
-
-	cmd := exec.Command("codex", c.args(model, args)...)
-	cmd.Stdin = os.Stdin
-	cmd.Stdout = os.Stdout
-	cmd.Stderr = os.Stderr
-	cmd.Env = append(os.Environ(),
-		"OPENAI_BASE_URL="+envconfig.Host().String()+"/v1/",
-		"OPENAI_API_KEY=ollama",
-	)
-	return cmd.Run()
-}
-
-func checkCodexVersion() error {
-	if _, err := exec.LookPath("codex"); err != nil {
-		return fmt.Errorf("codex is not installed, install with: npm install -g @openai/codex")
-	}
-
-	out, err := exec.Command("codex", "--version").Output()
-	if err != nil {
-		return fmt.Errorf("failed to get codex version: %w", err)
-	}
-
-	// Parse output like "codex-cli 0.87.0"
-	fields := strings.Fields(strings.TrimSpace(string(out)))
-	if len(fields) < 2 {
-		return fmt.Errorf("unexpected codex version output: %s", string(out))
-	}
-
-	version := "v" + fields[len(fields)-1]
-	minVersion := "v0.81.0"
-
-	if semver.Compare(version, minVersion) < 0 {
-		return fmt.Errorf("codex version %s is too old, minimum required is %s, update with: npm update -g @openai/codex", fields[len(fields)-1], "0.81.0")
-	}
-
-	return nil
-}
--- a/cmd/config/codex_test.go
+++ b/cmd/config/codex_test.go
@@ -1,31 +0,0 @@
-package config
-
-import (
-	"slices"
-	"testing"
-)
-
-func TestCodexArgs(t *testing.T) {
-	c := &Codex{}
-
-	tests := []struct {
-		name  string
-		model string
-		args  []string
-		want  []string
-	}{
-		{"with model", "llama3.2", nil, []string{"--oss", "-m", "llama3.2"}},
-		{"empty model", "", nil, []string{"--oss"}},
-		{"with model and profile", "qwen3-coder", []string{"-p", "myprofile"}, []string{"--oss", "-m", "qwen3-coder", "-p", "myprofile"}},
-		{"with sandbox flag", "llama3.2", []string{"--sandbox", "workspace-write"}, []string{"--oss", "-m", "llama3.2", "--sandbox", "workspace-write"}},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			got := c.args(tt.model, tt.args)
-			if !slices.Equal(got, tt.want) {
-				t.Errorf("args(%q, %v) = %v, want %v", tt.model, tt.args, got, tt.want)
-			}
-		})
-	}
-}
--- a/cmd/config/config.go
+++ b/cmd/config/config.go
@@ -1,301 +0,0 @@
-// Package config provides integration configuration for external coding tools
-// (Claude Code, Codex, Droid, OpenCode) to use Ollama models.
-package config
-
-import (
-	"context"
-	"encoding/json"
-	"errors"
-	"fmt"
-	"os"
-	"path/filepath"
-	"strings"
-
-	"github.com/ollama/ollama/api"
-)
-
-type integration struct {
-	Models    []string          `json:"models"`
-	Aliases   map[string]string `json:"aliases,omitempty"`
-	Onboarded bool              `json:"onboarded,omitempty"`
-}
-
-type config struct {
-	Integrations  map[string]*integration `json:"integrations"`
-	LastModel     string                  `json:"last_model,omitempty"`
-	LastSelection string                  `json:"last_selection,omitempty"` // "run" or integration name
-}
-
-func configPath() (string, error) {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return "", err
-	}
-	return filepath.Join(home, ".ollama", "config.json"), nil
-}
-
-func legacyConfigPath() (string, error) {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return "", err
-	}
-	return filepath.Join(home, ".ollama", "config", "config.json"), nil
-}
-
-// migrateConfig moves the config from the legacy path to ~/.ollama/config.json
-func migrateConfig() (bool, error) {
-	oldPath, err := legacyConfigPath()
-	if err != nil {
-		return false, err
-	}
-
-	oldData, err := os.ReadFile(oldPath)
-	if err != nil {
-		if os.IsNotExist(err) {
-			return false, nil
-		}
-		return false, err
-	}
-
-	// Ignore legacy files with invalid JSON and continue startup.
-	if !json.Valid(oldData) {
-		return false, nil
-	}
-
-	newPath, err := configPath()
-	if err != nil {
-		return false, err
-	}
-
-	if err := os.MkdirAll(filepath.Dir(newPath), 0o755); err != nil {
-		return false, err
-	}
-	if err := os.WriteFile(newPath, oldData, 0o644); err != nil {
-		return false, fmt.Errorf("write new config: %w", err)
-	}
-
-	_ = os.Remove(oldPath)
-	_ = os.Remove(filepath.Dir(oldPath)) // clean up empty directory
-
-	return true, nil
-}
-
-func load() (*config, error) {
-	path, err := configPath()
-	if err != nil {
-		return nil, err
-	}
-
-	data, err := os.ReadFile(path)
-	if err != nil && os.IsNotExist(err) {
-		if migrated, merr := migrateConfig(); merr == nil && migrated {
-			data, err = os.ReadFile(path)
-		}
-	}
-	if err != nil {
-		if os.IsNotExist(err) {
-			return &config{Integrations: make(map[string]*integration)}, nil
-		}
-		return nil, err
-	}
-
-	var cfg config
-	if err := json.Unmarshal(data, &cfg); err != nil {
-		return nil, fmt.Errorf("failed to parse config: %w, at: %s", err, path)
-	}
-	if cfg.Integrations == nil {
-		cfg.Integrations = make(map[string]*integration)
-	}
-	return &cfg, nil
-}
-
-func save(cfg *config) error {
-	path, err := configPath()
-	if err != nil {
-		return err
-	}
-
-	if err := os.MkdirAll(filepath.Dir(path), 0o755); err != nil {
-		return err
-	}
-
-	data, err := json.MarshalIndent(cfg, "", "  ")
-	if err != nil {
-		return err
-	}
-
-	return writeWithBackup(path, data)
-}
-
-func SaveIntegration(appName string, models []string) error {
-	if appName == "" {
-		return errors.New("app name cannot be empty")
-	}
-
-	cfg, err := load()
-	if err != nil {
-		return err
-	}
-
-	key := strings.ToLower(appName)
-	existing := cfg.Integrations[key]
-	var aliases map[string]string
-	var onboarded bool
-	if existing != nil {
-		aliases = existing.Aliases
-		onboarded = existing.Onboarded
-	}
-
-	cfg.Integrations[key] = &integration{
-		Models:    models,
-		Aliases:   aliases,
-		Onboarded: onboarded,
-	}
-
-	return save(cfg)
-}
-
-// integrationOnboarded marks an integration as onboarded in ollama's config.
-func integrationOnboarded(appName string) error {
-	cfg, err := load()
-	if err != nil {
-		return err
-	}
-
-	key := strings.ToLower(appName)
-	existing := cfg.Integrations[key]
-	if existing == nil {
-		existing = &integration{}
-	}
-	existing.Onboarded = true
-	cfg.Integrations[key] = existing
-	return save(cfg)
-}
-
-// IntegrationModel returns the first configured model for an integration, or empty string if not configured.
-func IntegrationModel(appName string) string {
-	integrationConfig, err := loadIntegration(appName)
-	if err != nil || len(integrationConfig.Models) == 0 {
-		return ""
-	}
-	return integrationConfig.Models[0]
-}
-
-// IntegrationModels returns all configured models for an integration, or nil.
-func IntegrationModels(appName string) []string {
-	integrationConfig, err := loadIntegration(appName)
-	if err != nil || len(integrationConfig.Models) == 0 {
-		return nil
-	}
-	return integrationConfig.Models
-}
-
-// LastModel returns the last model that was run, or empty string if none.
-func LastModel() string {
-	cfg, err := load()
-	if err != nil {
-		return ""
-	}
-	return cfg.LastModel
-}
-
-// SetLastModel saves the last model that was run.
-func SetLastModel(model string) error {
-	cfg, err := load()
-	if err != nil {
-		return err
-	}
-	cfg.LastModel = model
-	return save(cfg)
-}
-
-// LastSelection returns the last menu selection ("run" or integration name), or empty string if none.
-func LastSelection() string {
-	cfg, err := load()
-	if err != nil {
-		return ""
-	}
-	return cfg.LastSelection
-}
-
-// SetLastSelection saves the last menu selection ("run" or integration name).
-func SetLastSelection(selection string) error {
-	cfg, err := load()
-	if err != nil {
-		return err
-	}
-	cfg.LastSelection = selection
-	return save(cfg)
-}
-
-// ModelExists checks if a model exists on the Ollama server.
-func ModelExists(ctx context.Context, name string) bool {
-	if name == "" {
-		return false
-	}
-	client, err := api.ClientFromEnvironment()
-	if err != nil {
-		return false
-	}
-	models, err := client.List(ctx)
-	if err != nil {
-		return false
-	}
-	for _, m := range models.Models {
-		if m.Name == name || strings.HasPrefix(m.Name, name+":") {
-			return true
-		}
-	}
-	return false
-}
-
-func loadIntegration(appName string) (*integration, error) {
-	cfg, err := load()
-	if err != nil {
-		return nil, err
-	}
-
-	integrationConfig, ok := cfg.Integrations[strings.ToLower(appName)]
-	if !ok {
-		return nil, os.ErrNotExist
-	}
-
-	return integrationConfig, nil
-}
-
-func saveAliases(appName string, aliases map[string]string) error {
-	if appName == "" {
-		return errors.New("app name cannot be empty")
-	}
-
-	cfg, err := load()
-	if err != nil {
-		return err
-	}
-
-	key := strings.ToLower(appName)
-	existing := cfg.Integrations[key]
-	if existing == nil {
-		existing = &integration{}
-	}
-
-	// Replace aliases entirely (not merge) so deletions are persisted
-	existing.Aliases = aliases
-
-	cfg.Integrations[key] = existing
-	return save(cfg)
-}
-
-func listIntegrations() ([]integration, error) {
-	cfg, err := load()
-	if err != nil {
-		return nil, err
-	}
-
-	result := make([]integration, 0, len(cfg.Integrations))
-	for _, integrationConfig := range cfg.Integrations {
-		result = append(result, *integrationConfig)
-	}
-
-	return result, nil
-}
--- a/cmd/config/config_cloud_test.go
+++ b/cmd/config/config_cloud_test.go
@@ -1,677 +0,0 @@
-package config
-
-import (
-	"context"
-	"errors"
-	"os"
-	"path/filepath"
-	"testing"
-)
-
-func TestSetAliases_CloudModel(t *testing.T) {
-	// Test the SetAliases logic by checking the alias map behavior
-	aliases := map[string]string{
-		"primary": "kimi-k2.5:cloud",
-		"fast":    "kimi-k2.5:cloud",
-	}
-
-	// Verify fast is set (cloud model behavior)
-	if aliases["fast"] == "" {
-		t.Error("cloud model should have fast alias set")
-	}
-	if aliases["fast"] != aliases["primary"] {
-		t.Errorf("fast should equal primary for auto-set, got fast=%q primary=%q", aliases["fast"], aliases["primary"])
-	}
-}
-
-func TestSetAliases_LocalModel(t *testing.T) {
-	aliases := map[string]string{
-		"primary": "llama3.2:latest",
-	}
-	// Simulate local model behavior: fast should be empty
-	delete(aliases, "fast")
-
-	if aliases["fast"] != "" {
-		t.Error("local model should have empty fast alias")
-	}
-}
-
-func TestSaveAliases_ReplacesNotMerges(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	// First save with both primary and fast
-	initial := map[string]string{
-		"primary": "cloud-model",
-		"fast":    "cloud-model",
-	}
-	if err := saveAliases("claude", initial); err != nil {
-		t.Fatalf("failed to save initial aliases: %v", err)
-	}
-
-	// Verify both are saved
-	loaded, err := loadIntegration("claude")
-	if err != nil {
-		t.Fatalf("failed to load: %v", err)
-	}
-	if loaded.Aliases["fast"] != "cloud-model" {
-		t.Errorf("expected fast=cloud-model, got %q", loaded.Aliases["fast"])
-	}
-
-	// Now save without fast (simulating switch to local model)
-	updated := map[string]string{
-		"primary": "local-model",
-		// fast intentionally missing
-	}
-	if err := saveAliases("claude", updated); err != nil {
-		t.Fatalf("failed to save updated aliases: %v", err)
-	}
-
-	// Verify fast is GONE (not merged/preserved)
-	loaded, err = loadIntegration("claude")
-	if err != nil {
-		t.Fatalf("failed to load after update: %v", err)
-	}
-	if loaded.Aliases["fast"] != "" {
-		t.Errorf("fast should be removed after saving without it, got %q", loaded.Aliases["fast"])
-	}
-	if loaded.Aliases["primary"] != "local-model" {
-		t.Errorf("primary should be updated to local-model, got %q", loaded.Aliases["primary"])
-	}
-}
-
-func TestSaveAliases_PreservesModels(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	// First save integration with models
-	if err := SaveIntegration("claude", []string{"model1", "model2"}); err != nil {
-		t.Fatalf("failed to save integration: %v", err)
-	}
-
-	// Then update aliases
-	aliases := map[string]string{"primary": "new-model"}
-	if err := saveAliases("claude", aliases); err != nil {
-		t.Fatalf("failed to save aliases: %v", err)
-	}
-
-	// Verify models are preserved
-	loaded, err := loadIntegration("claude")
-	if err != nil {
-		t.Fatalf("failed to load: %v", err)
-	}
-	if len(loaded.Models) != 2 || loaded.Models[0] != "model1" {
-		t.Errorf("models should be preserved, got %v", loaded.Models)
-	}
-}
-
-// TestSaveAliases_EmptyMap clears all aliases
-func TestSaveAliases_EmptyMap(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	// Save with aliases
-	if err := saveAliases("claude", map[string]string{"primary": "model", "fast": "model"}); err != nil {
-		t.Fatalf("failed to save: %v", err)
-	}
-
-	// Save empty map
-	if err := saveAliases("claude", map[string]string{}); err != nil {
-		t.Fatalf("failed to save empty: %v", err)
-	}
-
-	loaded, err := loadIntegration("claude")
-	if err != nil {
-		t.Fatalf("failed to load: %v", err)
-	}
-	if len(loaded.Aliases) != 0 {
-		t.Errorf("aliases should be empty, got %v", loaded.Aliases)
-	}
-}
-
-// TestSaveAliases_NilMap handles nil gracefully
-func TestSaveAliases_NilMap(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	// Save with aliases first
-	if err := saveAliases("claude", map[string]string{"primary": "model"}); err != nil {
-		t.Fatalf("failed to save: %v", err)
-	}
-
-	// Save nil map - should clear aliases
-	if err := saveAliases("claude", nil); err != nil {
-		t.Fatalf("failed to save nil: %v", err)
-	}
-
-	loaded, err := loadIntegration("claude")
-	if err != nil {
-		t.Fatalf("failed to load: %v", err)
-	}
-	if len(loaded.Aliases) > 0 {
-		t.Errorf("aliases should be nil or empty, got %v", loaded.Aliases)
-	}
-}
-
-// TestSaveAliases_EmptyAppName returns error
-func TestSaveAliases_EmptyAppName(t *testing.T) {
-	err := saveAliases("", map[string]string{"primary": "model"})
-	if err == nil {
-		t.Error("expected error for empty app name")
-	}
-}
-
-func TestSaveAliases_CaseInsensitive(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	if err := saveAliases("Claude", map[string]string{"primary": "model1"}); err != nil {
-		t.Fatalf("failed to save: %v", err)
-	}
-
-	// Load with different case
-	loaded, err := loadIntegration("claude")
-	if err != nil {
-		t.Fatalf("failed to load: %v", err)
-	}
-	if loaded.Aliases["primary"] != "model1" {
-		t.Errorf("expected primary=model1, got %q", loaded.Aliases["primary"])
-	}
-
-	// Update with different case
-	if err := saveAliases("CLAUDE", map[string]string{"primary": "model2"}); err != nil {
-		t.Fatalf("failed to update: %v", err)
-	}
-
-	loaded, err = loadIntegration("claude")
-	if err != nil {
-		t.Fatalf("failed to load after update: %v", err)
-	}
-	if loaded.Aliases["primary"] != "model2" {
-		t.Errorf("expected primary=model2, got %q", loaded.Aliases["primary"])
-	}
-}
-
-// TestSaveAliases_CreatesIntegration creates integration if it doesn't exist
-func TestSaveAliases_CreatesIntegration(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	// Save aliases for non-existent integration
-	if err := saveAliases("newintegration", map[string]string{"primary": "model"}); err != nil {
-		t.Fatalf("failed to save: %v", err)
-	}
-
-	loaded, err := loadIntegration("newintegration")
-	if err != nil {
-		t.Fatalf("failed to load: %v", err)
-	}
-	if loaded.Aliases["primary"] != "model" {
-		t.Errorf("expected primary=model, got %q", loaded.Aliases["primary"])
-	}
-}
-
-func TestConfigureAliases_AliasMap(t *testing.T) {
-	t.Run("cloud model auto-sets fast to primary", func(t *testing.T) {
-		aliases := make(map[string]string)
-		aliases["primary"] = "cloud-model"
-
-		// Simulate cloud model behavior
-		isCloud := true
-		if isCloud {
-			if aliases["fast"] == "" {
-				aliases["fast"] = aliases["primary"]
-			}
-		}
-
-		if aliases["fast"] != "cloud-model" {
-			t.Errorf("expected fast=cloud-model, got %q", aliases["fast"])
-		}
-	})
-
-	t.Run("cloud model preserves custom fast", func(t *testing.T) {
-		aliases := map[string]string{
-			"primary": "cloud-model",
-			"fast":    "custom-fast-model",
-		}
-
-		// Simulate cloud model behavior - should preserve existing fast
-		isCloud := true
-		if isCloud {
-			if aliases["fast"] == "" {
-				aliases["fast"] = aliases["primary"]
-			}
-		}
-
-		if aliases["fast"] != "custom-fast-model" {
-			t.Errorf("expected fast=custom-fast-model (preserved), got %q", aliases["fast"])
-		}
-	})
-
-	t.Run("local model clears fast", func(t *testing.T) {
-		aliases := map[string]string{
-			"primary": "local-model",
-			"fast":    "should-be-cleared",
-		}
-
-		// Simulate local model behavior
-		isCloud := false
-		if !isCloud {
-			delete(aliases, "fast")
-		}
-
-		if aliases["fast"] != "" {
-			t.Errorf("expected fast to be cleared, got %q", aliases["fast"])
-		}
-	})
-
-	t.Run("switching cloud to local clears fast", func(t *testing.T) {
-		// Start with cloud config
-		aliases := map[string]string{
-			"primary": "cloud-model",
-			"fast":    "cloud-model",
-		}
-
-		// Switch to local
-		aliases["primary"] = "local-model"
-		isCloud := false
-		if !isCloud {
-			delete(aliases, "fast")
-		}
-
-		if aliases["fast"] != "" {
-			t.Errorf("fast should be cleared when switching to local, got %q", aliases["fast"])
-		}
-		if aliases["primary"] != "local-model" {
-			t.Errorf("primary should be updated, got %q", aliases["primary"])
-		}
-	})
-
-	t.Run("switching local to cloud sets fast", func(t *testing.T) {
-		// Start with local config (no fast)
-		aliases := map[string]string{
-			"primary": "local-model",
-		}
-
-		// Switch to cloud
-		aliases["primary"] = "cloud-model"
-		isCloud := true
-		if isCloud {
-			if aliases["fast"] == "" {
-				aliases["fast"] = aliases["primary"]
-			}
-		}
-
-		if aliases["fast"] != "cloud-model" {
-			t.Errorf("fast should be set when switching to cloud, got %q", aliases["fast"])
-		}
-	})
-}
-
-func TestSetAliases_PrefixMapping(t *testing.T) {
-	// This tests the expected mapping without needing a real client
-	aliases := map[string]string{
-		"primary": "my-cloud-model",
-		"fast":    "my-fast-model",
-	}
-
-	expectedMappings := map[string]string{
-		"claude-sonnet-": aliases["primary"],
-		"claude-haiku-":  aliases["fast"],
-	}
-
-	if expectedMappings["claude-sonnet-"] != "my-cloud-model" {
-		t.Errorf("claude-sonnet- should map to primary")
-	}
-	if expectedMappings["claude-haiku-"] != "my-fast-model" {
-		t.Errorf("claude-haiku- should map to fast")
-	}
-}
-
-func TestSetAliases_LocalDeletesPrefixes(t *testing.T) {
-	aliases := map[string]string{
-		"primary": "local-model",
-		// fast is empty/missing - indicates local model
-	}
-
-	prefixesToDelete := []string{"claude-sonnet-", "claude-haiku-"}
-
-	// Verify the logic: when fast is empty, we should delete
-	if aliases["fast"] != "" {
-		t.Error("fast should be empty for local model")
-	}
-
-	// Verify we have the right prefixes to delete
-	if len(prefixesToDelete) != 2 {
-		t.Errorf("expected 2 prefixes to delete, got %d", len(prefixesToDelete))
-	}
-}
-
-// TestAtomicUpdate_ServerFailsConfigNotSaved simulates atomic update behavior
-func TestAtomicUpdate_ServerFailsConfigNotSaved(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	// Simulate: server fails, config should NOT be saved
-	serverErr := errors.New("server unavailable")
-
-	if serverErr == nil {
-		t.Error("config should NOT be saved when server fails")
-	}
-}
-
-// TestAtomicUpdate_ServerSucceedsConfigSaved simulates successful atomic update
-func TestAtomicUpdate_ServerSucceedsConfigSaved(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	// Simulate: server succeeds, config should be saved
-	var serverErr error
-	if serverErr != nil {
-		t.Fatal("server should succeed")
-	}
-
-	if err := saveAliases("claude", map[string]string{"primary": "model"}); err != nil {
-		t.Fatalf("saveAliases failed: %v", err)
-	}
-
-	// Verify it was actually saved
-	loaded, err := loadIntegration("claude")
-	if err != nil {
-		t.Fatalf("failed to load: %v", err)
-	}
-	if loaded.Aliases["primary"] != "model" {
-		t.Errorf("expected primary=model, got %q", loaded.Aliases["primary"])
-	}
-}
-
-func TestConfigFile_PreservesUnknownFields(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	// Write config with extra fields
-	configPath := filepath.Join(tmpDir, ".ollama", "config.json")
-	os.MkdirAll(filepath.Dir(configPath), 0o755)
-
-	// Note: Our config struct only has Integrations, so top-level unknown fields
-	// won't be preserved by our current implementation. This test documents that.
-	initialConfig := `{
-  "integrations": {
-    "claude": {
-      "models": ["model1"],
-      "aliases": {"primary": "model1"},
-      "unknownField": "should be lost"
-    }
-  },
-  "topLevelUnknown": "will be lost"
-}`
-	os.WriteFile(configPath, []byte(initialConfig), 0o644)
-
-	// Update aliases
-	if err := saveAliases("claude", map[string]string{"primary": "model2"}); err != nil {
-		t.Fatalf("failed to save: %v", err)
-	}
-
-	// Read raw file to check
-	data, _ := os.ReadFile(configPath)
-	content := string(data)
-
-	// models should be preserved
-	if !contains(content, "model1") {
-		t.Error("models should be preserved")
-	}
-
-	// primary should be updated
-	if !contains(content, "model2") {
-		t.Error("primary should be updated to model2")
-	}
-}
-
-func contains(s, substr string) bool {
-	return len(s) >= len(substr) && (s == substr || len(s) > 0 && containsHelper(s, substr))
-}
-
-func containsHelper(s, substr string) bool {
-	for i := 0; i <= len(s)-len(substr); i++ {
-		if s[i:i+len(substr)] == substr {
-			return true
-		}
-	}
-	return false
-}
-
-func TestClaudeImplementsAliasConfigurer(t *testing.T) {
-	c := &Claude{}
-	var _ AliasConfigurer = c // Compile-time check
-}
-
-func TestModelNameEdgeCases(t *testing.T) {
-	testCases := []struct {
-		name  string
-		model string
-	}{
-		{"simple", "llama3.2"},
-		{"with tag", "llama3.2:latest"},
-		{"with cloud tag", "kimi-k2.5:cloud"},
-		{"with namespace", "library/llama3.2"},
-		{"with dots", "glm-4.7-flash"},
-		{"with numbers", "qwen3:8b"},
-	}
-
-	for _, tc := range testCases {
-		t.Run(tc.name, func(t *testing.T) {
-			tmpDir := t.TempDir()
-			setTestHome(t, tmpDir)
-
-			aliases := map[string]string{"primary": tc.model}
-			if err := saveAliases("claude", aliases); err != nil {
-				t.Fatalf("failed to save model %q: %v", tc.model, err)
-			}
-
-			loaded, err := loadIntegration("claude")
-			if err != nil {
-				t.Fatalf("failed to load: %v", err)
-			}
-			if loaded.Aliases["primary"] != tc.model {
-				t.Errorf("expected primary=%q, got %q", tc.model, loaded.Aliases["primary"])
-			}
-		})
-	}
-}
-
-func TestSwitchingScenarios(t *testing.T) {
-	t.Run("cloud to local removes fast", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		// Initial cloud config
-		if err := saveAliases("claude", map[string]string{
-			"primary": "cloud-model",
-			"fast":    "cloud-model",
-		}); err != nil {
-			t.Fatal(err)
-		}
-
-		// Switch to local (no fast)
-		if err := saveAliases("claude", map[string]string{
-			"primary": "local-model",
-		}); err != nil {
-			t.Fatal(err)
-		}
-
-		loaded, _ := loadIntegration("claude")
-		if loaded.Aliases["fast"] != "" {
-			t.Errorf("fast should be removed, got %q", loaded.Aliases["fast"])
-		}
-		if loaded.Aliases["primary"] != "local-model" {
-			t.Errorf("primary should be local-model, got %q", loaded.Aliases["primary"])
-		}
-	})
-
-	t.Run("local to cloud adds fast", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		// Initial local config
-		if err := saveAliases("claude", map[string]string{
-			"primary": "local-model",
-		}); err != nil {
-			t.Fatal(err)
-		}
-
-		// Switch to cloud (with fast)
-		if err := saveAliases("claude", map[string]string{
-			"primary": "cloud-model",
-			"fast":    "cloud-model",
-		}); err != nil {
-			t.Fatal(err)
-		}
-
-		loaded, _ := loadIntegration("claude")
-		if loaded.Aliases["fast"] != "cloud-model" {
-			t.Errorf("fast should be cloud-model, got %q", loaded.Aliases["fast"])
-		}
-	})
-
-	t.Run("cloud to different cloud updates both", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		// Initial cloud config
-		if err := saveAliases("claude", map[string]string{
-			"primary": "cloud-model-1",
-			"fast":    "cloud-model-1",
-		}); err != nil {
-			t.Fatal(err)
-		}
-
-		// Switch to different cloud
-		if err := saveAliases("claude", map[string]string{
-			"primary": "cloud-model-2",
-			"fast":    "cloud-model-2",
-		}); err != nil {
-			t.Fatal(err)
-		}
-
-		loaded, _ := loadIntegration("claude")
-		if loaded.Aliases["primary"] != "cloud-model-2" {
-			t.Errorf("primary should be cloud-model-2, got %q", loaded.Aliases["primary"])
-		}
-		if loaded.Aliases["fast"] != "cloud-model-2" {
-			t.Errorf("fast should be cloud-model-2, got %q", loaded.Aliases["fast"])
-		}
-	})
-}
-
-func TestToolCapabilityFiltering(t *testing.T) {
-	t.Run("all models checked for tool capability", func(t *testing.T) {
-		// Both cloud and local models are checked for tool capability via Show API
-		// Only models with "tools" in capabilities are included
-		m := modelInfo{Name: "tool-model", Remote: false, ToolCapable: true}
-		if !m.ToolCapable {
-			t.Error("tool capable model should be marked as such")
-		}
-	})
-
-	t.Run("modelInfo includes ToolCapable field", func(t *testing.T) {
-		m := modelInfo{Name: "test", Remote: true, ToolCapable: true}
-		if !m.ToolCapable {
-			t.Error("ToolCapable field should be accessible")
-		}
-	})
-}
-
-func TestIsCloudModel_RequiresClient(t *testing.T) {
-	t.Run("nil client always returns false", func(t *testing.T) {
-		// isCloudModel now only uses Show API, no suffix detection
-		if isCloudModel(context.Background(), nil, "model:cloud") {
-			t.Error("nil client should return false regardless of suffix")
-		}
-		if isCloudModel(context.Background(), nil, "local-model") {
-			t.Error("nil client should return false")
-		}
-	})
-}
-
-func TestModelsAndAliasesMustStayInSync(t *testing.T) {
-	t.Run("saveAliases followed by saveIntegration keeps them in sync", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		// Save aliases with one model
-		if err := saveAliases("claude", map[string]string{"primary": "model-a"}); err != nil {
-			t.Fatal(err)
-		}
-
-		// Save integration with same model (this is the pattern we use)
-		if err := SaveIntegration("claude", []string{"model-a"}); err != nil {
-			t.Fatal(err)
-		}
-
-		loaded, _ := loadIntegration("claude")
-		if loaded.Aliases["primary"] != loaded.Models[0] {
-			t.Errorf("aliases.primary (%q) != models[0] (%q)", loaded.Aliases["primary"], loaded.Models[0])
-		}
-	})
-
-	t.Run("out of sync config is detectable", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		// Simulate out-of-sync state (like manual edit or bug)
-		if err := SaveIntegration("claude", []string{"old-model"}); err != nil {
-			t.Fatal(err)
-		}
-		if err := saveAliases("claude", map[string]string{"primary": "new-model"}); err != nil {
-			t.Fatal(err)
-		}
-
-		loaded, _ := loadIntegration("claude")
-
-		// They should be different (this is the bug state)
-		if loaded.Models[0] == loaded.Aliases["primary"] {
-			t.Error("expected out-of-sync state for this test")
-		}
-
-		// The fix: when updating aliases, also update models
-		if err := SaveIntegration("claude", []string{loaded.Aliases["primary"]}); err != nil {
-			t.Fatal(err)
-		}
-
-		loaded, _ = loadIntegration("claude")
-		if loaded.Models[0] != loaded.Aliases["primary"] {
-			t.Errorf("after fix: models[0] (%q) should equal aliases.primary (%q)",
-				loaded.Models[0], loaded.Aliases["primary"])
-		}
-	})
-
-	t.Run("updating primary alias updates models too", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		// Initial state
-		if err := SaveIntegration("claude", []string{"initial-model"}); err != nil {
-			t.Fatal(err)
-		}
-		if err := saveAliases("claude", map[string]string{"primary": "initial-model"}); err != nil {
-			t.Fatal(err)
-		}
-
-		// Update aliases AND models together
-		newAliases := map[string]string{"primary": "updated-model"}
-		if err := saveAliases("claude", newAliases); err != nil {
-			t.Fatal(err)
-		}
-		if err := SaveIntegration("claude", []string{newAliases["primary"]}); err != nil {
-			t.Fatal(err)
-		}
-
-		loaded, _ := loadIntegration("claude")
-		if loaded.Models[0] != "updated-model" {
-			t.Errorf("models[0] should be updated-model, got %q", loaded.Models[0])
-		}
-		if loaded.Aliases["primary"] != "updated-model" {
-			t.Errorf("aliases.primary should be updated-model, got %q", loaded.Aliases["primary"])
-		}
-	})
-}
--- a/cmd/config/config_test.go
+++ b/cmd/config/config_test.go
@@ -1,595 +0,0 @@
-package config
-
-import (
-	"os"
-	"path/filepath"
-	"strings"
-	"testing"
-)
-
-// setTestHome sets both HOME (Unix) and USERPROFILE (Windows) for cross-platform tests
-func setTestHome(t *testing.T, dir string) {
-	t.Setenv("HOME", dir)
-	t.Setenv("USERPROFILE", dir)
-}
-
-// editorPaths is a test helper that safely calls Paths if the runner implements Editor
-func editorPaths(r Runner) []string {
-	if editor, ok := r.(Editor); ok {
-		return editor.Paths()
-	}
-	return nil
-}
-
-func TestIntegrationConfig(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	t.Run("save and load round-trip", func(t *testing.T) {
-		models := []string{"llama3.2", "mistral", "qwen2.5"}
-		if err := SaveIntegration("claude", models); err != nil {
-			t.Fatal(err)
-		}
-
-		config, err := loadIntegration("claude")
-		if err != nil {
-			t.Fatal(err)
-		}
-
-		if len(config.Models) != len(models) {
-			t.Errorf("expected %d models, got %d", len(models), len(config.Models))
-		}
-		for i, m := range models {
-			if config.Models[i] != m {
-				t.Errorf("model %d: expected %s, got %s", i, m, config.Models[i])
-			}
-		}
-	})
-
-	t.Run("save and load aliases", func(t *testing.T) {
-		models := []string{"llama3.2"}
-		if err := SaveIntegration("claude", models); err != nil {
-			t.Fatal(err)
-		}
-		aliases := map[string]string{
-			"primary": "llama3.2:70b",
-			"fast":    "llama3.2:8b",
-		}
-		if err := saveAliases("claude", aliases); err != nil {
-			t.Fatal(err)
-		}
-
-		config, err := loadIntegration("claude")
-		if err != nil {
-			t.Fatal(err)
-		}
-		if config.Aliases == nil {
-			t.Fatal("expected aliases to be saved")
-		}
-		for k, v := range aliases {
-			if config.Aliases[k] != v {
-				t.Errorf("alias %s: expected %s, got %s", k, v, config.Aliases[k])
-			}
-		}
-	})
-
-	t.Run("saveIntegration preserves aliases", func(t *testing.T) {
-		if err := SaveIntegration("claude", []string{"model-a"}); err != nil {
-			t.Fatal(err)
-		}
-		if err := saveAliases("claude", map[string]string{"primary": "model-a", "fast": "model-small"}); err != nil {
-			t.Fatal(err)
-		}
-
-		if err := SaveIntegration("claude", []string{"model-b"}); err != nil {
-			t.Fatal(err)
-		}
-		config, err := loadIntegration("claude")
-		if err != nil {
-			t.Fatal(err)
-		}
-		if config.Aliases["primary"] != "model-a" {
-			t.Errorf("expected aliases to be preserved, got %v", config.Aliases)
-		}
-	})
-
-	t.Run("defaultModel returns first model", func(t *testing.T) {
-		SaveIntegration("codex", []string{"model-a", "model-b"})
-
-		config, _ := loadIntegration("codex")
-		defaultModel := ""
-		if len(config.Models) > 0 {
-			defaultModel = config.Models[0]
-		}
-		if defaultModel != "model-a" {
-			t.Errorf("expected model-a, got %s", defaultModel)
-		}
-	})
-
-	t.Run("defaultModel returns empty for no models", func(t *testing.T) {
-		config := &integration{Models: []string{}}
-		defaultModel := ""
-		if len(config.Models) > 0 {
-			defaultModel = config.Models[0]
-		}
-		if defaultModel != "" {
-			t.Errorf("expected empty string, got %s", defaultModel)
-		}
-	})
-
-	t.Run("app name is case-insensitive", func(t *testing.T) {
-		SaveIntegration("Claude", []string{"model-x"})
-
-		config, err := loadIntegration("claude")
-		if err != nil {
-			t.Fatal(err)
-		}
-		defaultModel := ""
-		if len(config.Models) > 0 {
-			defaultModel = config.Models[0]
-		}
-		if defaultModel != "model-x" {
-			t.Errorf("expected model-x, got %s", defaultModel)
-		}
-	})
-
-	t.Run("multiple integrations in single file", func(t *testing.T) {
-		SaveIntegration("app1", []string{"model-1"})
-		SaveIntegration("app2", []string{"model-2"})
-
-		config1, _ := loadIntegration("app1")
-		config2, _ := loadIntegration("app2")
-
-		defaultModel1 := ""
-		if len(config1.Models) > 0 {
-			defaultModel1 = config1.Models[0]
-		}
-		defaultModel2 := ""
-		if len(config2.Models) > 0 {
-			defaultModel2 = config2.Models[0]
-		}
-		if defaultModel1 != "model-1" {
-			t.Errorf("expected model-1, got %s", defaultModel1)
-		}
-		if defaultModel2 != "model-2" {
-			t.Errorf("expected model-2, got %s", defaultModel2)
-		}
-	})
-}
-
-func TestListIntegrations(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	t.Run("returns empty when no integrations", func(t *testing.T) {
-		configs, err := listIntegrations()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if len(configs) != 0 {
-			t.Errorf("expected 0 integrations, got %d", len(configs))
-		}
-	})
-
-	t.Run("returns all saved integrations", func(t *testing.T) {
-		SaveIntegration("claude", []string{"model-1"})
-		SaveIntegration("droid", []string{"model-2"})
-
-		configs, err := listIntegrations()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if len(configs) != 2 {
-			t.Errorf("expected 2 integrations, got %d", len(configs))
-		}
-	})
-}
-
-func TestEditorPaths(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	t.Run("returns empty for claude (no Editor)", func(t *testing.T) {
-		r := integrations["claude"]
-		paths := editorPaths(r)
-		if len(paths) != 0 {
-			t.Errorf("expected no paths for claude, got %v", paths)
-		}
-	})
-
-	t.Run("returns empty for codex (no Editor)", func(t *testing.T) {
-		r := integrations["codex"]
-		paths := editorPaths(r)
-		if len(paths) != 0 {
-			t.Errorf("expected no paths for codex, got %v", paths)
-		}
-	})
-
-	t.Run("returns empty for droid when no config exists", func(t *testing.T) {
-		r := integrations["droid"]
-		paths := editorPaths(r)
-		if len(paths) != 0 {
-			t.Errorf("expected no paths, got %v", paths)
-		}
-	})
-
-	t.Run("returns path for droid when config exists", func(t *testing.T) {
-		settingsDir, _ := os.UserHomeDir()
-		settingsDir = filepath.Join(settingsDir, ".factory")
-		os.MkdirAll(settingsDir, 0o755)
-		os.WriteFile(filepath.Join(settingsDir, "settings.json"), []byte(`{}`), 0o644)
-
-		r := integrations["droid"]
-		paths := editorPaths(r)
-		if len(paths) != 1 {
-			t.Errorf("expected 1 path, got %d", len(paths))
-		}
-	})
-
-	t.Run("returns paths for opencode when configs exist", func(t *testing.T) {
-		home, _ := os.UserHomeDir()
-		configDir := filepath.Join(home, ".config", "opencode")
-		stateDir := filepath.Join(home, ".local", "state", "opencode")
-		os.MkdirAll(configDir, 0o755)
-		os.MkdirAll(stateDir, 0o755)
-		os.WriteFile(filepath.Join(configDir, "opencode.json"), []byte(`{}`), 0o644)
-		os.WriteFile(filepath.Join(stateDir, "model.json"), []byte(`{}`), 0o644)
-
-		r := integrations["opencode"]
-		paths := editorPaths(r)
-		if len(paths) != 2 {
-			t.Errorf("expected 2 paths, got %d: %v", len(paths), paths)
-		}
-	})
-}
-
-func TestLoadIntegration_CorruptedJSON(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	dir := filepath.Join(tmpDir, ".ollama")
-	os.MkdirAll(dir, 0o755)
-	os.WriteFile(filepath.Join(dir, "config.json"), []byte(`{corrupted json`), 0o644)
-
-	_, err := loadIntegration("test")
-	if err == nil {
-		t.Error("expected error for nonexistent integration in corrupted file")
-	}
-}
-
-func TestSaveIntegration_NilModels(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	if err := SaveIntegration("test", nil); err != nil {
-		t.Fatalf("saveIntegration with nil models failed: %v", err)
-	}
-
-	config, err := loadIntegration("test")
-	if err != nil {
-		t.Fatalf("loadIntegration failed: %v", err)
-	}
-
-	if config.Models == nil {
-		// nil is acceptable
-	} else if len(config.Models) != 0 {
-		t.Errorf("expected empty or nil models, got %v", config.Models)
-	}
-}
-
-func TestSaveIntegration_EmptyAppName(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	err := SaveIntegration("", []string{"model"})
-	if err == nil {
-		t.Error("expected error for empty app name, got nil")
-	}
-	if err != nil && !strings.Contains(err.Error(), "app name cannot be empty") {
-		t.Errorf("expected 'app name cannot be empty' error, got: %v", err)
-	}
-}
-
-func TestLoadIntegration_NonexistentIntegration(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	_, err := loadIntegration("nonexistent")
-	if err == nil {
-		t.Error("expected error for nonexistent integration, got nil")
-	}
-	if !os.IsNotExist(err) {
-		t.Logf("error type is os.ErrNotExist as expected: %v", err)
-	}
-}
-
-func TestConfigPath(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	path, err := configPath()
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	expected := filepath.Join(tmpDir, ".ollama", "config.json")
-	if path != expected {
-		t.Errorf("expected %s, got %s", expected, path)
-	}
-}
-
-func TestLoad(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	t.Run("returns empty config when file does not exist", func(t *testing.T) {
-		cfg, err := load()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if cfg == nil {
-			t.Fatal("expected non-nil config")
-		}
-		if cfg.Integrations == nil {
-			t.Error("expected non-nil Integrations map")
-		}
-		if len(cfg.Integrations) != 0 {
-			t.Errorf("expected empty Integrations, got %d", len(cfg.Integrations))
-		}
-	})
-
-	t.Run("loads existing config", func(t *testing.T) {
-		path, _ := configPath()
-		os.MkdirAll(filepath.Dir(path), 0o755)
-		os.WriteFile(path, []byte(`{"integrations":{"test":{"models":["model-a"]}}}`), 0o644)
-
-		cfg, err := load()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if cfg.Integrations["test"] == nil {
-			t.Fatal("expected test integration")
-		}
-		if len(cfg.Integrations["test"].Models) != 1 {
-			t.Errorf("expected 1 model, got %d", len(cfg.Integrations["test"].Models))
-		}
-	})
-
-	t.Run("returns error for corrupted JSON", func(t *testing.T) {
-		path, _ := configPath()
-		os.MkdirAll(filepath.Dir(path), 0o755)
-		os.WriteFile(path, []byte(`{corrupted`), 0o644)
-
-		_, err := load()
-		if err == nil {
-			t.Error("expected error for corrupted JSON")
-		}
-	})
-}
-
-func TestMigrateConfig(t *testing.T) {
-	t.Run("migrates legacy file to new location", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		legacyDir := filepath.Join(tmpDir, ".ollama", "config")
-		os.MkdirAll(legacyDir, 0o755)
-		data := []byte(`{"integrations":{"claude":{"models":["llama3.2"]}}}`)
-		os.WriteFile(filepath.Join(legacyDir, "config.json"), data, 0o644)
-
-		migrated, err := migrateConfig()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if !migrated {
-			t.Fatal("expected migration to occur")
-		}
-
-		newPath, _ := configPath()
-		got, err := os.ReadFile(newPath)
-		if err != nil {
-			t.Fatalf("new config not found: %v", err)
-		}
-		if string(got) != string(data) {
-			t.Errorf("content mismatch: got %s", got)
-		}
-
-		if _, err := os.Stat(filepath.Join(legacyDir, "config.json")); !os.IsNotExist(err) {
-			t.Error("legacy file should have been removed")
-		}
-
-		if _, err := os.Stat(legacyDir); !os.IsNotExist(err) {
-			t.Error("legacy directory should have been removed")
-		}
-	})
-
-	t.Run("no-op when no legacy file exists", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		migrated, err := migrateConfig()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if migrated {
-			t.Error("expected no migration")
-		}
-	})
-
-	t.Run("skips corrupt legacy file", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		legacyDir := filepath.Join(tmpDir, ".ollama", "config")
-		os.MkdirAll(legacyDir, 0o755)
-		os.WriteFile(filepath.Join(legacyDir, "config.json"), []byte(`{corrupt`), 0o644)
-
-		migrated, err := migrateConfig()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if migrated {
-			t.Error("should not migrate corrupt file")
-		}
-
-		if _, err := os.Stat(filepath.Join(legacyDir, "config.json")); os.IsNotExist(err) {
-			t.Error("corrupt legacy file should not have been deleted")
-		}
-	})
-
-	t.Run("new path takes precedence over legacy", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		legacyDir := filepath.Join(tmpDir, ".ollama", "config")
-		os.MkdirAll(legacyDir, 0o755)
-		os.WriteFile(filepath.Join(legacyDir, "config.json"), []byte(`{"integrations":{"old":{"models":["old-model"]}}}`), 0o644)
-
-		newDir := filepath.Join(tmpDir, ".ollama")
-		os.WriteFile(filepath.Join(newDir, "config.json"), []byte(`{"integrations":{"new":{"models":["new-model"]}}}`), 0o644)
-
-		cfg, err := load()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if _, ok := cfg.Integrations["new"]; !ok {
-			t.Error("expected new-path integration to be loaded")
-		}
-		if _, ok := cfg.Integrations["old"]; ok {
-			t.Error("legacy integration should not have been loaded")
-		}
-	})
-
-	t.Run("idempotent when called twice", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		legacyDir := filepath.Join(tmpDir, ".ollama", "config")
-		os.MkdirAll(legacyDir, 0o755)
-		os.WriteFile(filepath.Join(legacyDir, "config.json"), []byte(`{"integrations":{}}`), 0o644)
-
-		if _, err := migrateConfig(); err != nil {
-			t.Fatal(err)
-		}
-
-		migrated, err := migrateConfig()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if migrated {
-			t.Error("second migration should be a no-op")
-		}
-	})
-
-	t.Run("legacy directory preserved if not empty", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		legacyDir := filepath.Join(tmpDir, ".ollama", "config")
-		os.MkdirAll(legacyDir, 0o755)
-		os.WriteFile(filepath.Join(legacyDir, "config.json"), []byte(`{"integrations":{}}`), 0o644)
-		os.WriteFile(filepath.Join(legacyDir, "other-file.txt"), []byte("keep me"), 0o644)
-
-		if _, err := migrateConfig(); err != nil {
-			t.Fatal(err)
-		}
-
-		if _, err := os.Stat(legacyDir); os.IsNotExist(err) {
-			t.Error("directory with other files should not have been removed")
-		}
-		if _, err := os.Stat(filepath.Join(legacyDir, "other-file.txt")); os.IsNotExist(err) {
-			t.Error("other files in legacy directory should be untouched")
-		}
-	})
-
-	t.Run("save writes to new path after migration", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		legacyDir := filepath.Join(tmpDir, ".ollama", "config")
-		os.MkdirAll(legacyDir, 0o755)
-		os.WriteFile(filepath.Join(legacyDir, "config.json"), []byte(`{"integrations":{"claude":{"models":["llama3.2"]}}}`), 0o644)
-
-		// load triggers migration, then save should write to new path
-		if err := SaveIntegration("codex", []string{"qwen2.5"}); err != nil {
-			t.Fatal(err)
-		}
-
-		newPath := filepath.Join(tmpDir, ".ollama", "config.json")
-		if _, err := os.Stat(newPath); os.IsNotExist(err) {
-			t.Error("save should write to new path")
-		}
-
-		// old path should not be recreated
-		if _, err := os.Stat(filepath.Join(legacyDir, "config.json")); !os.IsNotExist(err) {
-			t.Error("save should not recreate legacy path")
-		}
-	})
-
-	t.Run("load triggers migration transparently", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		legacyDir := filepath.Join(tmpDir, ".ollama", "config")
-		os.MkdirAll(legacyDir, 0o755)
-		os.WriteFile(filepath.Join(legacyDir, "config.json"), []byte(`{"integrations":{"claude":{"models":["llama3.2"]}}}`), 0o644)
-
-		cfg, err := load()
-		if err != nil {
-			t.Fatal(err)
-		}
-		if cfg.Integrations["claude"] == nil || cfg.Integrations["claude"].Models[0] != "llama3.2" {
-			t.Error("migration via load() did not preserve data")
-		}
-	})
-}
-
-func TestSave(t *testing.T) {
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	t.Run("creates config file", func(t *testing.T) {
-		cfg := &config{
-			Integrations: map[string]*integration{
-				"test": {Models: []string{"model-a", "model-b"}},
-			},
-		}
-
-		if err := save(cfg); err != nil {
-			t.Fatal(err)
-		}
-
-		path, _ := configPath()
-		if _, err := os.Stat(path); os.IsNotExist(err) {
-			t.Error("config file was not created")
-		}
-	})
-
-	t.Run("round-trip preserves data", func(t *testing.T) {
-		cfg := &config{
-			Integrations: map[string]*integration{
-				"claude": {Models: []string{"llama3.2", "mistral"}},
-				"codex":  {Models: []string{"qwen2.5"}},
-			},
-		}
-
-		if err := save(cfg); err != nil {
-			t.Fatal(err)
-		}
-
-		loaded, err := load()
-		if err != nil {
-			t.Fatal(err)
-		}
-
-		if len(loaded.Integrations) != 2 {
-			t.Errorf("expected 2 integrations, got %d", len(loaded.Integrations))
-		}
-		if loaded.Integrations["claude"] == nil {
-			t.Error("missing claude integration")
-		}
-		if len(loaded.Integrations["claude"].Models) != 2 {
-			t.Errorf("expected 2 models for claude, got %d", len(loaded.Integrations["claude"].Models))
-		}
-	})
-}
--- a/cmd/config/droid.go
+++ b/cmd/config/droid.go
@@ -1,207 +0,0 @@
-package config
-
-import (
-	"context"
-	"encoding/json"
-	"errors"
-	"fmt"
-	"os"
-	"os/exec"
-	"path/filepath"
-	"slices"
-
-	"github.com/ollama/ollama/api"
-	"github.com/ollama/ollama/envconfig"
-)
-
-// Droid implements Runner and Editor for Droid integration
-type Droid struct{}
-
-// droidSettings represents the Droid settings.json file (only fields we use)
-type droidSettings struct {
-	CustomModels           []modelEntry    `json:"customModels"`
-	SessionDefaultSettings sessionSettings `json:"sessionDefaultSettings"`
-}
-
-type sessionSettings struct {
-	Model           string `json:"model"`
-	ReasoningEffort string `json:"reasoningEffort"`
-}
-
-type modelEntry struct {
-	Model           string `json:"model"`
-	DisplayName     string `json:"displayName"`
-	BaseURL         string `json:"baseUrl"`
-	APIKey          string `json:"apiKey"`
-	Provider        string `json:"provider"`
-	MaxOutputTokens int    `json:"maxOutputTokens"`
-	SupportsImages  bool   `json:"supportsImages"`
-	ID              string `json:"id"`
-	Index           int    `json:"index"`
-}
-
-func (d *Droid) String() string { return "Droid" }
-
-func (d *Droid) Run(model string, args []string) error {
-	if _, err := exec.LookPath("droid"); err != nil {
-		return fmt.Errorf("droid is not installed, install from https://docs.factory.ai/cli/getting-started/quickstart")
-	}
-
-	// Call Edit() to ensure config is up-to-date before launch
-	models := []string{model}
-	if config, err := loadIntegration("droid"); err == nil && len(config.Models) > 0 {
-		models = config.Models
-	}
-	var err error
-	models, err = resolveEditorModels("droid", models, func() ([]string, error) {
-		return selectModels(context.Background(), "droid", "")
-	})
-	if errors.Is(err, errCancelled) {
-		return nil
-	}
-	if err != nil {
-		return err
-	}
-	if err := d.Edit(models); err != nil {
-		return fmt.Errorf("setup failed: %w", err)
-	}
-
-	cmd := exec.Command("droid", args...)
-	cmd.Stdin = os.Stdin
-	cmd.Stdout = os.Stdout
-	cmd.Stderr = os.Stderr
-	return cmd.Run()
-}
-
-func (d *Droid) Paths() []string {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return nil
-	}
-	p := filepath.Join(home, ".factory", "settings.json")
-	if _, err := os.Stat(p); err == nil {
-		return []string{p}
-	}
-	return nil
-}
-
-func (d *Droid) Edit(models []string) error {
-	if len(models) == 0 {
-		return nil
-	}
-
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return err
-	}
-
-	settingsPath := filepath.Join(home, ".factory", "settings.json")
-	if err := os.MkdirAll(filepath.Dir(settingsPath), 0o755); err != nil {
-		return err
-	}
-
-	// Read file once, unmarshal twice:
-	// map preserves unknown fields for writing back (including extra fields in model entries)
-	settingsMap := make(map[string]any)
-	var settings droidSettings
-	if data, err := os.ReadFile(settingsPath); err == nil {
-		if err := json.Unmarshal(data, &settingsMap); err != nil {
-			return fmt.Errorf("failed to parse settings file: %w, at: %s", err, settingsPath)
-		}
-		json.Unmarshal(data, &settings) // ignore error, zero values are fine
-	}
-
-	// Keep only non-Ollama models from the raw map (preserves extra fields)
-	// Rebuild Ollama models
-	var nonOllamaModels []any
-	if rawModels, ok := settingsMap["customModels"].([]any); ok {
-		for _, raw := range rawModels {
-			if m, ok := raw.(map[string]any); ok {
-				if m["apiKey"] != "ollama" {
-					nonOllamaModels = append(nonOllamaModels, raw)
-				}
-			}
-		}
-	}
-
-	// Build new Ollama model entries with sequential indices (0, 1, 2, ...)
-	client, _ := api.ClientFromEnvironment()
-
-	var newModels []any
-	var defaultModelID string
-	for i, model := range models {
-		maxOutput := 64000
-		if isCloudModel(context.Background(), client, model) {
-			if l, ok := lookupCloudModelLimit(model); ok {
-				maxOutput = l.Output
-			}
-		}
-		modelID := fmt.Sprintf("custom:%s-%d", model, i)
-		newModels = append(newModels, modelEntry{
-			Model:           model,
-			DisplayName:     model,
-			BaseURL:         envconfig.Host().String() + "/v1",
-			APIKey:          "ollama",
-			Provider:        "generic-chat-completion-api",
-			MaxOutputTokens: maxOutput,
-			SupportsImages:  false,
-			ID:              modelID,
-			Index:           i,
-		})
-		if i == 0 {
-			defaultModelID = modelID
-		}
-	}
-
-	settingsMap["customModels"] = append(newModels, nonOllamaModels...)
-
-	// Update session default settings (preserve unknown fields in the nested object)
-	sessionSettings, ok := settingsMap["sessionDefaultSettings"].(map[string]any)
-	if !ok {
-		sessionSettings = make(map[string]any)
-	}
-	sessionSettings["model"] = defaultModelID
-
-	if !isValidReasoningEffort(settings.SessionDefaultSettings.ReasoningEffort) {
-		sessionSettings["reasoningEffort"] = "none"
-	}
-
-	settingsMap["sessionDefaultSettings"] = sessionSettings
-
-	data, err := json.MarshalIndent(settingsMap, "", "  ")
-	if err != nil {
-		return err
-	}
-	return writeWithBackup(settingsPath, data)
-}
-
-func (d *Droid) Models() []string {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return nil
-	}
-
-	data, err := os.ReadFile(filepath.Join(home, ".factory", "settings.json"))
-	if err != nil {
-		return nil
-	}
-
-	var settings droidSettings
-	if err := json.Unmarshal(data, &settings); err != nil {
-		return nil
-	}
-
-	var result []string
-	for _, m := range settings.CustomModels {
-		if m.APIKey == "ollama" {
-			result = append(result, m.Model)
-		}
-	}
-	return result
-}
-
-var validReasoningEfforts = []string{"high", "medium", "low", "none"}
-
-func isValidReasoningEffort(effort string) bool {
-	return slices.Contains(validReasoningEfforts, effort)
-}
--- a/cmd/config/droid_test.go
+++ b/cmd/config/droid_test.go
--- a/cmd/config/files.go
+++ b/cmd/config/files.go
@@ -1,99 +0,0 @@
-package config
-
-import (
-	"bytes"
-	"encoding/json"
-	"fmt"
-	"os"
-	"path/filepath"
-	"time"
-)
-
-func readJSONFile(path string) (map[string]any, error) {
-	data, err := os.ReadFile(path)
-	if err != nil {
-		return nil, err
-	}
-	var result map[string]any
-	if err := json.Unmarshal(data, &result); err != nil {
-		return nil, err
-	}
-	return result, nil
-}
-
-func copyFile(src, dst string) error {
-	info, err := os.Stat(src)
-	if err != nil {
-		return err
-	}
-	data, err := os.ReadFile(src)
-	if err != nil {
-		return err
-	}
-	return os.WriteFile(dst, data, info.Mode().Perm())
-}
-
-func backupDir() string {
-	return filepath.Join(os.TempDir(), "ollama-backups")
-}
-
-func backupToTmp(srcPath string) (string, error) {
-	dir := backupDir()
-	if err := os.MkdirAll(dir, 0o755); err != nil {
-		return "", err
-	}
-
-	backupPath := filepath.Join(dir, fmt.Sprintf("%s.%d", filepath.Base(srcPath), time.Now().Unix()))
-	if err := copyFile(srcPath, backupPath); err != nil {
-		return "", err
-	}
-	return backupPath, nil
-}
-
-// writeWithBackup writes data to path via temp file + rename, backing up any existing file first
-func writeWithBackup(path string, data []byte) error {
-	var backupPath string
-	// backup must be created before any writes to the target file
-	if existingContent, err := os.ReadFile(path); err == nil {
-		if !bytes.Equal(existingContent, data) {
-			backupPath, err = backupToTmp(path)
-			if err != nil {
-				return fmt.Errorf("backup failed: %w", err)
-			}
-		}
-	} else if !os.IsNotExist(err) {
-		return fmt.Errorf("read existing file: %w", err)
-	}
-
-	dir := filepath.Dir(path)
-	tmp, err := os.CreateTemp(dir, ".tmp-*")
-	if err != nil {
-		return fmt.Errorf("create temp failed: %w", err)
-	}
-	tmpPath := tmp.Name()
-
-	if _, err := tmp.Write(data); err != nil {
-		_ = tmp.Close()
-		_ = os.Remove(tmpPath)
-		return fmt.Errorf("write failed: %w", err)
-	}
-	if err := tmp.Sync(); err != nil {
-		_ = tmp.Close()
-		_ = os.Remove(tmpPath)
-		return fmt.Errorf("sync failed: %w", err)
-	}
-	if err := tmp.Close(); err != nil {
-		_ = os.Remove(tmpPath)
-		return fmt.Errorf("close failed: %w", err)
-	}
-
-	if err := os.Rename(tmpPath, path); err != nil {
-		_ = os.Remove(tmpPath)
-		if backupPath != "" {
-			_ = copyFile(backupPath, path)
-		}
-		return fmt.Errorf("rename failed: %w", err)
-	}
-
-	return nil
-}
--- a/cmd/config/files_test.go
+++ b/cmd/config/files_test.go
@@ -1,502 +0,0 @@
-package config
-
-import (
-	"encoding/json"
-	"fmt"
-	"os"
-	"path/filepath"
-	"runtime"
-	"testing"
-)
-
-func mustMarshal(t *testing.T, v any) []byte {
-	t.Helper()
-	data, err := json.MarshalIndent(v, "", "  ")
-	if err != nil {
-		t.Fatal(err)
-	}
-	return data
-}
-
-func TestWriteWithBackup(t *testing.T) {
-	tmpDir := t.TempDir()
-
-	t.Run("creates file", func(t *testing.T) {
-		path := filepath.Join(tmpDir, "new.json")
-		data := mustMarshal(t, map[string]string{"key": "value"})
-
-		if err := writeWithBackup(path, data); err != nil {
-			t.Fatal(err)
-		}
-
-		content, err := os.ReadFile(path)
-		if err != nil {
-			t.Fatal(err)
-		}
-
-		var result map[string]string
-		if err := json.Unmarshal(content, &result); err != nil {
-			t.Fatal(err)
-		}
-		if result["key"] != "value" {
-			t.Errorf("expected value, got %s", result["key"])
-		}
-	})
-
-	t.Run("creates backup in /tmp/ollama-backups", func(t *testing.T) {
-		path := filepath.Join(tmpDir, "backup.json")
-
-		os.WriteFile(path, []byte(`{"original": true}`), 0o644)
-
-		data := mustMarshal(t, map[string]bool{"updated": true})
-		if err := writeWithBackup(path, data); err != nil {
-			t.Fatal(err)
-		}
-
-		entries, err := os.ReadDir(backupDir())
-		if err != nil {
-			t.Fatal("backup directory not created")
-		}
-
-		var foundBackup bool
-		for _, entry := range entries {
-			if filepath.Ext(entry.Name()) != ".json" {
-				name := entry.Name()
-				if len(name) > len("backup.json.") && name[:len("backup.json.")] == "backup.json." {
-					backupPath := filepath.Join(backupDir(), name)
-					backup, err := os.ReadFile(backupPath)
-					if err == nil {
-						var backupData map[string]bool
-						json.Unmarshal(backup, &backupData)
-						if backupData["original"] {
-							foundBackup = true
-							os.Remove(backupPath)
-							break
-						}
-					}
-				}
-			}
-		}
-
-		if !foundBackup {
-			t.Error("backup file not created in /tmp/ollama-backups")
-		}
-
-		current, _ := os.ReadFile(path)
-		var currentData map[string]bool
-		json.Unmarshal(current, &currentData)
-		if !currentData["updated"] {
-			t.Error("file doesn't contain updated data")
-		}
-	})
-
-	t.Run("no backup for new file", func(t *testing.T) {
-		path := filepath.Join(tmpDir, "nobak.json")
-
-		data := mustMarshal(t, map[string]string{"new": "file"})
-		if err := writeWithBackup(path, data); err != nil {
-			t.Fatal(err)
-		}
-
-		entries, _ := os.ReadDir(backupDir())
-		for _, entry := range entries {
-			if len(entry.Name()) > len("nobak.json.") && entry.Name()[:len("nobak.json.")] == "nobak.json." {
-				t.Error("backup should not exist for new file")
-			}
-		}
-	})
-
-	t.Run("no backup when content unchanged", func(t *testing.T) {
-		path := filepath.Join(tmpDir, "unchanged.json")
-
-		data := mustMarshal(t, map[string]string{"key": "value"})
-
-		if err := writeWithBackup(path, data); err != nil {
-			t.Fatal(err)
-		}
-
-		entries1, _ := os.ReadDir(backupDir())
-		countBefore := 0
-		for _, e := range entries1 {
-			if len(e.Name()) > len("unchanged.json.") && e.Name()[:len("unchanged.json.")] == "unchanged.json." {
-				countBefore++
-			}
-		}
-
-		if err := writeWithBackup(path, data); err != nil {
-			t.Fatal(err)
-		}
-
-		entries2, _ := os.ReadDir(backupDir())
-		countAfter := 0
-		for _, e := range entries2 {
-			if len(e.Name()) > len("unchanged.json.") && e.Name()[:len("unchanged.json.")] == "unchanged.json." {
-				countAfter++
-			}
-		}
-
-		if countAfter != countBefore {
-			t.Errorf("backup was created when content unchanged (before=%d, after=%d)", countBefore, countAfter)
-		}
-	})
-
-	t.Run("backup filename contains unix timestamp", func(t *testing.T) {
-		path := filepath.Join(tmpDir, "timestamped.json")
-
-		os.WriteFile(path, []byte(`{"v": 1}`), 0o644)
-		data := mustMarshal(t, map[string]int{"v": 2})
-		if err := writeWithBackup(path, data); err != nil {
-			t.Fatal(err)
-		}
-
-		entries, _ := os.ReadDir(backupDir())
-		var found bool
-		for _, entry := range entries {
-			name := entry.Name()
-			if len(name) > len("timestamped.json.") && name[:len("timestamped.json.")] == "timestamped.json." {
-				timestamp := name[len("timestamped.json."):]
-				for _, c := range timestamp {
-					if c < '0' || c > '9' {
-						t.Errorf("backup filename timestamp contains non-numeric character: %s", name)
-					}
-				}
-				found = true
-				os.Remove(filepath.Join(backupDir(), name))
-				break
-			}
-		}
-		if !found {
-			t.Error("backup file with timestamp not found")
-		}
-	})
-}
-
-// Edge case tests for files.go
-
-// TestWriteWithBackup_FailsIfBackupFails documents critical behavior: if backup fails, we must not proceed.
-// User could lose their config with no way to recover.
-func TestWriteWithBackup_FailsIfBackupFails(t *testing.T) {
-	if runtime.GOOS == "windows" {
-		t.Skip("permission tests unreliable on Windows")
-	}
-
-	tmpDir := t.TempDir()
-	path := filepath.Join(tmpDir, "config.json")
-
-	// Create original file
-	originalContent := []byte(`{"original": true}`)
-	os.WriteFile(path, originalContent, 0o644)
-
-	// Make backup directory read-only to force backup failure
-	backupDir := backupDir()
-	os.MkdirAll(backupDir, 0o755)
-	os.Chmod(backupDir, 0o444) // Read-only
-	defer os.Chmod(backupDir, 0o755)
-
-	newContent := []byte(`{"updated": true}`)
-	err := writeWithBackup(path, newContent)
-
-	// Should fail because backup couldn't be created
-	if err == nil {
-		t.Error("expected error when backup fails, got nil")
-	}
-
-	// Original file should be preserved
-	current, _ := os.ReadFile(path)
-	if string(current) != string(originalContent) {
-		t.Errorf("original file was modified despite backup failure: got %s", string(current))
-	}
-}
-
-// TestWriteWithBackup_PermissionDenied verifies clear error when target file has wrong permissions.
-// Common issue when config owned by root or wrong perms.
-func TestWriteWithBackup_PermissionDenied(t *testing.T) {
-	if runtime.GOOS == "windows" {
-		t.Skip("permission tests unreliable on Windows")
-	}
-
-	tmpDir := t.TempDir()
-
-	// Create a read-only directory
-	readOnlyDir := filepath.Join(tmpDir, "readonly")
-	os.MkdirAll(readOnlyDir, 0o755)
-	os.Chmod(readOnlyDir, 0o444)
-	defer os.Chmod(readOnlyDir, 0o755)
-
-	path := filepath.Join(readOnlyDir, "config.json")
-	err := writeWithBackup(path, []byte(`{"test": true}`))
-
-	if err == nil {
-		t.Error("expected permission error, got nil")
-	}
-}
-
-// TestWriteWithBackup_DirectoryDoesNotExist verifies behavior when target directory doesn't exist.
-// writeWithBackup doesn't create directories - caller is responsible.
-func TestWriteWithBackup_DirectoryDoesNotExist(t *testing.T) {
-	tmpDir := t.TempDir()
-	path := filepath.Join(tmpDir, "nonexistent", "subdir", "config.json")
-
-	err := writeWithBackup(path, []byte(`{"test": true}`))
-
-	// Should fail because directory doesn't exist
-	if err == nil {
-		t.Error("expected error for nonexistent directory, got nil")
-	}
-}
-
-// TestWriteWithBackup_SymlinkTarget documents behavior when target is a symlink.
-// Documents what happens if user symlinks their config file.
-func TestWriteWithBackup_SymlinkTarget(t *testing.T) {
-	if runtime.GOOS == "windows" {
-		t.Skip("symlink tests may require admin on Windows")
-	}
-
-	tmpDir := t.TempDir()
-	realFile := filepath.Join(tmpDir, "real.json")
-	symlink := filepath.Join(tmpDir, "link.json")
-
-	// Create real file and symlink
-	os.WriteFile(realFile, []byte(`{"v": 1}`), 0o644)
-	os.Symlink(realFile, symlink)
-
-	// Write through symlink
-	err := writeWithBackup(symlink, []byte(`{"v": 2}`))
-	if err != nil {
-		t.Fatalf("writeWithBackup through symlink failed: %v", err)
-	}
-
-	// The real file should be updated (symlink followed for temp file creation)
-	content, _ := os.ReadFile(symlink)
-	if string(content) != `{"v": 2}` {
-		t.Errorf("symlink target not updated correctly: got %s", string(content))
-	}
-}
-
-// TestBackupToTmp_SpecialCharsInFilename verifies backup works with special characters.
-// User may have config files with unusual names.
-func TestBackupToTmp_SpecialCharsInFilename(t *testing.T) {
-	tmpDir := t.TempDir()
-
-	// File with spaces and special chars
-	path := filepath.Join(tmpDir, "my config (backup).json")
-	os.WriteFile(path, []byte(`{"test": true}`), 0o644)
-
-	backupPath, err := backupToTmp(path)
-	if err != nil {
-		t.Fatalf("backupToTmp with special chars failed: %v", err)
-	}
-
-	// Verify backup exists and has correct content
-	content, err := os.ReadFile(backupPath)
-	if err != nil {
-		t.Fatalf("could not read backup: %v", err)
-	}
-	if string(content) != `{"test": true}` {
-		t.Errorf("backup content mismatch: got %s", string(content))
-	}
-
-	os.Remove(backupPath)
-}
-
-// TestCopyFile_PreservesPermissions verifies that copyFile preserves file permissions.
-func TestCopyFile_PreservesPermissions(t *testing.T) {
-	if runtime.GOOS == "windows" {
-		t.Skip("permission preservation tests unreliable on Windows")
-	}
-
-	tmpDir := t.TempDir()
-	src := filepath.Join(tmpDir, "src.json")
-	dst := filepath.Join(tmpDir, "dst.json")
-
-	// Create source with specific permissions
-	os.WriteFile(src, []byte(`{"test": true}`), 0o600)
-
-	err := copyFile(src, dst)
-	if err != nil {
-		t.Fatalf("copyFile failed: %v", err)
-	}
-
-	srcInfo, _ := os.Stat(src)
-	dstInfo, _ := os.Stat(dst)
-
-	if srcInfo.Mode().Perm() != dstInfo.Mode().Perm() {
-		t.Errorf("permissions not preserved: src=%v, dst=%v", srcInfo.Mode().Perm(), dstInfo.Mode().Perm())
-	}
-}
-
-// TestCopyFile_SourceNotFound verifies clear error when source doesn't exist.
-func TestCopyFile_SourceNotFound(t *testing.T) {
-	tmpDir := t.TempDir()
-	src := filepath.Join(tmpDir, "nonexistent.json")
-	dst := filepath.Join(tmpDir, "dst.json")
-
-	err := copyFile(src, dst)
-	if err == nil {
-		t.Error("expected error for nonexistent source, got nil")
-	}
-}
-
-// TestWriteWithBackup_TargetIsDirectory verifies error when path points to a directory.
-func TestWriteWithBackup_TargetIsDirectory(t *testing.T) {
-	tmpDir := t.TempDir()
-	dirPath := filepath.Join(tmpDir, "actualdir")
-	os.MkdirAll(dirPath, 0o755)
-
-	err := writeWithBackup(dirPath, []byte(`{"test": true}`))
-	if err == nil {
-		t.Error("expected error when target is a directory, got nil")
-	}
-}
-
-// TestWriteWithBackup_EmptyData verifies writing zero bytes works correctly.
-func TestWriteWithBackup_EmptyData(t *testing.T) {
-	tmpDir := t.TempDir()
-	path := filepath.Join(tmpDir, "empty.json")
-
-	err := writeWithBackup(path, []byte{})
-	if err != nil {
-		t.Fatalf("writeWithBackup with empty data failed: %v", err)
-	}
-
-	content, err := os.ReadFile(path)
-	if err != nil {
-		t.Fatalf("could not read file: %v", err)
-	}
-	if len(content) != 0 {
-		t.Errorf("expected empty file, got %d bytes", len(content))
-	}
-}
-
-// TestWriteWithBackup_FileUnreadableButDirWritable verifies behavior when existing file
-// cannot be read (for backup comparison) but directory is writable.
-func TestWriteWithBackup_FileUnreadableButDirWritable(t *testing.T) {
-	if runtime.GOOS == "windows" {
-		t.Skip("permission tests unreliable on Windows")
-	}
-
-	tmpDir := t.TempDir()
-	path := filepath.Join(tmpDir, "unreadable.json")
-
-	// Create file and make it unreadable
-	os.WriteFile(path, []byte(`{"original": true}`), 0o644)
-	os.Chmod(path, 0o000)
-	defer os.Chmod(path, 0o644)
-
-	// Should fail because we can't read the file to compare/backup
-	err := writeWithBackup(path, []byte(`{"updated": true}`))
-	if err == nil {
-		t.Error("expected error when file is unreadable, got nil")
-	}
-}
-
-// TestWriteWithBackup_RapidSuccessiveWrites verifies backup works with multiple writes
-// within the same second (timestamp collision scenario).
-func TestWriteWithBackup_RapidSuccessiveWrites(t *testing.T) {
-	tmpDir := t.TempDir()
-	path := filepath.Join(tmpDir, "rapid.json")
-
-	// Create initial file
-	os.WriteFile(path, []byte(`{"v": 0}`), 0o644)
-
-	// Rapid successive writes
-	for i := 1; i <= 3; i++ {
-		data := []byte(fmt.Sprintf(`{"v": %d}`, i))
-		if err := writeWithBackup(path, data); err != nil {
-			t.Fatalf("write %d failed: %v", i, err)
-		}
-	}
-
-	// Verify final content
-	content, _ := os.ReadFile(path)
-	if string(content) != `{"v": 3}` {
-		t.Errorf("expected final content {\"v\": 3}, got %s", string(content))
-	}
-
-	// Verify at least one backup exists
-	entries, _ := os.ReadDir(backupDir())
-	var backupCount int
-	for _, e := range entries {
-		if len(e.Name()) > len("rapid.json.") && e.Name()[:len("rapid.json.")] == "rapid.json." {
-			backupCount++
-		}
-	}
-	if backupCount == 0 {
-		t.Error("expected at least one backup file from rapid writes")
-	}
-}
-
-// TestWriteWithBackup_BackupDirIsFile verifies error when backup directory path is a file.
-func TestWriteWithBackup_BackupDirIsFile(t *testing.T) {
-	if runtime.GOOS == "windows" {
-		t.Skip("test modifies system temp directory")
-	}
-
-	// Create a file at the backup directory path
-	backupPath := backupDir()
-	// Clean up any existing directory first
-	os.RemoveAll(backupPath)
-	// Create a file instead of directory
-	os.WriteFile(backupPath, []byte("not a directory"), 0o644)
-	defer func() {
-		os.Remove(backupPath)
-		os.MkdirAll(backupPath, 0o755)
-	}()
-
-	tmpDir := t.TempDir()
-	path := filepath.Join(tmpDir, "test.json")
-	os.WriteFile(path, []byte(`{"original": true}`), 0o644)
-
-	err := writeWithBackup(path, []byte(`{"updated": true}`))
-	if err == nil {
-		t.Error("expected error when backup dir is a file, got nil")
-	}
-}
-
-// TestWriteWithBackup_NoOrphanTempFiles verifies temp files are cleaned up on failure.
-func TestWriteWithBackup_NoOrphanTempFiles(t *testing.T) {
-	if runtime.GOOS == "windows" {
-		t.Skip("permission tests unreliable on Windows")
-	}
-
-	tmpDir := t.TempDir()
-
-	// Count existing temp files
-	countTempFiles := func() int {
-		entries, _ := os.ReadDir(tmpDir)
-		count := 0
-		for _, e := range entries {
-			if len(e.Name()) > 4 && e.Name()[:4] == ".tmp" {
-				count++
-			}
-		}
-		return count
-	}
-
-	before := countTempFiles()
-
-	// Create a file, then make directory read-only to cause rename failure
-	path := filepath.Join(tmpDir, "orphan.json")
-	os.WriteFile(path, []byte(`{"v": 1}`), 0o644)
-
-	// Make a subdirectory and try to write there after making parent read-only
-	subDir := filepath.Join(tmpDir, "subdir")
-	os.MkdirAll(subDir, 0o755)
-	subPath := filepath.Join(subDir, "config.json")
-	os.WriteFile(subPath, []byte(`{"v": 1}`), 0o644)
-
-	// Make subdir read-only after creating temp file would succeed but rename would fail
-	// This is tricky to test - the temp file is created in the same dir, so if we can't
-	// rename, we also couldn't create. Let's just verify normal failure cleanup works.
-
-	// Force a failure by making the target a directory
-	badPath := filepath.Join(tmpDir, "isdir")
-	os.MkdirAll(badPath, 0o755)
-
-	_ = writeWithBackup(badPath, []byte(`{"test": true}`))
-
-	after := countTempFiles()
-	if after > before {
-		t.Errorf("orphan temp files left behind: before=%d, after=%d", before, after)
-	}
-}
--- a/cmd/config/integrations.go
+++ b/cmd/config/integrations.go
--- a/cmd/config/integrations_test.go
+++ b/cmd/config/integrations_test.go
--- a/cmd/config/openclaw.go
+++ b/cmd/config/openclaw.go
@@ -1,801 +0,0 @@
-package config
-
-import (
-	"context"
-	"encoding/json"
-	"fmt"
-	"net"
-	"net/url"
-	"os"
-	"os/exec"
-	"path/filepath"
-	"runtime"
-	"slices"
-	"strings"
-	"time"
-
-	"github.com/ollama/ollama/api"
-	"github.com/ollama/ollama/envconfig"
-	"github.com/ollama/ollama/types/model"
-)
-
-const defaultGatewayPort = 18789
-
-// Bound model capability probing so launch/config cannot hang on slow/unreachable API calls.
-var openclawModelShowTimeout = 5 * time.Second
-
-type Openclaw struct{}
-
-func (c *Openclaw) String() string { return "OpenClaw" }
-
-func (c *Openclaw) Run(model string, args []string) error {
-	bin, err := ensureOpenclawInstalled()
-	if err != nil {
-		return err
-	}
-
-	firstLaunch := true
-	if integrationConfig, err := loadIntegration("openclaw"); err == nil {
-		firstLaunch = !integrationConfig.Onboarded
-	}
-
-	if firstLaunch {
-		fmt.Fprintf(os.Stderr, "\n%sSecurity%s\n\n", ansiBold, ansiReset)
-		fmt.Fprintf(os.Stderr, "  OpenClaw can read files and run actions when tools are enabled.\n")
-		fmt.Fprintf(os.Stderr, "  A bad prompt can trick it into doing unsafe things.\n\n")
-		fmt.Fprintf(os.Stderr, "%s  Learn more: https://docs.openclaw.ai/gateway/security%s\n\n", ansiGray, ansiReset)
-
-		ok, err := confirmPrompt("I understand the risks. Continue?")
-		if err != nil {
-			return err
-		}
-		if !ok {
-			return nil
-		}
-	}
-
-	if !c.onboarded() {
-		fmt.Fprintf(os.Stderr, "\n%sSetting up OpenClaw with Ollama...%s\n", ansiGreen, ansiReset)
-		fmt.Fprintf(os.Stderr, "%s  Model: %s%s\n\n", ansiGray, model, ansiReset)
-
-		cmd := exec.Command(bin, "onboard",
-			"--non-interactive",
-			"--accept-risk",
-			"--auth-choice", "skip",
-			"--gateway-token", "ollama",
-			"--install-daemon",
-			"--skip-channels",
-			"--skip-skills",
-		)
-		cmd.Stdin = os.Stdin
-		cmd.Stdout = os.Stdout
-		cmd.Stderr = os.Stderr
-		if err := cmd.Run(); err != nil {
-			return windowsHint(fmt.Errorf("openclaw onboarding failed: %w\n\nTry running: openclaw onboard", err))
-		}
-
-		patchDeviceScopes()
-
-		// Onboarding overwrites openclaw.json, so re-apply the model config
-		// that Edit() wrote before Run() was called.
-		if err := c.Edit([]string{model}); err != nil {
-			fmt.Fprintf(os.Stderr, "%s  Warning: could not re-apply model config: %v%s\n", ansiYellow, err, ansiReset)
-		}
-	}
-
-	if strings.HasSuffix(model, ":cloud") || strings.HasSuffix(model, "-cloud") {
-		if ensureWebSearchPlugin() {
-			registerWebSearchPlugin()
-		}
-	}
-
-	if firstLaunch {
-		fmt.Fprintf(os.Stderr, "\n%sPreparing your assistant — this may take a moment...%s\n\n", ansiGray, ansiReset)
-	} else {
-		fmt.Fprintf(os.Stderr, "\n%sStarting your assistant — this may take a moment...%s\n\n", ansiGray, ansiReset)
-	}
-
-	// When extra args are passed through, run exactly what the user asked for
-	// after setup and skip the built-in gateway+TUI convenience flow.
-	if len(args) > 0 {
-		cmd := exec.Command(bin, args...)
-		cmd.Env = openclawEnv()
-		cmd.Stdin = os.Stdin
-		cmd.Stdout = os.Stdout
-		cmd.Stderr = os.Stderr
-		if err := cmd.Run(); err != nil {
-			return windowsHint(err)
-		}
-		if firstLaunch {
-			if err := integrationOnboarded("openclaw"); err != nil {
-				return fmt.Errorf("failed to save onboarding state: %w", err)
-			}
-		}
-		return nil
-	}
-
-	token, port := c.gatewayInfo()
-	addr := fmt.Sprintf("localhost:%d", port)
-
-	// If the gateway is already running (e.g. via the daemon), restart it
-	// so it picks up any config changes from Edit() above (model, provider, etc.).
-	if portOpen(addr) {
-		restart := exec.Command(bin, "daemon", "restart")
-		restart.Env = openclawEnv()
-		if err := restart.Run(); err != nil {
-			fmt.Fprintf(os.Stderr, "%s  Warning: daemon restart failed: %v%s\n", ansiYellow, err, ansiReset)
-		}
-		if !waitForPort(addr, 10*time.Second) {
-			fmt.Fprintf(os.Stderr, "%s  Warning: gateway did not come back after restart%s\n", ansiYellow, ansiReset)
-		}
-	}
-
-	// If the gateway isn't running, start it as a background child process.
-	if !portOpen(addr) {
-		gw := exec.Command(bin, "gateway", "run", "--force")
-		gw.Env = openclawEnv()
-		if err := gw.Start(); err != nil {
-			return windowsHint(fmt.Errorf("failed to start gateway: %w", err))
-		}
-		defer func() {
-			if gw.Process != nil {
-				_ = gw.Process.Kill()
-				_ = gw.Wait()
-			}
-		}()
-	}
-
-	fmt.Fprintf(os.Stderr, "%sStarting gateway...%s\n", ansiGray, ansiReset)
-	if !waitForPort(addr, 30*time.Second) {
-		return windowsHint(fmt.Errorf("gateway did not start on %s", addr))
-	}
-
-	printOpenclawReady(bin, token, port, firstLaunch)
-
-	tuiArgs := []string{"tui"}
-	if firstLaunch {
-		tuiArgs = append(tuiArgs, "--message", "Wake up, my friend!")
-	}
-	tui := exec.Command(bin, tuiArgs...)
-	tui.Env = openclawEnv()
-	tui.Stdin = os.Stdin
-	tui.Stdout = os.Stdout
-	tui.Stderr = os.Stderr
-	if err := tui.Run(); err != nil {
-		return windowsHint(err)
-	}
-
-	if firstLaunch {
-		if err := integrationOnboarded("openclaw"); err != nil {
-			return fmt.Errorf("failed to save onboarding state: %w", err)
-		}
-	}
-	return nil
-}
-
-// gatewayInfo reads the gateway auth token and port from the OpenClaw config.
-func (c *Openclaw) gatewayInfo() (token string, port int) {
-	port = defaultGatewayPort
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return "", port
-	}
-
-	for _, path := range []string{
-		filepath.Join(home, ".openclaw", "openclaw.json"),
-		filepath.Join(home, ".clawdbot", "clawdbot.json"),
-	} {
-		data, err := os.ReadFile(path)
-		if err != nil {
-			continue
-		}
-		var config map[string]any
-		if json.Unmarshal(data, &config) != nil {
-			continue
-		}
-		gw, _ := config["gateway"].(map[string]any)
-		if p, ok := gw["port"].(float64); ok && p > 0 {
-			port = int(p)
-		}
-		auth, _ := gw["auth"].(map[string]any)
-		if t, _ := auth["token"].(string); t != "" {
-			token = t
-		}
-		return token, port
-	}
-	return "", port
-}
-
-func printOpenclawReady(bin, token string, port int, firstLaunch bool) {
-	u := fmt.Sprintf("http://localhost:%d", port)
-	if token != "" {
-		u += "/#token=" + url.QueryEscape(token)
-	}
-
-	fmt.Fprintf(os.Stderr, "\n%s✓ OpenClaw is running%s\n\n", ansiGreen, ansiReset)
-	fmt.Fprintf(os.Stderr, "  Open the Web UI:\n")
-	fmt.Fprintf(os.Stderr, "    %s\n\n", hyperlink(u, u))
-
-	if firstLaunch {
-		fmt.Fprintf(os.Stderr, "%s  Quick start:%s\n", ansiBold, ansiReset)
-		fmt.Fprintf(os.Stderr, "%s    /help             see all commands%s\n", ansiGray, ansiReset)
-		fmt.Fprintf(os.Stderr, "%s    %s configure --section channels   connect WhatsApp, Telegram, etc.%s\n", ansiGray, bin, ansiReset)
-		fmt.Fprintf(os.Stderr, "%s    %s skills                         browse and install skills%s\n\n", ansiGray, bin, ansiReset)
-		fmt.Fprintf(os.Stderr, "%s  The OpenClaw gateway is running in the background.%s\n", ansiYellow, ansiReset)
-		fmt.Fprintf(os.Stderr, "%s  Stop it with: %s gateway stop%s\n\n", ansiYellow, bin, ansiReset)
-	} else {
-		fmt.Fprintf(os.Stderr, "%sTip: connect WhatsApp, Telegram, and more with: %s configure --section channels%s\n", ansiGray, bin, ansiReset)
-	}
-}
-
-// openclawEnv returns the current environment with provider API keys cleared
-// so openclaw only uses the Ollama gateway, not keys from the user's shell.
-func openclawEnv() []string {
-	clear := map[string]bool{
-		"ANTHROPIC_API_KEY":     true,
-		"ANTHROPIC_OAUTH_TOKEN": true,
-		"OPENAI_API_KEY":        true,
-		"GEMINI_API_KEY":        true,
-		"MISTRAL_API_KEY":       true,
-		"GROQ_API_KEY":          true,
-		"XAI_API_KEY":           true,
-		"OPENROUTER_API_KEY":    true,
-	}
-	var env []string
-	for _, e := range os.Environ() {
-		key, _, _ := strings.Cut(e, "=")
-		if !clear[key] {
-			env = append(env, e)
-		}
-	}
-	return env
-}
-
-// portOpen checks if a TCP port is currently accepting connections.
-func portOpen(addr string) bool {
-	conn, err := net.DialTimeout("tcp", addr, 500*time.Millisecond)
-	if err != nil {
-		return false
-	}
-	conn.Close()
-	return true
-}
-
-func waitForPort(addr string, timeout time.Duration) bool {
-	deadline := time.Now().Add(timeout)
-	for time.Now().Before(deadline) {
-		conn, err := net.DialTimeout("tcp", addr, 500*time.Millisecond)
-		if err == nil {
-			conn.Close()
-			return true
-		}
-		time.Sleep(250 * time.Millisecond)
-	}
-	return false
-}
-
-func windowsHint(err error) error {
-	if runtime.GOOS != "windows" {
-		return err
-	}
-	return fmt.Errorf("%w\n\n"+
-		"OpenClaw runs best on WSL2.\n"+
-		"Quick setup: wsl --install\n"+
-		"Guide: https://docs.openclaw.ai/windows", err)
-}
-
-// onboarded checks if OpenClaw onboarding wizard was completed
-// by looking for the wizard.lastRunAt marker in the config
-func (c *Openclaw) onboarded() bool {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return false
-	}
-
-	configPath := filepath.Join(home, ".openclaw", "openclaw.json")
-	legacyPath := filepath.Join(home, ".clawdbot", "clawdbot.json")
-
-	config := make(map[string]any)
-	if data, err := os.ReadFile(configPath); err == nil {
-		_ = json.Unmarshal(data, &config)
-	} else if data, err := os.ReadFile(legacyPath); err == nil {
-		_ = json.Unmarshal(data, &config)
-	} else {
-		return false
-	}
-
-	// Check for wizard.lastRunAt marker (set when onboarding completes)
-	wizard, _ := config["wizard"].(map[string]any)
-	if wizard == nil {
-		return false
-	}
-	lastRunAt, _ := wizard["lastRunAt"].(string)
-	return lastRunAt != ""
-}
-
-// patchDeviceScopes upgrades the local CLI device's paired scopes to include
-// operator.admin. Only patches the local device, not remote ones.
-// Best-effort: silently returns on any error.
-func patchDeviceScopes() {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return
-	}
-
-	deviceID := readLocalDeviceID(home)
-	if deviceID == "" {
-		return
-	}
-
-	path := filepath.Join(home, ".openclaw", "devices", "paired.json")
-	data, err := os.ReadFile(path)
-	if err != nil {
-		return
-	}
-
-	var devices map[string]map[string]any
-	if err := json.Unmarshal(data, &devices); err != nil {
-		return
-	}
-
-	dev, ok := devices[deviceID]
-	if !ok {
-		return
-	}
-
-	required := []string{
-		"operator.read",
-		"operator.admin",
-		"operator.approvals",
-		"operator.pairing",
-	}
-
-	changed := patchScopes(dev, "scopes", required)
-	if tokens, ok := dev["tokens"].(map[string]any); ok {
-		for _, tok := range tokens {
-			if tokenMap, ok := tok.(map[string]any); ok {
-				if patchScopes(tokenMap, "scopes", required) {
-					changed = true
-				}
-			}
-		}
-	}
-
-	if !changed {
-		return
-	}
-
-	out, err := json.MarshalIndent(devices, "", "  ")
-	if err != nil {
-		return
-	}
-	_ = os.WriteFile(path, out, 0o600)
-}
-
-// readLocalDeviceID reads the local device ID from openclaw's identity file.
-func readLocalDeviceID(home string) string {
-	data, err := os.ReadFile(filepath.Join(home, ".openclaw", "identity", "device-auth.json"))
-	if err != nil {
-		return ""
-	}
-	var auth map[string]any
-	if err := json.Unmarshal(data, &auth); err != nil {
-		return ""
-	}
-	id, _ := auth["deviceId"].(string)
-	return id
-}
-
-// patchScopes ensures obj[key] contains all required scopes. Returns true if
-// any scopes were added.
-func patchScopes(obj map[string]any, key string, required []string) bool {
-	existing, _ := obj[key].([]any)
-	have := make(map[string]bool, len(existing))
-	for _, s := range existing {
-		if str, ok := s.(string); ok {
-			have[str] = true
-		}
-	}
-	added := false
-	for _, s := range required {
-		if !have[s] {
-			existing = append(existing, s)
-			added = true
-		}
-	}
-	if added {
-		obj[key] = existing
-	}
-	return added
-}
-
-func ensureOpenclawInstalled() (string, error) {
-	if _, err := exec.LookPath("openclaw"); err == nil {
-		return "openclaw", nil
-	}
-	if _, err := exec.LookPath("clawdbot"); err == nil {
-		return "clawdbot", nil
-	}
-
-	if _, err := exec.LookPath("npm"); err != nil {
-		return "", fmt.Errorf("openclaw is not installed and npm was not found\n\n" +
-			"Install Node.js first:\n" +
-			"  https://nodejs.org/\n\n" +
-			"Then rerun:\n" +
-			"  ollama launch\n" +
-			"and select OpenClaw")
-	}
-
-	ok, err := confirmPrompt("OpenClaw is not installed. Install with npm?")
-	if err != nil {
-		return "", err
-	}
-	if !ok {
-		return "", fmt.Errorf("openclaw installation cancelled")
-	}
-
-	fmt.Fprintf(os.Stderr, "\nInstalling OpenClaw...\n")
-	cmd := exec.Command("npm", "install", "-g", "openclaw@latest")
-	cmd.Stdin = os.Stdin
-	cmd.Stdout = os.Stdout
-	cmd.Stderr = os.Stderr
-	if err := cmd.Run(); err != nil {
-		return "", fmt.Errorf("failed to install openclaw: %w", err)
-	}
-
-	if _, err := exec.LookPath("openclaw"); err != nil {
-		return "", fmt.Errorf("openclaw was installed but the binary was not found on PATH\n\nYou may need to restart your shell")
-	}
-
-	fmt.Fprintf(os.Stderr, "%sOpenClaw installed successfully%s\n\n", ansiGreen, ansiReset)
-	return "openclaw", nil
-}
-
-func (c *Openclaw) Paths() []string {
-	home, _ := os.UserHomeDir()
-	p := filepath.Join(home, ".openclaw", "openclaw.json")
-	if _, err := os.Stat(p); err == nil {
-		return []string{p}
-	}
-	legacy := filepath.Join(home, ".clawdbot", "clawdbot.json")
-	if _, err := os.Stat(legacy); err == nil {
-		return []string{legacy}
-	}
-	return nil
-}
-
-func (c *Openclaw) Edit(models []string) error {
-	if len(models) == 0 {
-		return nil
-	}
-
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return err
-	}
-
-	configPath := filepath.Join(home, ".openclaw", "openclaw.json")
-	legacyPath := filepath.Join(home, ".clawdbot", "clawdbot.json")
-	if err := os.MkdirAll(filepath.Dir(configPath), 0o755); err != nil {
-		return err
-	}
-
-	// Read into map[string]any to preserve unknown fields
-	config := make(map[string]any)
-	if data, err := os.ReadFile(configPath); err == nil {
-		_ = json.Unmarshal(data, &config)
-	} else if data, err := os.ReadFile(legacyPath); err == nil {
-		_ = json.Unmarshal(data, &config)
-	}
-
-	// Navigate/create: models.providers.ollama (preserving other providers)
-	modelsSection, _ := config["models"].(map[string]any)
-	if modelsSection == nil {
-		modelsSection = make(map[string]any)
-	}
-	providers, _ := modelsSection["providers"].(map[string]any)
-	if providers == nil {
-		providers = make(map[string]any)
-	}
-	ollama, _ := providers["ollama"].(map[string]any)
-	if ollama == nil {
-		ollama = make(map[string]any)
-	}
-
-	ollama["baseUrl"] = envconfig.Host().String() + "/v1"
-	// needed to register provider
-	ollama["apiKey"] = "ollama-local"
-	ollama["api"] = "ollama"
-
-	// Build map of existing models to preserve user customizations
-	existingModels, _ := ollama["models"].([]any)
-	existingByID := make(map[string]map[string]any)
-	for _, m := range existingModels {
-		if entry, ok := m.(map[string]any); ok {
-			if id, ok := entry["id"].(string); ok {
-				existingByID[id] = entry
-			}
-		}
-	}
-
-	client, _ := api.ClientFromEnvironment()
-
-	var newModels []any
-	for _, m := range models {
-		entry, _ := openclawModelConfig(context.Background(), client, m)
-		// Merge existing fields (user customizations)
-		if existing, ok := existingByID[m]; ok {
-			for k, v := range existing {
-				if _, isNew := entry[k]; !isNew {
-					entry[k] = v
-				}
-			}
-		}
-		newModels = append(newModels, entry)
-	}
-	ollama["models"] = newModels
-
-	providers["ollama"] = ollama
-	modelsSection["providers"] = providers
-	config["models"] = modelsSection
-
-	// Update agents.defaults.model.primary (preserving other agent settings)
-	agents, _ := config["agents"].(map[string]any)
-	if agents == nil {
-		agents = make(map[string]any)
-	}
-	defaults, _ := agents["defaults"].(map[string]any)
-	if defaults == nil {
-		defaults = make(map[string]any)
-	}
-	modelConfig, _ := defaults["model"].(map[string]any)
-	if modelConfig == nil {
-		modelConfig = make(map[string]any)
-	}
-	modelConfig["primary"] = "ollama/" + models[0]
-	defaults["model"] = modelConfig
-	agents["defaults"] = defaults
-	config["agents"] = agents
-
-	data, err := json.MarshalIndent(config, "", "  ")
-	if err != nil {
-		return err
-	}
-	if err := writeWithBackup(configPath, data); err != nil {
-		return err
-	}
-
-	// Clear any per-session model overrides so the new primary takes effect
-	// immediately rather than being shadowed by a cached modelOverride.
-	clearSessionModelOverride(models[0])
-	return nil
-}
-
-// clearSessionModelOverride removes per-session model overrides from the main
-// agent session so the global primary model takes effect on the next TUI launch.
-func clearSessionModelOverride(primary string) {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return
-	}
-	path := filepath.Join(home, ".openclaw", "agents", "main", "sessions", "sessions.json")
-	data, err := os.ReadFile(path)
-	if err != nil {
-		return
-	}
-	var sessions map[string]map[string]any
-	if json.Unmarshal(data, &sessions) != nil {
-		return
-	}
-	changed := false
-	for _, sess := range sessions {
-		if override, _ := sess["modelOverride"].(string); override != "" && override != primary {
-			delete(sess, "modelOverride")
-			delete(sess, "providerOverride")
-			sess["model"] = primary
-			changed = true
-		}
-	}
-	if !changed {
-		return
-	}
-	out, err := json.MarshalIndent(sessions, "", "  ")
-	if err != nil {
-		return
-	}
-	_ = os.WriteFile(path, out, 0o600)
-}
-
-const webSearchNpmPackage = "@ollama/openclaw-web-search"
-
-// ensureWebSearchPlugin installs the openclaw-web-search extension into the
-// user-level extensions directory (~/.openclaw/extensions/) if it isn't already
-// present. Returns true if the extension is available.
-func ensureWebSearchPlugin() bool {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return false
-	}
-
-	pluginDir := filepath.Join(home, ".openclaw", "extensions", "openclaw-web-search")
-	if _, err := os.Stat(filepath.Join(pluginDir, "index.ts")); err == nil {
-		return true // already installed
-	}
-
-	npmBin, err := exec.LookPath("npm")
-	if err != nil {
-		return false
-	}
-
-	if err := os.MkdirAll(pluginDir, 0o755); err != nil {
-		return false
-	}
-
-	// Download the tarball via `npm pack`, extract it flat into the plugin dir.
-	pack := exec.Command(npmBin, "pack", webSearchNpmPackage, "--pack-destination", pluginDir)
-	out, err := pack.Output()
-	if err != nil {
-		fmt.Fprintf(os.Stderr, "%s  Warning: could not download web search plugin: %v%s\n", ansiYellow, err, ansiReset)
-		return false
-	}
-
-	tgzName := strings.TrimSpace(string(out))
-	tgzPath := filepath.Join(pluginDir, tgzName)
-	defer os.Remove(tgzPath)
-
-	tar := exec.Command("tar", "xzf", tgzPath, "--strip-components=1", "-C", pluginDir)
-	if err := tar.Run(); err != nil {
-		fmt.Fprintf(os.Stderr, "%s  Warning: could not extract web search plugin: %v%s\n", ansiYellow, err, ansiReset)
-		return false
-	}
-
-	fmt.Fprintf(os.Stderr, "%s  ✓ Installed web search plugin%s\n", ansiGreen, ansiReset)
-	return true
-}
-
-// registerWebSearchPlugin adds plugins.entries.openclaw-web-search to the OpenClaw
-// config so the gateway activates it on next start. Best-effort; silently returns
-// on any error.
-func registerWebSearchPlugin() {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return
-	}
-	configPath := filepath.Join(home, ".openclaw", "openclaw.json")
-	data, err := os.ReadFile(configPath)
-	if err != nil {
-		return
-	}
-	var config map[string]any
-	if json.Unmarshal(data, &config) != nil {
-		return
-	}
-
-	plugins, _ := config["plugins"].(map[string]any)
-	if plugins == nil {
-		plugins = make(map[string]any)
-	}
-	entries, _ := plugins["entries"].(map[string]any)
-	if entries == nil {
-		entries = make(map[string]any)
-	}
-	if _, ok := entries["openclaw-web-search"]; ok {
-		return // already registered
-	}
-	entries["openclaw-web-search"] = map[string]any{"enabled": true}
-	plugins["entries"] = entries
-	config["plugins"] = plugins
-
-	// Disable the built-in web search since our plugin replaces it.
-	tools, _ := config["tools"].(map[string]any)
-	if tools == nil {
-		tools = make(map[string]any)
-	}
-	web, _ := tools["web"].(map[string]any)
-	if web == nil {
-		web = make(map[string]any)
-	}
-	web["search"] = map[string]any{"enabled": false}
-	tools["web"] = web
-	config["tools"] = tools
-
-	out, err := json.MarshalIndent(config, "", "  ")
-	if err != nil {
-		return
-	}
-	_ = os.WriteFile(configPath, out, 0o600)
-}
-
-// openclawModelConfig builds an OpenClaw model config entry with capability detection.
-// The second return value indicates whether the model is a cloud (remote) model.
-func openclawModelConfig(ctx context.Context, client *api.Client, modelID string) (map[string]any, bool) {
-	entry := map[string]any{
-		"id":    modelID,
-		"name":  modelID,
-		"input": []any{"text"},
-		"cost": map[string]any{
-			"input":      0,
-			"output":     0,
-			"cacheRead":  0,
-			"cacheWrite": 0,
-		},
-	}
-
-	if client == nil {
-		return entry, false
-	}
-
-	showCtx := ctx
-	if _, hasDeadline := ctx.Deadline(); !hasDeadline {
-		var cancel context.CancelFunc
-		showCtx, cancel = context.WithTimeout(ctx, openclawModelShowTimeout)
-		defer cancel()
-	}
-
-	resp, err := client.Show(showCtx, &api.ShowRequest{Model: modelID})
-	if err != nil {
-		return entry, false
-	}
-
-	// Set input types based on vision capability
-	if slices.Contains(resp.Capabilities, model.CapabilityVision) {
-		entry["input"] = []any{"text", "image"}
-	}
-
-	// Set reasoning based on thinking capability
-	if slices.Contains(resp.Capabilities, model.CapabilityThinking) {
-		entry["reasoning"] = true
-	}
-
-	// Cloud models: use hardcoded limits for context/output tokens.
-	// Capability detection above still applies (vision, thinking).
-	if resp.RemoteModel != "" {
-		if l, ok := lookupCloudModelLimit(modelID); ok {
-			entry["contextWindow"] = l.Context
-			entry["maxTokens"] = l.Output
-		}
-		return entry, true
-	}
-
-	// Extract context window from ModelInfo (local models only)
-	for key, val := range resp.ModelInfo {
-		if strings.HasSuffix(key, ".context_length") {
-			if ctxLen, ok := val.(float64); ok && ctxLen > 0 {
-				entry["contextWindow"] = int(ctxLen)
-			}
-			break
-		}
-	}
-
-	return entry, false
-}
-
-func (c *Openclaw) Models() []string {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return nil
-	}
-
-	config, err := readJSONFile(filepath.Join(home, ".openclaw", "openclaw.json"))
-	if err != nil {
-		config, err = readJSONFile(filepath.Join(home, ".clawdbot", "clawdbot.json"))
-		if err != nil {
-			return nil
-		}
-	}
-
-	modelsSection, _ := config["models"].(map[string]any)
-	providers, _ := modelsSection["providers"].(map[string]any)
-	ollama, _ := providers["ollama"].(map[string]any)
-	modelList, _ := ollama["models"].([]any)
-
-	var result []string
-	for _, m := range modelList {
-		if entry, ok := m.(map[string]any); ok {
-			if id, ok := entry["id"].(string); ok {
-				result = append(result, id)
-			}
-		}
-	}
-	return result
-}
--- a/cmd/config/openclaw_test.go
+++ b/cmd/config/openclaw_test.go
--- a/cmd/config/opencode.go
+++ b/cmd/config/opencode.go
@@ -1,279 +0,0 @@
-package config
-
-import (
-	"context"
-	"encoding/json"
-	"errors"
-	"fmt"
-	"maps"
-	"os"
-	"os/exec"
-	"path/filepath"
-	"slices"
-	"strings"
-
-	"github.com/ollama/ollama/api"
-	"github.com/ollama/ollama/envconfig"
-)
-
-// OpenCode implements Runner and Editor for OpenCode integration
-type OpenCode struct{}
-
-// cloudModelLimit holds context and output token limits for a cloud model.
-type cloudModelLimit struct {
-	Context int
-	Output  int
-}
-
-// lookupCloudModelLimit returns the token limits for a cloud model.
-// It tries the exact name first, then strips the ":cloud" suffix.
-func lookupCloudModelLimit(name string) (cloudModelLimit, bool) {
-	if l, ok := cloudModelLimits[name]; ok {
-		return l, true
-	}
-	base := strings.TrimSuffix(name, ":cloud")
-	if base != name {
-		if l, ok := cloudModelLimits[base]; ok {
-			return l, true
-		}
-	}
-	return cloudModelLimit{}, false
-}
-
-func (o *OpenCode) String() string { return "OpenCode" }
-
-func (o *OpenCode) Run(model string, args []string) error {
-	if _, err := exec.LookPath("opencode"); err != nil {
-		return fmt.Errorf("opencode is not installed, install from https://opencode.ai")
-	}
-
-	// Call Edit() to ensure config is up-to-date before launch
-	models := []string{model}
-	if config, err := loadIntegration("opencode"); err == nil && len(config.Models) > 0 {
-		models = config.Models
-	}
-	var err error
-	models, err = resolveEditorModels("opencode", models, func() ([]string, error) {
-		return selectModels(context.Background(), "opencode", "")
-	})
-	if errors.Is(err, errCancelled) {
-		return nil
-	}
-	if err != nil {
-		return err
-	}
-	if err := o.Edit(models); err != nil {
-		return fmt.Errorf("setup failed: %w", err)
-	}
-
-	cmd := exec.Command("opencode", args...)
-	cmd.Stdin = os.Stdin
-	cmd.Stdout = os.Stdout
-	cmd.Stderr = os.Stderr
-	return cmd.Run()
-}
-
-func (o *OpenCode) Paths() []string {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return nil
-	}
-
-	var paths []string
-	p := filepath.Join(home, ".config", "opencode", "opencode.json")
-	if _, err := os.Stat(p); err == nil {
-		paths = append(paths, p)
-	}
-	sp := filepath.Join(home, ".local", "state", "opencode", "model.json")
-	if _, err := os.Stat(sp); err == nil {
-		paths = append(paths, sp)
-	}
-	return paths
-}
-
-func (o *OpenCode) Edit(modelList []string) error {
-	if len(modelList) == 0 {
-		return nil
-	}
-
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return err
-	}
-
-	configPath := filepath.Join(home, ".config", "opencode", "opencode.json")
-	if err := os.MkdirAll(filepath.Dir(configPath), 0o755); err != nil {
-		return err
-	}
-
-	config := make(map[string]any)
-	if data, err := os.ReadFile(configPath); err == nil {
-		_ = json.Unmarshal(data, &config) // Ignore parse errors; treat missing/corrupt files as empty
-	}
-
-	config["$schema"] = "https://opencode.ai/config.json"
-
-	provider, ok := config["provider"].(map[string]any)
-	if !ok {
-		provider = make(map[string]any)
-	}
-
-	ollama, ok := provider["ollama"].(map[string]any)
-	if !ok {
-		ollama = map[string]any{
-			"npm":  "@ai-sdk/openai-compatible",
-			"name": "Ollama (local)",
-			"options": map[string]any{
-				"baseURL": envconfig.Host().String() + "/v1",
-			},
-		}
-	}
-
-	models, ok := ollama["models"].(map[string]any)
-	if !ok {
-		models = make(map[string]any)
-	}
-
-	selectedSet := make(map[string]bool)
-	for _, m := range modelList {
-		selectedSet[m] = true
-	}
-
-	for name, cfg := range models {
-		if cfgMap, ok := cfg.(map[string]any); ok {
-			if isOllamaModel(cfgMap) && !selectedSet[name] {
-				delete(models, name)
-			}
-		}
-	}
-
-	client, _ := api.ClientFromEnvironment()
-
-	for _, model := range modelList {
-		if existing, ok := models[model].(map[string]any); ok {
-			// migrate existing models without _launch marker
-			if isOllamaModel(existing) {
-				existing["_launch"] = true
-				if name, ok := existing["name"].(string); ok {
-					existing["name"] = strings.TrimSuffix(name, " [Ollama]")
-				}
-			}
-			if isCloudModel(context.Background(), client, model) {
-				if l, ok := lookupCloudModelLimit(model); ok {
-					existing["limit"] = map[string]any{
-						"context": l.Context,
-						"output":  l.Output,
-					}
-				}
-			}
-			continue
-		}
-		entry := map[string]any{
-			"name":    model,
-			"_launch": true,
-		}
-		if isCloudModel(context.Background(), client, model) {
-			if l, ok := lookupCloudModelLimit(model); ok {
-				entry["limit"] = map[string]any{
-					"context": l.Context,
-					"output":  l.Output,
-				}
-			}
-		}
-		models[model] = entry
-	}
-
-	ollama["models"] = models
-	provider["ollama"] = ollama
-	config["provider"] = provider
-
-	configData, err := json.MarshalIndent(config, "", "  ")
-	if err != nil {
-		return err
-	}
-	if err := writeWithBackup(configPath, configData); err != nil {
-		return err
-	}
-
-	statePath := filepath.Join(home, ".local", "state", "opencode", "model.json")
-	if err := os.MkdirAll(filepath.Dir(statePath), 0o755); err != nil {
-		return err
-	}
-
-	state := map[string]any{
-		"recent":   []any{},
-		"favorite": []any{},
-		"variant":  map[string]any{},
-	}
-	if data, err := os.ReadFile(statePath); err == nil {
-		_ = json.Unmarshal(data, &state) // Ignore parse errors; use defaults
-	}
-
-	recent, _ := state["recent"].([]any)
-
-	modelSet := make(map[string]bool)
-	for _, m := range modelList {
-		modelSet[m] = true
-	}
-
-	// Filter out existing Ollama models we're about to re-add
-	newRecent := slices.DeleteFunc(slices.Clone(recent), func(entry any) bool {
-		e, ok := entry.(map[string]any)
-		if !ok || e["providerID"] != "ollama" {
-			return false
-		}
-		modelID, _ := e["modelID"].(string)
-		return modelSet[modelID]
-	})
-
-	// Prepend models in reverse order so first model ends up first
-	for _, model := range slices.Backward(modelList) {
-		newRecent = slices.Insert(newRecent, 0, any(map[string]any{
-			"providerID": "ollama",
-			"modelID":    model,
-		}))
-	}
-
-	const maxRecentModels = 10
-	newRecent = newRecent[:min(len(newRecent), maxRecentModels)]
-
-	state["recent"] = newRecent
-
-	stateData, err := json.MarshalIndent(state, "", "  ")
-	if err != nil {
-		return err
-	}
-	return writeWithBackup(statePath, stateData)
-}
-
-func (o *OpenCode) Models() []string {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return nil
-	}
-	config, err := readJSONFile(filepath.Join(home, ".config", "opencode", "opencode.json"))
-	if err != nil {
-		return nil
-	}
-	provider, _ := config["provider"].(map[string]any)
-	ollama, _ := provider["ollama"].(map[string]any)
-	models, _ := ollama["models"].(map[string]any)
-	if len(models) == 0 {
-		return nil
-	}
-	keys := slices.Collect(maps.Keys(models))
-	slices.Sort(keys)
-	return keys
-}
-
-// isOllamaModel reports whether a model config entry is managed by us
-func isOllamaModel(cfg map[string]any) bool {
-	if v, ok := cfg["_launch"].(bool); ok && v {
-		return true
-	}
-	// previously used [Ollama] as a suffix for the model managed by ollama launch
-	if name, ok := cfg["name"].(string); ok {
-		return strings.HasSuffix(name, "[Ollama]")
-	}
-	return false
-}
--- a/cmd/config/opencode_test.go
+++ b/cmd/config/opencode_test.go
@@ -1,668 +0,0 @@
-package config
-
-import (
-	"encoding/json"
-	"fmt"
-	"os"
-	"path/filepath"
-	"testing"
-)
-
-func TestOpenCodeIntegration(t *testing.T) {
-	o := &OpenCode{}
-
-	t.Run("String", func(t *testing.T) {
-		if got := o.String(); got != "OpenCode" {
-			t.Errorf("String() = %q, want %q", got, "OpenCode")
-		}
-	})
-
-	t.Run("implements Runner", func(t *testing.T) {
-		var _ Runner = o
-	})
-
-	t.Run("implements Editor", func(t *testing.T) {
-		var _ Editor = o
-	})
-}
-
-func TestOpenCodeEdit(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configDir := filepath.Join(tmpDir, ".config", "opencode")
-	configPath := filepath.Join(configDir, "opencode.json")
-	stateDir := filepath.Join(tmpDir, ".local", "state", "opencode")
-	statePath := filepath.Join(stateDir, "model.json")
-
-	cleanup := func() {
-		os.RemoveAll(configDir)
-		os.RemoveAll(stateDir)
-	}
-
-	t.Run("fresh install", func(t *testing.T) {
-		cleanup()
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-		assertOpenCodeModelExists(t, configPath, "llama3.2")
-		assertOpenCodeRecentModel(t, statePath, 0, "ollama", "llama3.2")
-	})
-
-	t.Run("preserve other providers", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-		os.WriteFile(configPath, []byte(`{"provider":{"anthropic":{"apiKey":"xxx"}}}`), 0o644)
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-		data, _ := os.ReadFile(configPath)
-		var cfg map[string]any
-		json.Unmarshal(data, &cfg)
-		provider := cfg["provider"].(map[string]any)
-		if provider["anthropic"] == nil {
-			t.Error("anthropic provider was removed")
-		}
-		assertOpenCodeModelExists(t, configPath, "llama3.2")
-	})
-
-	t.Run("preserve other models", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-		os.WriteFile(configPath, []byte(`{"provider":{"ollama":{"models":{"mistral":{"name":"Mistral"}}}}}`), 0o644)
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-		assertOpenCodeModelExists(t, configPath, "mistral")
-		assertOpenCodeModelExists(t, configPath, "llama3.2")
-	})
-
-	t.Run("update existing model", func(t *testing.T) {
-		cleanup()
-		o.Edit([]string{"llama3.2"})
-		o.Edit([]string{"llama3.2"})
-		assertOpenCodeModelExists(t, configPath, "llama3.2")
-	})
-
-	t.Run("preserve top-level keys", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-		os.WriteFile(configPath, []byte(`{"theme":"dark","keybindings":{}}`), 0o644)
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-		data, _ := os.ReadFile(configPath)
-		var cfg map[string]any
-		json.Unmarshal(data, &cfg)
-		if cfg["theme"] != "dark" {
-			t.Error("theme was removed")
-		}
-		if cfg["keybindings"] == nil {
-			t.Error("keybindings was removed")
-		}
-	})
-
-	t.Run("model state - insert at index 0", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(stateDir, 0o755)
-		os.WriteFile(statePath, []byte(`{"recent":[{"providerID":"anthropic","modelID":"claude"}],"favorite":[],"variant":{}}`), 0o644)
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-		assertOpenCodeRecentModel(t, statePath, 0, "ollama", "llama3.2")
-		assertOpenCodeRecentModel(t, statePath, 1, "anthropic", "claude")
-	})
-
-	t.Run("model state - preserve favorites and variants", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(stateDir, 0o755)
-		os.WriteFile(statePath, []byte(`{"recent":[],"favorite":[{"providerID":"x","modelID":"y"}],"variant":{"a":"b"}}`), 0o644)
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-		data, _ := os.ReadFile(statePath)
-		var state map[string]any
-		json.Unmarshal(data, &state)
-		if len(state["favorite"].([]any)) != 1 {
-			t.Error("favorite was modified")
-		}
-		if state["variant"].(map[string]any)["a"] != "b" {
-			t.Error("variant was modified")
-		}
-	})
-
-	t.Run("model state - deduplicate on re-add", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(stateDir, 0o755)
-		os.WriteFile(statePath, []byte(`{"recent":[{"providerID":"ollama","modelID":"llama3.2"},{"providerID":"anthropic","modelID":"claude"}],"favorite":[],"variant":{}}`), 0o644)
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-		data, _ := os.ReadFile(statePath)
-		var state map[string]any
-		json.Unmarshal(data, &state)
-		recent := state["recent"].([]any)
-		if len(recent) != 2 {
-			t.Errorf("expected 2 recent entries, got %d", len(recent))
-		}
-		assertOpenCodeRecentModel(t, statePath, 0, "ollama", "llama3.2")
-	})
-
-	t.Run("remove model", func(t *testing.T) {
-		cleanup()
-		// First add two models
-		o.Edit([]string{"llama3.2", "mistral"})
-		assertOpenCodeModelExists(t, configPath, "llama3.2")
-		assertOpenCodeModelExists(t, configPath, "mistral")
-
-		// Then remove one by only selecting the other
-		o.Edit([]string{"llama3.2"})
-		assertOpenCodeModelExists(t, configPath, "llama3.2")
-		assertOpenCodeModelNotExists(t, configPath, "mistral")
-	})
-
-	t.Run("preserve user customizations on managed models", func(t *testing.T) {
-		cleanup()
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-
-		// Add custom fields to the model entry (simulating user edits)
-		data, _ := os.ReadFile(configPath)
-		var cfg map[string]any
-		json.Unmarshal(data, &cfg)
-		provider := cfg["provider"].(map[string]any)
-		ollama := provider["ollama"].(map[string]any)
-		models := ollama["models"].(map[string]any)
-		entry := models["llama3.2"].(map[string]any)
-		entry["_myPref"] = "custom-value"
-		entry["_myNum"] = 42
-		configData, _ := json.MarshalIndent(cfg, "", "  ")
-		os.WriteFile(configPath, configData, 0o644)
-
-		// Re-run Edit — should preserve custom fields
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-
-		data, _ = os.ReadFile(configPath)
-		json.Unmarshal(data, &cfg)
-		provider = cfg["provider"].(map[string]any)
-		ollama = provider["ollama"].(map[string]any)
-		models = ollama["models"].(map[string]any)
-		entry = models["llama3.2"].(map[string]any)
-
-		if entry["_myPref"] != "custom-value" {
-			t.Errorf("_myPref was lost: got %v", entry["_myPref"])
-		}
-		if entry["_myNum"] != float64(42) {
-			t.Errorf("_myNum was lost: got %v", entry["_myNum"])
-		}
-		if v, ok := entry["_launch"].(bool); !ok || !v {
-			t.Errorf("_launch marker missing or false: got %v", entry["_launch"])
-		}
-	})
-
-	t.Run("migrate legacy [Ollama] suffix entries", func(t *testing.T) {
-		cleanup()
-		// Write a config with a legacy entry (has [Ollama] suffix but no _launch marker)
-		os.MkdirAll(configDir, 0o755)
-		os.WriteFile(configPath, []byte(`{"provider":{"ollama":{"models":{"llama3.2":{"name":"llama3.2 [Ollama]"}}}}}`), 0o644)
-
-		if err := o.Edit([]string{"llama3.2"}); err != nil {
-			t.Fatal(err)
-		}
-
-		data, _ := os.ReadFile(configPath)
-		var cfg map[string]any
-		json.Unmarshal(data, &cfg)
-		provider := cfg["provider"].(map[string]any)
-		ollama := provider["ollama"].(map[string]any)
-		models := ollama["models"].(map[string]any)
-		entry := models["llama3.2"].(map[string]any)
-
-		// _launch marker should be added
-		if v, ok := entry["_launch"].(bool); !ok || !v {
-			t.Errorf("_launch marker not added during migration: got %v", entry["_launch"])
-		}
-		// [Ollama] suffix should be stripped
-		if name, ok := entry["name"].(string); !ok || name != "llama3.2" {
-			t.Errorf("name suffix not stripped: got %q", entry["name"])
-		}
-	})
-
-	t.Run("remove model preserves non-ollama models", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-		// Add a non-Ollama model manually
-		os.WriteFile(configPath, []byte(`{"provider":{"ollama":{"models":{"external":{"name":"External Model"}}}}}`), 0o644)
-
-		o.Edit([]string{"llama3.2"})
-		assertOpenCodeModelExists(t, configPath, "llama3.2")
-		assertOpenCodeModelExists(t, configPath, "external") // Should be preserved
-	})
-}
-
-func assertOpenCodeModelExists(t *testing.T, path, model string) {
-	t.Helper()
-	data, err := os.ReadFile(path)
-	if err != nil {
-		t.Fatal(err)
-	}
-	var cfg map[string]any
-	if err := json.Unmarshal(data, &cfg); err != nil {
-		t.Fatal(err)
-	}
-	provider, ok := cfg["provider"].(map[string]any)
-	if !ok {
-		t.Fatal("provider not found")
-	}
-	ollama, ok := provider["ollama"].(map[string]any)
-	if !ok {
-		t.Fatal("ollama provider not found")
-	}
-	models, ok := ollama["models"].(map[string]any)
-	if !ok {
-		t.Fatal("models not found")
-	}
-	if models[model] == nil {
-		t.Errorf("model %s not found", model)
-	}
-}
-
-func assertOpenCodeModelNotExists(t *testing.T, path, model string) {
-	t.Helper()
-	data, err := os.ReadFile(path)
-	if err != nil {
-		t.Fatal(err)
-	}
-	var cfg map[string]any
-	if err := json.Unmarshal(data, &cfg); err != nil {
-		t.Fatal(err)
-	}
-	provider, ok := cfg["provider"].(map[string]any)
-	if !ok {
-		return // No provider means no model
-	}
-	ollama, ok := provider["ollama"].(map[string]any)
-	if !ok {
-		return // No ollama means no model
-	}
-	models, ok := ollama["models"].(map[string]any)
-	if !ok {
-		return // No models means no model
-	}
-	if models[model] != nil {
-		t.Errorf("model %s should not exist but was found", model)
-	}
-}
-
-func assertOpenCodeRecentModel(t *testing.T, path string, index int, providerID, modelID string) {
-	t.Helper()
-	data, err := os.ReadFile(path)
-	if err != nil {
-		t.Fatal(err)
-	}
-	var state map[string]any
-	if err := json.Unmarshal(data, &state); err != nil {
-		t.Fatal(err)
-	}
-	recent, ok := state["recent"].([]any)
-	if !ok {
-		t.Fatal("recent not found")
-	}
-	if index >= len(recent) {
-		t.Fatalf("index %d out of range (len=%d)", index, len(recent))
-	}
-	entry, ok := recent[index].(map[string]any)
-	if !ok {
-		t.Fatal("entry is not a map")
-	}
-	if entry["providerID"] != providerID {
-		t.Errorf("expected providerID %s, got %s", providerID, entry["providerID"])
-	}
-	if entry["modelID"] != modelID {
-		t.Errorf("expected modelID %s, got %s", modelID, entry["modelID"])
-	}
-}
-
-// Edge case tests for opencode.go
-
-func TestOpenCodeEdit_CorruptedConfigJSON(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configDir := filepath.Join(tmpDir, ".config", "opencode")
-	configPath := filepath.Join(configDir, "opencode.json")
-
-	os.MkdirAll(configDir, 0o755)
-	os.WriteFile(configPath, []byte(`{corrupted json content`), 0o644)
-
-	// Should not panic - corrupted JSON should be treated as empty
-	err := o.Edit([]string{"llama3.2"})
-	if err != nil {
-		t.Fatalf("Edit failed with corrupted config: %v", err)
-	}
-
-	// Verify valid JSON was created
-	data, _ := os.ReadFile(configPath)
-	var cfg map[string]any
-	if err := json.Unmarshal(data, &cfg); err != nil {
-		t.Errorf("resulting config is not valid JSON: %v", err)
-	}
-}
-
-func TestOpenCodeEdit_CorruptedStateJSON(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	stateDir := filepath.Join(tmpDir, ".local", "state", "opencode")
-	statePath := filepath.Join(stateDir, "model.json")
-
-	os.MkdirAll(stateDir, 0o755)
-	os.WriteFile(statePath, []byte(`{corrupted state`), 0o644)
-
-	err := o.Edit([]string{"llama3.2"})
-	if err != nil {
-		t.Fatalf("Edit failed with corrupted state: %v", err)
-	}
-
-	// Verify valid state was created
-	data, _ := os.ReadFile(statePath)
-	var state map[string]any
-	if err := json.Unmarshal(data, &state); err != nil {
-		t.Errorf("resulting state is not valid JSON: %v", err)
-	}
-}
-
-func TestOpenCodeEdit_WrongTypeProvider(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configDir := filepath.Join(tmpDir, ".config", "opencode")
-	configPath := filepath.Join(configDir, "opencode.json")
-
-	os.MkdirAll(configDir, 0o755)
-	os.WriteFile(configPath, []byte(`{"provider": "not a map"}`), 0o644)
-
-	err := o.Edit([]string{"llama3.2"})
-	if err != nil {
-		t.Fatalf("Edit with wrong type provider failed: %v", err)
-	}
-
-	// Verify provider is now correct type
-	data, _ := os.ReadFile(configPath)
-	var cfg map[string]any
-	json.Unmarshal(data, &cfg)
-
-	provider, ok := cfg["provider"].(map[string]any)
-	if !ok {
-		t.Fatalf("provider should be map after setup, got %T", cfg["provider"])
-	}
-	if provider["ollama"] == nil {
-		t.Error("ollama provider should be created")
-	}
-}
-
-func TestOpenCodeEdit_WrongTypeRecent(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	stateDir := filepath.Join(tmpDir, ".local", "state", "opencode")
-	statePath := filepath.Join(stateDir, "model.json")
-
-	os.MkdirAll(stateDir, 0o755)
-	os.WriteFile(statePath, []byte(`{"recent": "not an array", "favorite": [], "variant": {}}`), 0o644)
-
-	err := o.Edit([]string{"llama3.2"})
-	if err != nil {
-		t.Fatalf("Edit with wrong type recent failed: %v", err)
-	}
-
-	// The function should handle this gracefully
-	data, _ := os.ReadFile(statePath)
-	var state map[string]any
-	json.Unmarshal(data, &state)
-
-	// recent should be properly set after setup
-	recent, ok := state["recent"].([]any)
-	if !ok {
-		t.Logf("Note: recent type after setup is %T (documenting behavior)", state["recent"])
-	} else if len(recent) == 0 {
-		t.Logf("Note: recent is empty (documenting behavior)")
-	}
-}
-
-func TestOpenCodeEdit_EmptyModels(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configDir := filepath.Join(tmpDir, ".config", "opencode")
-	configPath := filepath.Join(configDir, "opencode.json")
-
-	os.MkdirAll(configDir, 0o755)
-	originalContent := `{"provider":{"ollama":{"models":{"existing":{}}}}}`
-	os.WriteFile(configPath, []byte(originalContent), 0o644)
-
-	// Empty models should be no-op
-	err := o.Edit([]string{})
-	if err != nil {
-		t.Fatalf("Edit with empty models failed: %v", err)
-	}
-
-	// Original content should be preserved (file not modified)
-	data, _ := os.ReadFile(configPath)
-	if string(data) != originalContent {
-		t.Errorf("empty models should not modify file, but content changed")
-	}
-}
-
-func TestOpenCodeEdit_SpecialCharsInModelName(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	// Model name with special characters (though unusual)
-	specialModel := `model-with-"quotes"`
-
-	err := o.Edit([]string{specialModel})
-	if err != nil {
-		t.Fatalf("Edit with special chars failed: %v", err)
-	}
-
-	// Verify it was stored correctly
-	configDir := filepath.Join(tmpDir, ".config", "opencode")
-	configPath := filepath.Join(configDir, "opencode.json")
-	data, _ := os.ReadFile(configPath)
-
-	var cfg map[string]any
-	if err := json.Unmarshal(data, &cfg); err != nil {
-		t.Fatalf("resulting config is invalid JSON: %v", err)
-	}
-
-	// Model should be accessible
-	provider, _ := cfg["provider"].(map[string]any)
-	ollama, _ := provider["ollama"].(map[string]any)
-	models, _ := ollama["models"].(map[string]any)
-
-	if models[specialModel] == nil {
-		t.Errorf("model with special chars not found in config")
-	}
-}
-
-func readOpenCodeModel(t *testing.T, configPath, model string) map[string]any {
-	t.Helper()
-	data, err := os.ReadFile(configPath)
-	if err != nil {
-		t.Fatal(err)
-	}
-	var cfg map[string]any
-	json.Unmarshal(data, &cfg)
-	provider := cfg["provider"].(map[string]any)
-	ollama := provider["ollama"].(map[string]any)
-	models := ollama["models"].(map[string]any)
-	entry, ok := models[model].(map[string]any)
-	if !ok {
-		t.Fatalf("model %s not found in config", model)
-	}
-	return entry
-}
-
-func TestOpenCodeEdit_LocalModelNoLimit(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configPath := filepath.Join(tmpDir, ".config", "opencode", "opencode.json")
-
-	if err := o.Edit([]string{"llama3.2"}); err != nil {
-		t.Fatal(err)
-	}
-
-	entry := readOpenCodeModel(t, configPath, "llama3.2")
-	if entry["limit"] != nil {
-		t.Errorf("local model should not have limit set, got %v", entry["limit"])
-	}
-}
-
-func TestOpenCodeEdit_PreservesUserLimit(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configDir := filepath.Join(tmpDir, ".config", "opencode")
-	configPath := filepath.Join(configDir, "opencode.json")
-
-	// Set up a model with a user-configured limit
-	os.MkdirAll(configDir, 0o755)
-	os.WriteFile(configPath, []byte(`{
-		"provider": {
-			"ollama": {
-				"models": {
-					"llama3.2": {
-						"name": "llama3.2",
-						"_launch": true,
-						"limit": {"context": 8192, "output": 4096}
-					}
-				}
-			}
-		}
-	}`), 0o644)
-
-	// Re-edit should preserve the user's limit (not delete it)
-	if err := o.Edit([]string{"llama3.2"}); err != nil {
-		t.Fatal(err)
-	}
-
-	entry := readOpenCodeModel(t, configPath, "llama3.2")
-	limit, ok := entry["limit"].(map[string]any)
-	if !ok {
-		t.Fatal("user-configured limit was removed")
-	}
-	if limit["context"] != float64(8192) {
-		t.Errorf("context limit changed: got %v, want 8192", limit["context"])
-	}
-	if limit["output"] != float64(4096) {
-		t.Errorf("output limit changed: got %v, want 4096", limit["output"])
-	}
-}
-
-func TestOpenCodeEdit_CloudModelLimitStructure(t *testing.T) {
-	// Verify that when a cloud model entry has limits set (as Edit would do),
-	// the structure matches what opencode expects and re-edit preserves them.
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configDir := filepath.Join(tmpDir, ".config", "opencode")
-	configPath := filepath.Join(configDir, "opencode.json")
-
-	expected := cloudModelLimits["glm-4.7"]
-
-	// Simulate a cloud model that already has the limit set by a previous Edit
-	os.MkdirAll(configDir, 0o755)
-	os.WriteFile(configPath, []byte(fmt.Sprintf(`{
-		"provider": {
-			"ollama": {
-				"models": {
-					"glm-4.7:cloud": {
-						"name": "glm-4.7:cloud",
-						"_launch": true,
-						"limit": {"context": %d, "output": %d}
-					}
-				}
-			}
-		}
-	}`, expected.Context, expected.Output)), 0o644)
-
-	// Re-edit should preserve the cloud model limit
-	if err := o.Edit([]string{"glm-4.7:cloud"}); err != nil {
-		t.Fatal(err)
-	}
-
-	entry := readOpenCodeModel(t, configPath, "glm-4.7:cloud")
-	limit, ok := entry["limit"].(map[string]any)
-	if !ok {
-		t.Fatal("cloud model limit was removed on re-edit")
-	}
-	if limit["context"] != float64(expected.Context) {
-		t.Errorf("context = %v, want %d", limit["context"], expected.Context)
-	}
-	if limit["output"] != float64(expected.Output) {
-		t.Errorf("output = %v, want %d", limit["output"], expected.Output)
-	}
-}
-
-func TestLookupCloudModelLimit(t *testing.T) {
-	tests := []struct {
-		name        string
-		wantOK      bool
-		wantContext int
-		wantOutput  int
-	}{
-		{"glm-4.7", true, 202_752, 131_072},
-		{"glm-4.7:cloud", true, 202_752, 131_072},
-		{"kimi-k2.5", true, 262_144, 262_144},
-		{"kimi-k2.5:cloud", true, 262_144, 262_144},
-		{"deepseek-v3.2", true, 163_840, 65_536},
-		{"deepseek-v3.2:cloud", true, 163_840, 65_536},
-		{"qwen3-coder:480b", true, 262_144, 65_536},
-		{"qwen3-coder-next:cloud", true, 262_144, 32_768},
-		{"llama3.2", false, 0, 0},
-		{"unknown-model:cloud", false, 0, 0},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			l, ok := lookupCloudModelLimit(tt.name)
-			if ok != tt.wantOK {
-				t.Errorf("lookupCloudModelLimit(%q) ok = %v, want %v", tt.name, ok, tt.wantOK)
-			}
-			if ok {
-				if l.Context != tt.wantContext {
-					t.Errorf("context = %d, want %d", l.Context, tt.wantContext)
-				}
-				if l.Output != tt.wantOutput {
-					t.Errorf("output = %d, want %d", l.Output, tt.wantOutput)
-				}
-			}
-		})
-	}
-}
-
-func TestOpenCodeModels_NoConfig(t *testing.T) {
-	o := &OpenCode{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	models := o.Models()
-	if len(models) > 0 {
-		t.Errorf("expected nil/empty for missing config, got %v", models)
-	}
-}
--- a/cmd/config/pi.go
+++ b/cmd/config/pi.go
@@ -1,237 +0,0 @@
-package config
-
-import (
-	"context"
-	"encoding/json"
-	"fmt"
-	"net/http"
-	"os"
-	"os/exec"
-	"path/filepath"
-	"slices"
-	"strings"
-
-	"github.com/ollama/ollama/api"
-	"github.com/ollama/ollama/envconfig"
-	"github.com/ollama/ollama/types/model"
-)
-
-// Pi implements Runner and Editor for Pi (Pi Coding Agent) integration
-type Pi struct{}
-
-func (p *Pi) String() string { return "Pi" }
-
-func (p *Pi) Run(model string, args []string) error {
-	if _, err := exec.LookPath("pi"); err != nil {
-		return fmt.Errorf("pi is not installed, install with: npm install -g @mariozechner/pi-coding-agent")
-	}
-
-	// Call Edit() to ensure config is up-to-date before launch
-	models := []string{model}
-	if config, err := loadIntegration("pi"); err == nil && len(config.Models) > 0 {
-		models = config.Models
-	}
-	if err := p.Edit(models); err != nil {
-		return fmt.Errorf("setup failed: %w", err)
-	}
-
-	cmd := exec.Command("pi", args...)
-	cmd.Stdin = os.Stdin
-	cmd.Stdout = os.Stdout
-	cmd.Stderr = os.Stderr
-	return cmd.Run()
-}
-
-func (p *Pi) Paths() []string {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return nil
-	}
-
-	var paths []string
-	modelsPath := filepath.Join(home, ".pi", "agent", "models.json")
-	if _, err := os.Stat(modelsPath); err == nil {
-		paths = append(paths, modelsPath)
-	}
-	settingsPath := filepath.Join(home, ".pi", "agent", "settings.json")
-	if _, err := os.Stat(settingsPath); err == nil {
-		paths = append(paths, settingsPath)
-	}
-	return paths
-}
-
-func (p *Pi) Edit(models []string) error {
-	if len(models) == 0 {
-		return nil
-	}
-
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return err
-	}
-
-	configPath := filepath.Join(home, ".pi", "agent", "models.json")
-	if err := os.MkdirAll(filepath.Dir(configPath), 0o755); err != nil {
-		return err
-	}
-
-	config := make(map[string]any)
-	if data, err := os.ReadFile(configPath); err == nil {
-		_ = json.Unmarshal(data, &config)
-	}
-
-	providers, ok := config["providers"].(map[string]any)
-	if !ok {
-		providers = make(map[string]any)
-	}
-
-	ollama, ok := providers["ollama"].(map[string]any)
-	if !ok {
-		ollama = map[string]any{
-			"baseUrl": envconfig.Host().String() + "/v1",
-			"api":     "openai-completions",
-			"apiKey":  "ollama",
-		}
-	}
-
-	existingModels, ok := ollama["models"].([]any)
-	if !ok {
-		existingModels = make([]any, 0)
-	}
-
-	// Build set of selected models to track which need to be added
-	selectedSet := make(map[string]bool, len(models))
-	for _, m := range models {
-		selectedSet[m] = true
-	}
-
-	// Build new models list:
-	// 1. Keep user-managed models (no _launch marker) - untouched
-	// 2. Keep ollama-managed models (_launch marker) that are still selected
-	// 3. Add new ollama-managed models
-	var newModels []any
-	for _, m := range existingModels {
-		if modelObj, ok := m.(map[string]any); ok {
-			if id, ok := modelObj["id"].(string); ok {
-				// User-managed model (no _launch marker) - always preserve
-				if !isPiOllamaModel(modelObj) {
-					newModels = append(newModels, m)
-				} else if selectedSet[id] {
-					// Ollama-managed and still selected - keep it
-					newModels = append(newModels, m)
-					selectedSet[id] = false
-				}
-			}
-		}
-	}
-
-	// Add newly selected models that weren't already in the list
-	client := api.NewClient(envconfig.Host(), http.DefaultClient)
-	ctx := context.Background()
-	for _, model := range models {
-		if selectedSet[model] {
-			newModels = append(newModels, createConfig(ctx, client, model))
-		}
-	}
-
-	ollama["models"] = newModels
-	providers["ollama"] = ollama
-	config["providers"] = providers
-
-	configData, err := json.MarshalIndent(config, "", "  ")
-	if err != nil {
-		return err
-	}
-	if err := writeWithBackup(configPath, configData); err != nil {
-		return err
-	}
-
-	// Update settings.json with default provider and model
-	settingsPath := filepath.Join(home, ".pi", "agent", "settings.json")
-	settings := make(map[string]any)
-	if data, err := os.ReadFile(settingsPath); err == nil {
-		_ = json.Unmarshal(data, &settings)
-	}
-
-	settings["defaultProvider"] = "ollama"
-	settings["defaultModel"] = models[0]
-
-	settingsData, err := json.MarshalIndent(settings, "", "  ")
-	if err != nil {
-		return err
-	}
-	return writeWithBackup(settingsPath, settingsData)
-}
-
-func (p *Pi) Models() []string {
-	home, err := os.UserHomeDir()
-	if err != nil {
-		return nil
-	}
-
-	configPath := filepath.Join(home, ".pi", "agent", "models.json")
-	config, err := readJSONFile(configPath)
-	if err != nil {
-		return nil
-	}
-
-	providers, _ := config["providers"].(map[string]any)
-	ollama, _ := providers["ollama"].(map[string]any)
-	models, _ := ollama["models"].([]any)
-
-	var result []string
-	for _, m := range models {
-		if modelObj, ok := m.(map[string]any); ok {
-			if id, ok := modelObj["id"].(string); ok {
-				result = append(result, id)
-			}
-		}
-	}
-	slices.Sort(result)
-	return result
-}
-
-// isPiOllamaModel reports whether a model config entry is managed by ollama launch
-func isPiOllamaModel(cfg map[string]any) bool {
-	if v, ok := cfg["_launch"].(bool); ok && v {
-		return true
-	}
-	return false
-}
-
-// createConfig builds Pi model config with capability detection
-func createConfig(ctx context.Context, client *api.Client, modelID string) map[string]any {
-	cfg := map[string]any{
-		"id":      modelID,
-		"_launch": true,
-	}
-
-	resp, err := client.Show(ctx, &api.ShowRequest{Model: modelID})
-	if err != nil {
-		return cfg
-	}
-
-	// Set input types based on vision capability
-	if slices.Contains(resp.Capabilities, model.CapabilityVision) {
-		cfg["input"] = []string{"text", "image"}
-	} else {
-		cfg["input"] = []string{"text"}
-	}
-
-	// Set reasoning based on thinking capability
-	if slices.Contains(resp.Capabilities, model.CapabilityThinking) {
-		cfg["reasoning"] = true
-	}
-
-	// Extract context window from ModelInfo
-	for key, val := range resp.ModelInfo {
-		if strings.HasSuffix(key, ".context_length") {
-			if ctxLen, ok := val.(float64); ok && ctxLen > 0 {
-				cfg["contextWindow"] = int(ctxLen)
-			}
-			break
-		}
-	}
-
-	return cfg
-}
--- a/cmd/config/pi_test.go
+++ b/cmd/config/pi_test.go
@@ -1,830 +0,0 @@
-package config
-
-import (
-	"context"
-	"encoding/json"
-	"fmt"
-	"net/http"
-	"net/http/httptest"
-	"net/url"
-	"os"
-	"path/filepath"
-	"testing"
-
-	"github.com/ollama/ollama/api"
-	"github.com/ollama/ollama/types/model"
-)
-
-func TestPiIntegration(t *testing.T) {
-	pi := &Pi{}
-
-	t.Run("String", func(t *testing.T) {
-		if got := pi.String(); got != "Pi" {
-			t.Errorf("String() = %q, want %q", got, "Pi")
-		}
-	})
-
-	t.Run("implements Runner", func(t *testing.T) {
-		var _ Runner = pi
-	})
-
-	t.Run("implements Editor", func(t *testing.T) {
-		var _ Editor = pi
-	})
-}
-
-func TestPiPaths(t *testing.T) {
-	pi := &Pi{}
-
-	t.Run("returns empty when no config exists", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		paths := pi.Paths()
-		if len(paths) != 0 {
-			t.Errorf("Paths() = %v, want empty", paths)
-		}
-	})
-
-	t.Run("returns path when config exists", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		configDir := filepath.Join(tmpDir, ".pi", "agent")
-		if err := os.MkdirAll(configDir, 0o755); err != nil {
-			t.Fatal(err)
-		}
-		configPath := filepath.Join(configDir, "models.json")
-		if err := os.WriteFile(configPath, []byte("{}"), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		paths := pi.Paths()
-		if len(paths) != 1 || paths[0] != configPath {
-			t.Errorf("Paths() = %v, want [%s]", paths, configPath)
-		}
-	})
-}
-
-func TestPiEdit(t *testing.T) {
-	// Mock Ollama server for createConfig calls during Edit
-	srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-		if r.URL.Path == "/api/show" {
-			fmt.Fprintf(w, `{"capabilities":[],"model_info":{}}`)
-			return
-		}
-		w.WriteHeader(http.StatusNotFound)
-	}))
-	defer srv.Close()
-	t.Setenv("OLLAMA_HOST", srv.URL)
-
-	pi := &Pi{}
-	tmpDir := t.TempDir()
-	setTestHome(t, tmpDir)
-
-	configDir := filepath.Join(tmpDir, ".pi", "agent")
-	configPath := filepath.Join(configDir, "models.json")
-
-	cleanup := func() {
-		os.RemoveAll(configDir)
-	}
-
-	readConfig := func() map[string]any {
-		data, _ := os.ReadFile(configPath)
-		var cfg map[string]any
-		json.Unmarshal(data, &cfg)
-		return cfg
-	}
-
-	t.Run("returns nil for empty models", func(t *testing.T) {
-		if err := pi.Edit([]string{}); err != nil {
-			t.Errorf("Edit([]) error = %v, want nil", err)
-		}
-	})
-
-	t.Run("creates config with models", func(t *testing.T) {
-		cleanup()
-
-		models := []string{"llama3.2", "qwen3:8b"}
-		if err := pi.Edit(models); err != nil {
-			t.Fatalf("Edit() error = %v", err)
-		}
-
-		cfg := readConfig()
-
-		providers, ok := cfg["providers"].(map[string]any)
-		if !ok {
-			t.Error("Config missing providers")
-		}
-
-		ollama, ok := providers["ollama"].(map[string]any)
-		if !ok {
-			t.Error("Providers missing ollama")
-		}
-
-		modelsArray, ok := ollama["models"].([]any)
-		if !ok || len(modelsArray) != 2 {
-			t.Errorf("Expected 2 models, got %v", modelsArray)
-		}
-
-		if ollama["baseUrl"] == nil {
-			t.Error("Missing baseUrl")
-		}
-		if ollama["api"] != "openai-completions" {
-			t.Errorf("Expected api=openai-completions, got %v", ollama["api"])
-		}
-		if ollama["apiKey"] != "ollama" {
-			t.Errorf("Expected apiKey=ollama, got %v", ollama["apiKey"])
-		}
-	})
-
-	t.Run("updates existing config preserving ollama provider settings", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-
-		existingConfig := `{
-			"providers": {
-				"ollama": {
-					"baseUrl": "http://custom:8080/v1",
-					"api": "custom-api",
-					"apiKey": "custom-key",
-					"models": [
-						{"id": "old-model", "_launch": true}
-					]
-				}
-			}
-		}`
-		if err := os.WriteFile(configPath, []byte(existingConfig), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		models := []string{"new-model"}
-		if err := pi.Edit(models); err != nil {
-			t.Fatalf("Edit() error = %v", err)
-		}
-
-		cfg := readConfig()
-		providers := cfg["providers"].(map[string]any)
-		ollama := providers["ollama"].(map[string]any)
-
-		if ollama["baseUrl"] != "http://custom:8080/v1" {
-			t.Errorf("Custom baseUrl not preserved, got %v", ollama["baseUrl"])
-		}
-		if ollama["api"] != "custom-api" {
-			t.Errorf("Custom api not preserved, got %v", ollama["api"])
-		}
-		if ollama["apiKey"] != "custom-key" {
-			t.Errorf("Custom apiKey not preserved, got %v", ollama["apiKey"])
-		}
-
-		modelsArray := ollama["models"].([]any)
-		if len(modelsArray) != 1 {
-			t.Errorf("Expected 1 model after update, got %d", len(modelsArray))
-		} else {
-			modelEntry := modelsArray[0].(map[string]any)
-			if modelEntry["id"] != "new-model" {
-				t.Errorf("Expected new-model, got %v", modelEntry["id"])
-			}
-			// Verify _launch marker is present
-			if modelEntry["_launch"] != true {
-				t.Errorf("Expected _launch marker to be true")
-			}
-		}
-	})
-
-	t.Run("replaces old models with new ones", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-
-		// Old models must have _launch marker to be managed by us
-		existingConfig := `{
-			"providers": {
-				"ollama": {
-					"baseUrl": "http://localhost:11434/v1",
-					"api": "openai-completions",
-					"apiKey": "ollama",
-					"models": [
-						{"id": "old-model-1", "_launch": true},
-						{"id": "old-model-2", "_launch": true}
-					]
-				}
-			}
-		}`
-		if err := os.WriteFile(configPath, []byte(existingConfig), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		newModels := []string{"new-model-1", "new-model-2"}
-		if err := pi.Edit(newModels); err != nil {
-			t.Fatalf("Edit() error = %v", err)
-		}
-
-		cfg := readConfig()
-		providers := cfg["providers"].(map[string]any)
-		ollama := providers["ollama"].(map[string]any)
-		modelsArray := ollama["models"].([]any)
-
-		if len(modelsArray) != 2 {
-			t.Errorf("Expected 2 models, got %d", len(modelsArray))
-		}
-
-		modelIDs := make(map[string]bool)
-		for _, m := range modelsArray {
-			modelObj := m.(map[string]any)
-			id := modelObj["id"].(string)
-			modelIDs[id] = true
-		}
-
-		if !modelIDs["new-model-1"] || !modelIDs["new-model-2"] {
-			t.Errorf("Expected new models, got %v", modelIDs)
-		}
-		if modelIDs["old-model-1"] || modelIDs["old-model-2"] {
-			t.Errorf("Old models should have been removed, got %v", modelIDs)
-		}
-	})
-
-	t.Run("handles partial overlap in model list", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-
-		// Models must have _launch marker to be managed
-		existingConfig := `{
-			"providers": {
-				"ollama": {
-					"baseUrl": "http://localhost:11434/v1",
-					"api": "openai-completions",
-					"apiKey": "ollama",
-					"models": [
-						{"id": "keep-model", "_launch": true},
-						{"id": "remove-model", "_launch": true}
-					]
-				}
-			}
-		}`
-		if err := os.WriteFile(configPath, []byte(existingConfig), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		newModels := []string{"keep-model", "add-model"}
-		if err := pi.Edit(newModels); err != nil {
-			t.Fatalf("Edit() error = %v", err)
-		}
-
-		cfg := readConfig()
-		providers := cfg["providers"].(map[string]any)
-		ollama := providers["ollama"].(map[string]any)
-		modelsArray := ollama["models"].([]any)
-
-		if len(modelsArray) != 2 {
-			t.Errorf("Expected 2 models, got %d", len(modelsArray))
-		}
-
-		modelIDs := make(map[string]bool)
-		for _, m := range modelsArray {
-			modelObj := m.(map[string]any)
-			id := modelObj["id"].(string)
-			modelIDs[id] = true
-		}
-
-		if !modelIDs["keep-model"] || !modelIDs["add-model"] {
-			t.Errorf("Expected keep-model and add-model, got %v", modelIDs)
-		}
-		if modelIDs["remove-model"] {
-			t.Errorf("remove-model should have been removed")
-		}
-	})
-
-	t.Run("handles corrupt config gracefully", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-
-		if err := os.WriteFile(configPath, []byte("{invalid json}"), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		models := []string{"test-model"}
-		if err := pi.Edit(models); err != nil {
-			t.Fatalf("Edit() should not fail with corrupt config, got %v", err)
-		}
-
-		data, err := os.ReadFile(configPath)
-		if err != nil {
-			t.Fatalf("Failed to read config: %v", err)
-		}
-
-		var cfg map[string]any
-		if err := json.Unmarshal(data, &cfg); err != nil {
-			t.Fatalf("Config should be valid after Edit, got parse error: %v", err)
-		}
-
-		providers := cfg["providers"].(map[string]any)
-		ollama := providers["ollama"].(map[string]any)
-		modelsArray := ollama["models"].([]any)
-
-		if len(modelsArray) != 1 {
-			t.Errorf("Expected 1 model, got %d", len(modelsArray))
-		}
-	})
-
-	// CRITICAL SAFETY TEST: verifies we don't stomp on user configs
-	t.Run("preserves user-managed models without _launch marker", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-
-		// User has manually configured models in ollama provider (no _launch marker)
-		existingConfig := `{
-			"providers": {
-				"ollama": {
-					"baseUrl": "http://localhost:11434/v1",
-					"api": "openai-completions",
-					"apiKey": "ollama",
-					"models": [
-						{"id": "user-model-1"},
-						{"id": "user-model-2", "customField": "preserved"},
-						{"id": "ollama-managed", "_launch": true}
-					]
-				}
-			}
-		}`
-		if err := os.WriteFile(configPath, []byte(existingConfig), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		// Add a new ollama-managed model
-		newModels := []string{"new-ollama-model"}
-		if err := pi.Edit(newModels); err != nil {
-			t.Fatalf("Edit() error = %v", err)
-		}
-
-		cfg := readConfig()
-		providers := cfg["providers"].(map[string]any)
-		ollama := providers["ollama"].(map[string]any)
-		modelsArray := ollama["models"].([]any)
-
-		// Should have: new-ollama-model (managed) + 2 user models (preserved)
-		if len(modelsArray) != 3 {
-			t.Errorf("Expected 3 models (1 new managed + 2 preserved user models), got %d", len(modelsArray))
-		}
-
-		modelIDs := make(map[string]map[string]any)
-		for _, m := range modelsArray {
-			modelObj := m.(map[string]any)
-			id := modelObj["id"].(string)
-			modelIDs[id] = modelObj
-		}
-
-		// Verify new model has _launch marker
-		if m, ok := modelIDs["new-ollama-model"]; !ok {
-			t.Errorf("new-ollama-model should be present")
-		} else if m["_launch"] != true {
-			t.Errorf("new-ollama-model should have _launch marker")
-		}
-
-		// Verify user models are preserved
-		if _, ok := modelIDs["user-model-1"]; !ok {
-			t.Errorf("user-model-1 should be preserved")
-		}
-		if _, ok := modelIDs["user-model-2"]; !ok {
-			t.Errorf("user-model-2 should be preserved")
-		} else if modelIDs["user-model-2"]["customField"] != "preserved" {
-			t.Errorf("user-model-2 customField should be preserved")
-		}
-
-		// Verify old ollama-managed model is removed (not in new list)
-		if _, ok := modelIDs["ollama-managed"]; ok {
-			t.Errorf("ollama-managed should be removed (old ollama model not in new selection)")
-		}
-	})
-
-	t.Run("updates settings.json with default provider and model", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-
-		// Create existing settings with other fields
-		settingsPath := filepath.Join(configDir, "settings.json")
-		existingSettings := `{
-			"theme": "dark",
-			"customSetting": "value",
-			"defaultProvider": "anthropic",
-			"defaultModel": "claude-3"
-		}`
-		if err := os.WriteFile(settingsPath, []byte(existingSettings), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		models := []string{"llama3.2"}
-		if err := pi.Edit(models); err != nil {
-			t.Fatalf("Edit() error = %v", err)
-		}
-
-		data, err := os.ReadFile(settingsPath)
-		if err != nil {
-			t.Fatalf("Failed to read settings: %v", err)
-		}
-
-		var settings map[string]any
-		if err := json.Unmarshal(data, &settings); err != nil {
-			t.Fatalf("Failed to parse settings: %v", err)
-		}
-
-		// Verify defaultProvider is set to ollama
-		if settings["defaultProvider"] != "ollama" {
-			t.Errorf("defaultProvider = %v, want ollama", settings["defaultProvider"])
-		}
-
-		// Verify defaultModel is set to first model
-		if settings["defaultModel"] != "llama3.2" {
-			t.Errorf("defaultModel = %v, want llama3.2", settings["defaultModel"])
-		}
-
-		// Verify other fields are preserved
-		if settings["theme"] != "dark" {
-			t.Errorf("theme = %v, want dark (preserved)", settings["theme"])
-		}
-		if settings["customSetting"] != "value" {
-			t.Errorf("customSetting = %v, want value (preserved)", settings["customSetting"])
-		}
-	})
-
-	t.Run("creates settings.json if it does not exist", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-
-		models := []string{"qwen3:8b"}
-		if err := pi.Edit(models); err != nil {
-			t.Fatalf("Edit() error = %v", err)
-		}
-
-		settingsPath := filepath.Join(configDir, "settings.json")
-		data, err := os.ReadFile(settingsPath)
-		if err != nil {
-			t.Fatalf("settings.json should be created: %v", err)
-		}
-
-		var settings map[string]any
-		if err := json.Unmarshal(data, &settings); err != nil {
-			t.Fatalf("Failed to parse settings: %v", err)
-		}
-
-		if settings["defaultProvider"] != "ollama" {
-			t.Errorf("defaultProvider = %v, want ollama", settings["defaultProvider"])
-		}
-		if settings["defaultModel"] != "qwen3:8b" {
-			t.Errorf("defaultModel = %v, want qwen3:8b", settings["defaultModel"])
-		}
-	})
-
-	t.Run("handles corrupt settings.json gracefully", func(t *testing.T) {
-		cleanup()
-		os.MkdirAll(configDir, 0o755)
-
-		// Create corrupt settings
-		settingsPath := filepath.Join(configDir, "settings.json")
-		if err := os.WriteFile(settingsPath, []byte("{invalid"), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		models := []string{"test-model"}
-		if err := pi.Edit(models); err != nil {
-			t.Fatalf("Edit() should not fail with corrupt settings, got %v", err)
-		}
-
-		data, err := os.ReadFile(settingsPath)
-		if err != nil {
-			t.Fatalf("Failed to read settings: %v", err)
-		}
-
-		var settings map[string]any
-		if err := json.Unmarshal(data, &settings); err != nil {
-			t.Fatalf("settings.json should be valid after Edit, got parse error: %v", err)
-		}
-
-		if settings["defaultProvider"] != "ollama" {
-			t.Errorf("defaultProvider = %v, want ollama", settings["defaultProvider"])
-		}
-		if settings["defaultModel"] != "test-model" {
-			t.Errorf("defaultModel = %v, want test-model", settings["defaultModel"])
-		}
-	})
-}
-
-func TestPiModels(t *testing.T) {
-	pi := &Pi{}
-
-	t.Run("returns nil when no config exists", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		models := pi.Models()
-		if models != nil {
-			t.Errorf("Models() = %v, want nil", models)
-		}
-	})
-
-	t.Run("returns models from config", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		configDir := filepath.Join(tmpDir, ".pi", "agent")
-		if err := os.MkdirAll(configDir, 0o755); err != nil {
-			t.Fatal(err)
-		}
-		config := `{
-			"providers": {
-				"ollama": {
-					"models": [
-						{"id": "llama3.2"},
-						{"id": "qwen3:8b"}
-					]
-				}
-			}
-		}`
-		configPath := filepath.Join(configDir, "models.json")
-		if err := os.WriteFile(configPath, []byte(config), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		models := pi.Models()
-		if len(models) != 2 {
-			t.Errorf("Models() returned %d models, want 2", len(models))
-		}
-		if models[0] != "llama3.2" || models[1] != "qwen3:8b" {
-			t.Errorf("Models() = %v, want [llama3.2 qwen3:8b] (sorted)", models)
-		}
-	})
-
-	t.Run("returns sorted models", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		configDir := filepath.Join(tmpDir, ".pi", "agent")
-		if err := os.MkdirAll(configDir, 0o755); err != nil {
-			t.Fatal(err)
-		}
-		config := `{
-			"providers": {
-				"ollama": {
-					"models": [
-						{"id": "z-model"},
-						{"id": "a-model"},
-						{"id": "m-model"}
-					]
-				}
-			}
-		}`
-		configPath := filepath.Join(configDir, "models.json")
-		if err := os.WriteFile(configPath, []byte(config), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		models := pi.Models()
-		if models[0] != "a-model" || models[1] != "m-model" || models[2] != "z-model" {
-			t.Errorf("Models() = %v, want [a-model m-model z-model] (sorted)", models)
-		}
-	})
-
-	t.Run("returns nil when models array is missing", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		configDir := filepath.Join(tmpDir, ".pi", "agent")
-		if err := os.MkdirAll(configDir, 0o755); err != nil {
-			t.Fatal(err)
-		}
-		config := `{
-			"providers": {
-				"ollama": {}
-			}
-		}`
-		configPath := filepath.Join(configDir, "models.json")
-		if err := os.WriteFile(configPath, []byte(config), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		models := pi.Models()
-		if models != nil {
-			t.Errorf("Models() = %v, want nil when models array is missing", models)
-		}
-	})
-
-	t.Run("handles corrupt config gracefully", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		setTestHome(t, tmpDir)
-
-		configDir := filepath.Join(tmpDir, ".pi", "agent")
-		if err := os.MkdirAll(configDir, 0o755); err != nil {
-			t.Fatal(err)
-		}
-		configPath := filepath.Join(configDir, "models.json")
-		if err := os.WriteFile(configPath, []byte("{invalid json}"), 0o644); err != nil {
-			t.Fatal(err)
-		}
-
-		models := pi.Models()
-		if models != nil {
-			t.Errorf("Models() = %v, want nil for corrupt config", models)
-		}
-	})
-}
-
-func TestIsPiOllamaModel(t *testing.T) {
-	tests := []struct {
-		name string
-		cfg  map[string]any
-		want bool
-	}{
-		{"with _launch true", map[string]any{"id": "m", "_launch": true}, true},
-		{"with _launch false", map[string]any{"id": "m", "_launch": false}, false},
-		{"without _launch", map[string]any{"id": "m"}, false},
-		{"with _launch non-bool", map[string]any{"id": "m", "_launch": "yes"}, false},
-		{"empty map", map[string]any{}, false},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			if got := isPiOllamaModel(tt.cfg); got != tt.want {
-				t.Errorf("isPiOllamaModel(%v) = %v, want %v", tt.cfg, got, tt.want)
-			}
-		})
-	}
-}
-
-func TestCreateConfig(t *testing.T) {
-	t.Run("sets vision input when model has vision capability", func(t *testing.T) {
-		srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			if r.URL.Path == "/api/show" {
-				fmt.Fprintf(w, `{"capabilities":["vision"],"model_info":{}}`)
-				return
-			}
-			w.WriteHeader(http.StatusNotFound)
-		}))
-		defer srv.Close()
-
-		u, _ := url.Parse(srv.URL)
-		client := api.NewClient(u, srv.Client())
-
-		cfg := createConfig(context.Background(), client, "llava:7b")
-
-		if cfg["id"] != "llava:7b" {
-			t.Errorf("id = %v, want llava:7b", cfg["id"])
-		}
-		if cfg["_launch"] != true {
-			t.Error("expected _launch = true")
-		}
-		input, ok := cfg["input"].([]string)
-		if !ok || len(input) != 2 || input[0] != "text" || input[1] != "image" {
-			t.Errorf("input = %v, want [text image]", cfg["input"])
-		}
-	})
-
-	t.Run("sets text-only input when model lacks vision", func(t *testing.T) {
-		srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			if r.URL.Path == "/api/show" {
-				fmt.Fprintf(w, `{"capabilities":["completion"],"model_info":{}}`)
-				return
-			}
-			w.WriteHeader(http.StatusNotFound)
-		}))
-		defer srv.Close()
-
-		u, _ := url.Parse(srv.URL)
-		client := api.NewClient(u, srv.Client())
-
-		cfg := createConfig(context.Background(), client, "llama3.2")
-
-		input, ok := cfg["input"].([]string)
-		if !ok || len(input) != 1 || input[0] != "text" {
-			t.Errorf("input = %v, want [text]", cfg["input"])
-		}
-		if _, ok := cfg["reasoning"]; ok {
-			t.Error("reasoning should not be set for non-thinking model")
-		}
-	})
-
-	t.Run("sets reasoning when model has thinking capability", func(t *testing.T) {
-		srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			if r.URL.Path == "/api/show" {
-				fmt.Fprintf(w, `{"capabilities":["thinking"],"model_info":{}}`)
-				return
-			}
-			w.WriteHeader(http.StatusNotFound)
-		}))
-		defer srv.Close()
-
-		u, _ := url.Parse(srv.URL)
-		client := api.NewClient(u, srv.Client())
-
-		cfg := createConfig(context.Background(), client, "qwq")
-
-		if cfg["reasoning"] != true {
-			t.Error("expected reasoning = true for thinking model")
-		}
-	})
-
-	t.Run("extracts context window from model info", func(t *testing.T) {
-		srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			if r.URL.Path == "/api/show" {
-				fmt.Fprintf(w, `{"capabilities":[],"model_info":{"llama.context_length":131072}}`)
-				return
-			}
-			w.WriteHeader(http.StatusNotFound)
-		}))
-		defer srv.Close()
-
-		u, _ := url.Parse(srv.URL)
-		client := api.NewClient(u, srv.Client())
-
-		cfg := createConfig(context.Background(), client, "llama3.2")
-
-		if cfg["contextWindow"] != 131072 {
-			t.Errorf("contextWindow = %v, want 131072", cfg["contextWindow"])
-		}
-	})
-
-	t.Run("handles all capabilities together", func(t *testing.T) {
-		srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			if r.URL.Path == "/api/show" {
-				fmt.Fprintf(w, `{"capabilities":["vision","thinking"],"model_info":{"qwen3.context_length":32768}}`)
-				return
-			}
-			w.WriteHeader(http.StatusNotFound)
-		}))
-		defer srv.Close()
-
-		u, _ := url.Parse(srv.URL)
-		client := api.NewClient(u, srv.Client())
-
-		cfg := createConfig(context.Background(), client, "qwen3-vision")
-
-		input := cfg["input"].([]string)
-		if len(input) != 2 || input[0] != "text" || input[1] != "image" {
-			t.Errorf("input = %v, want [text image]", input)
-		}
-		if cfg["reasoning"] != true {
-			t.Error("expected reasoning = true")
-		}
-		if cfg["contextWindow"] != 32768 {
-			t.Errorf("contextWindow = %v, want 32768", cfg["contextWindow"])
-		}
-	})
-
-	t.Run("returns minimal config when show fails", func(t *testing.T) {
-		srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			w.WriteHeader(http.StatusNotFound)
-			fmt.Fprintf(w, `{"error":"model not found"}`)
-		}))
-		defer srv.Close()
-
-		u, _ := url.Parse(srv.URL)
-		client := api.NewClient(u, srv.Client())
-
-		cfg := createConfig(context.Background(), client, "missing-model")
-
-		if cfg["id"] != "missing-model" {
-			t.Errorf("id = %v, want missing-model", cfg["id"])
-		}
-		if cfg["_launch"] != true {
-			t.Error("expected _launch = true")
-		}
-		// Should not have capability fields
-		if _, ok := cfg["input"]; ok {
-			t.Error("input should not be set when show fails")
-		}
-		if _, ok := cfg["reasoning"]; ok {
-			t.Error("reasoning should not be set when show fails")
-		}
-		if _, ok := cfg["contextWindow"]; ok {
-			t.Error("contextWindow should not be set when show fails")
-		}
-	})
-
-	t.Run("skips zero context length", func(t *testing.T) {
-		srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-			if r.URL.Path == "/api/show" {
-				fmt.Fprintf(w, `{"capabilities":[],"model_info":{"llama.context_length":0}}`)
-				return
-			}
-			w.WriteHeader(http.StatusNotFound)
-		}))
-		defer srv.Close()
-
-		u, _ := url.Parse(srv.URL)
-		client := api.NewClient(u, srv.Client())
-
-		cfg := createConfig(context.Background(), client, "test-model")
-
-		if _, ok := cfg["contextWindow"]; ok {
-			t.Error("contextWindow should not be set for zero value")
-		}
-	})
-}
-
-// Ensure Capability constants used in createConfig match expected values
-func TestPiCapabilityConstants(t *testing.T) {
-	if model.CapabilityVision != "vision" {
-		t.Errorf("CapabilityVision = %q, want %q", model.CapabilityVision, "vision")
-	}
-	if model.CapabilityThinking != "thinking" {
-		t.Errorf("CapabilityThinking = %q, want %q", model.CapabilityThinking, "thinking")
-	}
-}
--- a/cmd/config/selector.go
+++ b/cmd/config/selector.go
@@ -1,59 +0,0 @@
-package config
-
-import (
-	"errors"
-	"fmt"
-	"os"
-
-	"golang.org/x/term"
-)
-
-// ANSI escape sequences for terminal formatting.
-const (
-	ansiBold   = "\033[1m"
-	ansiReset  = "\033[0m"
-	ansiGray   = "\033[37m"
-	ansiGreen  = "\033[32m"
-	ansiYellow = "\033[33m"
-)
-
-// ErrCancelled is returned when the user cancels a selection.
-var ErrCancelled = errors.New("cancelled")
-
-// errCancelled is kept as an alias for backward compatibility within the package.
-var errCancelled = ErrCancelled
-
-// DefaultConfirmPrompt provides a TUI-based confirmation prompt.
-// When set, confirmPrompt delegates to it instead of using raw terminal I/O.
-var DefaultConfirmPrompt func(prompt string) (bool, error)
-
-func confirmPrompt(prompt string) (bool, error) {
-	if DefaultConfirmPrompt != nil {
-		return DefaultConfirmPrompt(prompt)
-	}
-
-	fd := int(os.Stdin.Fd())
-	oldState, err := term.MakeRaw(fd)
-	if err != nil {
-		return false, err
-	}
-	defer term.Restore(fd, oldState)
-
-	fmt.Fprintf(os.Stderr, "%s (\033[1my\033[0m/n) ", prompt)
-
-	buf := make([]byte, 1)
-	for {
-		if _, err := os.Stdin.Read(buf); err != nil {
-			return false, err
-		}
-
-		switch buf[0] {
-		case 'Y', 'y', 13:
-			fmt.Fprintf(os.Stderr, "yes\r\n")
-			return true, nil
-		case 'N', 'n', 27, 3:
-			fmt.Fprintf(os.Stderr, "no\r\n")
-			return false, nil
-		}
-	}
-}
--- a/cmd/config/selector_test.go
+++ b/cmd/config/selector_test.go
@@ -1,19 +0,0 @@
-package config
-
-import (
-	"testing"
-)
-
-func TestErrCancelled(t *testing.T) {
-	t.Run("NotNil", func(t *testing.T) {
-		if errCancelled == nil {
-			t.Error("errCancelled should not be nil")
-		}
-	})
-
-	t.Run("Message", func(t *testing.T) {
-		if errCancelled.Error() != "cancelled" {
-			t.Errorf("expected 'cancelled', got %q", errCancelled.Error())
-		}
-	})
-}
--- a/cmd/editor_unix.go
+++ b/cmd/editor_unix.go
@@ -1,5 +0,0 @@
-//go:build !windows
-
-package cmd
-
-const defaultEditor = "vi"
--- a/cmd/editor_windows.go
+++ b/cmd/editor_windows.go
@@ -1,5 +0,0 @@
-//go:build windows
-
-package cmd
-
-const defaultEditor = "edit"
--- a/cmd/interactive.go
+++ b/cmd/interactive.go
@@ -7,7 +7,6 @@ import (
 	"io"
 	"net/http"
 	"os"
-	"os/exec"
 	"path/filepath"
 	"regexp"
 	"slices"
@@ -80,7 +79,6 @@ func generateInteractive(cmd *cobra.Command, opts runOptions) error {
 		fmt.Fprintln(os.Stderr, "  Ctrl + w            Delete the word before the cursor")
 		fmt.Fprintln(os.Stderr, "")
 		fmt.Fprintln(os.Stderr, "  Ctrl + l            Clear the screen")
-		fmt.Fprintln(os.Stderr, "  Ctrl + g            Open default editor to compose a prompt")
 		fmt.Fprintln(os.Stderr, "  Ctrl + c            Stop the model from responding")
 		fmt.Fprintln(os.Stderr, "  Ctrl + d            Exit ollama (/bye)")
 		fmt.Fprintln(os.Stderr, "")
@@ -118,7 +116,7 @@ func generateInteractive(cmd *cobra.Command, opts runOptions) error {
 		Prompt:         ">>> ",
 		AltPrompt:      "... ",
 		Placeholder:    "Send a message (/? for help)",
-		AltPlaceholder: "Press Enter to send",
+		AltPlaceholder: `Use """ to end multi-line input`,
 	})
 	if err != nil {
 		return err
@@ -149,18 +147,6 @@ func generateInteractive(cmd *cobra.Command, opts runOptions) error {
 			scanner.Prompt.UseAlt = false
 			sb.Reset()

-			continue
-		case errors.Is(err, readline.ErrEditPrompt):
-			sb.Reset()
-			content, err := editInExternalEditor(line)
-			if err != nil {
-				fmt.Fprintf(os.Stderr, "error: %v\n", err)
-				continue
-			}
-			if strings.TrimSpace(content) == "" {
-				continue
-			}
-			scanner.Prefill = content
 			continue
 		case err != nil:
 			return err
@@ -173,7 +159,6 @@ func generateInteractive(cmd *cobra.Command, opts runOptions) error {
 			sb.WriteString(before)
 			if !ok {
 				fmt.Fprintln(&sb)
-				scanner.Prompt.UseAlt = true
 				continue
 			}

@@ -612,57 +597,6 @@ func extractFileData(input string) (string, []api.ImageData, error) {
 	return strings.TrimSpace(input), imgs, nil
 }

-func editInExternalEditor(content string) (string, error) {
-	editor := envconfig.Editor()
-	if editor == "" {
-		editor = os.Getenv("VISUAL")
-	}
-	if editor == "" {
-		editor = os.Getenv("EDITOR")
-	}
-	if editor == "" {
-		editor = defaultEditor
-	}
-
-	// Check that the editor binary exists
-	name := strings.Fields(editor)[0]
-	if _, err := exec.LookPath(name); err != nil {
-		return "", fmt.Errorf("editor %q not found, set OLLAMA_EDITOR to the path of your preferred editor", name)
-	}
-
-	tmpFile, err := os.CreateTemp("", "ollama-prompt-*.txt")
-	if err != nil {
-		return "", fmt.Errorf("creating temp file: %w", err)
-	}
-	defer os.Remove(tmpFile.Name())
-
-	if content != "" {
-		if _, err := tmpFile.WriteString(content); err != nil {
-			tmpFile.Close()
-			return "", fmt.Errorf("writing to temp file: %w", err)
-		}
-	}
-	tmpFile.Close()
-
-	args := strings.Fields(editor)
-	args = append(args, tmpFile.Name())
-	cmd := exec.Command(args[0], args[1:]...)
-	cmd.Stdin = os.Stdin
-	cmd.Stdout = os.Stdout
-	cmd.Stderr = os.Stderr
-
-	if err := cmd.Run(); err != nil {
-		return "", fmt.Errorf("editor exited with error: %w", err)
-	}
-
-	data, err := os.ReadFile(tmpFile.Name())
-	if err != nil {
-		return "", fmt.Errorf("reading temp file: %w", err)
-	}
-
-	return strings.TrimRight(string(data), "\n"), nil
-}
-
 func getImageData(filePath string) ([]byte, error) {
 	file, err := os.Open(filePath)
 	if err != nil {
--- a/cmd/start_darwin.go
+++ b/cmd/start_darwin.go
@@ -10,21 +10,19 @@ import (
 	"github.com/ollama/ollama/api"
 )

-var errNotRunning = errors.New("could not connect to ollama server, run 'ollama serve' to start it")
-
 func startApp(ctx context.Context, client *api.Client) error {
 	exe, err := os.Executable()
 	if err != nil {
-		return errNotRunning
+		return err
 	}
 	link, err := os.Readlink(exe)
 	if err != nil {
-		return errNotRunning
+		return err
 	}
 	r := regexp.MustCompile(`^.*/Ollama\s?\d*.app`)
 	m := r.FindStringSubmatch(link)
 	if len(m) != 1 {
-		return errNotRunning
+		return errors.New("could not find ollama app")
 	}
 	if err := exec.Command("/usr/bin/open", "-j", "-a", m[0], "--args", "--fast-startup").Run(); err != nil {
 		return err
--- a/cmd/tui/confirm.go
+++ b/cmd/tui/confirm.go
@@ -1,109 +0,0 @@
-package tui
-
-import (
-	"fmt"
-
-	tea "github.com/charmbracelet/bubbletea"
-	"github.com/charmbracelet/lipgloss"
-)
-
-var (
-	confirmActiveStyle = lipgloss.NewStyle().
-				Bold(true).
-				Background(lipgloss.AdaptiveColor{Light: "254", Dark: "236"})
-
-	confirmInactiveStyle = lipgloss.NewStyle().
-				Foreground(lipgloss.AdaptiveColor{Light: "242", Dark: "246"})
-)
-
-type confirmModel struct {
-	prompt    string
-	yes       bool
-	confirmed bool
-	cancelled bool
-	width     int
-}
-
-func (m confirmModel) Init() tea.Cmd {
-	return nil
-}
-
-func (m confirmModel) Update(msg tea.Msg) (tea.Model, tea.Cmd) {
-	switch msg := msg.(type) {
-	case tea.WindowSizeMsg:
-		wasSet := m.width > 0
-		m.width = msg.Width
-		if wasSet {
-			return m, tea.EnterAltScreen
-		}
-		return m, nil
-
-	case tea.KeyMsg:
-		switch msg.String() {
-		case "ctrl+c", "esc", "n":
-			m.cancelled = true
-			return m, tea.Quit
-		case "y":
-			m.yes = true
-			m.confirmed = true
-			return m, tea.Quit
-		case "enter":
-			m.confirmed = true
-			return m, tea.Quit
-		case "left", "h":
-			m.yes = true
-		case "right", "l":
-			m.yes = false
-		case "tab":
-			m.yes = !m.yes
-		}
-	}
-
-	return m, nil
-}
-
-func (m confirmModel) View() string {
-	if m.confirmed || m.cancelled {
-		return ""
-	}
-
-	var yesBtn, noBtn string
-	if m.yes {
-		yesBtn = confirmActiveStyle.Render(" Yes ")
-		noBtn = confirmInactiveStyle.Render(" No ")
-	} else {
-		yesBtn = confirmInactiveStyle.Render(" Yes ")
-		noBtn = confirmActiveStyle.Render(" No ")
-	}
-
-	s := selectorTitleStyle.Render(m.prompt) + "\n\n"
-	s += "  " + yesBtn + "  " + noBtn + "\n\n"
-	s += selectorHelpStyle.Render("←/→ navigate • enter confirm • esc cancel")
-
-	if m.width > 0 {
-		return lipgloss.NewStyle().MaxWidth(m.width).Render(s)
-	}
-	return s
-}
-
-// RunConfirm shows a bubbletea yes/no confirmation prompt.
-// Returns true if the user confirmed, false if cancelled.
-func RunConfirm(prompt string) (bool, error) {
-	m := confirmModel{
-		prompt: prompt,
-		yes:    true, // default to yes
-	}
-
-	p := tea.NewProgram(m)
-	finalModel, err := p.Run()
-	if err != nil {
-		return false, fmt.Errorf("error running confirm: %w", err)
-	}
-
-	fm := finalModel.(confirmModel)
-	if fm.cancelled {
-		return false, ErrCancelled
-	}
-
-	return fm.yes, nil
-}
--- a/cmd/tui/confirm_test.go
+++ b/cmd/tui/confirm_test.go
@@ -1,208 +0,0 @@
-package tui
-
-import (
-	"strings"
-	"testing"
-
-	tea "github.com/charmbracelet/bubbletea"
-)
-
-func TestConfirmModel_DefaultsToYes(t *testing.T) {
-	m := confirmModel{prompt: "Download test?", yes: true}
-	if !m.yes {
-		t.Error("should default to yes")
-	}
-}
-
-func TestConfirmModel_View_ContainsPrompt(t *testing.T) {
-	m := confirmModel{prompt: "Download qwen3:8b?", yes: true}
-	got := m.View()
-	if !strings.Contains(got, "Download qwen3:8b?") {
-		t.Error("should contain the prompt text")
-	}
-}
-
-func TestConfirmModel_View_ContainsButtons(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: true}
-	got := m.View()
-	if !strings.Contains(got, "Yes") {
-		t.Error("should contain Yes button")
-	}
-	if !strings.Contains(got, "No") {
-		t.Error("should contain No button")
-	}
-}
-
-func TestConfirmModel_View_ContainsHelp(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: true}
-	got := m.View()
-	if !strings.Contains(got, "enter confirm") {
-		t.Error("should contain help text")
-	}
-}
-
-func TestConfirmModel_View_ClearsAfterConfirm(t *testing.T) {
-	m := confirmModel{prompt: "Download?", confirmed: true}
-	if m.View() != "" {
-		t.Error("View should return empty string after confirmation")
-	}
-}
-
-func TestConfirmModel_View_ClearsAfterCancel(t *testing.T) {
-	m := confirmModel{prompt: "Download?", cancelled: true}
-	if m.View() != "" {
-		t.Error("View should return empty string after cancellation")
-	}
-}
-
-func TestConfirmModel_EnterConfirmsYes(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: true}
-	updated, cmd := m.Update(tea.KeyMsg{Type: tea.KeyEnter})
-	fm := updated.(confirmModel)
-	if !fm.confirmed {
-		t.Error("enter should set confirmed=true")
-	}
-	if !fm.yes {
-		t.Error("enter with yes selected should keep yes=true")
-	}
-	if cmd == nil {
-		t.Error("enter should return tea.Quit")
-	}
-}
-
-func TestConfirmModel_EnterConfirmsNo(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: false}
-	updated, cmd := m.Update(tea.KeyMsg{Type: tea.KeyEnter})
-	fm := updated.(confirmModel)
-	if !fm.confirmed {
-		t.Error("enter should set confirmed=true")
-	}
-	if fm.yes {
-		t.Error("enter with no selected should keep yes=false")
-	}
-	if cmd == nil {
-		t.Error("enter should return tea.Quit")
-	}
-}
-
-func TestConfirmModel_EscCancels(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: true}
-	updated, cmd := m.Update(tea.KeyMsg{Type: tea.KeyEsc})
-	fm := updated.(confirmModel)
-	if !fm.cancelled {
-		t.Error("esc should set cancelled=true")
-	}
-	if cmd == nil {
-		t.Error("esc should return tea.Quit")
-	}
-}
-
-func TestConfirmModel_CtrlCCancels(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: true}
-	updated, cmd := m.Update(tea.KeyMsg{Type: tea.KeyCtrlC})
-	fm := updated.(confirmModel)
-	if !fm.cancelled {
-		t.Error("ctrl+c should set cancelled=true")
-	}
-	if cmd == nil {
-		t.Error("ctrl+c should return tea.Quit")
-	}
-}
-
-func TestConfirmModel_NCancels(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: true}
-	updated, cmd := m.Update(tea.KeyMsg{Type: tea.KeyRunes, Runes: []rune{'n'}})
-	fm := updated.(confirmModel)
-	if !fm.cancelled {
-		t.Error("'n' should set cancelled=true")
-	}
-	if cmd == nil {
-		t.Error("'n' should return tea.Quit")
-	}
-}
-
-func TestConfirmModel_YConfirmsYes(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: false}
-	updated, cmd := m.Update(tea.KeyMsg{Type: tea.KeyRunes, Runes: []rune{'y'}})
-	fm := updated.(confirmModel)
-	if !fm.confirmed {
-		t.Error("'y' should set confirmed=true")
-	}
-	if !fm.yes {
-		t.Error("'y' should set yes=true")
-	}
-	if cmd == nil {
-		t.Error("'y' should return tea.Quit")
-	}
-}
-
-func TestConfirmModel_ArrowKeysNavigate(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: true}
-
-	// Right moves to No
-	updated, _ := m.Update(tea.KeyMsg{Type: tea.KeyRunes, Runes: []rune{'l'}})
-	fm := updated.(confirmModel)
-	if fm.yes {
-		t.Error("right/l should move to No")
-	}
-	if fm.confirmed || fm.cancelled {
-		t.Error("navigation should not confirm or cancel")
-	}
-
-	// Left moves back to Yes
-	updated, _ = fm.Update(tea.KeyMsg{Type: tea.KeyRunes, Runes: []rune{'h'}})
-	fm = updated.(confirmModel)
-	if !fm.yes {
-		t.Error("left/h should move to Yes")
-	}
-}
-
-func TestConfirmModel_TabToggles(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: true}
-
-	updated, _ := m.Update(tea.KeyMsg{Type: tea.KeyTab})
-	fm := updated.(confirmModel)
-	if fm.yes {
-		t.Error("tab should toggle from Yes to No")
-	}
-
-	updated, _ = fm.Update(tea.KeyMsg{Type: tea.KeyTab})
-	fm = updated.(confirmModel)
-	if !fm.yes {
-		t.Error("tab should toggle from No to Yes")
-	}
-}
-
-func TestConfirmModel_WindowSizeUpdatesWidth(t *testing.T) {
-	m := confirmModel{prompt: "Download?"}
-	updated, _ := m.Update(tea.WindowSizeMsg{Width: 100, Height: 40})
-	fm := updated.(confirmModel)
-	if fm.width != 100 {
-		t.Errorf("expected width 100, got %d", fm.width)
-	}
-}
-
-func TestConfirmModel_ResizeEntersAltScreen(t *testing.T) {
-	m := confirmModel{prompt: "Download?", width: 80}
-	_, cmd := m.Update(tea.WindowSizeMsg{Width: 100, Height: 40})
-	if cmd == nil {
-		t.Error("resize (width already set) should return a command")
-	}
-}
-
-func TestConfirmModel_InitialWindowSizeNoAltScreen(t *testing.T) {
-	m := confirmModel{prompt: "Download?"}
-	_, cmd := m.Update(tea.WindowSizeMsg{Width: 80, Height: 40})
-	if cmd != nil {
-		t.Error("initial WindowSizeMsg should not return a command")
-	}
-}
-
-func TestConfirmModel_ViewMaxWidth(t *testing.T) {
-	m := confirmModel{prompt: "Download?", yes: true, width: 40}
-	got := m.View()
-	// Just ensure it doesn't panic and returns content
-	if got == "" {
-		t.Error("View with width set should still return content")
-	}
-}
--- a/cmd/tui/selector.go
+++ b/cmd/tui/selector.go
@@ -1,824 +0,0 @@
-package tui
-
-import (
-	"errors"
-	"fmt"
-	"strings"
-
-	tea "github.com/charmbracelet/bubbletea"
-	"github.com/charmbracelet/lipgloss"
-	"github.com/ollama/ollama/cmd/config"
-)
-
-var (
-	selectorTitleStyle = lipgloss.NewStyle().
-				Bold(true)
-
-	selectorItemStyle = lipgloss.NewStyle().
-				PaddingLeft(4)
-
-	selectorSelectedItemStyle = lipgloss.NewStyle().
-					PaddingLeft(2).
-					Bold(true).
-					Background(lipgloss.AdaptiveColor{Light: "254", Dark: "236"})
-
-	selectorDescStyle = lipgloss.NewStyle().
-				Foreground(lipgloss.AdaptiveColor{Light: "242", Dark: "246"})
-
-	selectorDescLineStyle = selectorDescStyle.
-				PaddingLeft(6)
-
-	selectorFilterStyle = lipgloss.NewStyle().
-				Foreground(lipgloss.AdaptiveColor{Light: "242", Dark: "246"}).
-				Italic(true)
-
-	selectorInputStyle = lipgloss.NewStyle().
-				Foreground(lipgloss.AdaptiveColor{Light: "235", Dark: "252"})
-
-	selectorDefaultTagStyle = lipgloss.NewStyle().
-				Foreground(lipgloss.AdaptiveColor{Light: "242", Dark: "246"}).
-				Italic(true)
-
-	selectorHelpStyle = lipgloss.NewStyle().
-				Foreground(lipgloss.AdaptiveColor{Light: "244", Dark: "244"})
-
-	selectorMoreStyle = lipgloss.NewStyle().
-				PaddingLeft(6).
-				Foreground(lipgloss.AdaptiveColor{Light: "242", Dark: "246"}).
-				Italic(true)
-
-	sectionHeaderStyle = lipgloss.NewStyle().
-				PaddingLeft(2).
-				Bold(true).
-				Foreground(lipgloss.AdaptiveColor{Light: "240", Dark: "249"})
-)
-
-const maxSelectorItems = 10
-
-// ErrCancelled is returned when the user cancels the selection.
-var ErrCancelled = errors.New("cancelled")
-
-type SelectItem struct {
-	Name        string
-	Description string
-	Recommended bool
-}
-
-// ConvertItems converts config.ModelItem slice to SelectItem slice.
-func ConvertItems(items []config.ModelItem) []SelectItem {
-	out := make([]SelectItem, len(items))
-	for i, item := range items {
-		out[i] = SelectItem{Name: item.Name, Description: item.Description, Recommended: item.Recommended}
-	}
-	return out
-}
-
-// ReorderItems returns a copy with recommended items first, then non-recommended,
-// preserving relative order within each group. This ensures the data order matches
-// the visual section layout (Recommended / More).
-func ReorderItems(items []SelectItem) []SelectItem {
-	var rec, other []SelectItem
-	for _, item := range items {
-		if item.Recommended {
-			rec = append(rec, item)
-		} else {
-			other = append(other, item)
-		}
-	}
-	return append(rec, other...)
-}
-
-// selectorModel is the bubbletea model for single selection.
-type selectorModel struct {
-	title        string
-	items        []SelectItem
-	filter       string
-	cursor       int
-	scrollOffset int
-	selected     string
-	cancelled    bool
-	helpText     string
-	width        int
-}
-
-func (m selectorModel) filteredItems() []SelectItem {
-	if m.filter == "" {
-		return m.items
-	}
-	filterLower := strings.ToLower(m.filter)
-	var result []SelectItem
-	for _, item := range m.items {
-		if strings.Contains(strings.ToLower(item.Name), filterLower) {
-			result = append(result, item)
-		}
-	}
-	return result
-}
-
-func (m selectorModel) Init() tea.Cmd {
-	return nil
-}
-
-// otherStart returns the index of the first non-recommended item in the filtered list.
-// When filtering, all items scroll together so this returns 0.
-func (m selectorModel) otherStart() int {
-	if m.filter != "" {
-		return 0
-	}
-	filtered := m.filteredItems()
-	for i, item := range filtered {
-		if !item.Recommended {
-			return i
-		}
-	}
-	return len(filtered)
-}
-
-// updateNavigation handles navigation keys (up/down/pgup/pgdown/filter/backspace).
-// It does NOT handle Enter, Esc, or CtrlC. This is used by both the standalone
-// selector and the TUI modal (which intercepts Enter/Esc for its own logic).
-func (m *selectorModel) updateNavigation(msg tea.KeyMsg) {
-	filtered := m.filteredItems()
-	otherStart := m.otherStart()
-
-	switch msg.Type {
-	case tea.KeyUp:
-		if m.cursor > 0 {
-			m.cursor--
-			m.updateScroll(otherStart)
-		}
-
-	case tea.KeyDown:
-		if m.cursor < len(filtered)-1 {
-			m.cursor++
-			m.updateScroll(otherStart)
-		}
-
-	case tea.KeyPgUp:
-		m.cursor -= maxSelectorItems
-		if m.cursor < 0 {
-			m.cursor = 0
-		}
-		m.updateScroll(otherStart)
-
-	case tea.KeyPgDown:
-		m.cursor += maxSelectorItems
-		if m.cursor >= len(filtered) {
-			m.cursor = len(filtered) - 1
-		}
-		m.updateScroll(otherStart)
-
-	case tea.KeyBackspace:
-		if len(m.filter) > 0 {
-			m.filter = m.filter[:len(m.filter)-1]
-			m.cursor = 0
-			m.scrollOffset = 0
-		}
-
-	case tea.KeyRunes:
-		m.filter += string(msg.Runes)
-		m.cursor = 0
-		m.scrollOffset = 0
-	}
-}
-
-// updateScroll adjusts scrollOffset based on cursor position.
-// When not filtering, scrollOffset is relative to the "More" (non-recommended) section.
-// When filtering, it's relative to the full filtered list.
-func (m *selectorModel) updateScroll(otherStart int) {
-	if m.filter != "" {
-		if m.cursor < m.scrollOffset {
-			m.scrollOffset = m.cursor
-		}
-		if m.cursor >= m.scrollOffset+maxSelectorItems {
-			m.scrollOffset = m.cursor - maxSelectorItems + 1
-		}
-		return
-	}
-
-	// Cursor is in recommended section — reset "More" scroll to top
-	if m.cursor < otherStart {
-		m.scrollOffset = 0
-		return
-	}
-
-	// Cursor is in "More" section — scroll relative to others
-	posInOthers := m.cursor - otherStart
-	maxOthers := maxSelectorItems - otherStart
-	if maxOthers < 3 {
-		maxOthers = 3
-	}
-	if posInOthers < m.scrollOffset {
-		m.scrollOffset = posInOthers
-	}
-	if posInOthers >= m.scrollOffset+maxOthers {
-		m.scrollOffset = posInOthers - maxOthers + 1
-	}
-}
-
-func (m selectorModel) Update(msg tea.Msg) (tea.Model, tea.Cmd) {
-	switch msg := msg.(type) {
-	case tea.WindowSizeMsg:
-		wasSet := m.width > 0
-		m.width = msg.Width
-		if wasSet {
-			return m, tea.EnterAltScreen
-		}
-		return m, nil
-
-	case tea.KeyMsg:
-		switch msg.Type {
-		case tea.KeyCtrlC, tea.KeyEsc:
-			m.cancelled = true
-			return m, tea.Quit
-
-		case tea.KeyEnter:
-			filtered := m.filteredItems()
-			if len(filtered) > 0 && m.cursor < len(filtered) {
-				m.selected = filtered[m.cursor].Name
-			}
-			return m, tea.Quit
-
-		default:
-			m.updateNavigation(msg)
-		}
-	}
-
-	return m, nil
-}
-
-func (m selectorModel) renderItem(s *strings.Builder, item SelectItem, idx int) {
-	if idx == m.cursor {
-		s.WriteString(selectorSelectedItemStyle.Render("▸ " + item.Name))
-	} else {
-		s.WriteString(selectorItemStyle.Render(item.Name))
-	}
-	s.WriteString("\n")
-	if item.Description != "" {
-		s.WriteString(selectorDescLineStyle.Render(item.Description))
-		s.WriteString("\n")
-	}
-}
-
-// renderContent renders the selector content (title, items, help text) without
-// checking the cancelled/selected state. This is used by both View() (standalone mode)
-// and by the TUI modal which embeds a selectorModel.
-func (m selectorModel) renderContent() string {
-	var s strings.Builder
-
-	s.WriteString(selectorTitleStyle.Render(m.title))
-	s.WriteString(" ")
-	if m.filter == "" {
-		s.WriteString(selectorFilterStyle.Render("Type to filter..."))
-	} else {
-		s.WriteString(selectorInputStyle.Render(m.filter))
-	}
-	s.WriteString("\n\n")
-
-	filtered := m.filteredItems()
-
-	if len(filtered) == 0 {
-		s.WriteString(selectorItemStyle.Render(selectorDescStyle.Render("(no matches)")))
-		s.WriteString("\n")
-	} else if m.filter != "" {
-		s.WriteString(sectionHeaderStyle.Render("Top Results"))
-		s.WriteString("\n")
-
-		displayCount := min(len(filtered), maxSelectorItems)
-		for i := range displayCount {
-			idx := m.scrollOffset + i
-			if idx >= len(filtered) {
-				break
-			}
-			m.renderItem(&s, filtered[idx], idx)
-		}
-
-		if remaining := len(filtered) - m.scrollOffset - displayCount; remaining > 0 {
-			s.WriteString(selectorMoreStyle.Render(fmt.Sprintf("... and %d more", remaining)))
-			s.WriteString("\n")
-		}
-	} else {
-		// Split into pinned recommended and scrollable others
-		var recItems, otherItems []int
-		for i, item := range filtered {
-			if item.Recommended {
-				recItems = append(recItems, i)
-			} else {
-				otherItems = append(otherItems, i)
-			}
-		}
-
-		// Always render all recommended items (pinned)
-		if len(recItems) > 0 {
-			s.WriteString(sectionHeaderStyle.Render("Recommended"))
-			s.WriteString("\n")
-			for _, idx := range recItems {
-				m.renderItem(&s, filtered[idx], idx)
-			}
-		}
-
-		if len(otherItems) > 0 {
-			s.WriteString("\n")
-			s.WriteString(sectionHeaderStyle.Render("More"))
-			s.WriteString("\n")
-
-			maxOthers := maxSelectorItems - len(recItems)
-			if maxOthers < 3 {
-				maxOthers = 3
-			}
-			displayCount := min(len(otherItems), maxOthers)
-
-			for i := range displayCount {
-				idx := m.scrollOffset + i
-				if idx >= len(otherItems) {
-					break
-				}
-				m.renderItem(&s, filtered[otherItems[idx]], otherItems[idx])
-			}
-
-			if remaining := len(otherItems) - m.scrollOffset - displayCount; remaining > 0 {
-				s.WriteString(selectorMoreStyle.Render(fmt.Sprintf("... and %d more", remaining)))
-				s.WriteString("\n")
-			}
-		}
-	}
-
-	s.WriteString("\n")
-	help := "↑/↓ navigate • enter select • esc cancel"
-	if m.helpText != "" {
-		help = m.helpText
-	}
-	s.WriteString(selectorHelpStyle.Render(help))
-
-	return s.String()
-}
-
-func (m selectorModel) View() string {
-	if m.cancelled || m.selected != "" {
-		return ""
-	}
-
-	s := m.renderContent()
-	if m.width > 0 {
-		return lipgloss.NewStyle().MaxWidth(m.width).Render(s)
-	}
-	return s
-}
-
-// cursorForCurrent returns the item index matching current, or 0 if not found.
-func cursorForCurrent(items []SelectItem, current string) int {
-	if current != "" {
-		for i, item := range items {
-			if item.Name == current || strings.HasPrefix(item.Name, current+":") || strings.HasPrefix(current, item.Name+":") {
-				return i
-			}
-		}
-	}
-	return 0
-}
-
-func SelectSingle(title string, items []SelectItem, current string) (string, error) {
-	if len(items) == 0 {
-		return "", fmt.Errorf("no items to select from")
-	}
-
-	m := selectorModel{
-		title:  title,
-		items:  items,
-		cursor: cursorForCurrent(items, current),
-	}
-
-	p := tea.NewProgram(m)
-	finalModel, err := p.Run()
-	if err != nil {
-		return "", fmt.Errorf("error running selector: %w", err)
-	}
-
-	fm := finalModel.(selectorModel)
-	if fm.cancelled {
-		return "", ErrCancelled
-	}
-
-	return fm.selected, nil
-}
-
-// multiSelectorModel is the bubbletea model for multi selection.
-type multiSelectorModel struct {
-	title        string
-	items        []SelectItem
-	itemIndex    map[string]int
-	filter       string
-	cursor       int
-	scrollOffset int
-	checked      map[int]bool
-	checkOrder   []int
-	cancelled    bool
-	confirmed    bool
-	width        int
-
-	// multi enables full multi-select editing mode. The zero value (false)
-	// shows a single-select picker where Enter adds the chosen model to
-	// the existing list. Tab toggles between modes.
-	multi     bool
-	singleAdd string // model picked in single mode
-}
-
-func newMultiSelectorModel(title string, items []SelectItem, preChecked []string) multiSelectorModel {
-	m := multiSelectorModel{
-		title:     title,
-		items:     items,
-		itemIndex: make(map[string]int, len(items)),
-		checked:   make(map[int]bool),
-	}
-
-	for i, item := range items {
-		m.itemIndex[item.Name] = i
-	}
-
-	// Reverse order so preChecked[0] (the current default) ends up last
-	// in checkOrder, matching the "last checked = default" convention.
-	for i := len(preChecked) - 1; i >= 0; i-- {
-		if idx, ok := m.itemIndex[preChecked[i]]; ok {
-			m.checked[idx] = true
-			m.checkOrder = append(m.checkOrder, idx)
-		}
-	}
-
-	// Position cursor on the current default model
-	if len(preChecked) > 0 {
-		if idx, ok := m.itemIndex[preChecked[0]]; ok {
-			m.cursor = idx
-			m.updateScroll(m.otherStart())
-		}
-	}
-
-	return m
-}
-
-func (m multiSelectorModel) filteredItems() []SelectItem {
-	if m.filter == "" {
-		return m.items
-	}
-	filterLower := strings.ToLower(m.filter)
-	var result []SelectItem
-	for _, item := range m.items {
-		if strings.Contains(strings.ToLower(item.Name), filterLower) {
-			result = append(result, item)
-		}
-	}
-	return result
-}
-
-// otherStart returns the index of the first non-recommended item in the filtered list.
-func (m multiSelectorModel) otherStart() int {
-	if m.filter != "" {
-		return 0
-	}
-	filtered := m.filteredItems()
-	for i, item := range filtered {
-		if !item.Recommended {
-			return i
-		}
-	}
-	return len(filtered)
-}
-
-// updateScroll adjusts scrollOffset for section-based scrolling (matches single-select).
-func (m *multiSelectorModel) updateScroll(otherStart int) {
-	if m.filter != "" {
-		if m.cursor < m.scrollOffset {
-			m.scrollOffset = m.cursor
-		}
-		if m.cursor >= m.scrollOffset+maxSelectorItems {
-			m.scrollOffset = m.cursor - maxSelectorItems + 1
-		}
-		return
-	}
-
-	if m.cursor < otherStart {
-		m.scrollOffset = 0
-		return
-	}
-
-	posInOthers := m.cursor - otherStart
-	maxOthers := maxSelectorItems - otherStart
-	if maxOthers < 3 {
-		maxOthers = 3
-	}
-	if posInOthers < m.scrollOffset {
-		m.scrollOffset = posInOthers
-	}
-	if posInOthers >= m.scrollOffset+maxOthers {
-		m.scrollOffset = posInOthers - maxOthers + 1
-	}
-}
-
-func (m *multiSelectorModel) toggleItem() {
-	filtered := m.filteredItems()
-	if len(filtered) == 0 || m.cursor >= len(filtered) {
-		return
-	}
-
-	item := filtered[m.cursor]
-	origIdx := m.itemIndex[item.Name]
-
-	if m.checked[origIdx] {
-		delete(m.checked, origIdx)
-		for i, idx := range m.checkOrder {
-			if idx == origIdx {
-				m.checkOrder = append(m.checkOrder[:i], m.checkOrder[i+1:]...)
-				break
-			}
-		}
-	} else {
-		m.checked[origIdx] = true
-		m.checkOrder = append(m.checkOrder, origIdx)
-	}
-}
-
-func (m multiSelectorModel) selectedCount() int {
-	return len(m.checkOrder)
-}
-
-func (m multiSelectorModel) Init() tea.Cmd {
-	return nil
-}
-
-func (m multiSelectorModel) Update(msg tea.Msg) (tea.Model, tea.Cmd) {
-	switch msg := msg.(type) {
-	case tea.WindowSizeMsg:
-		wasSet := m.width > 0
-		m.width = msg.Width
-		if wasSet {
-			return m, tea.EnterAltScreen
-		}
-		return m, nil
-
-	case tea.KeyMsg:
-		filtered := m.filteredItems()
-
-		switch msg.Type {
-		case tea.KeyCtrlC, tea.KeyEsc:
-			m.cancelled = true
-			return m, tea.Quit
-
-		case tea.KeyTab:
-			m.multi = !m.multi
-
-		case tea.KeyEnter:
-			if !m.multi {
-				if len(filtered) > 0 && m.cursor < len(filtered) {
-					m.singleAdd = filtered[m.cursor].Name
-					m.confirmed = true
-					return m, tea.Quit
-				}
-			} else if len(m.checkOrder) > 0 {
-				m.confirmed = true
-				return m, tea.Quit
-			}
-
-		case tea.KeySpace:
-			if m.multi {
-				m.toggleItem()
-			}
-
-		case tea.KeyUp:
-			if m.cursor > 0 {
-				m.cursor--
-				m.updateScroll(m.otherStart())
-			}
-
-		case tea.KeyDown:
-			if m.cursor < len(filtered)-1 {
-				m.cursor++
-				m.updateScroll(m.otherStart())
-			}
-
-		case tea.KeyPgUp:
-			m.cursor -= maxSelectorItems
-			if m.cursor < 0 {
-				m.cursor = 0
-			}
-			m.updateScroll(m.otherStart())
-
-		case tea.KeyPgDown:
-			m.cursor += maxSelectorItems
-			if m.cursor >= len(filtered) {
-				m.cursor = len(filtered) - 1
-			}
-			m.updateScroll(m.otherStart())
-
-		case tea.KeyBackspace:
-			if len(m.filter) > 0 {
-				m.filter = m.filter[:len(m.filter)-1]
-				m.cursor = 0
-				m.scrollOffset = 0
-			}
-
-		case tea.KeyRunes:
-			// On some terminals (e.g. Windows PowerShell), space arrives as
-			// KeyRunes instead of KeySpace. Intercept it so toggle still works.
-			if len(msg.Runes) == 1 && msg.Runes[0] == ' ' {
-				if m.multi {
-					m.toggleItem()
-				}
-			} else {
-				m.filter += string(msg.Runes)
-				m.cursor = 0
-				m.scrollOffset = 0
-			}
-		}
-	}
-
-	return m, nil
-}
-
-func (m multiSelectorModel) renderSingleItem(s *strings.Builder, item SelectItem, idx int) {
-	if idx == m.cursor {
-		s.WriteString(selectorSelectedItemStyle.Render("▸ " + item.Name))
-	} else {
-		s.WriteString(selectorItemStyle.Render(item.Name))
-	}
-	s.WriteString("\n")
-	if item.Description != "" {
-		s.WriteString(selectorDescLineStyle.Render(item.Description))
-		s.WriteString("\n")
-	}
-}
-
-func (m multiSelectorModel) renderMultiItem(s *strings.Builder, item SelectItem, idx int) {
-	origIdx := m.itemIndex[item.Name]
-
-	var check string
-	if m.checked[origIdx] {
-		check = "[x] "
-	} else {
-		check = "[ ] "
-	}
-
-	suffix := ""
-	if len(m.checkOrder) > 0 && m.checkOrder[len(m.checkOrder)-1] == origIdx {
-		suffix = " " + selectorDefaultTagStyle.Render("(default)")
-	}
-
-	if idx == m.cursor {
-		s.WriteString(selectorSelectedItemStyle.Render("▸ " + check + item.Name))
-	} else {
-		s.WriteString(selectorItemStyle.Render(check + item.Name))
-	}
-	s.WriteString(suffix)
-	s.WriteString("\n")
-	if item.Description != "" {
-		s.WriteString(selectorDescLineStyle.Render(item.Description))
-		s.WriteString("\n")
-	}
-}
-
-func (m multiSelectorModel) View() string {
-	if m.cancelled || m.confirmed {
-		return ""
-	}
-
-	renderItem := m.renderSingleItem
-	if m.multi {
-		renderItem = m.renderMultiItem
-	}
-
-	var s strings.Builder
-
-	s.WriteString(selectorTitleStyle.Render(m.title))
-	s.WriteString(" ")
-	if m.filter == "" {
-		s.WriteString(selectorFilterStyle.Render("Type to filter..."))
-	} else {
-		s.WriteString(selectorInputStyle.Render(m.filter))
-	}
-	s.WriteString("\n\n")
-
-	filtered := m.filteredItems()
-
-	if len(filtered) == 0 {
-		s.WriteString(selectorItemStyle.Render(selectorDescStyle.Render("(no matches)")))
-		s.WriteString("\n")
-	} else if m.filter != "" {
-		// Filtering: flat scroll through all matches
-		displayCount := min(len(filtered), maxSelectorItems)
-		for i := range displayCount {
-			idx := m.scrollOffset + i
-			if idx >= len(filtered) {
-				break
-			}
-			renderItem(&s, filtered[idx], idx)
-		}
-
-		if remaining := len(filtered) - m.scrollOffset - displayCount; remaining > 0 {
-			s.WriteString(selectorMoreStyle.Render(fmt.Sprintf("... and %d more", remaining)))
-			s.WriteString("\n")
-		}
-	} else {
-		// Split into pinned recommended and scrollable others (matches single-select layout)
-		var recItems, otherItems []int
-		for i, item := range filtered {
-			if item.Recommended {
-				recItems = append(recItems, i)
-			} else {
-				otherItems = append(otherItems, i)
-			}
-		}
-
-		// Always render all recommended items (pinned)
-		if len(recItems) > 0 {
-			s.WriteString(sectionHeaderStyle.Render("Recommended"))
-			s.WriteString("\n")
-			for _, idx := range recItems {
-				renderItem(&s, filtered[idx], idx)
-			}
-		}
-
-		if len(otherItems) > 0 {
-			s.WriteString("\n")
-			s.WriteString(sectionHeaderStyle.Render("More"))
-			s.WriteString("\n")
-
-			maxOthers := maxSelectorItems - len(recItems)
-			if maxOthers < 3 {
-				maxOthers = 3
-			}
-			displayCount := min(len(otherItems), maxOthers)
-
-			for i := range displayCount {
-				idx := m.scrollOffset + i
-				if idx >= len(otherItems) {
-					break
-				}
-				renderItem(&s, filtered[otherItems[idx]], otherItems[idx])
-			}
-
-			if remaining := len(otherItems) - m.scrollOffset - displayCount; remaining > 0 {
-				s.WriteString(selectorMoreStyle.Render(fmt.Sprintf("... and %d more", remaining)))
-				s.WriteString("\n")
-			}
-		}
-	}
-
-	s.WriteString("\n")
-
-	if !m.multi {
-		s.WriteString(selectorHelpStyle.Render("↑/↓ navigate • enter select • tab add multiple • esc cancel"))
-	} else {
-		count := m.selectedCount()
-		if count == 0 {
-			s.WriteString(selectorDescStyle.Render("  Select at least one model."))
-		} else {
-			s.WriteString(selectorDescStyle.Render(fmt.Sprintf("  %d selected - press enter to continue", count)))
-		}
-		s.WriteString("\n\n")
-		s.WriteString(selectorHelpStyle.Render("↑/↓ navigate • space toggle • tab select single • enter confirm • esc cancel"))
-	}
-
-	result := s.String()
-	if m.width > 0 {
-		return lipgloss.NewStyle().MaxWidth(m.width).Render(result)
-	}
-	return result
-}
-
-func SelectMultiple(title string, items []SelectItem, preChecked []string) ([]string, error) {
-	if len(items) == 0 {
-		return nil, fmt.Errorf("no items to select from")
-	}
-
-	m := newMultiSelectorModel(title, items, preChecked)
-
-	p := tea.NewProgram(m)
-	finalModel, err := p.Run()
-	if err != nil {
-		return nil, fmt.Errorf("error running selector: %w", err)
-	}
-
-	fm := finalModel.(multiSelectorModel)
-	if fm.cancelled || !fm.confirmed {
-		return nil, ErrCancelled
-	}
-
-	// Single-add mode: prepend the picked model, keep existing models deduped
-	if fm.singleAdd != "" {
-		result := []string{fm.singleAdd}
-		for _, name := range preChecked {
-			if name != fm.singleAdd {
-				result = append(result, name)
-			}
-		}
-		return result, nil
-	}
-
-	// Multi-edit mode: last checked is default (first in result)
-	last := fm.checkOrder[len(fm.checkOrder)-1]
-	result := []string{fm.items[last].Name}
-	for _, idx := range fm.checkOrder {
-		if idx != last {
-			result = append(result, fm.items[idx].Name)
-		}
-	}
-	return result, nil
-}
--- a/cmd/tui/selector_test.go
+++ b/cmd/tui/selector_test.go
@@ -1,811 +0,0 @@
-package tui
-
-import (
-	"strings"
-	"testing"
-
-	tea "github.com/charmbracelet/bubbletea"
-)
-
-func items(names ...string) []SelectItem {
-	var out []SelectItem
-	for _, n := range names {
-		out = append(out, SelectItem{Name: n})
-	}
-	return out
-}
-
-func recItems(names ...string) []SelectItem {
-	var out []SelectItem
-	for _, n := range names {
-		out = append(out, SelectItem{Name: n, Recommended: true})
-	}
-	return out
-}
-
-func mixedItems() []SelectItem {
-	return []SelectItem{
-		{Name: "rec-a", Recommended: true},
-		{Name: "rec-b", Recommended: true},
-		{Name: "other-1"},
-		{Name: "other-2"},
-		{Name: "other-3"},
-		{Name: "other-4"},
-		{Name: "other-5"},
-		{Name: "other-6"},
-		{Name: "other-7"},
-		{Name: "other-8"},
-		{Name: "other-9"},
-		{Name: "other-10"},
-	}
-}
-
-func TestFilteredItems(t *testing.T) {
-	tests := []struct {
-		name   string
-		items  []SelectItem
-		filter string
-		want   []string
-	}{
-		{
-			name:   "no filter returns all",
-			items:  items("alpha", "beta", "gamma"),
-			filter: "",
-			want:   []string{"alpha", "beta", "gamma"},
-		},
-		{
-			name:   "filter matches substring",
-			items:  items("llama3.2", "qwen3:8b", "llama2"),
-			filter: "llama",
-			want:   []string{"llama3.2", "llama2"},
-		},
-		{
-			name:   "filter is case insensitive",
-			items:  items("Qwen3:8b", "llama3.2"),
-			filter: "QWEN",
-			want:   []string{"Qwen3:8b"},
-		},
-		{
-			name:   "no matches",
-			items:  items("alpha", "beta"),
-			filter: "zzz",
-			want:   nil,
-		},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			m := selectorModel{items: tt.items, filter: tt.filter}
-			got := m.filteredItems()
-			var gotNames []string
-			for _, item := range got {
-				gotNames = append(gotNames, item.Name)
-			}
-			if len(gotNames) != len(tt.want) {
-				t.Fatalf("got %v, want %v", gotNames, tt.want)
-			}
-			for i := range tt.want {
-				if gotNames[i] != tt.want[i] {
-					t.Errorf("index %d: got %q, want %q", i, gotNames[i], tt.want[i])
-				}
-			}
-		})
-	}
-}
-
-func TestOtherStart(t *testing.T) {
-	tests := []struct {
-		name   string
-		items  []SelectItem
-		filter string
-		want   int
-	}{
-		{
-			name:  "all recommended",
-			items: recItems("a", "b", "c"),
-			want:  3,
-		},
-		{
-			name:  "none recommended",
-			items: items("a", "b"),
-			want:  0,
-		},
-		{
-			name: "mixed",
-			items: []SelectItem{
-				{Name: "rec-a", Recommended: true},
-				{Name: "rec-b", Recommended: true},
-				{Name: "other-1"},
-				{Name: "other-2"},
-			},
-			want: 2,
-		},
-		{
-			name:  "empty",
-			items: nil,
-			want:  0,
-		},
-		{
-			name: "filtering returns 0",
-			items: []SelectItem{
-				{Name: "rec-a", Recommended: true},
-				{Name: "other-1"},
-			},
-			filter: "rec",
-			want:   0,
-		},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			m := selectorModel{items: tt.items, filter: tt.filter}
-			if got := m.otherStart(); got != tt.want {
-				t.Errorf("otherStart() = %d, want %d", got, tt.want)
-			}
-		})
-	}
-}
-
-func TestUpdateScroll(t *testing.T) {
-	tests := []struct {
-		name       string
-		cursor     int
-		offset     int
-		otherStart int
-		filter     string
-		wantOffset int
-	}{
-		{
-			name:       "cursor in recommended resets scroll",
-			cursor:     1,
-			offset:     5,
-			otherStart: 3,
-			wantOffset: 0,
-		},
-		{
-			name:       "cursor at start of others",
-			cursor:     2,
-			offset:     0,
-			otherStart: 2,
-			wantOffset: 0,
-		},
-		{
-			name:       "cursor scrolls down in others",
-			cursor:     12,
-			offset:     0,
-			otherStart: 2,
-			wantOffset: 3, // posInOthers=10, maxOthers=8, 10-8+1=3
-		},
-		{
-			name:       "cursor scrolls up in others",
-			cursor:     4,
-			offset:     5,
-			otherStart: 2,
-			wantOffset: 2, // posInOthers=2 < offset=5
-		},
-		{
-			name:       "filter mode standard scroll down",
-			cursor:     12,
-			offset:     0,
-			filter:     "x",
-			otherStart: 0,
-			wantOffset: 3, // 12 - 10 + 1 = 3
-		},
-		{
-			name:       "filter mode standard scroll up",
-			cursor:     2,
-			offset:     5,
-			filter:     "x",
-			otherStart: 0,
-			wantOffset: 2,
-		},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			m := selectorModel{
-				cursor:       tt.cursor,
-				scrollOffset: tt.offset,
-				filter:       tt.filter,
-			}
-			m.updateScroll(tt.otherStart)
-			if m.scrollOffset != tt.wantOffset {
-				t.Errorf("scrollOffset = %d, want %d", m.scrollOffset, tt.wantOffset)
-			}
-		})
-	}
-}
-
-func TestRenderContent_SectionHeaders(t *testing.T) {
-	m := selectorModel{
-		title: "Pick:",
-		items: []SelectItem{
-			{Name: "rec-a", Recommended: true},
-			{Name: "other-1"},
-		},
-	}
-	content := m.renderContent()
-
-	if !strings.Contains(content, "Recommended") {
-		t.Error("should contain 'Recommended' header")
-	}
-	if !strings.Contains(content, "More") {
-		t.Error("should contain 'More' header")
-	}
-}
-
-func TestRenderContent_FilteredHeader(t *testing.T) {
-	m := selectorModel{
-		title:  "Pick:",
-		items:  items("alpha", "beta", "alphabet"),
-		filter: "alpha",
-	}
-	content := m.renderContent()
-
-	if !strings.Contains(content, "Top Results") {
-		t.Error("filtered view should contain 'Top Results' header")
-	}
-	if strings.Contains(content, "Recommended") {
-		t.Error("filtered view should not contain 'Recommended' header")
-	}
-}
-
-func TestRenderContent_NoMatches(t *testing.T) {
-	m := selectorModel{
-		title:  "Pick:",
-		items:  items("alpha"),
-		filter: "zzz",
-	}
-	content := m.renderContent()
-
-	if !strings.Contains(content, "(no matches)") {
-		t.Error("should show '(no matches)' when filter has no results")
-	}
-}
-
-func TestRenderContent_SelectedItemIndicator(t *testing.T) {
-	m := selectorModel{
-		title:  "Pick:",
-		items:  items("alpha", "beta"),
-		cursor: 0,
-	}
-	content := m.renderContent()
-
-	if !strings.Contains(content, "▸") {
-		t.Error("selected item should have ▸ indicator")
-	}
-}
-
-func TestRenderContent_Description(t *testing.T) {
-	m := selectorModel{
-		title: "Pick:",
-		items: []SelectItem{
-			{Name: "alpha", Description: "the first letter"},
-		},
-	}
-	content := m.renderContent()
-
-	if !strings.Contains(content, "the first letter") {
-		t.Error("should render item description")
-	}
-}
-
-func TestRenderContent_PinnedRecommended(t *testing.T) {
-	m := selectorModel{
-		title: "Pick:",
-		items: mixedItems(),
-		// cursor deep in "More" section
-		cursor:       8,
-		scrollOffset: 3,
-	}
-	content := m.renderContent()
-
-	// Recommended items should always be visible (pinned)
-	if !strings.Contains(content, "rec-a") {
-		t.Error("recommended items should always be rendered (pinned)")
-	}
-	if !strings.Contains(content, "rec-b") {
-		t.Error("recommended items should always be rendered (pinned)")
-	}
-}
-
-func TestRenderContent_MoreOverflowIndicator(t *testing.T) {
-	m := selectorModel{
-		title: "Pick:",
-		items: mixedItems(), // 2 rec + 10 other = 12 total, maxSelectorItems=10
-	}
-	content := m.renderContent()
-
-	if !strings.Contains(content, "... and") {
-		t.Error("should show overflow indicator when more items than visible")
-	}
-}
-
-func TestUpdateNavigation_CursorBounds(t *testing.T) {
-	m := selectorModel{
-		items:  items("a", "b", "c"),
-		cursor: 0,
-	}
-
-	// Up at top stays at 0
-	m.updateNavigation(keyMsg(KeyUp))
-	if m.cursor != 0 {
-		t.Errorf("cursor should stay at 0 when pressing up at top, got %d", m.cursor)
-	}
-
-	// Down moves to 1
-	m.updateNavigation(keyMsg(KeyDown))
-	if m.cursor != 1 {
-		t.Errorf("cursor should be 1 after down, got %d", m.cursor)
-	}
-
-	// Down to end
-	m.updateNavigation(keyMsg(KeyDown))
-	m.updateNavigation(keyMsg(KeyDown))
-	if m.cursor != 2 {
-		t.Errorf("cursor should be 2 at bottom, got %d", m.cursor)
-	}
-}
-
-func TestUpdateNavigation_FilterResetsState(t *testing.T) {
-	m := selectorModel{
-		items:        items("alpha", "beta"),
-		cursor:       1,
-		scrollOffset: 5,
-	}
-
-	m.updateNavigation(runeMsg('x'))
-	if m.filter != "x" {
-		t.Errorf("filter should be 'x', got %q", m.filter)
-	}
-	if m.cursor != 0 {
-		t.Errorf("cursor should reset to 0 on filter, got %d", m.cursor)
-	}
-	if m.scrollOffset != 0 {
-		t.Errorf("scrollOffset should reset to 0 on filter, got %d", m.scrollOffset)
-	}
-}
-
-func TestUpdateNavigation_Backspace(t *testing.T) {
-	m := selectorModel{
-		items:  items("alpha"),
-		filter: "abc",
-		cursor: 1,
-	}
-
-	m.updateNavigation(keyMsg(KeyBackspace))
-	if m.filter != "ab" {
-		t.Errorf("filter should be 'ab' after backspace, got %q", m.filter)
-	}
-	if m.cursor != 0 {
-		t.Errorf("cursor should reset to 0 on backspace, got %d", m.cursor)
-	}
-}
-
-// --- cursorForCurrent ---
-
-func TestCursorForCurrent(t *testing.T) {
-	testItems := []SelectItem{
-		{Name: "llama3.2", Recommended: true},
-		{Name: "qwen3:8b", Recommended: true},
-		{Name: "gemma3:latest"},
-		{Name: "deepseek-r1"},
-		{Name: "glm-5:cloud"},
-	}
-
-	tests := []struct {
-		name    string
-		current string
-		want    int
-	}{
-		{"empty current", "", 0},
-		{"exact match", "qwen3:8b", 1},
-		{"no match returns 0", "nonexistent", 0},
-		{"bare name matches with :latest suffix", "gemma3", 2},
-		{"full tag matches bare item", "llama3.2:latest", 0},
-		{"cloud model exact match", "glm-5:cloud", 4},
-		{"cloud model bare name", "glm-5", 4},
-		{"recommended item exact match", "llama3.2", 0},
-		{"recommended item with tag", "qwen3", 1},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			if got := cursorForCurrent(testItems, tt.current); got != tt.want {
-				t.Errorf("cursorForCurrent(%q) = %d, want %d", tt.current, got, tt.want)
-			}
-		})
-	}
-}
-
-// --- ReorderItems ---
-
-func TestReorderItems(t *testing.T) {
-	input := []SelectItem{
-		{Name: "local-1"},
-		{Name: "rec-a", Recommended: true},
-		{Name: "local-2"},
-		{Name: "rec-b", Recommended: true},
-	}
-	got := ReorderItems(input)
-	want := []string{"rec-a", "rec-b", "local-1", "local-2"}
-	for i, item := range got {
-		if item.Name != want[i] {
-			t.Errorf("index %d: got %q, want %q", i, item.Name, want[i])
-		}
-	}
-}
-
-func TestReorderItems_AllRecommended(t *testing.T) {
-	input := recItems("a", "b", "c")
-	got := ReorderItems(input)
-	if len(got) != 3 {
-		t.Fatalf("expected 3 items, got %d", len(got))
-	}
-	for i, item := range got {
-		if item.Name != input[i].Name {
-			t.Errorf("order should be preserved, index %d: got %q, want %q", i, item.Name, input[i].Name)
-		}
-	}
-}
-
-func TestReorderItems_NoneRecommended(t *testing.T) {
-	input := items("x", "y")
-	got := ReorderItems(input)
-	if len(got) != 2 || got[0].Name != "x" || got[1].Name != "y" {
-		t.Errorf("order should be preserved, got %v", got)
-	}
-}
-
-// --- Multi-select otherStart ---
-
-func TestMultiOtherStart(t *testing.T) {
-	tests := []struct {
-		name   string
-		items  []SelectItem
-		filter string
-		want   int
-	}{
-		{"all recommended", recItems("a", "b"), "", 2},
-		{"none recommended", items("a", "b"), "", 0},
-		{"mixed", mixedItems(), "", 2},
-		{"with filter returns 0", mixedItems(), "other", 0},
-	}
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			m := newMultiSelectorModel("test", tt.items, nil)
-			m.filter = tt.filter
-			if got := m.otherStart(); got != tt.want {
-				t.Errorf("otherStart() = %d, want %d", got, tt.want)
-			}
-		})
-	}
-}
-
-// --- Multi-select updateScroll ---
-
-func TestMultiUpdateScroll(t *testing.T) {
-	tests := []struct {
-		name       string
-		cursor     int
-		offset     int
-		otherStart int
-		wantOffset int
-	}{
-		{"cursor in recommended resets scroll", 1, 5, 3, 0},
-		{"cursor at start of others", 2, 0, 2, 0},
-		{"cursor scrolls down in others", 12, 0, 2, 3},
-		{"cursor scrolls up in others", 4, 5, 2, 2},
-	}
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			m := newMultiSelectorModel("test", nil, nil)
-			m.cursor = tt.cursor
-			m.scrollOffset = tt.offset
-			m.updateScroll(tt.otherStart)
-			if m.scrollOffset != tt.wantOffset {
-				t.Errorf("scrollOffset = %d, want %d", m.scrollOffset, tt.wantOffset)
-			}
-		})
-	}
-}
-
-// --- Multi-select View section headers ---
-
-func TestMultiView_SectionHeaders(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", []SelectItem{
-		{Name: "rec-a", Recommended: true},
-		{Name: "other-1"},
-	}, nil)
-	content := m.View()
-
-	if !strings.Contains(content, "Recommended") {
-		t.Error("should contain 'Recommended' header")
-	}
-	if !strings.Contains(content, "More") {
-		t.Error("should contain 'More' header")
-	}
-}
-
-func TestMultiView_CursorIndicator(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b"), nil)
-	m.cursor = 0
-	content := m.View()
-
-	if !strings.Contains(content, "▸") {
-		t.Error("should show ▸ cursor indicator")
-	}
-}
-
-func TestMultiView_CheckedItemShowsX(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b"), []string{"a"})
-	m.multi = true
-	content := m.View()
-
-	if !strings.Contains(content, "[x]") {
-		t.Error("checked item should show [x]")
-	}
-	if !strings.Contains(content, "[ ]") {
-		t.Error("unchecked item should show [ ]")
-	}
-}
-
-func TestMultiView_DefaultTag(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b", "c"), []string{"a", "b"})
-	m.multi = true
-	content := m.View()
-
-	if !strings.Contains(content, "(default)") {
-		t.Error("should have (default) tag")
-	}
-	// preChecked[0] ("a") should be the default (last in checkOrder)
-	aIdx := strings.Index(content, "a")
-	defaultIdx := strings.Index(content, "(default)")
-	if defaultIdx < aIdx {
-		t.Error("(default) tag should appear after 'a' (the current default)")
-	}
-}
-
-func TestMultiView_PinnedRecommended(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", mixedItems(), nil)
-	m.cursor = 8
-	m.scrollOffset = 3
-	content := m.View()
-
-	if !strings.Contains(content, "rec-a") {
-		t.Error("recommended items should always be visible (pinned)")
-	}
-	if !strings.Contains(content, "rec-b") {
-		t.Error("recommended items should always be visible (pinned)")
-	}
-}
-
-func TestMultiView_OverflowIndicator(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", mixedItems(), nil)
-	content := m.View()
-
-	if !strings.Contains(content, "... and") {
-		t.Error("should show overflow indicator when more items than visible")
-	}
-}
-
-// --- Multi-select space toggle (including KeyRunes fallback for Windows PowerShell) ---
-
-func TestMultiUpdate_SpaceTogglesItem(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b", "c"), nil)
-	m.multi = true
-	m.cursor = 1
-
-	// Simulate space delivered as tea.KeySpace
-	updated, _ := m.Update(tea.KeyMsg{Type: tea.KeySpace})
-	m = updated.(multiSelectorModel)
-
-	if !m.checked[1] {
-		t.Error("space (KeySpace) should toggle the item at cursor")
-	}
-	if m.filter != "" {
-		t.Error("space should not modify filter")
-	}
-}
-
-func TestMultiUpdate_SpaceRuneTogglesItem(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b", "c"), nil)
-	m.multi = true
-	m.cursor = 1
-
-	// Simulate space delivered as tea.KeyRunes (Windows PowerShell behavior)
-	updated, _ := m.Update(tea.KeyMsg{Type: tea.KeyRunes, Runes: []rune{' '}})
-	m = updated.(multiSelectorModel)
-
-	if !m.checked[1] {
-		t.Error("space (KeyRunes) should toggle the item at cursor")
-	}
-	if m.filter != "" {
-		t.Error("space rune should not be added to filter")
-	}
-	if m.cursor != 1 {
-		t.Errorf("cursor should stay at 1, got %d", m.cursor)
-	}
-}
-
-// --- Single-add mode ---
-
-func TestMulti_StartsInSingleMode(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b"), nil)
-	if m.multi {
-		t.Error("should start in single mode (multi=false)")
-	}
-}
-
-func TestMulti_SingleModeNoCheckboxes(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b"), nil)
-	content := m.View()
-	if strings.Contains(content, "[x]") || strings.Contains(content, "[ ]") {
-		t.Error("single mode should not show checkboxes")
-	}
-	if !strings.Contains(content, "▸") {
-		t.Error("single mode should show cursor indicator")
-	}
-}
-
-func TestMulti_SingleModeEnterPicksItem(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b", "c"), nil)
-	m.cursor = 1
-
-	updated, _ := m.Update(tea.KeyMsg{Type: tea.KeyEnter})
-	m = updated.(multiSelectorModel)
-
-	if m.singleAdd != "b" {
-		t.Errorf("enter in single mode should pick cursor item, got %q", m.singleAdd)
-	}
-	if !m.confirmed {
-		t.Error("should set confirmed")
-	}
-}
-
-func TestMulti_SingleModeSpaceIsNoop(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b"), nil)
-	m.cursor = 0
-
-	updated, _ := m.Update(tea.KeyMsg{Type: tea.KeySpace})
-	m = updated.(multiSelectorModel)
-
-	if len(m.checked) != 0 {
-		t.Error("space in single mode should not toggle items")
-	}
-}
-
-func TestMulti_SingleModeSpaceRuneIsNoop(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b"), nil)
-	m.cursor = 0
-
-	updated, _ := m.Update(tea.KeyMsg{Type: tea.KeyRunes, Runes: []rune{' '}})
-	m = updated.(multiSelectorModel)
-
-	if len(m.checked) != 0 {
-		t.Error("space rune in single mode should not toggle items")
-	}
-	if m.filter != "" {
-		t.Error("space rune in single mode should not add to filter")
-	}
-}
-
-func TestMulti_TabTogglesMode(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a", "b"), nil)
-
-	if m.multi {
-		t.Fatal("should start in single mode")
-	}
-
-	updated, _ := m.Update(tea.KeyMsg{Type: tea.KeyTab})
-	m = updated.(multiSelectorModel)
-	if !m.multi {
-		t.Error("tab should switch to multi mode")
-	}
-
-	updated, _ = m.Update(tea.KeyMsg{Type: tea.KeyTab})
-	m = updated.(multiSelectorModel)
-	if m.multi {
-		t.Error("tab should switch back to single mode")
-	}
-}
-
-func TestMulti_SingleModeHelpText(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a"), nil)
-	content := m.View()
-	if !strings.Contains(content, "tab add multiple") {
-		t.Error("single mode should show 'tab add multiple' in help")
-	}
-}
-
-func TestMulti_MultiModeHelpText(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("a"), nil)
-	m.multi = true
-	content := m.View()
-	if !strings.Contains(content, "tab select single") {
-		t.Error("multi mode should show 'tab select single' in help")
-	}
-}
-
-// --- preChecked initialization order ---
-
-func TestMulti_PreCheckedDefaultIsLast(t *testing.T) {
-	// preChecked[0] ("a") is the current default and should end up
-	// last in checkOrder so it gets the (default) tag.
-	m := newMultiSelectorModel("Pick:", items("a", "b", "c"), []string{"a", "b", "c"})
-
-	if len(m.checkOrder) != 3 {
-		t.Fatalf("expected 3 in checkOrder, got %d", len(m.checkOrder))
-	}
-	lastIdx := m.checkOrder[len(m.checkOrder)-1]
-	if m.items[lastIdx].Name != "a" {
-		t.Errorf("preChecked[0] should be last in checkOrder, got %q", m.items[lastIdx].Name)
-	}
-}
-
-func TestMulti_CursorOnDefaultModel(t *testing.T) {
-	// preChecked[0] ("b") is the default; cursor should start on it
-	m := newMultiSelectorModel("Pick:", items("a", "b", "c"), []string{"b", "c"})
-
-	if m.cursor != 1 {
-		t.Errorf("cursor should be on preChecked[0] ('b') at index 1, got %d", m.cursor)
-	}
-}
-
-// --- Multi-mode last-checked is default ---
-
-func TestMulti_LastCheckedIsDefault(t *testing.T) {
-	m := newMultiSelectorModel("Pick:", items("alpha", "beta", "gamma"), nil)
-	m.multi = true
-
-	// Check "alpha" then "gamma"
-	m.cursor = 0
-	m.toggleItem()
-	m.cursor = 2
-	m.toggleItem()
-
-	// Last checked ("gamma") should be at the end of checkOrder
-	lastIdx := m.checkOrder[len(m.checkOrder)-1]
-	if m.items[lastIdx].Name != "gamma" {
-		t.Errorf("last checked should be 'gamma', got %q", m.items[lastIdx].Name)
-	}
-
-	// The (default) tag renders based on checkOrder[len-1]
-	content := m.View()
-	if !strings.Contains(content, "(default)") {
-		t.Fatal("should show (default) tag")
-	}
-	// "alpha" line should NOT have the default tag
-	for _, line := range strings.Split(content, "\n") {
-		if strings.Contains(line, "alpha") && strings.Contains(line, "(default)") {
-			t.Error("'alpha' (first checked) should not have (default) tag")
-		}
-	}
-}
-
-// Key message helpers for testing
-
-type keyType = int
-
-const (
-	KeyUp        keyType = iota
-	KeyDown      keyType = iota
-	KeyBackspace keyType = iota
-)
-
-func keyMsg(k keyType) tea.KeyMsg {
-	switch k {
-	case KeyUp:
-		return tea.KeyMsg{Type: tea.KeyUp}
-	case KeyDown:
-		return tea.KeyMsg{Type: tea.KeyDown}
-	case KeyBackspace:
-		return tea.KeyMsg{Type: tea.KeyBackspace}
-	default:
-		return tea.KeyMsg{}
-	}
-}
-
-func runeMsg(r rune) tea.KeyMsg {
-	return tea.KeyMsg{Type: tea.KeyRunes, Runes: []rune{r}}
-}
--- a/cmd/tui/signin.go
+++ b/cmd/tui/signin.go
@@ -1,128 +0,0 @@
-package tui
-
-import (
-	"fmt"
-	"strings"
-	"time"
-
-	tea "github.com/charmbracelet/bubbletea"
-	"github.com/charmbracelet/lipgloss"
-	"github.com/ollama/ollama/cmd/config"
-)
-
-type signInModel struct {
-	modelName string
-	signInURL string
-	spinner   int
-	width     int
-	userName  string
-	cancelled bool
-}
-
-func (m signInModel) Init() tea.Cmd {
-	return tea.Tick(200*time.Millisecond, func(t time.Time) tea.Msg {
-		return signInTickMsg{}
-	})
-}
-
-func (m signInModel) Update(msg tea.Msg) (tea.Model, tea.Cmd) {
-	switch msg := msg.(type) {
-	case tea.WindowSizeMsg:
-		wasSet := m.width > 0
-		m.width = msg.Width
-		if wasSet {
-			return m, tea.EnterAltScreen
-		}
-		return m, nil
-
-	case tea.KeyMsg:
-		switch msg.Type {
-		case tea.KeyCtrlC, tea.KeyEsc:
-			m.cancelled = true
-			return m, tea.Quit
-		}
-
-	case signInTickMsg:
-		m.spinner++
-		if m.spinner%5 == 0 {
-			return m, tea.Batch(
-				tea.Tick(200*time.Millisecond, func(t time.Time) tea.Msg {
-					return signInTickMsg{}
-				}),
-				checkSignIn,
-			)
-		}
-		return m, tea.Tick(200*time.Millisecond, func(t time.Time) tea.Msg {
-			return signInTickMsg{}
-		})
-
-	case signInCheckMsg:
-		if msg.signedIn {
-			m.userName = msg.userName
-			return m, tea.Quit
-		}
-	}
-
-	return m, nil
-}
-
-func (m signInModel) View() string {
-	if m.userName != "" {
-		return ""
-	}
-	return renderSignIn(m.modelName, m.signInURL, m.spinner, m.width)
-}
-
-func renderSignIn(modelName, signInURL string, spinner, width int) string {
-	spinnerFrames := []string{"⠋", "⠙", "⠹", "⠸", "⠼", "⠴", "⠦", "⠧", "⠇", "⠏"}
-	frame := spinnerFrames[spinner%len(spinnerFrames)]
-
-	urlColor := lipgloss.NewStyle().
-		Foreground(lipgloss.Color("117"))
-	urlWrap := lipgloss.NewStyle().PaddingLeft(2)
-	if width > 4 {
-		urlWrap = urlWrap.Width(width - 4)
-	}
-
-	var s strings.Builder
-
-	fmt.Fprintf(&s, "To use %s, please sign in.\n\n", selectorSelectedItemStyle.Render(modelName))
-
-	// Wrap in OSC 8 hyperlink so the entire URL is clickable even when wrapped.
-	// Padding is outside the hyperlink so spaces don't get underlined.
-	link := fmt.Sprintf("\033]8;;%s\033\\%s\033]8;;\033\\", signInURL, urlColor.Render(signInURL))
-	s.WriteString("Navigate to:\n")
-	s.WriteString(urlWrap.Render(link))
-	s.WriteString("\n\n")
-
-	s.WriteString(lipgloss.NewStyle().Foreground(lipgloss.AdaptiveColor{Light: "242", Dark: "246"}).Render(
-		frame + " Waiting for sign in to complete..."))
-	s.WriteString("\n\n")
-
-	s.WriteString(selectorHelpStyle.Render("esc cancel"))
-
-	return lipgloss.NewStyle().PaddingLeft(2).Render(s.String())
-}
-
-// RunSignIn shows a bubbletea sign-in dialog and polls until the user signs in or cancels.
-func RunSignIn(modelName, signInURL string) (string, error) {
-	config.OpenBrowser(signInURL)
-
-	m := signInModel{
-		modelName: modelName,
-		signInURL: signInURL,
-	}
-
-	p := tea.NewProgram(m)
-	finalModel, err := p.Run()
-	if err != nil {
-		return "", fmt.Errorf("error running sign-in: %w", err)
-	}
-
-	fm := finalModel.(signInModel)
-	if fm.cancelled {
-		return "", ErrCancelled
-	}
-
-	return fm.userName, nil
-}
--- a/cmd/tui/signin_test.go
+++ b/cmd/tui/signin_test.go
@@ -1,175 +0,0 @@
-package tui
-
-import (
-	"strings"
-	"testing"
-
-	tea "github.com/charmbracelet/bubbletea"
-)
-
-func TestRenderSignIn_ContainsModelName(t *testing.T) {
-	got := renderSignIn("glm-4.7:cloud", "https://example.com/signin", 0, 80)
-	if !strings.Contains(got, "glm-4.7:cloud") {
-		t.Error("should contain model name")
-	}
-	if !strings.Contains(got, "please sign in") {
-		t.Error("should contain sign-in prompt")
-	}
-}
-
-func TestRenderSignIn_ContainsURL(t *testing.T) {
-	url := "https://ollama.com/connect?key=abc123"
-	got := renderSignIn("test:cloud", url, 0, 120)
-	if !strings.Contains(got, url) {
-		t.Errorf("should contain URL %q", url)
-	}
-}
-
-func TestRenderSignIn_OSC8Hyperlink(t *testing.T) {
-	url := "https://ollama.com/connect?key=abc123"
-	got := renderSignIn("test:cloud", url, 0, 120)
-
-	// Should contain OSC 8 open sequence with the URL
-	osc8Open := "\033]8;;" + url + "\033\\"
-	if !strings.Contains(got, osc8Open) {
-		t.Error("should contain OSC 8 open sequence with URL")
-	}
-
-	// Should contain OSC 8 close sequence
-	osc8Close := "\033]8;;\033\\"
-	if !strings.Contains(got, osc8Close) {
-		t.Error("should contain OSC 8 close sequence")
-	}
-}
-
-func TestRenderSignIn_ContainsSpinner(t *testing.T) {
-	got := renderSignIn("test:cloud", "https://example.com", 0, 80)
-	if !strings.Contains(got, "Waiting for sign in to complete") {
-		t.Error("should contain waiting message")
-	}
-	if !strings.Contains(got, "⠋") {
-		t.Error("should contain first spinner frame at spinner=0")
-	}
-}
-
-func TestRenderSignIn_SpinnerAdvances(t *testing.T) {
-	got0 := renderSignIn("test:cloud", "https://example.com", 0, 80)
-	got1 := renderSignIn("test:cloud", "https://example.com", 1, 80)
-	if got0 == got1 {
-		t.Error("different spinner values should produce different output")
-	}
-}
-
-func TestRenderSignIn_ContainsEscHelp(t *testing.T) {
-	got := renderSignIn("test:cloud", "https://example.com", 0, 80)
-	if !strings.Contains(got, "esc cancel") {
-		t.Error("should contain esc cancel help text")
-	}
-}
-
-func TestSignInModel_EscCancels(t *testing.T) {
-	m := signInModel{
-		modelName: "test:cloud",
-		signInURL: "https://example.com",
-	}
-
-	updated, cmd := m.Update(tea.KeyMsg{Type: tea.KeyEsc})
-	fm := updated.(signInModel)
-	if !fm.cancelled {
-		t.Error("esc should set cancelled=true")
-	}
-	if cmd == nil {
-		t.Error("esc should return tea.Quit")
-	}
-}
-
-func TestSignInModel_CtrlCCancels(t *testing.T) {
-	m := signInModel{
-		modelName: "test:cloud",
-		signInURL: "https://example.com",
-	}
-
-	updated, cmd := m.Update(tea.KeyMsg{Type: tea.KeyCtrlC})
-	fm := updated.(signInModel)
-	if !fm.cancelled {
-		t.Error("ctrl+c should set cancelled=true")
-	}
-	if cmd == nil {
-		t.Error("ctrl+c should return tea.Quit")
-	}
-}
-
-func TestSignInModel_SignedInQuitsClean(t *testing.T) {
-	m := signInModel{
-		modelName: "test:cloud",
-		signInURL: "https://example.com",
-	}
-
-	updated, cmd := m.Update(signInCheckMsg{signedIn: true, userName: "alice"})
-	fm := updated.(signInModel)
-	if fm.userName != "alice" {
-		t.Errorf("expected userName 'alice', got %q", fm.userName)
-	}
-	if cmd == nil {
-		t.Error("successful sign-in should return tea.Quit")
-	}
-}
-
-func TestSignInModel_SignedInViewClears(t *testing.T) {
-	m := signInModel{
-		modelName: "test:cloud",
-		signInURL: "https://example.com",
-		userName:  "alice",
-	}
-
-	got := m.View()
-	if got != "" {
-		t.Errorf("View should return empty string after sign-in, got %q", got)
-	}
-}
-
-func TestSignInModel_NotSignedInContinues(t *testing.T) {
-	m := signInModel{
-		modelName: "test:cloud",
-		signInURL: "https://example.com",
-	}
-
-	updated, _ := m.Update(signInCheckMsg{signedIn: false})
-	fm := updated.(signInModel)
-	if fm.userName != "" {
-		t.Error("should not set userName when not signed in")
-	}
-	if fm.cancelled {
-		t.Error("should not cancel when check returns not signed in")
-	}
-}
-
-func TestSignInModel_WindowSizeUpdatesWidth(t *testing.T) {
-	m := signInModel{
-		modelName: "test:cloud",
-		signInURL: "https://example.com",
-	}
-
-	updated, _ := m.Update(tea.WindowSizeMsg{Width: 120, Height: 40})
-	fm := updated.(signInModel)
-	if fm.width != 120 {
-		t.Errorf("expected width 120, got %d", fm.width)
-	}
-}
-
-func TestSignInModel_TickAdvancesSpinner(t *testing.T) {
-	m := signInModel{
-		modelName: "test:cloud",
-		signInURL: "https://example.com",
-		spinner:   0,
-	}
-
-	updated, cmd := m.Update(signInTickMsg{})
-	fm := updated.(signInModel)
-	if fm.spinner != 1 {
-		t.Errorf("expected spinner=1, got %d", fm.spinner)
-	}
-	if cmd == nil {
-		t.Error("tick should return a command")
-	}
-}
--- a/cmd/tui/tui.go
+++ b/cmd/tui/tui.go
@@ -1,746 +0,0 @@
-package tui
-
-import (
-	"context"
-	"errors"
-	"fmt"
-	"strings"
-	"time"
-
-	tea "github.com/charmbracelet/bubbletea"
-	"github.com/charmbracelet/lipgloss"
-	"github.com/ollama/ollama/api"
-	"github.com/ollama/ollama/cmd/config"
-	"github.com/ollama/ollama/version"
-)
-
-var (
-	versionStyle = lipgloss.NewStyle().
-			Foreground(lipgloss.AdaptiveColor{Light: "243", Dark: "250"})
-
-	menuItemStyle = lipgloss.NewStyle().
-			PaddingLeft(2)
-
-	menuSelectedItemStyle = lipgloss.NewStyle().
-				Bold(true).
-				Background(lipgloss.AdaptiveColor{Light: "254", Dark: "236"})
-
-	menuDescStyle = selectorDescStyle.
-			PaddingLeft(4)
-
-	greyedStyle = menuItemStyle.
-			Foreground(lipgloss.AdaptiveColor{Light: "242", Dark: "246"})
-
-	greyedSelectedStyle = menuSelectedItemStyle.
-				Foreground(lipgloss.AdaptiveColor{Light: "242", Dark: "246"})
-
-	modelStyle = lipgloss.NewStyle().
-			Foreground(lipgloss.AdaptiveColor{Light: "243", Dark: "250"})
-
-	notInstalledStyle = lipgloss.NewStyle().
-				Foreground(lipgloss.AdaptiveColor{Light: "242", Dark: "246"}).
-				Italic(true)
-)
-
-type menuItem struct {
-	title       string
-	description string
-	integration string // integration name for loading model config, empty if not an integration
-	isRunModel  bool
-	isOthers    bool
-}
-
-var mainMenuItems = []menuItem{
-	{
-		title:       "Run a model",
-		description: "Start an interactive chat with a model",
-		isRunModel:  true,
-	},
-	{
-		title:       "Launch Claude Code",
-		description: "Agentic coding across large codebases",
-		integration: "claude",
-	},
-	{
-		title:       "Launch Codex",
-		description: "OpenAI's open-source coding agent",
-		integration: "codex",
-	},
-	{
-		title:       "Launch OpenClaw",
-		description: "Personal AI with 100+ skills",
-		integration: "openclaw",
-	},
-}
-
-var othersMenuItem = menuItem{
-	title:       "More...",
-	description: "Show additional integrations",
-	isOthers:    true,
-}
-
-// getOtherIntegrations dynamically builds the "Others" list from the integration
-// registry, excluding any integrations already present in the pinned mainMenuItems.
-func getOtherIntegrations() []menuItem {
-	pinned := map[string]bool{
-		"run": true, // not an integration but in the pinned list
-	}
-	for _, item := range mainMenuItems {
-		if item.integration != "" {
-			pinned[item.integration] = true
-		}
-	}
-
-	var others []menuItem
-	for _, info := range config.ListIntegrationInfos() {
-		if pinned[info.Name] {
-			continue
-		}
-		desc := info.Description
-		if desc == "" {
-			desc = "Open " + info.DisplayName + " integration"
-		}
-		others = append(others, menuItem{
-			title:       "Launch " + info.DisplayName,
-			description: desc,
-			integration: info.Name,
-		})
-	}
-	return others
-}
-
-type model struct {
-	items           []menuItem
-	cursor          int
-	quitting        bool
-	selected        bool
-	changeModel     bool
-	changeModels    []string // multi-select result for Editor integrations
-	showOthers      bool
-	availableModels map[string]bool
-	err             error
-
-	showingModal  bool
-	modalSelector selectorModel
-	modalItems    []SelectItem
-
-	showingMultiModal  bool
-	multiModalSelector multiSelectorModel
-
-	showingSignIn   bool
-	signInURL       string
-	signInModel     string
-	signInSpinner   int
-	signInFromModal bool // true if sign-in was triggered from modal (not main menu)
-
-	width     int    // terminal width from WindowSizeMsg
-	statusMsg string // temporary status message shown near help text
-}
-
-type signInTickMsg struct{}
-
-type signInCheckMsg struct {
-	signedIn bool
-	userName string
-}
-
-type clearStatusMsg struct{}
-
-func (m *model) modelExists(name string) bool {
-	if m.availableModels == nil || name == "" {
-		return false
-	}
-	if m.availableModels[name] {
-		return true
-	}
-	// Check for prefix match (e.g., "llama2" matches "llama2:latest")
-	for modelName := range m.availableModels {
-		if strings.HasPrefix(modelName, name+":") {
-			return true
-		}
-	}
-	return false
-}
-
-func (m *model) buildModalItems() []SelectItem {
-	modelItems, _ := config.GetModelItems(context.Background())
-	return ReorderItems(ConvertItems(modelItems))
-}
-
-func (m *model) openModelModal(currentModel string) {
-	m.modalItems = m.buildModalItems()
-	cursor := 0
-	if currentModel != "" {
-		for i, item := range m.modalItems {
-			if item.Name == currentModel || strings.HasPrefix(item.Name, currentModel+":") || strings.HasPrefix(currentModel, item.Name+":") {
-				cursor = i
-				break
-			}
-		}
-	}
-	m.modalSelector = selectorModel{
-		title:    "Select model:",
-		items:    m.modalItems,
-		cursor:   cursor,
-		helpText: "↑/↓ navigate • enter select • ← back",
-	}
-	m.modalSelector.updateScroll(m.modalSelector.otherStart())
-	m.showingModal = true
-}
-
-func (m *model) openMultiModelModal(integration string) {
-	items := m.buildModalItems()
-	var preChecked []string
-	if models := config.IntegrationModels(integration); len(models) > 0 {
-		preChecked = models
-	}
-	m.multiModalSelector = newMultiSelectorModel("Select models:", items, preChecked)
-	// Set cursor to the first pre-checked (last used) model
-	if len(preChecked) > 0 {
-		for i, item := range items {
-			if item.Name == preChecked[0] {
-				m.multiModalSelector.cursor = i
-				m.multiModalSelector.updateScroll(m.multiModalSelector.otherStart())
-				break
-			}
-		}
-	}
-	m.showingMultiModal = true
-}
-
-func isCloudModel(name string) bool {
-	return strings.HasSuffix(name, ":cloud") || strings.HasSuffix(name, "-cloud")
-}
-
-func cloudStatusDisabled(client *api.Client) bool {
-	status, err := client.CloudStatusExperimental(context.Background())
-	if err != nil {
-		return false
-	}
-	return status.Cloud.Disabled
-}
-
-func cloudModelDisabled(name string) bool {
-	if !isCloudModel(name) {
-		return false
-	}
-	client, err := api.ClientFromEnvironment()
-	if err != nil {
-		return false
-	}
-	return cloudStatusDisabled(client)
-}
-
-// checkCloudSignIn checks if a cloud model needs sign-in.
-// Returns a command to start sign-in if needed, or nil if already signed in.
-func (m *model) checkCloudSignIn(modelName string, fromModal bool) tea.Cmd {
-	if modelName == "" || !isCloudModel(modelName) {
-		return nil
-	}
-	client, err := api.ClientFromEnvironment()
-	if err != nil {
-		return nil
-	}
-	if cloudStatusDisabled(client) {
-		return nil
-	}
-	user, err := client.Whoami(context.Background())
-	if err == nil && user != nil && user.Name != "" {
-		return nil
-	}
-	var aErr api.AuthorizationError
-	if errors.As(err, &aErr) && aErr.SigninURL != "" {
-		return m.startSignIn(modelName, aErr.SigninURL, fromModal)
-	}
-	return nil
-}
-
-// startSignIn initiates the sign-in flow for a cloud model.
-// fromModal indicates if this was triggered from the model picker modal.
-func (m *model) startSignIn(modelName, signInURL string, fromModal bool) tea.Cmd {
-	m.showingModal = false
-	m.showingSignIn = true
-	m.signInURL = signInURL
-	m.signInModel = modelName
-	m.signInSpinner = 0
-	m.signInFromModal = fromModal
-
-	config.OpenBrowser(signInURL)
-
-	return tea.Tick(200*time.Millisecond, func(t time.Time) tea.Msg {
-		return signInTickMsg{}
-	})
-}
-
-func checkSignIn() tea.Msg {
-	client, err := api.ClientFromEnvironment()
-	if err != nil {
-		return signInCheckMsg{signedIn: false}
-	}
-	user, err := client.Whoami(context.Background())
-	if err == nil && user != nil && user.Name != "" {
-		return signInCheckMsg{signedIn: true, userName: user.Name}
-	}
-	return signInCheckMsg{signedIn: false}
-}
-
-func (m *model) loadAvailableModels() {
-	m.availableModels = make(map[string]bool)
-	client, err := api.ClientFromEnvironment()
-	if err != nil {
-		return
-	}
-	models, err := client.List(context.Background())
-	if err != nil {
-		return
-	}
-	cloudDisabled := cloudStatusDisabled(client)
-	for _, mdl := range models.Models {
-		if cloudDisabled && mdl.RemoteModel != "" {
-			continue
-		}
-		m.availableModels[mdl.Name] = true
-	}
-}
-
-func (m *model) buildItems() {
-	others := getOtherIntegrations()
-	m.items = make([]menuItem, 0, len(mainMenuItems)+1+len(others))
-	m.items = append(m.items, mainMenuItems...)
-
-	if m.showOthers {
-		m.items = append(m.items, others...)
-	} else {
-		m.items = append(m.items, othersMenuItem)
-	}
-}
-
-func isOthersIntegration(name string) bool {
-	for _, item := range getOtherIntegrations() {
-		if item.integration == name {
-			return true
-		}
-	}
-	return false
-}
-
-func initialModel() model {
-	m := model{
-		cursor: 0,
-	}
-	m.loadAvailableModels()
-
-	lastSelection := config.LastSelection()
-	if isOthersIntegration(lastSelection) {
-		m.showOthers = true
-	}
-
-	m.buildItems()
-
-	if lastSelection != "" {
-		for i, item := range m.items {
-			if lastSelection == "run" && item.isRunModel {
-				m.cursor = i
-				break
-			} else if item.integration == lastSelection {
-				m.cursor = i
-				break
-			}
-		}
-	}
-
-	return m
-}
-
-func (m model) Init() tea.Cmd {
-	return nil
-}
-
-func (m model) Update(msg tea.Msg) (tea.Model, tea.Cmd) {
-	if wmsg, ok := msg.(tea.WindowSizeMsg); ok {
-		wasSet := m.width > 0
-		m.width = wmsg.Width
-		if wasSet {
-			return m, tea.EnterAltScreen
-		}
-		return m, nil
-	}
-
-	if _, ok := msg.(clearStatusMsg); ok {
-		m.statusMsg = ""
-		return m, nil
-	}
-
-	if m.showingSignIn {
-		switch msg := msg.(type) {
-		case tea.KeyMsg:
-			switch msg.Type {
-			case tea.KeyCtrlC, tea.KeyEsc:
-				m.showingSignIn = false
-				if m.signInFromModal {
-					m.showingModal = true
-				}
-				return m, nil
-			}
-
-		case signInTickMsg:
-			m.signInSpinner++
-			// Check sign-in status every 5th tick (~1 second)
-			if m.signInSpinner%5 == 0 {
-				return m, tea.Batch(
-					tea.Tick(200*time.Millisecond, func(t time.Time) tea.Msg {
-						return signInTickMsg{}
-					}),
-					checkSignIn,
-				)
-			}
-			return m, tea.Tick(200*time.Millisecond, func(t time.Time) tea.Msg {
-				return signInTickMsg{}
-			})
-
-		case signInCheckMsg:
-			if msg.signedIn {
-				if m.signInFromModal {
-					m.modalSelector.selected = m.signInModel
-					m.changeModel = true
-				} else {
-					m.selected = true
-				}
-				m.quitting = true
-				return m, tea.Quit
-			}
-		}
-		return m, nil
-	}
-
-	if m.showingMultiModal {
-		switch msg := msg.(type) {
-		case tea.KeyMsg:
-			if msg.Type == tea.KeyLeft {
-				m.showingMultiModal = false
-				return m, nil
-			}
-			updated, cmd := m.multiModalSelector.Update(msg)
-			m.multiModalSelector = updated.(multiSelectorModel)
-
-			if m.multiModalSelector.cancelled {
-				m.showingMultiModal = false
-				return m, nil
-			}
-			if m.multiModalSelector.confirmed {
-				var selected []string
-				if m.multiModalSelector.singleAdd != "" {
-					// Single-add mode: prepend picked model, keep existing deduped
-					selected = []string{m.multiModalSelector.singleAdd}
-					for _, name := range config.IntegrationModels(m.items[m.cursor].integration) {
-						if name != m.multiModalSelector.singleAdd {
-							selected = append(selected, name)
-						}
-					}
-				} else {
-					// Last checked is default (first in result)
-					co := m.multiModalSelector.checkOrder
-					last := co[len(co)-1]
-					selected = []string{m.multiModalSelector.items[last].Name}
-					for _, idx := range co {
-						if idx != last {
-							selected = append(selected, m.multiModalSelector.items[idx].Name)
-						}
-					}
-				}
-				if len(selected) > 0 {
-					m.changeModels = selected
-					m.changeModel = true
-					m.quitting = true
-					return m, tea.Quit
-				}
-				m.multiModalSelector.confirmed = false
-				return m, nil
-			}
-			return m, cmd
-		}
-		return m, nil
-	}
-
-	if m.showingModal {
-		switch msg := msg.(type) {
-		case tea.KeyMsg:
-			switch msg.Type {
-			case tea.KeyCtrlC, tea.KeyEsc, tea.KeyLeft:
-				m.showingModal = false
-				return m, nil
-
-			case tea.KeyEnter:
-				filtered := m.modalSelector.filteredItems()
-				if len(filtered) > 0 && m.modalSelector.cursor < len(filtered) {
-					m.modalSelector.selected = filtered[m.modalSelector.cursor].Name
-				}
-				if m.modalSelector.selected != "" {
-					if cmd := m.checkCloudSignIn(m.modalSelector.selected, true); cmd != nil {
-						return m, cmd
-					}
-					m.changeModel = true
-					m.quitting = true
-					return m, tea.Quit
-				}
-				return m, nil
-
-			default:
-				// Delegate navigation (up/down/pgup/pgdown/filter/backspace) to selectorModel
-				m.modalSelector.updateNavigation(msg)
-			}
-		}
-		return m, nil
-	}
-
-	switch msg := msg.(type) {
-	case tea.KeyMsg:
-		switch msg.String() {
-		case "ctrl+c", "q", "esc":
-			m.quitting = true
-			return m, tea.Quit
-
-		case "up", "k":
-			if m.cursor > 0 {
-				m.cursor--
-			}
-			// Auto-collapse "Others" when cursor moves back into pinned items
-			if m.showOthers && m.cursor < len(mainMenuItems) {
-				m.showOthers = false
-				m.buildItems()
-			}
-
-		case "down", "j":
-			if m.cursor < len(m.items)-1 {
-				m.cursor++
-			}
-			// Auto-expand "Others..." when cursor lands on it
-			if m.cursor < len(m.items) && m.items[m.cursor].isOthers && !m.showOthers {
-				m.showOthers = true
-				m.buildItems()
-				// cursor now points at the first "other" integration
-			}
-
-		case "enter", " ":
-			item := m.items[m.cursor]
-
-			if item.integration != "" && !config.IsIntegrationInstalled(item.integration) && !config.AutoInstallable(item.integration) {
-				return m, nil
-			}
-
-			var configuredModel string
-			if item.isRunModel {
-				configuredModel = config.LastModel()
-			} else if item.integration != "" {
-				configuredModel = config.IntegrationModel(item.integration)
-			}
-			if cmd := m.checkCloudSignIn(configuredModel, false); cmd != nil {
-				return m, cmd
-			}
-
-			if configuredModel != "" && isCloudModel(configuredModel) && cloudModelDisabled(configuredModel) {
-				if item.integration != "" && config.IsEditorIntegration(item.integration) {
-					m.openMultiModelModal(item.integration)
-				} else {
-					m.openModelModal(configuredModel)
-				}
-				return m, nil
-			}
-
-			m.selected = true
-			m.quitting = true
-			return m, tea.Quit
-
-		case "right", "l":
-			item := m.items[m.cursor]
-			if item.integration != "" || item.isRunModel {
-				if item.integration != "" && !config.IsIntegrationInstalled(item.integration) {
-					if config.AutoInstallable(item.integration) {
-						// Auto-installable: select to trigger install flow
-						m.selected = true
-						m.quitting = true
-						return m, tea.Quit
-					}
-					return m, nil
-				}
-				if item.integration != "" && config.IsEditorIntegration(item.integration) {
-					m.openMultiModelModal(item.integration)
-				} else {
-					var currentModel string
-					if item.isRunModel {
-						currentModel = config.LastModel()
-					} else if item.integration != "" {
-						currentModel = config.IntegrationModel(item.integration)
-					}
-					m.openModelModal(currentModel)
-				}
-			}
-		}
-	}
-
-	return m, nil
-}
-
-func (m model) View() string {
-	if m.quitting {
-		return ""
-	}
-
-	if m.showingSignIn {
-		return m.renderSignInDialog()
-	}
-
-	if m.showingMultiModal {
-		return m.multiModalSelector.View()
-	}
-
-	if m.showingModal {
-		return m.renderModal()
-	}
-
-	s := selectorTitleStyle.Render("Ollama "+versionStyle.Render(version.Version)) + "\n\n"
-
-	for i, item := range m.items {
-		cursor := ""
-		style := menuItemStyle
-		isInstalled := true
-
-		if item.integration != "" {
-			isInstalled = config.IsIntegrationInstalled(item.integration)
-		}
-
-		if m.cursor == i {
-			cursor = "▸ "
-			if isInstalled {
-				style = menuSelectedItemStyle
-			} else {
-				style = greyedSelectedStyle
-			}
-		} else if !isInstalled && item.integration != "" {
-			style = greyedStyle
-		}
-
-		title := item.title
-		var modelSuffix string
-		if item.integration != "" {
-			if !isInstalled {
-				if config.AutoInstallable(item.integration) {
-					title += " " + notInstalledStyle.Render("(install)")
-				} else {
-					title += " " + notInstalledStyle.Render("(not installed)")
-				}
-			} else if m.cursor == i {
-				if mdl := config.IntegrationModel(item.integration); mdl != "" && m.modelExists(mdl) {
-					modelSuffix = " " + modelStyle.Render("("+mdl+")")
-				}
-			}
-		} else if item.isRunModel && m.cursor == i {
-			if mdl := config.LastModel(); mdl != "" && m.modelExists(mdl) {
-				modelSuffix = " " + modelStyle.Render("("+mdl+")")
-			}
-		}
-
-		s += style.Render(cursor+title) + modelSuffix + "\n"
-
-		desc := item.description
-		if !isInstalled && item.integration != "" && m.cursor == i {
-			if config.AutoInstallable(item.integration) {
-				desc = "Press enter to install"
-			} else if hint := config.IntegrationInstallHint(item.integration); hint != "" {
-				desc = hint
-			} else {
-				desc = "not installed"
-			}
-		}
-		s += menuDescStyle.Render(desc) + "\n\n"
-	}
-
-	if m.statusMsg != "" {
-		s += "\n" + lipgloss.NewStyle().Foreground(lipgloss.AdaptiveColor{Light: "124", Dark: "210"}).Render(m.statusMsg) + "\n"
-	}
-
-	s += "\n" + selectorHelpStyle.Render("↑/↓ navigate • enter launch • → change model • esc quit")
-
-	if m.width > 0 {
-		return lipgloss.NewStyle().MaxWidth(m.width).Render(s)
-	}
-	return s
-}
-
-func (m model) renderModal() string {
-	modalStyle := lipgloss.NewStyle().
-		PaddingBottom(1).
-		PaddingRight(2)
-
-	s := modalStyle.Render(m.modalSelector.renderContent())
-	if m.width > 0 {
-		return lipgloss.NewStyle().MaxWidth(m.width).Render(s)
-	}
-	return s
-}
-
-func (m model) renderSignInDialog() string {
-	return renderSignIn(m.signInModel, m.signInURL, m.signInSpinner, m.width)
-}
-
-type Selection int
-
-const (
-	SelectionNone Selection = iota
-	SelectionRunModel
-	SelectionChangeRunModel
-	SelectionIntegration       // Generic integration selection
-	SelectionChangeIntegration // Generic change model for integration
-)
-
-type Result struct {
-	Selection   Selection
-	Integration string   // integration name if applicable
-	Model       string   // model name if selected from single-select modal
-	Models      []string // models selected from multi-select modal (Editor integrations)
-}
-
-func Run() (Result, error) {
-	m := initialModel()
-	p := tea.NewProgram(m)
-
-	finalModel, err := p.Run()
-	if err != nil {
-		return Result{Selection: SelectionNone}, fmt.Errorf("error running TUI: %w", err)
-	}
-
-	fm := finalModel.(model)
-	if fm.err != nil {
-		return Result{Selection: SelectionNone}, fm.err
-	}
-
-	if !fm.selected && !fm.changeModel {
-		return Result{Selection: SelectionNone}, nil
-	}
-
-	item := fm.items[fm.cursor]
-
-	if fm.changeModel {
-		if item.isRunModel {
-			return Result{
-				Selection: SelectionChangeRunModel,
-				Model:     fm.modalSelector.selected,
-			}, nil
-		}
-		return Result{
-			Selection:   SelectionChangeIntegration,
-			Integration: item.integration,
-			Model:       fm.modalSelector.selected,
-			Models:      fm.changeModels,
-		}, nil
-	}
-
-	if item.isRunModel {
-		return Result{Selection: SelectionRunModel}, nil
-	}
-
-	return Result{
-		Selection:   SelectionIntegration,
-		Integration: item.integration,
-	}, nil
-}
--- a/convert/convert.go
+++ b/convert/convert.go
@@ -257,11 +257,10 @@ func LoadModelMetadata(fsys fs.FS) (ModelKV, *Tokenizer, error) {
 	if err != nil {
 		return nil, nil, err
 	}
-	bts = sanitizeNonFiniteJSON(bts)

 	var p ModelParameters
 	if err := json.Unmarshal(bts, &p); err != nil {
-		return nil, nil, fmt.Errorf("parse config.json: %w", err)
+		return nil, nil, err
 	}

 	if len(p.Architectures) < 1 {
@@ -312,24 +311,12 @@ func LoadModelMetadata(fsys fs.FS) (ModelKV, *Tokenizer, error) {
 		conv = &deepseekocr{}
 	case "DeepseekV3ForCausalLM":
 		conv = &deepseek2Model{}
-	case "Glm4MoeLiteForCausalLM":
-		conv = &glm4MoeLiteModel{}
-	case "GlmOcrForConditionalGeneration":
-		conv = &glmOcrModel{}
-	case "Lfm2ForCausalLM", "Lfm2MoeForCausalLM":
-		conv = &lfm2Model{}
-	case "Lfm2VlForConditionalGeneration":
-		conv = &lfm2VLTextModel{}
-	case "Qwen3NextForCausalLM", "Qwen3_5ForConditionalGeneration", "Qwen3_5MoeForConditionalGeneration":
-		conv = &qwen3NextModel{}
-	case "NemotronHForCausalLM":
-		conv = &nemotronHModel{}
 	default:
 		return nil, nil, fmt.Errorf("unsupported architecture %q", p.Architectures[0])
 	}

 	if err := json.Unmarshal(bts, conv); err != nil {
-		return nil, nil, fmt.Errorf("parse config.json for %q: %w", p.Architectures[0], err)
+		return nil, nil, err
 	}

 	if t, ok := conv.(moreParser); ok {
--- a/convert/convert_glm4moelite.go
+++ b/convert/convert_glm4moelite.go
@@ -1,264 +0,0 @@
-package convert
-
-import (
-	"cmp"
-	"fmt"
-	"log/slog"
-	"regexp"
-	"strconv"
-	"strings"
-
-	"github.com/pdevine/tensor"
-	"github.com/pdevine/tensor/native"
-
-	"github.com/ollama/ollama/fs/ggml"
-)
-
-type glm4MoeLiteModel struct {
-	ModelParameters
-	MaxPositionEmbeddings uint32  `json:"max_position_embeddings"`
-	HiddenSize            uint32  `json:"hidden_size"`
-	HiddenLayers          uint32  `json:"num_hidden_layers"`
-	IntermediateSize      uint32  `json:"intermediate_size"`
-	NumAttentionHeads     uint32  `json:"num_attention_heads"`
-	NumKeyValueHeads      uint32  `json:"num_key_value_heads"`
-	RMSNormEPS            float32 `json:"rms_norm_eps"`
-
-	RopeTheta     float32 `json:"rope_theta"`
-	QKNopeHeadDim uint32  `json:"qk_nope_head_dim"`
-	QKRopeHeadDim uint32  `json:"qk_rope_head_dim"`
-	KVLoraRank    uint32  `json:"kv_lora_rank"`
-	QLoraRank     uint32  `json:"q_lora_rank"`
-	VHeadDim      uint32  `json:"v_head_dim"`
-
-	ExpertCount            uint32  `json:"n_routed_experts"`
-	ExpertSharedCount      uint32  `json:"n_shared_experts"`
-	ExpertIntermediateSize uint32  `json:"moe_intermediate_size"`
-	ExpertUsedCount        uint32  `json:"num_experts_per_tok"`
-	ExpertWeightsNorm      bool    `json:"norm_topk_prob"`
-	ExpertWeightsScale     float32 `json:"routed_scaling_factor"`
-
-	LeadingDenseBlockCount uint32 `json:"first_k_dense_replace"`
-}
-
-func (p *glm4MoeLiteModel) KV(t *Tokenizer) KV {
-	kv := p.ModelParameters.KV(t)
-	kv["general.architecture"] = "glm4moelite"
-	kv["general.type"] = "model"
-	kv["glm4moelite.block_count"] = p.HiddenLayers
-
-	numHeads := p.NumAttentionHeads
-	numKVHeads := p.NumKeyValueHeads
-
-	kv["glm4moelite.attention.head_count"] = numHeads
-	kv["glm4moelite.attention.head_count_kv"] = numKVHeads
-	kv["glm4moelite.attention.key_length"] = p.QKNopeHeadDim + p.QKRopeHeadDim
-	kv["glm4moelite.attention.kv_lora_rank"] = p.KVLoraRank
-	kv["glm4moelite.attention.layer_norm_rms_epsilon"] = p.RMSNormEPS
-	kv["glm4moelite.attention.q_lora_rank"] = p.QLoraRank
-	kv["glm4moelite.attention.value_length"] = p.VHeadDim
-	kv["glm4moelite.context_length"] = p.MaxPositionEmbeddings
-	kv["glm4moelite.embedding_length"] = p.HiddenSize
-	kv["glm4moelite.expert_count"] = p.ExpertCount
-	kv["glm4moelite.expert_feed_forward_length"] = p.ExpertIntermediateSize
-	kv["glm4moelite.expert_shared_count"] = p.ExpertSharedCount
-
-	kv["glm4moelite.expert_gating_func"] = uint32(2)
-	kv["glm4moelite.expert_used_count"] = p.ExpertUsedCount
-	kv["glm4moelite.expert_weights_norm"] = p.ExpertWeightsNorm
-	kv["glm4moelite.expert_weights_scale"] = p.ExpertWeightsScale
-	kv["glm4moelite.feed_forward_length"] = p.IntermediateSize
-	kv["glm4moelite.leading_dense_block_count"] = p.LeadingDenseBlockCount
-
-	kv["glm4moelite.rope.dimension_count"] = p.QKRopeHeadDim
-	kv["glm4moelite.rope.freq_base"] = cmp.Or(p.RopeTheta, float32(1000000.0))
-
-	kv["glm4moelite.attention.key_length_mla"] = p.KVLoraRank + p.QKRopeHeadDim
-	kv["glm4moelite.attention.value_length_mla"] = p.KVLoraRank
-
-	kv["tokenizer.ggml.pre"] = "glm4"
-
-	return kv
-}
-
-func (p *glm4MoeLiteModel) Replacements() []string {
-	return []string{
-		"lm_head", "output",
-		"model.embed_tokens", "token_embd",
-		"model.norm", "output_norm",
-		"model.layers", "blk",
-		"input_layernorm", "attn_norm",
-		"self_attn.kv_a_proj_with_mqa", "attn_kv_a_mqa",
-		"self_attn.kv_a_layernorm", "attn_kv_a_norm",
-		"self_attn.kv_b_proj", "attn_kv_b",
-		"self_attn.q_a_proj", "attn_q_a",
-		"self_attn.q_a_layernorm", "attn_q_a_norm",
-		"self_attn.q_b_proj", "attn_q_b",
-		"self_attn.o_proj", "attn_output",
-		"post_attention_layernorm", "ffn_norm",
-		"mlp.shared_experts.down_proj", "ffn_down_shexp",
-		"mlp.shared_experts.gate_proj", "ffn_gate_shexp",
-		"mlp.shared_experts.up_proj", "ffn_up_shexp",
-		"mlp.gate_proj", "ffn_gate",
-		"mlp.down_proj", "ffn_down",
-		"mlp.up_proj", "ffn_up",
-		"mlp.gate.e_score_correction_bias", "exp_probs_b.bias",
-		"mlp.gate", "ffn_gate_inp",
-	}
-}
-
-// repackKVB extracts K or V from the combined KV_B tensor for MLA absorption.
-// K output row-major: [n_head, kv_lora_rank, qk_nope] -> GGML ne[]={qk_nope, kv_lora_rank, n_head}
-// V output row-major: [n_head, v_head, kv_lora_rank] -> GGML ne[]={kv_lora_rank, v_head, n_head}
-func (p *glm4MoeLiteModel) repackKVB(extractK bool, kvFirst bool, numHeads int) Repacker {
-	qkNope := int(p.QKNopeHeadDim)
-	vHeadDim := int(p.VHeadDim)
-	kvLoraRank := int(p.KVLoraRank)
-	kvPerHead := qkNope + vHeadDim
-
-	return func(_ string, data []float32, shape []uint64) ([]float32, error) {
-		dims := make([]int, len(shape))
-		for i := range shape {
-			dims[i] = int(shape[i])
-		}
-
-		var tt tensor.Tensor = tensor.New(tensor.WithShape(dims...), tensor.WithBacking(data))
-		var err error
-
-		// Normalize to [n_head * (qk_nope + v_head), kv_lora_rank] layout
-		if kvFirst {
-			tt, err = tensor.Transpose(tt, 1, 0)
-			if err != nil {
-				return nil, err
-			}
-			tt = tensor.Materialize(tt)
-		}
-
-		// Reshape to [n_head, qk_nope + v_head, kv_lora_rank]
-		if err := tt.Reshape(numHeads, kvPerHead, kvLoraRank); err != nil {
-			return nil, err
-		}
-
-		if extractK {
-			// Slice K: [n_head, qk_nope, kv_lora_rank]
-			tt, err = tt.Slice(nil, tensor.S(0, qkNope), nil)
-			if err != nil {
-				return nil, err
-			}
-			tt = tensor.Materialize(tt)
-			// Transpose to [n_head, kv_lora_rank, qk_nope]
-			tt, err = tensor.Transpose(tt, 0, 2, 1)
-			if err != nil {
-				return nil, err
-			}
-			tt = tensor.Materialize(tt)
-		} else {
-			// Slice V: [n_head, v_head, kv_lora_rank] - already correct layout
-			tt, err = tt.Slice(nil, tensor.S(qkNope, kvPerHead), nil)
-			if err != nil {
-				return nil, err
-			}
-			tt = tensor.Materialize(tt)
-		}
-
-		if err := tt.Reshape(tt.Shape().TotalSize()); err != nil {
-			return nil, err
-		}
-		return native.VectorF32(tt.(*tensor.Dense))
-	}
-}
-
-func (p *glm4MoeLiteModel) Tensors(s []Tensor) (out []*ggml.Tensor) {
-	merges := make([]merge, p.HiddenLayers*3)
-	for i := range p.HiddenLayers {
-		merges[i*3+0] = merge{
-			fmt.Sprintf("blk.%d.mlp.experts.*.gate_proj.weight", i),
-			fmt.Sprintf("blk.%d.ffn_gate_exps.weight", i),
-		}
-		merges[i*3+1] = merge{
-			fmt.Sprintf("blk.%d.mlp.experts.*.up_proj.weight", i),
-			fmt.Sprintf("blk.%d.ffn_up_exps.weight", i),
-		}
-		merges[i*3+2] = merge{
-			fmt.Sprintf("blk.%d.mlp.experts.*.down_proj.weight", i),
-			fmt.Sprintf("blk.%d.ffn_down_exps.weight", i),
-		}
-	}
-
-	skipLayer := func(n string, minValue uint32) bool {
-		re := regexp.MustCompile(`^blk\.(\d+)`)
-		matches := re.FindStringSubmatch(n)
-		if matches == nil {
-			return false
-		}
-
-		blkNum, err := strconv.Atoi(matches[1])
-		if err != nil {
-			return false
-		}
-
-		return uint32(blkNum) >= minValue
-	}
-
-	out, s = mergeTensors(s, merges...)
-	for _, t := range s {
-		// skip any additional layers (such as the Multi-Token Prediction layer)
-		if skipLayer(t.Name(), p.HiddenLayers) {
-			slog.Debug("skipping layer", "name", t.Name())
-			continue
-		}
-
-		// Split attn_kv_b into separate attn_k_b and attn_v_b for MLA absorption
-		if strings.HasSuffix(t.Name(), ".attn_kv_b.weight") {
-			qkNope := int(p.QKNopeHeadDim)
-			vHeadDim := int(p.VHeadDim)
-			kvLoraRank := int(p.KVLoraRank)
-			kvPerHead := qkNope + vHeadDim
-			numHeads := int(p.NumAttentionHeads)
-			kvFirst := true
-			if len(t.Shape()) == 2 {
-				switch {
-				case int(t.Shape()[0]) == kvLoraRank:
-					if kvPerHead > 0 && int(t.Shape()[1])%kvPerHead == 0 {
-						numHeads = int(t.Shape()[1]) / kvPerHead
-					}
-					kvFirst = true
-				case int(t.Shape()[1]) == kvLoraRank:
-					if kvPerHead > 0 && int(t.Shape()[0])%kvPerHead == 0 {
-						numHeads = int(t.Shape()[0]) / kvPerHead
-					}
-					kvFirst = false
-				default:
-					slog.Warn("glm4moelite: unexpected attn_kv_b layout", "name", t.Name(), "shape", t.Shape())
-				}
-			}
-
-			kTensor := t.Clone()
-			kTensor.SetRepacker(p.repackKVB(true, kvFirst, numHeads))
-			out = append(out, &ggml.Tensor{
-				Name:     strings.Replace(t.Name(), "attn_kv_b", "attn_k_b", 1),
-				Kind:     t.Kind(),
-				Shape:    []uint64{uint64(numHeads), uint64(kvLoraRank), uint64(qkNope)},
-				WriterTo: kTensor,
-			})
-
-			vTensor := t.Clone()
-			vTensor.SetRepacker(p.repackKVB(false, kvFirst, numHeads))
-			out = append(out, &ggml.Tensor{
-				Name:     strings.Replace(t.Name(), "attn_kv_b", "attn_v_b", 1),
-				Kind:     t.Kind(),
-				Shape:    []uint64{uint64(numHeads), uint64(vHeadDim), uint64(kvLoraRank)},
-				WriterTo: vTensor,
-			})
-			continue
-		}
-
-		out = append(out, &ggml.Tensor{
-			Name:     t.Name(),
-			Kind:     t.Kind(),
-			Shape:    t.Shape(),
-			WriterTo: t,
-		})
-	}
-	return out
-}
--- a/convert/convert_glmocr.go
+++ b/convert/convert_glmocr.go
@@ -1,455 +0,0 @@
-package convert
-
-import (
-	"cmp"
-	"encoding/json"
-	"io/fs"
-	"log/slog"
-	"regexp"
-	"strconv"
-	"strings"
-
-	"github.com/ollama/ollama/fs/ggml"
-	"github.com/pdevine/tensor"
-	"github.com/pdevine/tensor/native"
-)
-
-// normalToNeoXRepacker creates a repacker that permutes Q/K weights from interleaved (LLaMA)
-// to NeoX ordering for compatibility with GGML's M-RoPE kernel.
-//
-// For weights: reshape [out, in] -> [n_heads, head_dim, in], permute rotary dims, reshape back
-// For biases: reshape [out] -> [n_heads, head_dim], permute rotary dims, reshape back
-func normalToNeoXRepacker(nHeads, headDim int, partialRotaryFactor float32) func(string, []float32, []uint64) ([]float32, error) {
-	return func(_ string, data []float32, shape []uint64) ([]float32, error) {
-		rotaryDim := int(float32(headDim) * partialRotaryFactor)
-		if rotaryDim%2 != 0 {
-			rotaryDim = (rotaryDim / 2) * 2 // Round down to even
-		}
-
-		// Handle 1D (bias) or 2D (weight) tensors
-		is1D := len(shape) == 1
-		var inFeatures int
-		if is1D {
-			inFeatures = 1
-		} else {
-			inFeatures = int(shape[1])
-		}
-		outFeatures := int(shape[0])
-		nEffectiveHeads := outFeatures / headDim
-
-		if nEffectiveHeads != nHeads {
-			slog.Warn("normalToNeoX: unexpected head count", "effective", nEffectiveHeads, "expected", nHeads)
-		}
-
-		// Reshape to [n_heads, head_dim, in_features]
-		reshaped := make([]float32, len(data))
-		copy(reshaped, data)
-
-		// Permute the rotary dimensions: even indices first, then odd
-		// For each head, reorder [0,1,2,3,4,5...] to [0,2,4...,1,3,5...]
-		result := make([]float32, len(data))
-		halfRotary := rotaryDim / 2
-
-		for h := range nEffectiveHeads {
-			for f := range inFeatures {
-				for i := range halfRotary {
-					// Even dim (0, 2, 4, ...) -> position i
-					srcIdx := h*headDim*inFeatures + (2*i)*inFeatures + f
-					dstIdx := h*headDim*inFeatures + i*inFeatures + f
-					result[dstIdx] = reshaped[srcIdx]
-
-					// Odd dim (1, 3, 5, ...) -> position halfRotary + i
-					srcIdx = h*headDim*inFeatures + (2*i+1)*inFeatures + f
-					dstIdx = h*headDim*inFeatures + (halfRotary+i)*inFeatures + f
-					result[dstIdx] = reshaped[srcIdx]
-				}
-
-				// Non-rotary part: copy as-is
-				for i := rotaryDim; i < headDim; i++ {
-					srcIdx := h*headDim*inFeatures + i*inFeatures + f
-					result[srcIdx] = reshaped[srcIdx]
-				}
-			}
-		}
-
-		return result, nil
-	}
-}
-
-type glmOcrModel struct {
-	ModelParameters
-
-	TextConfig struct {
-		HiddenSize          uint32  `json:"hidden_size"`
-		IntermediateSize    uint32  `json:"intermediate_size"`
-		NumHiddenLayers     uint32  `json:"num_hidden_layers"`
-		NumAttentionHeads   uint32  `json:"num_attention_heads"`
-		NumKeyValueHeads    uint32  `json:"num_key_value_heads"`
-		HeadDim             uint32  `json:"head_dim"`
-		MaxPositionEmbed    uint32  `json:"max_position_embeddings"`
-		RMSNormEps          float32 `json:"rms_norm_eps"`
-		PartialRotaryFactor float32 `json:"partial_rotary_factor"`
-		RopeParameters      struct {
-			RopeType            string  `json:"rope_type"`
-			MRopeSection        []int32 `json:"mrope_section"`
-			RopeTheta           float32 `json:"rope_theta"`
-			PartialRotaryFactor float32 `json:"partial_rotary_factor"`
-		} `json:"rope_parameters"`
-	} `json:"text_config"`
-
-	VisionConfig struct {
-		HiddenSize        uint32  `json:"hidden_size"`
-		IntermediateSize  uint32  `json:"intermediate_size"`
-		Depth             uint32  `json:"depth"`
-		NumHeads          uint32  `json:"num_heads"`
-		ImageSize         uint32  `json:"image_size"`
-		PatchSize         uint32  `json:"patch_size"`
-		OutHiddenSize     uint32  `json:"out_hidden_size"`
-		RMSNormEps        float32 `json:"rms_norm_eps"`
-		SpatialMergeSize  uint32  `json:"spatial_merge_size"`
-		TemporalPatchSize uint32  `json:"temporal_patch_size"`
-	} `json:"vision_config"`
-
-	ImageStartTokenID uint32 `json:"image_start_token_id"`
-	ImageEndTokenID   uint32 `json:"image_end_token_id"`
-	VideoStartTokenID uint32 `json:"video_start_token_id"`
-	VideoEndTokenID   uint32 `json:"video_end_token_id"`
-	ImageTokenID      uint32 `json:"image_token_id"`
-	VideoTokenID      uint32 `json:"video_token_id"`
-
-	// Preprocessor config (preprocessor_config.json)
-	Preprocessor struct {
-		Size struct {
-			ShortestEdge uint32 `json:"shortest_edge"`
-			LongestEdge  uint32 `json:"longest_edge"`
-		} `json:"size"`
-		PatchSize         uint32    `json:"patch_size"`
-		TemporalPatchSize uint32    `json:"temporal_patch_size"`
-		MergeSize         uint32    `json:"merge_size"`
-		ImageMean         []float32 `json:"image_mean"`
-		ImageStd          []float32 `json:"image_std"`
-	} `json:"-"`
-}
-
-var _ ModelConverter = (*glmOcrModel)(nil)
-
-func (m *glmOcrModel) parseMore(fsys fs.FS) error {
-	bts, err := fs.ReadFile(fsys, "preprocessor_config.json")
-	if err != nil {
-		return err
-	}
-
-	return json.Unmarshal(bts, &m.Preprocessor)
-}
-
-func (m *glmOcrModel) KV(t *Tokenizer) KV {
-	kv := m.ModelParameters.KV(t)
-	kv["general.architecture"] = "glmocr"
-
-	// Text model parameters
-	kv["glmocr.block_count"] = cmp.Or(m.TextConfig.NumHiddenLayers, 16)
-	kv["glmocr.embedding_length"] = cmp.Or(m.TextConfig.HiddenSize, 1536)
-	kv["glmocr.attention.head_count"] = cmp.Or(m.TextConfig.NumAttentionHeads, 16)
-	kv["glmocr.attention.head_count_kv"] = cmp.Or(m.TextConfig.NumKeyValueHeads, 8)
-	headDim := cmp.Or(m.TextConfig.HeadDim, m.TextConfig.HiddenSize/m.TextConfig.NumAttentionHeads)
-	kv["glmocr.attention.key_length"] = headDim
-	kv["glmocr.attention.value_length"] = headDim
-	kv["glmocr.feed_forward_length"] = cmp.Or(m.TextConfig.IntermediateSize, 4608)
-	kv["glmocr.attention.layer_norm_rms_epsilon"] = cmp.Or(m.TextConfig.RMSNormEps, 1e-5)
-	kv["glmocr.context_length"] = cmp.Or(m.TextConfig.MaxPositionEmbed, 131072)
-	kv["glmocr.rope.freq_base"] = cmp.Or(m.TextConfig.RopeParameters.RopeTheta, float32(10000))
-	kv["glmocr.rope.partial_rotary_factor"] = cmp.Or(m.TextConfig.RopeParameters.PartialRotaryFactor, m.TextConfig.PartialRotaryFactor, float32(1.0))
-	if len(m.TextConfig.RopeParameters.MRopeSection) > 0 {
-		kv["glmocr.rope.mrope_section"] = m.TextConfig.RopeParameters.MRopeSection
-	}
-
-	// Vision model parameters
-	kv["glmocr.vision.block_count"] = cmp.Or(m.VisionConfig.Depth, 24)
-	kv["glmocr.vision.embedding_length"] = cmp.Or(m.VisionConfig.HiddenSize, 1024)
-	kv["glmocr.vision.attention.head_count"] = cmp.Or(m.VisionConfig.NumHeads, 16)
-	kv["glmocr.vision.image_size"] = cmp.Or(m.VisionConfig.ImageSize, 336)
-	kv["glmocr.vision.patch_size"] = cmp.Or(m.VisionConfig.PatchSize, m.Preprocessor.PatchSize, 14)
-	kv["glmocr.vision.spatial_merge_size"] = cmp.Or(m.VisionConfig.SpatialMergeSize, m.Preprocessor.MergeSize, 2)
-	kv["glmocr.vision.temporal_patch_size"] = cmp.Or(m.VisionConfig.TemporalPatchSize, m.Preprocessor.TemporalPatchSize, 2)
-	kv["glmocr.vision.out_hidden_size"] = cmp.Or(m.VisionConfig.OutHiddenSize, 1536)
-	kv["glmocr.vision.intermediate_size"] = cmp.Or(m.VisionConfig.IntermediateSize, 4096)
-	kv["glmocr.vision.attention.layer_norm_rms_epsilon"] = cmp.Or(m.VisionConfig.RMSNormEps, 1e-5)
-
-	// Preprocessor-derived image settings (min/max pixels and normalization)
-	// Note: fs.Config.keyValue() auto-prepends architecture prefix, so use full key
-	if m.Preprocessor.Size.ShortestEdge > 0 {
-		kv["glmocr.vision.min_pixels"] = m.Preprocessor.Size.ShortestEdge
-	}
-	if m.Preprocessor.Size.LongestEdge > 0 {
-		kv["glmocr.vision.max_pixels"] = m.Preprocessor.Size.LongestEdge
-	}
-	if len(m.Preprocessor.ImageMean) == 3 {
-		kv["glmocr.vision.image_mean"] = m.Preprocessor.ImageMean
-	}
-	if len(m.Preprocessor.ImageStd) == 3 {
-		kv["glmocr.vision.image_std"] = m.Preprocessor.ImageStd
-	}
-
-	// Special tokens
-	kv["glmocr.image_token_id"] = m.ImageTokenID
-	kv["glmocr.image_start_token_id"] = m.ImageStartTokenID
-	kv["glmocr.image_end_token_id"] = m.ImageEndTokenID
-	kv["glmocr.video_token_id"] = m.VideoTokenID
-	kv["glmocr.video_start_token_id"] = m.VideoStartTokenID
-	kv["glmocr.video_end_token_id"] = m.VideoEndTokenID
-
-	return kv
-}
-
-func (m *glmOcrModel) Tensors(ts []Tensor) []*ggml.Tensor {
-	var out []*ggml.Tensor
-
-	// Skip layers >= num_hidden_layers (Multi-Token Prediction layers not needed for basic inference)
-	numLayers := int(cmp.Or(m.TextConfig.NumHiddenLayers, 16))
-	skipLayer := func(name string) bool {
-		// Tensor names are already replaced to "blk.N.xxx" format
-		re := regexp.MustCompile(`^blk\.(\d+)`)
-		matches := re.FindStringSubmatch(name)
-		if matches == nil {
-			return false
-		}
-		blkNum, err := strconv.Atoi(matches[1])
-		if err != nil {
-			return false
-		}
-		return blkNum >= numLayers
-	}
-
-	for _, t := range ts {
-		name := t.Name()
-
-		// Skip next-n prediction layers (layers >= num_hidden_layers)
-		if skipLayer(name) {
-			continue
-		}
-
-		// Split ffn_gate_up into separate gate and up projections
-		if strings.Contains(name, "ffn_gate_up") {
-			for t := range splitDim(t, 0,
-				split{Replacer: strings.NewReplacer("ffn_gate_up", "ffn_gate")},
-				split{Replacer: strings.NewReplacer("ffn_gate_up", "ffn_up")},
-			) {
-				out = append(out, t)
-			}
-			continue
-		}
-
-		if strings.HasSuffix(name, "patch_embd.weight") {
-			shape := t.Shape()
-			if len(shape) == 5 && shape[2] == 2 {
-				newShape := []uint64{shape[0], shape[1], shape[3], shape[4]}
-
-				t0 := t.Clone()
-				t0.SetRepacker(func(_ string, data []float32, shape []uint64) ([]float32, error) {
-					dims := make([]int, len(shape))
-					for i := range shape {
-						dims[i] = int(shape[i])
-					}
-					var tt tensor.Tensor = tensor.New(tensor.WithShape(dims...), tensor.WithBacking(data))
-					tt, err := tt.Slice(nil, nil, tensor.S(0, 1), nil, nil)
-					if err != nil {
-						return nil, err
-					}
-					tt = tensor.Materialize(tt)
-					newDims := []int{int(shape[0]), int(shape[1]), int(shape[3]), int(shape[4])}
-					if err := tt.Reshape(newDims...); err != nil {
-						return nil, err
-					}
-					if err := tt.Reshape(tt.Shape().TotalSize()); err != nil {
-						return nil, err
-					}
-					return native.VectorF32(tt.(*tensor.Dense))
-				})
-				out = append(out, &ggml.Tensor{
-					Name:     strings.Replace(name, "patch_embd.weight", "patch_embd_0.weight", 1),
-					Kind:     t.Kind(),
-					Shape:    newShape,
-					WriterTo: t0,
-				})
-
-				t1 := t.Clone()
-				t1.SetRepacker(func(_ string, data []float32, shape []uint64) ([]float32, error) {
-					dims := make([]int, len(shape))
-					for i := range shape {
-						dims[i] = int(shape[i])
-					}
-					var tt tensor.Tensor = tensor.New(tensor.WithShape(dims...), tensor.WithBacking(data))
-					tt, err := tt.Slice(nil, nil, tensor.S(1, 2), nil, nil)
-					if err != nil {
-						return nil, err
-					}
-					tt = tensor.Materialize(tt)
-					newDims := []int{int(shape[0]), int(shape[1]), int(shape[3]), int(shape[4])}
-					if err := tt.Reshape(newDims...); err != nil {
-						return nil, err
-					}
-					if err := tt.Reshape(tt.Shape().TotalSize()); err != nil {
-						return nil, err
-					}
-					return native.VectorF32(tt.(*tensor.Dense))
-				})
-				out = append(out, &ggml.Tensor{
-					Name:     strings.Replace(name, "patch_embd.weight", "patch_embd_1.weight", 1),
-					Kind:     t.Kind(),
-					Shape:    newShape,
-					WriterTo: t1,
-				})
-
-				continue
-			}
-
-			if len(shape) == 4 {
-				out = append(out, &ggml.Tensor{
-					Name:     strings.Replace(name, "patch_embd.weight", "patch_embd_0.weight", 1),
-					Kind:     t.Kind(),
-					Shape:    t.Shape(),
-					WriterTo: t,
-				})
-				continue
-			}
-
-			slog.Warn("glmocr: patch_embed weight has unexpected shape - not splitting", "shape", shape)
-			// Fall through to default handling
-		}
-
-		// Handle pre-split patch embedding weights
-		// Pattern 1: v.patch_embd.0.weight, v.patch_embd.1.weight -> patch_embd_0.weight, patch_embd_1.weight
-		// Pattern 2: v.patch_embd.weight.0, v.patch_embd.weight.1 -> patch_embd_0.weight, patch_embd_1.weight
-		if strings.Contains(name, "patch_embd.0.") {
-			out = append(out, &ggml.Tensor{
-				Name:     strings.Replace(name, "patch_embd.0.", "patch_embd_0.", 1),
-				Kind:     t.Kind(),
-				Shape:    t.Shape(),
-				WriterTo: t,
-			})
-			continue
-		}
-		if strings.Contains(name, "patch_embd.1.") {
-			out = append(out, &ggml.Tensor{
-				Name:     strings.Replace(name, "patch_embd.1.", "patch_embd_1.", 1),
-				Kind:     t.Kind(),
-				Shape:    t.Shape(),
-				WriterTo: t,
-			})
-			continue
-		}
-		// Handle .weight.0 and .weight.1 suffix patterns
-		if strings.HasSuffix(name, "patch_embd.weight.0") {
-			out = append(out, &ggml.Tensor{
-				Name:     strings.Replace(name, "patch_embd.weight.0", "patch_embd_0.weight", 1),
-				Kind:     t.Kind(),
-				Shape:    t.Shape(),
-				WriterTo: t,
-			})
-			continue
-		}
-		if strings.HasSuffix(name, "patch_embd.weight.1") {
-			out = append(out, &ggml.Tensor{
-				Name:     strings.Replace(name, "patch_embd.weight.1", "patch_embd_1.weight", 1),
-				Kind:     t.Kind(),
-				Shape:    t.Shape(),
-				WriterTo: t,
-			})
-			continue
-		}
-
-		// Permute Q/K weights for M-RoPE compatibility (interleaved -> NeoX ordering)
-		// GGML's M-RoPE kernel uses NeoX-style rotation, but GLM-OCR uses interleaved (LLaMA-style)
-		// We permute at conversion time so the weights work correctly with GGML's kernel
-		// This aligns Q/K rotary dimensions with GGML's NeoX-style rotation
-		if len(m.TextConfig.RopeParameters.MRopeSection) > 0 &&
-			strings.Contains(name, "blk.") && (strings.Contains(name, "attn_q.") || strings.Contains(name, "attn_k.")) {
-			// Get config values for permutation
-			nHeads := int(cmp.Or(m.TextConfig.NumAttentionHeads, 16))
-			nKVHeads := int(cmp.Or(m.TextConfig.NumKeyValueHeads, 8))
-			hiddenSize := int(cmp.Or(m.TextConfig.HiddenSize, 1536))
-			headDim := int(cmp.Or(m.TextConfig.HeadDim, uint32(hiddenSize/nHeads)))
-			partialRotaryFactor := cmp.Or(m.TextConfig.PartialRotaryFactor, m.TextConfig.RopeParameters.PartialRotaryFactor, float32(1.0))
-
-			// Use appropriate head count: nHeads for Q, nKVHeads for K
-			effectiveHeads := nHeads
-			if strings.Contains(name, "attn_k.") {
-				effectiveHeads = nKVHeads
-			}
-
-			permutedT := t.Clone()
-			permutedT.SetRepacker(normalToNeoXRepacker(effectiveHeads, headDim, partialRotaryFactor))
-			out = append(out, &ggml.Tensor{
-				Name:     name,
-				Kind:     t.Kind(),
-				Shape:    t.Shape(),
-				WriterTo: permutedT,
-			})
-			continue
-		}
-
-		out = append(out, &ggml.Tensor{
-			Name:     name,
-			Kind:     t.Kind(),
-			Shape:    t.Shape(),
-			WriterTo: t,
-		})
-	}
-
-	return out
-}
-
-func (m *glmOcrModel) Replacements() []string {
-	return []string{
-		// Vision encoder
-		"model.visual.patch_embed.proj_1", "v.patch_embd_1", // Second temporal split
-		"model.visual.patch_embed.proj", "v.patch_embd",
-		"model.visual.blocks", "v.blk",
-		"model.visual.post_layernorm", "v.post_ln",
-		"model.visual.downsample", "mm.patch_merger",
-
-		// Vision attention
-		"attn.qkv", "attn_qkv",
-		"attn.proj", "attn_out",
-		"attn.q_norm", "attn_q_norm",
-		"attn.k_norm", "attn_k_norm",
-
-		// Vision norms
-		"norm1", "ln1",
-		"norm2", "ln2",
-
-		// Vision MLP
-		"mlp.gate_proj", "ffn_gate",
-		"mlp.up_proj", "ffn_up",
-		"mlp.down_proj", "ffn_down",
-
-		// Merger (multimodal projector)
-		"model.visual.merger.proj", "mm.model.fc",
-		"model.visual.merger.post_projection_norm", "mm.post_norm",
-		"model.visual.merger.gate_proj", "mm.gate",
-		"model.visual.merger.up_proj", "mm.up",
-		"model.visual.merger.down_proj", "mm.down",
-
-		// Language model
-		"model.language_model.embed_tokens", "token_embd",
-		"model.language_model.layers", "blk",
-		"model.language_model.norm", "output_norm",
-		"lm_head", "output",
-
-		// Language model attention
-		"self_attn.q_proj", "attn_q",
-		"self_attn.k_proj", "attn_k",
-		"self_attn.v_proj", "attn_v",
-		"self_attn.o_proj", "attn_out",
-
-		// Language model norms
-		"input_layernorm", "attn_norm",
-		"post_attention_layernorm", "ffn_norm",
-		"post_self_attn_layernorm", "post_attn_norm",
-		"post_mlp_layernorm", "post_ffn_norm",
-
-		// Language model MLP (remove mlp. prefix so ffn_* names work)
-		"mlp.gate_up_proj", "ffn_gate_up",
-		"mlp.down_proj", "ffn_down",
-	}
-}
--- a/convert/convert_lfm2.go
+++ b/convert/convert_lfm2.go
@@ -1,235 +0,0 @@
-package convert
-
-import (
-	"cmp"
-	"fmt"
-	"slices"
-	"strings"
-
-	"github.com/ollama/ollama/fs/ggml"
-)
-
-type lfm2Model struct {
-	ModelParameters
-	HiddenSize            uint32   `json:"hidden_size"`
-	NumHiddenLayers       uint32   `json:"num_hidden_layers"`
-	MaxPositionEmbeddings uint32   `json:"max_position_embeddings"`
-	IntermediateSize      uint32   `json:"intermediate_size"`
-	BlockFFDim            uint32   `json:"block_ff_dim"`
-	BlockMultipleOf       uint32   `json:"block_multiple_of"`
-	BlockAutoAdjustFFDim  bool     `json:"block_auto_adjust_ff_dim"`
-	BlockFFNDimMultiplier float32  `json:"block_ffn_dim_multiplier"`
-	NumAttentionHeads     uint32   `json:"num_attention_heads"`
-	NumKeyValueHeads      uint32   `json:"num_key_value_heads"`
-	RopeTheta             float32  `json:"rope_theta"`
-	NormEps               float32  `json:"norm_eps"`
-	ConvLCache            uint32   `json:"conv_L_cache"`
-	MoEIntermediateSize   uint32   `json:"moe_intermediate_size"`
-	NumExperts            uint32   `json:"num_experts"`
-	NumLocalExperts       uint32   `json:"num_local_experts"`
-	NumExpertsPerToken    uint32   `json:"num_experts_per_tok"`
-	NumDenseLayers        uint32   `json:"num_dense_layers"`
-	RoutedScalingFactor   float32  `json:"routed_scaling_factor"`
-	LayerTypes            []string `json:"layer_types"`
-	TieEmbedding          bool     `json:"tie_embedding"`
-	RopeParameters        struct {
-		RopeTheta float32 `json:"rope_theta"`
-	} `json:"rope_parameters"`
-}
-
-var _ ModelConverter = (*lfm2Model)(nil)
-
-const (
-	defaultMaxPositionEmbeddings = uint32(128_000)
-	fallbackContextLength        = uint32(32_768)
-)
-
-func (p *lfm2Model) isMoE() bool {
-	return p.ModelType == "lfm2_moe" || p.expertCount() > 0
-}
-
-func (p *lfm2Model) ropeFreqBase() float32 {
-	if p.RopeTheta != 0 {
-		return p.RopeTheta
-	}
-
-	return p.RopeParameters.RopeTheta
-}
-
-func (p *lfm2Model) expertCount() uint32 {
-	if p.NumLocalExperts > 0 {
-		return p.NumLocalExperts
-	}
-	return p.NumExperts
-}
-
-func (p *lfm2Model) feedForwardLength() uint32 {
-	ff := p.IntermediateSize
-	if p.BlockFFDim != 0 {
-		ff = p.BlockFFDim
-	}
-
-	if !p.BlockAutoAdjustFFDim || p.BlockMultipleOf == 0 {
-		return ff
-	}
-
-	ff = (2 * ff) / 3
-
-	// Keep default multiplier behavior consistent with llama.cpp conversion.
-	if p.BlockFFNDimMultiplier != 0 {
-		ff = uint32(float32(ff) * p.BlockFFNDimMultiplier)
-	}
-
-	m := p.BlockMultipleOf
-	return m * ((ff + m - 1) / m)
-}
-
-func (p *lfm2Model) hasKnownContextLengthFallbackSignature() bool {
-	return p.isMoE() &&
-		p.VocabSize == 65536 &&
-		p.HiddenSize == 2048 &&
-		p.NumHiddenLayers == 40 &&
-		p.IntermediateSize == 11776 &&
-		p.NumAttentionHeads == 32 &&
-		p.NumKeyValueHeads == 8 &&
-		p.NumDenseLayers == 2 &&
-		p.expertCount() == 64 &&
-		p.NumExpertsPerToken == 4 &&
-		p.MoEIntermediateSize == 1536
-}
-
-func (p *lfm2Model) contextLength() uint32 {
-	if p.MaxPositionEmbeddings == defaultMaxPositionEmbeddings && p.hasKnownContextLengthFallbackSignature() {
-		return fallbackContextLength
-	}
-
-	return p.MaxPositionEmbeddings
-}
-
-func (p *lfm2Model) KV(t *Tokenizer) KV {
-	architecture := "lfm2"
-	if p.isMoE() {
-		architecture = "lfm2moe"
-	}
-
-	kv := p.ModelParameters.KV(t)
-	kv["general.architecture"] = architecture
-	kv["tokenizer.ggml.pre"] = "lfm2"
-	kv["vocab_size"] = p.VocabSize
-	kv["block_count"] = p.NumHiddenLayers
-	kv["embedding_length"] = p.HiddenSize
-	kv["feed_forward_length"] = p.feedForwardLength()
-	kv["context_length"] = p.contextLength()
-
-	// Build per-layer KV head count array based on layer_types
-	// (0 = shortconv layer, non-zero = attention layer with that many KV heads).
-	//
-	// Dense LFM2 in HF defaults to all attention layers when layer_types is absent.
-	// Preserve that behavior to avoid accidentally emitting all-conv metadata.
-	kvHeadCounts := make([]uint32, p.NumHiddenLayers)
-	if len(p.LayerTypes) == 0 {
-		for i := range p.NumHiddenLayers {
-			kvHeadCounts[i] = p.NumKeyValueHeads
-		}
-	} else {
-		for i := range p.NumHiddenLayers {
-			if int(i) < len(p.LayerTypes) && p.LayerTypes[i] == "full_attention" {
-				kvHeadCounts[i] = p.NumKeyValueHeads
-			}
-		}
-	}
-
-	kv["attention.head_count"] = p.NumAttentionHeads
-	kv["attention.head_count_kv"] = kvHeadCounts
-	kv["attention.key_length"] = p.HiddenSize / p.NumAttentionHeads
-	kv["attention.value_length"] = p.HiddenSize / p.NumAttentionHeads
-	kv["attention.layer_norm_rms_epsilon"] = p.NormEps
-	kv["shortconv.l_cache"] = p.ConvLCache
-
-	if ropeFreqBase := p.ropeFreqBase(); ropeFreqBase != 0 {
-		kv["rope.freq_base"] = ropeFreqBase
-	}
-
-	if p.isMoE() {
-		kv["expert_count"] = p.expertCount()
-		kv["expert_used_count"] = p.NumExpertsPerToken
-		kv["expert_feed_forward_length"] = p.MoEIntermediateSize
-		kv["leading_dense_block_count"] = p.NumDenseLayers
-		kv["expert_gating_func"] = uint32(2) // sigmoid
-		kv["expert_weights_scale"] = cmp.Or(p.RoutedScalingFactor, float32(1.0))
-	}
-
-	return kv
-}
-
-func (p *lfm2Model) Tensors(ts []Tensor) []*ggml.Tensor {
-	var out []*ggml.Tensor
-
-	if p.isMoE() {
-		merges := make([]merge, 0, p.NumHiddenLayers*3)
-		for i := range p.NumHiddenLayers {
-			if i < p.NumDenseLayers {
-				continue
-			}
-
-			merges = append(merges, merge{
-				fmt.Sprintf("blk.%d.feed_forward.experts.*.w1.weight", i),
-				fmt.Sprintf("blk.%d.ffn_gate_exps.weight", i),
-			}, merge{
-				fmt.Sprintf("blk.%d.feed_forward.experts.*.w2.weight", i),
-				fmt.Sprintf("blk.%d.ffn_down_exps.weight", i),
-			}, merge{
-				fmt.Sprintf("blk.%d.feed_forward.experts.*.w3.weight", i),
-				fmt.Sprintf("blk.%d.ffn_up_exps.weight", i),
-			})
-		}
-
-		merged, remaining := mergeTensors(ts, merges...)
-		out = append(out, merged...)
-		ts = remaining
-	}
-
-	for _, t := range ts {
-		shape := t.Shape()
-
-		// Squeeze conv weights: [D, 1, K] -> [D, K]
-		if strings.HasSuffix(t.Name(), "shortconv.conv.weight") {
-			if len(shape) == 3 && shape[1] == 1 {
-				shape = []uint64{shape[0], shape[2]}
-			}
-		}
-
-		out = append(out, &ggml.Tensor{
-			Name:     t.Name(),
-			Kind:     t.Kind(),
-			Shape:    slices.Clone(shape),
-			WriterTo: t,
-		})
-	}
-
-	return out
-}
-
-func (p *lfm2Model) Replacements() []string {
-	return []string{
-		"model.embed_tokens", "token_embd",
-		"model.embedding_norm", "token_embd_norm",
-		"model.layers", "blk",
-		"operator_norm", "attn_norm",
-		"self_attn.q_proj", "attn_q",
-		"self_attn.k_proj", "attn_k",
-		"self_attn.v_proj", "attn_v",
-		"self_attn.out_proj", "attn_output",
-		"self_attn.q_layernorm", "attn_q_norm",
-		"self_attn.k_layernorm", "attn_k_norm",
-		"conv.conv", "shortconv.conv",
-		"conv.in_proj", "shortconv.in_proj",
-		"conv.out_proj", "shortconv.out_proj",
-		"feed_forward.gate", "ffn_gate_inp",
-		"feed_forward.expert_bias", "exp_probs_b.bias",
-		"feed_forward.w1", "ffn_gate",
-		"feed_forward.w2", "ffn_down",
-		"feed_forward.w3", "ffn_up",
-		"ffn_norm", "ffn_norm",
-	}
-}
--- a/convert/convert_lfm2_test.go
+++ b/convert/convert_lfm2_test.go
@@ -1,271 +0,0 @@
-package convert
-
-import (
-	"io"
-	"slices"
-	"strings"
-	"testing"
-)
-
-type lfm2StubTensor struct {
-	tensorBase
-}
-
-func newLFM2StubTensor(name string, shape []uint64) *lfm2StubTensor {
-	return &lfm2StubTensor{
-		tensorBase: tensorBase{
-			name:  name,
-			shape: shape,
-		},
-	}
-}
-
-func (t *lfm2StubTensor) WriteTo(io.Writer) (int64, error) {
-	return 0, nil
-}
-
-func (t *lfm2StubTensor) Clone() Tensor {
-	return &lfm2StubTensor{
-		tensorBase: tensorBase{
-			name:  t.name,
-			shape: slices.Clone(t.shape),
-		},
-	}
-}
-
-func TestLFM2MoEKV(t *testing.T) {
-	var p lfm2Model
-	p.ModelParameters.ModelType = "lfm2_moe"
-	p.VocabSize = 65536
-	p.HiddenSize = 2048
-	p.NumHiddenLayers = 4
-	p.MaxPositionEmbeddings = 128000
-	p.IntermediateSize = 11776
-	p.NumAttentionHeads = 32
-	p.NumKeyValueHeads = 8
-	p.LayerTypes = []string{"conv", "full_attention", "conv", "full_attention"}
-	p.NormEps = 1e-5
-	p.ConvLCache = 3
-	p.MoEIntermediateSize = 1536
-	p.NumExperts = 64
-	p.NumExpertsPerToken = 4
-	p.NumDenseLayers = 2
-	p.RopeParameters.RopeTheta = 1_000_000
-
-	kv := p.KV(&Tokenizer{Vocabulary: &Vocabulary{Model: "gpt2"}})
-
-	if got, want := kv["general.architecture"], "lfm2moe"; got != want {
-		t.Fatalf("general.architecture = %v, want %v", got, want)
-	}
-	if got, want := kv["tokenizer.ggml.pre"], "lfm2"; got != want {
-		t.Fatalf("tokenizer.ggml.pre = %v, want %v", got, want)
-	}
-
-	if got, want := kv["expert_count"], uint32(64); got != want {
-		t.Fatalf("expert_count = %v, want %v", got, want)
-	}
-
-	if got, want := kv["expert_used_count"], uint32(4); got != want {
-		t.Fatalf("expert_used_count = %v, want %v", got, want)
-	}
-
-	if got, want := kv["expert_feed_forward_length"], uint32(1536); got != want {
-		t.Fatalf("expert_feed_forward_length = %v, want %v", got, want)
-	}
-
-	if got, want := kv["leading_dense_block_count"], uint32(2); got != want {
-		t.Fatalf("leading_dense_block_count = %v, want %v", got, want)
-	}
-
-	if got, want := kv["expert_gating_func"], uint32(2); got != want {
-		t.Fatalf("expert_gating_func = %v, want %v", got, want)
-	}
-
-	gotHeadCounts, ok := kv["attention.head_count_kv"].([]uint32)
-	if !ok {
-		t.Fatalf("attention.head_count_kv has unexpected type %T", kv["attention.head_count_kv"])
-	}
-
-	wantHeadCounts := []uint32{0, 8, 0, 8}
-	if !slices.Equal(gotHeadCounts, wantHeadCounts) {
-		t.Fatalf("attention.head_count_kv = %v, want %v", gotHeadCounts, wantHeadCounts)
-	}
-
-	if got, want := kv["rope.freq_base"], float32(1_000_000); got != want {
-		t.Fatalf("rope.freq_base = %v, want %v", got, want)
-	}
-}
-
-func TestLFM2DenseKV(t *testing.T) {
-	p := lfm2Model{
-		ModelParameters:       ModelParameters{ModelType: "lfm2", VocabSize: 32000},
-		HiddenSize:            1024,
-		NumHiddenLayers:       2,
-		MaxPositionEmbeddings: 32768,
-		IntermediateSize:      4096,
-		NumAttentionHeads:     16,
-		NumKeyValueHeads:      4,
-		LayerTypes:            []string{"conv", "full_attention"},
-		NormEps:               1e-5,
-		ConvLCache:            3,
-		RopeTheta:             10000,
-	}
-
-	kv := p.KV(&Tokenizer{Vocabulary: &Vocabulary{Model: "gpt2"}})
-
-	if got, want := kv["general.architecture"], "lfm2"; got != want {
-		t.Fatalf("general.architecture = %v, want %v", got, want)
-	}
-	if got, want := kv["tokenizer.ggml.pre"], "lfm2"; got != want {
-		t.Fatalf("tokenizer.ggml.pre = %v, want %v", got, want)
-	}
-
-	if _, ok := kv["expert_count"]; ok {
-		t.Fatalf("expert_count should not be set for dense lfm2")
-	}
-}
-
-func TestLFM2MoETensors(t *testing.T) {
-	p := lfm2Model{
-		ModelParameters: ModelParameters{ModelType: "lfm2_moe"},
-		NumHiddenLayers: 4,
-		NumDenseLayers:  2,
-	}
-
-	in := []Tensor{
-		newLFM2StubTensor("blk.2.feed_forward.experts.0.w1.weight", []uint64{1536, 2048}),
-		newLFM2StubTensor("blk.2.feed_forward.experts.1.w1.weight", []uint64{1536, 2048}),
-		newLFM2StubTensor("blk.2.feed_forward.experts.0.w2.weight", []uint64{2048, 1536}),
-		newLFM2StubTensor("blk.2.feed_forward.experts.1.w2.weight", []uint64{2048, 1536}),
-		newLFM2StubTensor("blk.2.feed_forward.experts.0.w3.weight", []uint64{1536, 2048}),
-		newLFM2StubTensor("blk.2.feed_forward.experts.1.w3.weight", []uint64{1536, 2048}),
-		newLFM2StubTensor("blk.0.shortconv.conv.weight", []uint64{2048, 1, 3}),
-	}
-
-	out := p.Tensors(in)
-
-	byName := make(map[string][]uint64, len(out))
-	for _, tns := range out {
-		byName[tns.Name] = tns.Shape
-	}
-
-	if got, ok := byName["blk.2.ffn_gate_exps.weight"]; !ok {
-		t.Fatalf("missing merged tensor blk.2.ffn_gate_exps.weight")
-	} else if !slices.Equal(got, []uint64{2, 1536, 2048}) {
-		t.Fatalf("blk.2.ffn_gate_exps.weight shape = %v, want [2 1536 2048]", got)
-	}
-
-	if got, ok := byName["blk.2.ffn_down_exps.weight"]; !ok {
-		t.Fatalf("missing merged tensor blk.2.ffn_down_exps.weight")
-	} else if !slices.Equal(got, []uint64{2, 2048, 1536}) {
-		t.Fatalf("blk.2.ffn_down_exps.weight shape = %v, want [2 2048 1536]", got)
-	}
-
-	if got, ok := byName["blk.2.ffn_up_exps.weight"]; !ok {
-		t.Fatalf("missing merged tensor blk.2.ffn_up_exps.weight")
-	} else if !slices.Equal(got, []uint64{2, 1536, 2048}) {
-		t.Fatalf("blk.2.ffn_up_exps.weight shape = %v, want [2 1536 2048]", got)
-	}
-
-	if got, ok := byName["blk.0.shortconv.conv.weight"]; !ok {
-		t.Fatalf("missing shortconv tensor")
-	} else if !slices.Equal(got, []uint64{2048, 3}) {
-		t.Fatalf("blk.0.shortconv.conv.weight shape = %v, want [2048 3]", got)
-	}
-
-	if _, ok := byName["blk.2.feed_forward.experts.0.w1.weight"]; ok {
-		t.Fatalf("unmerged expert tensor should not be present")
-	}
-}
-
-func TestLFM2MoEReplacements(t *testing.T) {
-	p := lfm2Model{}
-	replacer := strings.NewReplacer(p.Replacements()...)
-
-	if got, want := replacer.Replace("model.layers.2.feed_forward.expert_bias"), "blk.2.exp_probs_b.bias"; got != want {
-		t.Fatalf("expert bias replacement = %q, want %q", got, want)
-	}
-
-	if got, want := replacer.Replace("model.layers.2.feed_forward.gate.weight"), "blk.2.ffn_gate_inp.weight"; got != want {
-		t.Fatalf("gate replacement = %q, want %q", got, want)
-	}
-}
-
-func TestLFM2KVContextLengthEdgeCaseFallbackOverride(t *testing.T) {
-	p := lfm2Model{
-		ModelParameters:       ModelParameters{ModelType: "lfm2_moe", VocabSize: 65536},
-		HiddenSize:            2048,
-		NumHiddenLayers:       40,
-		MaxPositionEmbeddings: 128000,
-		IntermediateSize:      11776,
-		NumAttentionHeads:     32,
-		NumKeyValueHeads:      8,
-		LayerTypes:            make([]string, 40),
-		NormEps:               1e-5,
-		ConvLCache:            3,
-		MoEIntermediateSize:   1536,
-		NumExperts:            64,
-		NumExpertsPerToken:    4,
-		NumDenseLayers:        2,
-	}
-	for i := 0; i < len(p.LayerTypes); i++ {
-		p.LayerTypes[i] = "conv"
-	}
-	p.LayerTypes[2] = "full_attention"
-
-	kv := p.KV(&Tokenizer{Vocabulary: &Vocabulary{Model: "gpt2"}})
-
-	if got, want := kv["context_length"], uint32(32768); got != want {
-		t.Fatalf("context_length = %v, want %v", got, want)
-	}
-}
-
-func TestLFM2KVContextLengthNoOverride(t *testing.T) {
-	p := lfm2Model{
-		ModelParameters:       ModelParameters{ModelType: "lfm2_moe", VocabSize: 65536},
-		HiddenSize:            2048,
-		NumHiddenLayers:       39, // mismatch: should not trigger edge case
-		MaxPositionEmbeddings: 128000,
-		IntermediateSize:      11776,
-		NumAttentionHeads:     32,
-		NumKeyValueHeads:      8,
-		LayerTypes:            []string{"conv", "full_attention"},
-		NormEps:               1e-5,
-		ConvLCache:            3,
-		MoEIntermediateSize:   1536,
-		NumExperts:            64,
-		NumExpertsPerToken:    4,
-		NumDenseLayers:        2,
-	}
-
-	kv := p.KV(&Tokenizer{Vocabulary: &Vocabulary{Model: "gpt2"}})
-
-	if got, want := kv["context_length"], uint32(128000); got != want {
-		t.Fatalf("context_length = %v, want %v", got, want)
-	}
-}
-
-func TestLFM2KVFeedForwardLengthAutoAdjust(t *testing.T) {
-	p := lfm2Model{
-		ModelParameters:       ModelParameters{ModelType: "lfm2", VocabSize: 65536},
-		HiddenSize:            2048,
-		NumHiddenLayers:       16,
-		MaxPositionEmbeddings: 128000,
-		IntermediateSize:      12288, // should be ignored when block_ff_dim is set
-		BlockFFDim:            12288,
-		BlockAutoAdjustFFDim:  true,
-		BlockMultipleOf:       256,
-		BlockFFNDimMultiplier: 1.0,
-		NumAttentionHeads:     32,
-		NumKeyValueHeads:      8,
-		LayerTypes:            []string{"conv", "full_attention"},
-		NormEps:               1e-5,
-		ConvLCache:            3,
-	}
-
-	kv := p.KV(&Tokenizer{Vocabulary: &Vocabulary{Model: "gpt2"}})
-
-	if got, want := kv["feed_forward_length"], uint32(8192); got != want {
-		t.Fatalf("feed_forward_length = %v, want %v", got, want)
-	}
-}
--- a/convert/convert_lfm2_vl.go
+++ b/convert/convert_lfm2_vl.go
@@ -1,417 +0,0 @@
-package convert
-
-import (
-	"cmp"
-	"encoding/json"
-	"errors"
-	"fmt"
-	"io/fs"
-	"slices"
-	"strings"
-
-	"github.com/ollama/ollama/fs/ggml"
-)
-
-// lfm2VLTextModel converts the language model component of LFM2 VL checkpoints.
-type lfm2VLTextModel struct {
-	TextConfig            lfm2Model `json:"text_config"`
-	DoImageSplitting      *bool     `json:"do_image_splitting"`
-	DownsampleFactor      uint32    `json:"downsample_factor"`
-	EncoderPatchSize      uint32    `json:"encoder_patch_size"`
-	ImageTokenID          uint32    `json:"image_token_id"`
-	MaxImageTokens        uint32    `json:"max_image_tokens"`
-	MinImageTokens        uint32    `json:"min_image_tokens"`
-	MaxTiles              uint32    `json:"max_tiles"`
-	MinTiles              uint32    `json:"min_tiles"`
-	TileSize              uint32    `json:"tile_size"`
-	MaxPixelsTolerance    float32   `json:"max_pixels_tolerance"`
-	ProjectorUseLayernorm bool      `json:"projector_use_layernorm"`
-	ProjectorHiddenSize   uint32    `json:"projector_hidden_size"`
-	ProjectorHiddenAct    string    `json:"projector_hidden_act"`
-	UseImageSpecialTokens *bool     `json:"use_image_special_tokens"`
-	UseThumbnail          *bool     `json:"use_thumbnail"`
-	VisionConfig          struct {
-		HiddenSize        uint32  `json:"hidden_size"`
-		IntermediateSize  uint32  `json:"intermediate_size"`
-		NumAttentionHeads uint32  `json:"num_attention_heads"`
-		NumHiddenLayers   uint32  `json:"num_hidden_layers"`
-		NumChannels       uint32  `json:"num_channels"`
-		PatchSize         uint32  `json:"patch_size"`
-		LayerNormEpsilon  float32 `json:"layer_norm_eps"`
-	} `json:"vision_config"`
-	Processor struct {
-		ImageProcessor struct {
-			DoImageSplitting *bool     `json:"do_image_splitting"`
-			DownsampleFactor uint32    `json:"downsample_factor"`
-			MaxImageTokens   uint32    `json:"max_image_tokens"`
-			MinImageTokens   uint32    `json:"min_image_tokens"`
-			MaxTiles         uint32    `json:"max_tiles"`
-			MinTiles         uint32    `json:"min_tiles"`
-			MaxPixelsTol     float32   `json:"max_pixels_tolerance"`
-			TileSize         uint32    `json:"tile_size"`
-			UseThumbnail     *bool     `json:"use_thumbnail"`
-			ImageMean        []float32 `json:"image_mean"`
-			ImageStd         []float32 `json:"image_std"`
-			Size             struct {
-				Height uint32 `json:"height"`
-				Width  uint32 `json:"width"`
-			} `json:"size"`
-		} `json:"image_processor"`
-	}
-}
-
-func (p *lfm2VLTextModel) textModel() *lfm2Model {
-	return &p.TextConfig
-}
-
-func (p *lfm2VLTextModel) specialTokenTypes() []string {
-	return p.textModel().specialTokenTypes()
-}
-
-func (p *lfm2VLTextModel) parseMore(fsys fs.FS) error {
-	bts, err := fs.ReadFile(fsys, "processor_config.json")
-	if err != nil {
-		if errors.Is(err, fs.ErrNotExist) {
-			return nil
-		}
-		return err
-	}
-
-	return json.Unmarshal(bts, &p.Processor)
-}
-
-func (p *lfm2VLTextModel) visionImageSize() uint32 {
-	// LFM2-VL image processor operates on 512 tiles and downsamples by factor 2
-	// before projection. Keep a fixed square image size compatible with position
-	// embeddings and the simplified runtime image pipeline.
-	tile := cmp.Or(
-		p.Processor.ImageProcessor.TileSize,
-		p.Processor.ImageProcessor.Size.Height,
-		p.Processor.ImageProcessor.Size.Width,
-		uint32(512),
-	)
-	downsample := cmp.Or(p.DownsampleFactor, p.Processor.ImageProcessor.DownsampleFactor, uint32(2))
-	if downsample == 0 {
-		return tile
-	}
-
-	return max(uint32(1), tile/downsample)
-}
-
-func (p *lfm2VLTextModel) KV(t *Tokenizer) KV {
-	kv := p.textModel().KV(t)
-
-	boolOr := func(defaultValue bool, values ...*bool) bool {
-		for _, v := range values {
-			if v != nil {
-				return *v
-			}
-		}
-		return defaultValue
-	}
-
-	kv["vision.block_count"] = cmp.Or(p.VisionConfig.NumHiddenLayers, uint32(27))
-	kv["vision.embedding_length"] = cmp.Or(p.VisionConfig.HiddenSize, uint32(1152))
-	kv["vision.feed_forward_length"] = cmp.Or(p.VisionConfig.IntermediateSize, uint32(4304))
-	kv["vision.attention.head_count"] = cmp.Or(p.VisionConfig.NumAttentionHeads, uint32(16))
-	kv["vision.attention.layer_norm_epsilon"] = cmp.Or(p.VisionConfig.LayerNormEpsilon, float32(1e-6))
-	kv["vision.patch_size"] = cmp.Or(p.VisionConfig.PatchSize, p.EncoderPatchSize, uint32(16))
-	kv["vision.num_channels"] = cmp.Or(p.VisionConfig.NumChannels, uint32(3))
-	kv["vision.image_size"] = p.visionImageSize()
-	kv["vision.projector.scale_factor"] = cmp.Or(p.DownsampleFactor, p.Processor.ImageProcessor.DownsampleFactor, uint32(2))
-	kv["vision.projector.use_layernorm"] = p.ProjectorUseLayernorm
-	kv["vision.do_image_splitting"] = boolOr(true, p.DoImageSplitting, p.Processor.ImageProcessor.DoImageSplitting)
-	kv["vision.min_tiles"] = cmp.Or(p.MinTiles, p.Processor.ImageProcessor.MinTiles, uint32(2))
-	kv["vision.max_tiles"] = cmp.Or(p.MaxTiles, p.Processor.ImageProcessor.MaxTiles, uint32(10))
-	kv["vision.tile_size"] = cmp.Or(p.TileSize, p.Processor.ImageProcessor.TileSize, uint32(512))
-	kv["vision.min_image_tokens"] = cmp.Or(p.MinImageTokens, p.Processor.ImageProcessor.MinImageTokens, uint32(64))
-	kv["vision.max_image_tokens"] = cmp.Or(p.MaxImageTokens, p.Processor.ImageProcessor.MaxImageTokens, uint32(256))
-	kv["vision.max_pixels_tolerance"] = cmp.Or(p.MaxPixelsTolerance, p.Processor.ImageProcessor.MaxPixelsTol, float32(2.0))
-	kv["vision.use_thumbnail"] = boolOr(true, p.UseThumbnail, p.Processor.ImageProcessor.UseThumbnail)
-	kv["vision.use_image_special_tokens"] = boolOr(true, p.UseImageSpecialTokens)
-	kv["vision.image_mean"] = slices.Clone(defaultFloat32Slice(p.Processor.ImageProcessor.ImageMean, []float32{0.5, 0.5, 0.5}))
-	kv["vision.image_std"] = slices.Clone(defaultFloat32Slice(p.Processor.ImageProcessor.ImageStd, []float32{0.5, 0.5, 0.5}))
-	kv["vision.image_token_id"] = cmp.Or(p.ImageTokenID, uint32(396))
-
-	setVisionTokenID := func(k, token string) {
-		if t == nil || t.Vocabulary == nil {
-			return
-		}
-		for i, v := range t.Vocabulary.Tokens {
-			if v == token {
-				kv[k] = uint32(i)
-				return
-			}
-		}
-	}
-	setVisionTokenID("vision.image_start_token_id", "<|image_start|>")
-	setVisionTokenID("vision.image_end_token_id", "<|image_end|>")
-	setVisionTokenID("vision.image_thumbnail_token_id", "<|img_thumbnail|>")
-
-	return kv
-}
-
-func (p *lfm2VLTextModel) Tensors(ts []Tensor) []*ggml.Tensor {
-	patchSize := int(cmp.Or(p.VisionConfig.PatchSize, p.EncoderPatchSize, uint32(16)))
-	numChannels := int(cmp.Or(p.VisionConfig.NumChannels, uint32(3)))
-
-	for _, t := range ts {
-		if t.Name() == "v.patch_embd.weight" {
-			shape := t.Shape()
-			if len(shape) == 2 {
-				inputDim := uint64(numChannels * patchSize * patchSize)
-				if shape[1] == inputDim {
-					channels := numChannels
-					patch := patchSize
-					t.SetRepacker(func(_ string, data []float32, srcShape []uint64) ([]float32, error) {
-						return repackPatchEmbeddingWeight(data, srcShape, channels, patch)
-					})
-				}
-			}
-		}
-	}
-
-	out := p.textModel().Tensors(ts)
-	for _, t := range out {
-		if t.Name == "v.patch_embd.weight" && len(t.Shape) == 2 {
-			t.Shape = []uint64{t.Shape[0], uint64(numChannels), uint64(patchSize), uint64(patchSize)}
-		}
-	}
-	return out
-}
-
-func (p *lfm2VLTextModel) Replacements() []string {
-	out := make([]string, 0, 96)
-
-	addText := func(from, to string) {
-		out = append(out, from, to)
-		if strings.HasPrefix(from, "model.") {
-			suffix := strings.TrimPrefix(from, "model.")
-			out = append(out,
-				"model.language_model."+suffix, to,
-				"model.language_model.model."+suffix, to,
-			)
-		}
-	}
-
-	base := p.textModel().Replacements()
-	for i := 0; i+1 < len(base); i += 2 {
-		addText(base[i], base[i+1])
-	}
-
-	// Vision tower + multimodal projector tensors (single-file conversion).
-	out = append(out,
-		"model.vision_tower.vision_model.embeddings.patch_embedding", "v.patch_embd",
-		"model.vision_tower.vision_model.embeddings.position_embedding", "v.position_embd",
-		"model.vision_tower.vision_model.encoder.layers", "v.blk",
-		"model.vision_tower.vision_model.post_layernorm", "v.post_ln",
-		"model.multi_modal_projector.layer_norm", "mm.layer_norm",
-		"model.multi_modal_projector.linear_1", "mm.1",
-		"model.multi_modal_projector.linear_2", "mm.2",
-		"self_attn.q_proj", "attn_q",
-		"self_attn.k_proj", "attn_k",
-		"self_attn.v_proj", "attn_v",
-		"self_attn.out_proj", "attn_out",
-		"layer_norm1", "ln1",
-		"layer_norm2", "ln2",
-		"mlp.fc1", "ffn_up",
-		"mlp.fc2", "ffn_down",
-	)
-
-	return out
-}
-
-// lfm2VLProjectorModel converts the vision encoder + projector component of LFM2 VL checkpoints.
-type lfm2VLProjectorModel struct {
-	ModelParameters
-	DownsampleFactor   uint32 `json:"downsample_factor"`
-	ProjectorHiddenDim uint32 `json:"projector_hidden_size"`
-	VisionModel        struct {
-		HiddenSize        uint32  `json:"hidden_size"`
-		IntermediateSize  uint32  `json:"intermediate_size"`
-		NumAttentionHeads uint32  `json:"num_attention_heads"`
-		NumHiddenLayers   uint32  `json:"num_hidden_layers"`
-		NumChannels       uint32  `json:"num_channels"`
-		PatchSize         uint32  `json:"patch_size"`
-		LayerNormEpsilon  float32 `json:"layer_norm_eps"`
-		ImageSize         uint32  `json:"image_size"`
-	} `json:"vision_config"`
-	Processor struct {
-		ImageProcessor struct {
-			DownsampleFactor uint32    `json:"downsample_factor"`
-			TileSize         uint32    `json:"tile_size"`
-			ImageMean        []float32 `json:"image_mean"`
-			ImageStd         []float32 `json:"image_std"`
-			Size             struct {
-				Height uint32 `json:"height"`
-				Width  uint32 `json:"width"`
-			} `json:"size"`
-		} `json:"image_processor"`
-	}
-}
-
-var (
-	_ ModelConverter = (*lfm2VLTextModel)(nil)
-	_ ModelConverter = (*lfm2VLProjectorModel)(nil)
-	_ moreParser     = (*lfm2VLTextModel)(nil)
-	_ moreParser     = (*lfm2VLProjectorModel)(nil)
-)
-
-func (p *lfm2VLProjectorModel) parseMore(fsys fs.FS) error {
-	bts, err := fs.ReadFile(fsys, "processor_config.json")
-	if err != nil {
-		if errors.Is(err, fs.ErrNotExist) {
-			return nil
-		}
-		return err
-	}
-
-	return json.Unmarshal(bts, &p.Processor)
-}
-
-func (p *lfm2VLProjectorModel) imageSize() uint32 {
-	if p.VisionModel.ImageSize > 0 {
-		return p.VisionModel.ImageSize
-	}
-
-	downsample := cmp.Or(p.DownsampleFactor, p.Processor.ImageProcessor.DownsampleFactor, uint32(2))
-	baseSize := cmp.Or(
-		p.Processor.ImageProcessor.TileSize,
-		p.Processor.ImageProcessor.Size.Height,
-		p.Processor.ImageProcessor.Size.Width,
-		uint32(256),
-	)
-	if downsample == 0 {
-		return baseSize
-	}
-
-	return max(uint32(1), baseSize/downsample)
-}
-
-func (p *lfm2VLProjectorModel) KV(_ *Tokenizer) KV {
-	kv := KV{
-		"general.architecture":         "clip",
-		"general.type":                 "mmproj",
-		"general.file_type":            uint32(1),
-		"general.quantization_version": uint32(2),
-		"clip.has_vision_encoder":      true,
-		"clip.projector_type":          "lfm2",
-		"clip.use_gelu":                true,
-	}
-
-	kv["clip.vision.block_count"] = cmp.Or(p.VisionModel.NumHiddenLayers, uint32(27))
-	kv["clip.vision.embedding_length"] = cmp.Or(p.VisionModel.HiddenSize, uint32(1152))
-	kv["clip.vision.feed_forward_length"] = cmp.Or(p.VisionModel.IntermediateSize, uint32(4304))
-	kv["clip.vision.attention.head_count"] = cmp.Or(p.VisionModel.NumAttentionHeads, uint32(16))
-	kv["clip.vision.attention.layer_norm_epsilon"] = cmp.Or(p.VisionModel.LayerNormEpsilon, float32(1e-6))
-	kv["clip.vision.patch_size"] = cmp.Or(p.VisionModel.PatchSize, uint32(16))
-	kv["clip.vision.image_size"] = p.imageSize()
-	kv["clip.vision.projection_dim"] = cmp.Or(p.ProjectorHiddenDim, uint32(2048))
-	kv["clip.vision.projector.scale_factor"] = cmp.Or(p.DownsampleFactor, p.Processor.ImageProcessor.DownsampleFactor, uint32(2))
-	kv["clip.vision.image_mean"] = slices.Clone(defaultFloat32Slice(p.Processor.ImageProcessor.ImageMean, []float32{0.5, 0.5, 0.5}))
-	kv["clip.vision.image_std"] = slices.Clone(defaultFloat32Slice(p.Processor.ImageProcessor.ImageStd, []float32{0.5, 0.5, 0.5}))
-
-	return kv
-}
-
-func defaultFloat32Slice(v, fallback []float32) []float32 {
-	if len(v) > 0 {
-		return v
-	}
-
-	return fallback
-}
-
-func (p *lfm2VLProjectorModel) Tensors(ts []Tensor) []*ggml.Tensor {
-	var out []*ggml.Tensor
-
-	numChannels := cmp.Or(p.VisionModel.NumChannels, uint32(3))
-	patchSize := cmp.Or(p.VisionModel.PatchSize, uint32(16))
-
-	for _, t := range ts {
-		name := t.Name()
-		if !(strings.HasPrefix(name, "v.") || strings.HasPrefix(name, "mm.")) {
-			continue
-		}
-
-		shape := t.Shape()
-		if name == "v.patch_embd.weight" && len(shape) == 2 {
-			inputDim := uint64(numChannels * patchSize * patchSize)
-			if shape[1] == inputDim {
-				shape = []uint64{shape[0], uint64(numChannels), uint64(patchSize), uint64(patchSize)}
-				channels := int(numChannels)
-				patch := int(patchSize)
-				t.SetRepacker(func(_ string, data []float32, srcShape []uint64) ([]float32, error) {
-					return repackPatchEmbeddingWeight(data, srcShape, channels, patch)
-				})
-			}
-		}
-
-		out = append(out, &ggml.Tensor{
-			Name:     name,
-			Kind:     t.Kind(),
-			Shape:    slices.Clone(shape),
-			WriterTo: t,
-		})
-	}
-
-	return out
-}
-
-func (p *lfm2VLProjectorModel) Replacements() []string {
-	return []string{
-		"model.multi_modal_projector.linear_1", "mm.1",
-		"model.multi_modal_projector.linear_2", "mm.2",
-		"model.vision_tower.vision_model.embeddings.patch_embedding", "v.patch_embd",
-		"model.vision_tower.vision_model.embeddings.position_embedding", "v.position_embd",
-		"model.vision_tower.vision_model.encoder.layers", "v.blk",
-		"self_attn.q_proj", "attn_q",
-		"self_attn.k_proj", "attn_k",
-		"self_attn.v_proj", "attn_v",
-		"self_attn.out_proj", "attn_out",
-		"layer_norm1", "ln1",
-		"layer_norm2", "ln2",
-		"mlp.fc1", "ffn_up",
-		"mlp.fc2", "ffn_down",
-		"model.vision_tower.vision_model.post_layernorm", "v.post_ln",
-	}
-}
-
-func repackPatchEmbeddingWeight(data []float32, srcShape []uint64, channels, patch int) ([]float32, error) {
-	if len(srcShape) != 2 {
-		return nil, fmt.Errorf("invalid patch embedding shape rank: %d", len(srcShape))
-	}
-
-	outDim := int(srcShape[0])
-	flatInputDim := int(srcShape[1])
-	expectedInputDim := channels * patch * patch
-	if flatInputDim != expectedInputDim {
-		return nil, fmt.Errorf("invalid patch embedding input dim: got %d, want %d", flatInputDim, expectedInputDim)
-	}
-
-	expectedSize := outDim * flatInputDim
-	if len(data) != expectedSize {
-		return nil, fmt.Errorf("invalid patch embedding data size: got %d, want %d", len(data), expectedSize)
-	}
-
-	repacked := make([]float32, len(data))
-	perChannel := patch * patch
-
-	for o := range outDim {
-		inBase := o * flatInputDim
-		outBase := o * flatInputDim
-
-		for y := range patch {
-			for x := range patch {
-				inPixelBase := inBase + (y*patch+x)*channels
-				for c := range channels {
-					src := inPixelBase + c
-					dst := outBase + c*perChannel + y*patch + x
-					repacked[dst] = data[src]
-				}
-			}
-		}
-	}
-
-	return repacked, nil
-}
--- a/convert/convert_lfm2_vl_test.go
+++ b/convert/convert_lfm2_vl_test.go
@@ -1,249 +0,0 @@
-package convert
-
-import (
-	"slices"
-	"strings"
-	"testing"
-)
-
-func TestLFM2VLTextModelKVUsesTextConfig(t *testing.T) {
-	p := lfm2VLTextModel{
-		TextConfig: lfm2Model{
-			ModelParameters:       ModelParameters{ModelType: "lfm2", VocabSize: 65536},
-			HiddenSize:            2048,
-			NumHiddenLayers:       16,
-			MaxPositionEmbeddings: 128000,
-			IntermediateSize:      12288,
-			BlockFFDim:            12288,
-			BlockAutoAdjustFFDim:  true,
-			BlockMultipleOf:       256,
-			BlockFFNDimMultiplier: 1.0,
-			NumAttentionHeads:     32,
-			NumKeyValueHeads:      8,
-			LayerTypes:            []string{"conv", "full_attention"},
-			NormEps:               1e-5,
-			ConvLCache:            3,
-		},
-		DownsampleFactor: 2,
-		VisionConfig: struct {
-			HiddenSize        uint32  `json:"hidden_size"`
-			IntermediateSize  uint32  `json:"intermediate_size"`
-			NumAttentionHeads uint32  `json:"num_attention_heads"`
-			NumHiddenLayers   uint32  `json:"num_hidden_layers"`
-			NumChannels       uint32  `json:"num_channels"`
-			PatchSize         uint32  `json:"patch_size"`
-			LayerNormEpsilon  float32 `json:"layer_norm_eps"`
-		}{
-			HiddenSize:        1152,
-			IntermediateSize:  4304,
-			NumAttentionHeads: 16,
-			NumHiddenLayers:   27,
-			NumChannels:       3,
-			PatchSize:         16,
-			LayerNormEpsilon:  1e-6,
-		},
-	}
-	p.Processor.ImageProcessor.TileSize = 512
-	p.Processor.ImageProcessor.ImageMean = []float32{0.5, 0.5, 0.5}
-	p.Processor.ImageProcessor.ImageStd = []float32{0.5, 0.5, 0.5}
-
-	kv := p.KV(&Tokenizer{
-		Vocabulary: &Vocabulary{
-			Model:  "gpt2",
-			Tokens: []string{"<|pad|>", "<image>", "<|image_start|>", "<|image_end|>", "<|img_thumbnail|>"},
-		},
-	})
-
-	if got, want := kv["general.architecture"], "lfm2"; got != want {
-		t.Fatalf("general.architecture = %v, want %v", got, want)
-	}
-
-	if got, want := kv["feed_forward_length"], uint32(8192); got != want {
-		t.Fatalf("feed_forward_length = %v, want %v", got, want)
-	}
-
-	if got, want := kv["vision.block_count"], uint32(27); got != want {
-		t.Fatalf("vision.block_count = %v, want %v", got, want)
-	}
-
-	if got, want := kv["vision.image_size"], uint32(256); got != want {
-		t.Fatalf("vision.image_size = %v, want %v", got, want)
-	}
-
-	if got, want := kv["vision.image_token_id"], uint32(396); got != want {
-		t.Fatalf("vision.image_token_id = %v, want %v", got, want)
-	}
-
-	if got, want := kv["vision.image_start_token_id"], uint32(2); got != want {
-		t.Fatalf("vision.image_start_token_id = %v, want %v", got, want)
-	}
-
-	if got, want := kv["vision.do_image_splitting"], true; got != want {
-		t.Fatalf("vision.do_image_splitting = %v, want %v", got, want)
-	}
-	if got, want := kv["vision.min_tiles"], uint32(2); got != want {
-		t.Fatalf("vision.min_tiles = %v, want %v", got, want)
-	}
-	if got, want := kv["vision.max_tiles"], uint32(10); got != want {
-		t.Fatalf("vision.max_tiles = %v, want %v", got, want)
-	}
-	if got, want := kv["vision.tile_size"], uint32(512); got != want {
-		t.Fatalf("vision.tile_size = %v, want %v", got, want)
-	}
-	if got, want := kv["vision.use_thumbnail"], true; got != want {
-		t.Fatalf("vision.use_thumbnail = %v, want %v", got, want)
-	}
-	if got, want := kv["vision.use_image_special_tokens"], true; got != want {
-		t.Fatalf("vision.use_image_special_tokens = %v, want %v", got, want)
-	}
-}
-
-func TestLFM2VLTextModelTensorsIncludeVision(t *testing.T) {
-	p := lfm2VLTextModel{}
-	p.VisionConfig.PatchSize = 16
-	p.VisionConfig.NumChannels = 3
-	input := []Tensor{
-		newLFM2StubTensor("model.embed_tokens.weight", []uint64{65536, 2048}),
-		newLFM2StubTensor("model.layers.0.ffn_norm.weight", []uint64{2048}),
-		newLFM2StubTensor("v.patch_embd.weight", []uint64{1152, 768}),
-		newLFM2StubTensor("v.blk.0.attn_q.weight", []uint64{1152, 1152}),
-		newLFM2StubTensor("mm.1.weight", []uint64{2048, 4608}),
-	}
-
-	out := p.Tensors(input)
-	if len(out) == 0 {
-		t.Fatal("expected non-empty tensor list")
-	}
-
-	foundPatch := false
-	foundVision := false
-	for _, tns := range out {
-		if tns.Name == "v.patch_embd.weight" {
-			foundPatch = true
-			if !slices.Equal(tns.Shape, []uint64{1152, 3, 16, 16}) {
-				t.Fatalf("v.patch_embd.weight shape = %v, want [1152 3 16 16]", tns.Shape)
-			}
-		}
-		if strings.HasPrefix(tns.Name, "v.") || strings.HasPrefix(tns.Name, "mm.") {
-			foundVision = true
-		}
-	}
-
-	if !foundPatch {
-		t.Fatal("expected v.patch_embd.weight in output tensors")
-	}
-	if !foundVision {
-		t.Fatal("expected at least one vision/projector tensor in output")
-	}
-}
-
-func TestLFM2VLTextModelReplacements(t *testing.T) {
-	p := lfm2VLTextModel{}
-	r := strings.NewReplacer(p.Replacements()...)
-
-	tests := []struct {
-		name string
-		in   string
-		want string
-	}{
-		{
-			name: "language_model_embed_tokens",
-			in:   "model.language_model.embed_tokens.weight",
-			want: "token_embd.weight",
-		},
-		{
-			name: "language_model_layers",
-			in:   "model.language_model.layers.2.self_attn.q_proj.weight",
-			want: "blk.2.attn_q.weight",
-		},
-		{
-			name: "nested_language_model_prefix",
-			in:   "model.language_model.model.embedding_norm.weight",
-			want: "token_embd_norm.weight",
-		},
-	}
-
-	for _, tt := range tests {
-		t.Run(tt.name, func(t *testing.T) {
-			if got := r.Replace(tt.in); got != tt.want {
-				t.Fatalf("replacement(%q) = %q, want %q", tt.in, got, tt.want)
-			}
-		})
-	}
-}
-
-func TestLFM2VLProjectorKV(t *testing.T) {
-	p := lfm2VLProjectorModel{
-		DownsampleFactor:   2,
-		ProjectorHiddenDim: 2048,
-	}
-	p.VisionModel.NumHiddenLayers = 27
-	p.VisionModel.HiddenSize = 1152
-	p.VisionModel.IntermediateSize = 4304
-	p.VisionModel.NumAttentionHeads = 16
-	p.VisionModel.PatchSize = 16
-	p.VisionModel.LayerNormEpsilon = 1e-6
-	p.Processor.ImageProcessor.TileSize = 512
-	p.Processor.ImageProcessor.ImageMean = []float32{0.5, 0.5, 0.5}
-	p.Processor.ImageProcessor.ImageStd = []float32{0.5, 0.5, 0.5}
-
-	kv := p.KV(nil)
-
-	if got, want := kv["general.architecture"], "clip"; got != want {
-		t.Fatalf("general.architecture = %v, want %v", got, want)
-	}
-	if got, want := kv["clip.projector_type"], "lfm2"; got != want {
-		t.Fatalf("clip.projector_type = %v, want %v", got, want)
-	}
-	if got, want := kv["clip.vision.image_size"], uint32(256); got != want {
-		t.Fatalf("clip.vision.image_size = %v, want %v", got, want)
-	}
-}
-
-func TestLFM2VLProjectorTensorsPatchReshape(t *testing.T) {
-	p := lfm2VLProjectorModel{}
-	p.VisionModel.NumChannels = 3
-	p.VisionModel.PatchSize = 16
-
-	input := []Tensor{
-		newLFM2StubTensor("v.patch_embd.weight", []uint64{1152, 768}),
-		newLFM2StubTensor("mm.1.weight", []uint64{2048, 4608}),
-		newLFM2StubTensor("model.embed_tokens.weight", []uint64{65536, 2048}),
-	}
-
-	out := p.Tensors(input)
-	if len(out) != 2 {
-		t.Fatalf("expected 2 tensors, got %d", len(out))
-	}
-
-	var patchShape []uint64
-	for _, tns := range out {
-		if tns.Name == "v.patch_embd.weight" {
-			patchShape = tns.Shape
-			break
-		}
-	}
-
-	if !slices.Equal(patchShape, []uint64{1152, 3, 16, 16}) {
-		t.Fatalf("v.patch_embd.weight shape = %v, want [1152 3 16 16]", patchShape)
-	}
-}
-
-func TestRepackPatchEmbeddingWeight(t *testing.T) {
-	data := []float32{
-		0, 1, // y=0,x=0
-		2, 3, // y=0,x=1
-		4, 5, // y=1,x=0
-		6, 7, // y=1,x=1
-	}
-
-	got, err := repackPatchEmbeddingWeight(data, []uint64{1, 8}, 2, 2)
-	if err != nil {
-		t.Fatalf("unexpected error: %v", err)
-	}
-
-	want := []float32{0, 2, 4, 6, 1, 3, 5, 7}
-	if !slices.Equal(got, want) {
-		t.Fatalf("repacked data = %v, want %v", got, want)
-	}
-}
--- a/convert/convert_nemotron_h.go
+++ b/convert/convert_nemotron_h.go
@@ -1,385 +0,0 @@
-package convert
-
-import (
-	"cmp"
-	"encoding/json"
-	"fmt"
-	"io/fs"
-	"math"
-	"slices"
-	"strings"
-
-	"github.com/ollama/ollama/fs/ggml"
-)
-
-type hybridPattern string
-
-func (p *hybridPattern) UnmarshalJSON(data []byte) error {
-	if string(data) == "null" {
-		*p = ""
-		return nil
-	}
-
-	var single string
-	if err := json.Unmarshal(data, &single); err == nil {
-		*p = hybridPattern(strings.TrimSpace(single))
-		return nil
-	}
-
-	var parts []string
-	if err := json.Unmarshal(data, &parts); err == nil {
-		*p = hybridPattern(strings.Join(parts, ""))
-		return nil
-	}
-
-	return fmt.Errorf("hybrid_override_pattern must be a string or string array")
-}
-
-type nemotronHModel struct {
-	ModelParameters
-	MaxPositionEmbeddings uint32        `json:"max_position_embeddings"`
-	HiddenSize            uint32        `json:"hidden_size"`
-	NumHiddenLayers       uint32        `json:"num_hidden_layers"`
-	NumAttentionHeads     uint32        `json:"num_attention_heads"`
-	NumKeyValueHeads      uint32        `json:"num_key_value_heads"`
-	HeadDim               uint32        `json:"head_dim"`
-	LayerNormEpsilon      float32       `json:"layer_norm_epsilon"`
-	NormEpsilon           float32       `json:"norm_eps"`
-	RopeTheta             float32       `json:"rope_theta"`
-	PartialRotaryFactor   float32       `json:"partial_rotary_factor"`
-	ConvKernel            uint32        `json:"conv_kernel"`
-	SSMStateSize          uint32        `json:"ssm_state_size"`
-	MambaNumHeads         uint32        `json:"mamba_num_heads"`
-	MambaHeadDim          uint32        `json:"mamba_head_dim"`
-	NGroups               uint32        `json:"n_groups"`
-	IntermediateSize      uint32        `json:"intermediate_size"`
-	HybridOverridePattern hybridPattern `json:"hybrid_override_pattern"`
-
-	// MoE
-	NumExperts                  uint32  `json:"num_experts"`
-	NumSharedExperts            uint32  `json:"num_shared_experts"`
-	NRoutedExperts              uint32  `json:"n_routed_experts"`
-	NSharedExperts              uint32  `json:"n_shared_experts"`
-	NumExpertsPerTok            uint32  `json:"num_experts_per_tok"`
-	MoEIntermediateSize         uint32  `json:"moe_intermediate_size"`
-	MoESharedExpertIntermediate uint32  `json:"moe_shared_expert_intermediate_size"`
-	NormTopKProb                bool    `json:"norm_topk_prob"`
-	RoutedScalingFactor         float32 `json:"routed_scaling_factor"`
-	ExpertGroupCount            uint32  `json:"n_group"`
-	ExpertGroupUsedCount        uint32  `json:"topk_group"`
-}
-
-var _ ModelConverter = (*nemotronHModel)(nil)
-
-func (n *nemotronHModel) parseMore(_ fs.FS) error {
-	if n.NumHiddenLayers == 0 {
-		return fmt.Errorf("nemotron_h: num_hidden_layers must be set")
-	}
-	if n.HiddenSize == 0 {
-		return fmt.Errorf("nemotron_h: hidden_size must be set")
-	}
-	if n.NumAttentionHeads == 0 {
-		return fmt.Errorf("nemotron_h: num_attention_heads must be set")
-	}
-	if n.HeadDim == 0 {
-		if n.HiddenSize%n.NumAttentionHeads != 0 {
-			return fmt.Errorf("nemotron_h: hidden_size (%d) must be divisible by num_attention_heads (%d)", n.HiddenSize, n.NumAttentionHeads)
-		}
-		n.HeadDim = n.HiddenSize / n.NumAttentionHeads
-	}
-	if n.NumKeyValueHeads == 0 {
-		n.NumKeyValueHeads = n.NumAttentionHeads
-	}
-	if n.ConvKernel == 0 {
-		return fmt.Errorf("nemotron_h: conv_kernel must be set")
-	}
-	if n.SSMStateSize == 0 {
-		return fmt.Errorf("nemotron_h: ssm_state_size must be set")
-	}
-	if n.ssmHeadCount() == 0 {
-		return fmt.Errorf("nemotron_h: mamba_num_heads must be set")
-	}
-	if n.MambaHeadDim == 0 {
-		return fmt.Errorf("nemotron_h: mamba_head_dim must be set")
-	}
-	if n.NGroups == 0 {
-		n.NGroups = 1
-	}
-
-	if _, _, err := n.layerArrays(); err != nil {
-		return err
-	}
-
-	if n.isMoE() {
-		if n.routedExpertCount() == 0 {
-			return fmt.Errorf("nemotron_h: routed expert count must be set for MoE models")
-		}
-		if n.NumExpertsPerTok == 0 {
-			return fmt.Errorf("nemotron_h: num_experts_per_tok must be set for MoE models")
-		}
-		if n.NumExpertsPerTok > n.routedExpertCount() {
-			return fmt.Errorf("nemotron_h: num_experts_per_tok (%d) cannot exceed expert_count (%d)", n.NumExpertsPerTok, n.routedExpertCount())
-		}
-		if n.moeIntermediateSize() == 0 {
-			return fmt.Errorf("nemotron_h: moe_intermediate_size must be set for MoE models")
-		}
-	}
-
-	return nil
-}
-
-func (n *nemotronHModel) isMoE() bool {
-	return cmp.Or(n.routedExpertCount(), n.NumExpertsPerTok, n.MoEIntermediateSize) > 0
-}
-
-func (n *nemotronHModel) routedExpertCount() uint32 {
-	return cmp.Or(n.NRoutedExperts, n.NumExperts)
-}
-
-func (n *nemotronHModel) sharedExpertCount() uint32 {
-	return cmp.Or(n.NSharedExperts, n.NumSharedExperts)
-}
-
-func (n *nemotronHModel) ssmHeadCount() uint32 {
-	return n.MambaNumHeads
-}
-
-func (n *nemotronHModel) ssmInnerSize() uint32 {
-	return n.MambaHeadDim * n.ssmHeadCount()
-}
-
-func (n *nemotronHModel) epsilon() float32 {
-	return cmp.Or(n.NormEpsilon, n.LayerNormEpsilon, float32(1e-5))
-}
-
-func (n *nemotronHModel) moeIntermediateSize() uint32 {
-	return cmp.Or(n.MoEIntermediateSize, n.IntermediateSize)
-}
-
-func (n *nemotronHModel) denseIntermediateSize() uint32 {
-	return cmp.Or(n.IntermediateSize, n.MoEIntermediateSize)
-}
-
-func (n *nemotronHModel) layerArrays() (headCountKV []uint32, ffnLengths []uint32, err error) {
-	pattern := strings.TrimSpace(string(n.HybridOverridePattern))
-	if pattern == "" {
-		return nil, nil, fmt.Errorf("nemotron_h: hybrid_override_pattern must be set")
-	}
-
-	runes := []rune(pattern)
-	if len(runes) != int(n.NumHiddenLayers) {
-		return nil, nil, fmt.Errorf("nemotron_h: hybrid_override_pattern length (%d) must match num_hidden_layers (%d)", len(runes), n.NumHiddenLayers)
-	}
-
-	headCountKV = make([]uint32, n.NumHiddenLayers)
-	ffnLengths = make([]uint32, n.NumHiddenLayers)
-
-	attnKVHeads := cmp.Or(n.NumKeyValueHeads, n.NumAttentionHeads)
-	moeFFN := n.moeIntermediateSize()
-	denseFFN := n.denseIntermediateSize()
-
-	for i, layerType := range runes {
-		switch layerType {
-		case 'M':
-			// Recurrent layer: no KV heads and no FFN.
-		case '*', 'A':
-			// Attention-only layer.
-			headCountKV[i] = attnKVHeads
-		case 'E':
-			// MoE layer.
-			if moeFFN == 0 {
-				return nil, nil, fmt.Errorf("nemotron_h: moe layer at index %d but moe_intermediate_size is zero", i)
-			}
-			ffnLengths[i] = moeFFN
-		case '-':
-			// Dense FFN layer.
-			if denseFFN == 0 {
-				return nil, nil, fmt.Errorf("nemotron_h: dense FFN layer at index %d but intermediate_size is zero", i)
-			}
-			ffnLengths[i] = denseFFN
-		default:
-			return nil, nil, fmt.Errorf("nemotron_h: unsupported layer type %q in hybrid_override_pattern at index %d", layerType, i)
-		}
-	}
-
-	return headCountKV, ffnLengths, nil
-}
-
-func (n *nemotronHModel) KV(t *Tokenizer) KV {
-	kv := n.ModelParameters.KV(t)
-
-	arch := "nemotron_h"
-	if n.isMoE() {
-		arch = "nemotron_h_moe"
-	}
-	kv["general.architecture"] = arch
-	kv["block_count"] = n.NumHiddenLayers
-	kv["context_length"] = n.MaxPositionEmbeddings
-	kv["embedding_length"] = n.HiddenSize
-	kv["attention.head_count"] = n.NumAttentionHeads
-	kv["attention.key_length"] = n.HeadDim
-	kv["attention.value_length"] = n.HeadDim
-	kv["attention.layer_norm_epsilon"] = n.epsilon()
-	kv["attention.layer_norm_rms_epsilon"] = n.epsilon()
-	kv["rope.freq_base"] = cmp.Or(n.RopeTheta, float32(10000))
-	if n.PartialRotaryFactor > 0 && n.PartialRotaryFactor <= 1 {
-		kv["rope.dimension_count"] = uint32(float32(n.HeadDim) * n.PartialRotaryFactor)
-	}
-
-	if headCountKV, ffnLengths, err := n.layerArrays(); err == nil {
-		kv["attention.head_count_kv"] = headCountKV
-		kv["feed_forward_length"] = ffnLengths
-	}
-
-	kv["ssm.conv_kernel"] = n.ConvKernel
-	kv["ssm.inner_size"] = n.ssmInnerSize()
-	kv["ssm.state_size"] = n.SSMStateSize
-	kv["ssm.group_count"] = n.NGroups
-	kv["ssm.time_step_rank"] = n.ssmHeadCount()
-
-	if n.isMoE() {
-		kv["expert_count"] = n.routedExpertCount()
-		kv["expert_used_count"] = n.NumExpertsPerTok
-		kv["expert_feed_forward_length"] = n.moeIntermediateSize()
-		if n.sharedExpertCount() > 0 {
-			kv["expert_shared_count"] = n.sharedExpertCount()
-		}
-		if n.MoESharedExpertIntermediate > 0 {
-			kv["expert_shared_feed_forward_length"] = n.MoESharedExpertIntermediate
-		}
-		kv["expert_weights_norm"] = n.NormTopKProb
-		kv["expert_weights_scale"] = n.RoutedScalingFactor
-		if n.ExpertGroupCount > 0 {
-			kv["expert_group_count"] = n.ExpertGroupCount
-		}
-		if n.ExpertGroupUsedCount > 0 {
-			kv["expert_group_used_count"] = n.ExpertGroupUsedCount
-		}
-	}
-
-	return kv
-}
-
-func normalizeVectorShapeToColumn(shape []uint64) []uint64 {
-	switch len(shape) {
-	case 1:
-		return []uint64{shape[0], 1}
-	case 2:
-		if shape[0] == 1 && shape[1] > 1 {
-			return []uint64{shape[1], 1}
-		}
-		if shape[1] == 1 && shape[0] > 1 {
-			return []uint64{shape[0], 1}
-		}
-	}
-
-	return slices.Clone(shape)
-}
-
-func (n *nemotronHModel) Tensors(ts []Tensor) []*ggml.Tensor {
-	var out []*ggml.Tensor
-
-	remaining := ts
-	if n.isMoE() {
-		merges := make([]merge, 0, n.NumHiddenLayers*2)
-		for i := range n.NumHiddenLayers {
-			merges = append(merges, merge{
-				fmt.Sprintf("blk.%d.mixer.experts.*.up_proj.weight", i),
-				fmt.Sprintf("blk.%d.ffn_up_exps.weight", i),
-			}, merge{
-				fmt.Sprintf("blk.%d.mixer.experts.*.down_proj.weight", i),
-				fmt.Sprintf("blk.%d.ffn_down_exps.weight", i),
-			})
-		}
-
-		merged, rest := mergeTensors(ts, merges...)
-		out = append(out, merged...)
-		remaining = rest
-	}
-
-	nGroups := uint64(cmp.Or(n.NGroups, uint32(1)))
-	for _, t := range remaining {
-		name := t.Name()
-		shape := slices.Clone(t.Shape())
-
-		switch {
-		case strings.HasSuffix(name, ".ssm_a"):
-			shape = normalizeVectorShapeToColumn(shape)
-			t.SetRepacker(func(_ string, data []float32, _ []uint64) ([]float32, error) {
-				out := make([]float32, len(data))
-				for i, v := range data {
-					out[i] = -float32(math.Exp(float64(v)))
-				}
-				return out, nil
-			})
-		case strings.HasSuffix(name, ".ssm_d"):
-			shape = normalizeVectorShapeToColumn(shape)
-		case strings.HasSuffix(name, ".ssm_norm.weight"):
-			switch len(shape) {
-			case 1:
-				if nGroups > 0 && shape[0]%nGroups == 0 {
-					shape = []uint64{nGroups, shape[0] / nGroups}
-				}
-			case 2:
-				if shape[0] == 1 && nGroups > 0 && shape[1]%nGroups == 0 {
-					shape = []uint64{nGroups, shape[1] / nGroups}
-				}
-			}
-		case strings.HasSuffix(name, ".ssm_conv1d.weight"):
-			if len(shape) == 3 {
-				if shape[0] == 1 {
-					shape = []uint64{shape[1], shape[2]}
-				} else if shape[1] == 1 {
-					shape = []uint64{shape[0], shape[2]}
-				}
-			}
-		}
-
-		out = append(out, &ggml.Tensor{
-			Name:     name,
-			Kind:     t.Kind(),
-			Shape:    shape,
-			WriterTo: t,
-		})
-	}
-
-	return out
-}
-
-func (n *nemotronHModel) Replacements() []string {
-	return []string{
-		// Embedding and output
-		"lm_head", "output",
-		"backbone.embeddings", "token_embd",
-		"backbone.norm_f", "output_norm",
-		"backbone.layers", "blk",
-
-		// Recurrent (Mamba2) tensors
-		"mixer.in_proj", "ssm_in",
-		"mixer.out_proj", "ssm_out",
-		"mixer.dt_bias", "ssm_dt.bias",
-		"mixer.A_log", "ssm_a",
-		"mixer.D", "ssm_d",
-		"mixer.conv1d", "ssm_conv1d",
-		"mixer.norm.weight", "ssm_norm.weight",
-
-		// Attention tensors
-		"mixer.q_proj", "attn_q",
-		"mixer.k_proj", "attn_k",
-		"mixer.v_proj", "attn_v",
-		"mixer.o_proj", "attn_output",
-
-		// FFN / MoE tensors
-		"mixer.gate.e_score_correction_bias", "exp_probs_b.bias",
-		"mixer.gate", "ffn_gate_inp",
-		"mixer.fc1_latent_proj", "ffn_latent_in",
-		"mixer.fc2_latent_proj", "ffn_latent_out",
-		"mixer.shared_experts.up_proj", "ffn_up_shexp",
-		"mixer.shared_experts.down_proj", "ffn_down_shexp",
-		"mixer.up_proj", "ffn_up",
-		"mixer.down_proj", "ffn_down",
-
-		// Per-layer pre-norm
-		".norm.weight", ".attn_norm.weight",
-	}
-}
--- a/convert/convert_nemotron_h_test.go
+++ b/convert/convert_nemotron_h_test.go
@@ -1,230 +0,0 @@
-package convert
-
-import (
-	"bytes"
-	"encoding/binary"
-	"encoding/json"
-	"io"
-	"os"
-	"path/filepath"
-	"slices"
-	"strings"
-	"testing"
-)
-
-func TestHybridPatternUnmarshal(t *testing.T) {
-	t.Run("string", func(t *testing.T) {
-		var p hybridPattern
-		if err := json.Unmarshal([]byte(`"MEM*"`), &p); err != nil {
-			t.Fatal(err)
-		}
-		if got, want := string(p), "MEM*"; got != want {
-			t.Fatalf("unexpected pattern: got %q want %q", got, want)
-		}
-	})
-
-	t.Run("array", func(t *testing.T) {
-		var p hybridPattern
-		if err := json.Unmarshal([]byte(`["M","E","M","*"]`), &p); err != nil {
-			t.Fatal(err)
-		}
-		if got, want := string(p), "MEM*"; got != want {
-			t.Fatalf("unexpected pattern: got %q want %q", got, want)
-		}
-	})
-}
-
-func TestNemotronHLayerArrays(t *testing.T) {
-	m := &nemotronHModel{
-		NumHiddenLayers:       5,
-		NumAttentionHeads:     32,
-		NumKeyValueHeads:      8,
-		HybridOverridePattern: "MEM*E",
-		NRoutedExperts:        128,
-		NumExpertsPerTok:      6,
-		MoEIntermediateSize:   1856,
-	}
-
-	headsKV, ffn, err := m.layerArrays()
-	if err != nil {
-		t.Fatal(err)
-	}
-
-	if got, want := headsKV, []uint32{0, 0, 0, 8, 0}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected head_count_kv: got %v want %v", got, want)
-	}
-	if got, want := ffn, []uint32{0, 1856, 0, 0, 1856}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected feed_forward_length: got %v want %v", got, want)
-	}
-}
-
-func TestNemotronHKV(t *testing.T) {
-	m := &nemotronHModel{
-		MaxPositionEmbeddings:       1048576,
-		HiddenSize:                  2688,
-		NumHiddenLayers:             5,
-		NumAttentionHeads:           32,
-		NumKeyValueHeads:            2,
-		HeadDim:                     128,
-		LayerNormEpsilon:            1e-5,
-		RopeTheta:                   10000,
-		PartialRotaryFactor:         0.5,
-		ConvKernel:                  4,
-		SSMStateSize:                128,
-		MambaNumHeads:               64,
-		MambaHeadDim:                64,
-		NGroups:                     8,
-		HybridOverridePattern:       "MEM*E",
-		NRoutedExperts:              128,
-		NSharedExperts:              1,
-		NumExpertsPerTok:            6,
-		MoEIntermediateSize:         1856,
-		MoESharedExpertIntermediate: 3712,
-		NormTopKProb:                true,
-		RoutedScalingFactor:         2.5,
-	}
-	if err := m.parseMore(nil); err != nil {
-		t.Fatal(err)
-	}
-
-	kv := m.KV(&Tokenizer{Vocabulary: &Vocabulary{}})
-	if got, want := kv["general.architecture"], "nemotron_h_moe"; got != want {
-		t.Fatalf("unexpected architecture: got %v want %v", got, want)
-	}
-
-	headCountKV, ok := kv["attention.head_count_kv"].([]uint32)
-	if !ok {
-		t.Fatalf("attention.head_count_kv has unexpected type: %T", kv["attention.head_count_kv"])
-	}
-	if got, want := headCountKV, []uint32{0, 0, 0, 2, 0}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected attention.head_count_kv: got %v want %v", got, want)
-	}
-
-	ffnLength, ok := kv["feed_forward_length"].([]uint32)
-	if !ok {
-		t.Fatalf("feed_forward_length has unexpected type: %T", kv["feed_forward_length"])
-	}
-	if got, want := ffnLength, []uint32{0, 1856, 0, 0, 1856}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected feed_forward_length: got %v want %v", got, want)
-	}
-}
-
-func TestNemotronHTensorsTransforms(t *testing.T) {
-	m := &nemotronHModel{NGroups: 8}
-	in := []Tensor{
-		&fakeTensor{
-			name:  "blk.0.ssm_a",
-			shape: []uint64{4},
-			data:  []float32{0, 1, 2, 3},
-		},
-		&fakeTensor{
-			name:  "blk.0.ssm_d",
-			shape: []uint64{4},
-			data:  []float32{0, 1, 2, 3},
-		},
-		&fakeTensor{
-			name:  "blk.0.ssm_norm.weight",
-			shape: []uint64{16},
-			data:  make([]float32, 16),
-		},
-		&fakeTensor{
-			name:  "blk.0.ssm_conv1d.weight",
-			shape: []uint64{10, 1, 4},
-			data:  make([]float32, 40),
-		},
-	}
-
-	out := m.Tensors(in)
-	if len(out) != len(in) {
-		t.Fatalf("unexpected output tensor count: got %d want %d", len(out), len(in))
-	}
-
-	got := map[string]struct {
-		shape  []uint64
-		writer io.WriterTo
-	}{}
-	for _, t := range out {
-		got[t.Name] = struct {
-			shape  []uint64
-			writer io.WriterTo
-		}{shape: t.Shape, writer: t.WriterTo}
-	}
-
-	if shape := got["blk.0.ssm_a"].shape; !slices.Equal(shape, []uint64{4, 1}) {
-		t.Fatalf("unexpected ssm_a shape: %v", shape)
-	}
-	if shape := got["blk.0.ssm_d"].shape; !slices.Equal(shape, []uint64{4, 1}) {
-		t.Fatalf("unexpected ssm_d shape: %v", shape)
-	}
-	if shape := got["blk.0.ssm_norm.weight"].shape; !slices.Equal(shape, []uint64{8, 2}) {
-		t.Fatalf("unexpected ssm_norm shape: %v", shape)
-	}
-	if shape := got["blk.0.ssm_conv1d.weight"].shape; !slices.Equal(shape, []uint64{10, 4}) {
-		t.Fatalf("unexpected ssm_conv1d shape: %v", shape)
-	}
-
-	var b bytes.Buffer
-	if _, err := got["blk.0.ssm_a"].writer.WriteTo(&b); err != nil {
-		t.Fatal(err)
-	}
-	values := make([]float32, 4)
-	if err := binary.Read(&b, binary.LittleEndian, &values); err != nil {
-		t.Fatal(err)
-	}
-	// 0 -> -exp(0) == -1
-	if values[0] != -1 {
-		t.Fatalf("unexpected transformed ssm_a[0]: got %v want -1", values[0])
-	}
-}
-
-func TestNemotronHLoadModelMetadata(t *testing.T) {
-	tempDir := t.TempDir()
-
-	config := `{
-		"architectures": ["NemotronHForCausalLM"],
-		"model_type": "nemotron_h",
-		"num_hidden_layers": 4,
-		"hidden_size": 512,
-		"max_position_embeddings": 32768,
-		"num_attention_heads": 8,
-		"num_key_value_heads": 2,
-		"head_dim": 64,
-		"layer_norm_epsilon": 1e-5,
-		"conv_kernel": 4,
-		"ssm_state_size": 128,
-		"mamba_num_heads": 16,
-		"mamba_head_dim": 32,
-		"n_groups": 8,
-		"hybrid_override_pattern": "ME*M",
-		"n_routed_experts": 16,
-		"num_experts_per_tok": 4,
-		"moe_intermediate_size": 256
-	}`
-
-	if err := os.WriteFile(filepath.Join(tempDir, "config.json"), []byte(config), 0o644); err != nil {
-		t.Fatal(err)
-	}
-	if err := os.WriteFile(filepath.Join(tempDir, "tokenizer.json"), []byte(`{}`), 0o644); err != nil {
-		t.Fatal(err)
-	}
-
-	kv, _, err := LoadModelMetadata(os.DirFS(tempDir))
-	if err != nil {
-		t.Fatal(err)
-	}
-	if _, ok := kv.(*nemotronHModel); !ok {
-		t.Fatalf("unexpected converter type: %T", kv)
-	}
-}
-
-func TestNemotronHReplacementsLatentProjections(t *testing.T) {
-	m := &nemotronHModel{}
-	r := strings.NewReplacer(m.Replacements()...)
-
-	if got, want := r.Replace("backbone.layers.1.mixer.fc1_latent_proj.weight"), "blk.1.ffn_latent_in.weight"; got != want {
-		t.Fatalf("unexpected fc1 replacement: got %q want %q", got, want)
-	}
-	if got, want := r.Replace("backbone.layers.1.mixer.fc2_latent_proj.weight"), "blk.1.ffn_latent_out.weight"; got != want {
-		t.Fatalf("unexpected fc2 replacement: got %q want %q", got, want)
-	}
-}
--- a/convert/convert_qwen3next.go
+++ b/convert/convert_qwen3next.go
@@ -1,946 +0,0 @@
-package convert
-
-import (
-	"encoding/json"
-	"fmt"
-	"io/fs"
-	"math"
-	"slices"
-	"strings"
-
-	"github.com/pdevine/tensor"
-	"github.com/pdevine/tensor/native"
-
-	"github.com/ollama/ollama/fs/ggml"
-)
-
-type qwen3NextRopeScaling struct {
-	Type         string     `json:"type"`
-	Factor       ropeFactor `json:"factor"`
-	MropeSection []int32    `json:"mrope_section"`
-}
-
-type qwen3NextRopeParams struct {
-	MRopeInterleaved    bool    `json:"mrope_interleaved"`
-	MropeSection        []int32 `json:"mrope_section"`
-	RopeType            string  `json:"rope_type"`
-	RopeTheta           float32 `json:"rope_theta"`
-	PartialRotaryFactor float32 `json:"partial_rotary_factor"`
-}
-
-type qwen3NextTextConfig struct {
-	MaxPositionEmbeddings uint32  `json:"max_position_embeddings"`
-	HiddenSize            uint32  `json:"hidden_size"`
-	NumHiddenLayers       uint32  `json:"num_hidden_layers"`
-	IntermediateSize      uint32  `json:"intermediate_size"`
-	NumAttentionHeads     uint32  `json:"num_attention_heads"`
-	NumKeyValueHeads      uint32  `json:"num_key_value_heads"`
-	HeadDim               uint32  `json:"head_dim"`
-	RopeTheta             float32 `json:"rope_theta"`
-	RMSNormEPS            float32 `json:"rms_norm_eps"`
-
-	// MoE config
-	NumExperts             uint32 `json:"num_experts"`
-	NumExpertsPerToken     uint32 `json:"num_experts_per_tok"`
-	NormTopkProb           *bool  `json:"norm_topk_prob"`
-	MoEIntermediateSize    uint32 `json:"moe_intermediate_size"`
-	SharedExpertIntermSize uint32 `json:"shared_expert_intermediate_size"`
-
-	// Hybrid attention config
-	FullAttentionInterval uint32   `json:"full_attention_interval"`
-	LayerTypes            []string `json:"layer_types"`
-
-	// Linear attention (Gated Delta Net) config
-	LinearConvKernelDim uint32 `json:"linear_conv_kernel_dim"`
-	LinearKeyHeadDim    uint32 `json:"linear_key_head_dim"`
-	LinearNumKeyHeads   uint32 `json:"linear_num_key_heads"`
-	LinearNumValueHeads uint32 `json:"linear_num_value_heads"`
-	LinearValueHeadDim  uint32 `json:"linear_value_head_dim"`
-
-	// RoPE config
-	PartialRotaryFactor float32              `json:"partial_rotary_factor"`
-	RopeScaling         qwen3NextRopeScaling `json:"rope_scaling"`
-	RopeParameters      qwen3NextRopeParams  `json:"rope_parameters"`
-}
-
-type qwen3NextVisionConfig struct {
-	Depth                  uint32  `json:"depth"`
-	HiddenSize             uint32  `json:"hidden_size"`
-	NumHeads               uint32  `json:"num_heads"`
-	InChannels             uint32  `json:"in_channels"`
-	PatchSize              uint32  `json:"patch_size"`
-	SpatialMergeSize       uint32  `json:"spatial_merge_size"`
-	RMSNormEps             float32 `json:"layer_norm_epsilon"`
-	RopeTheta              float32 `json:"rope_theta"`
-	TemporalPatchSize      uint32  `json:"temporal_patch_size"`
-	DeepstackVisualIndexes []int32 `json:"deepstack_visual_indexes"`
-
-	Size struct {
-		ShortestEdge uint32 `json:"shortest_edge"`
-		LongestEdge  uint32 `json:"longest_edge"`
-	} `json:"size"`
-
-	ImageMean []float32 `json:"image_mean"`
-	ImageStd  []float32 `json:"image_std"`
-}
-
-type qwen3NextModel struct {
-	ModelParameters
-	qwen3NextTextConfig
-
-	TextConfig  *qwen3NextTextConfig  `json:"text_config"`
-	VisionModel qwen3NextVisionConfig `json:"vision_config"`
-
-	ImageTokenID       uint32 `json:"image_token_id"`
-	VisionStartTokenID uint32 `json:"vision_start_token_id"`
-	VisionEndTokenID   uint32 `json:"vision_end_token_id"`
-}
-
-var _ ModelConverter = (*qwen3NextModel)(nil)
-
-func (q *qwen3NextModel) parseMore(fsys fs.FS) error {
-	if q.TextConfig != nil {
-		q.qwen3NextTextConfig = *q.TextConfig
-	}
-
-	if q.RopeTheta == 0 {
-		q.RopeTheta = q.RopeParameters.RopeTheta
-	}
-	if q.PartialRotaryFactor == 0 {
-		q.PartialRotaryFactor = q.RopeParameters.PartialRotaryFactor
-	}
-
-	if q.RopeScaling.Type == "" && q.RopeParameters.RopeType != "" {
-		q.RopeScaling.Type = q.RopeParameters.RopeType
-	}
-
-	// Pull vision preprocessing fields when present.
-	if q.VisionModel.Depth > 0 {
-		if bts, err := fs.ReadFile(fsys, "preprocessor_config.json"); err == nil {
-			var pre struct {
-				Size struct {
-					ShortestEdge uint32 `json:"shortest_edge"`
-					LongestEdge  uint32 `json:"longest_edge"`
-				} `json:"size"`
-				PatchSize         uint32    `json:"patch_size"`
-				TemporalPatchSize uint32    `json:"temporal_patch_size"`
-				MergeSize         uint32    `json:"merge_size"`
-				ImageMean         []float32 `json:"image_mean"`
-				ImageStd          []float32 `json:"image_std"`
-			}
-			if json.Unmarshal(bts, &pre) == nil {
-				if q.VisionModel.PatchSize == 0 {
-					q.VisionModel.PatchSize = pre.PatchSize
-				}
-				if q.VisionModel.TemporalPatchSize == 0 {
-					q.VisionModel.TemporalPatchSize = pre.TemporalPatchSize
-				}
-				if q.VisionModel.SpatialMergeSize == 0 {
-					q.VisionModel.SpatialMergeSize = pre.MergeSize
-				}
-				if q.VisionModel.Size.ShortestEdge == 0 {
-					q.VisionModel.Size.ShortestEdge = pre.Size.ShortestEdge
-				}
-				if q.VisionModel.Size.LongestEdge == 0 {
-					q.VisionModel.Size.LongestEdge = pre.Size.LongestEdge
-				}
-				if len(q.VisionModel.ImageMean) == 0 {
-					q.VisionModel.ImageMean = pre.ImageMean
-				}
-				if len(q.VisionModel.ImageStd) == 0 {
-					q.VisionModel.ImageStd = pre.ImageStd
-				}
-			}
-		}
-	}
-
-	if q.NumHiddenLayers == 0 {
-		return fmt.Errorf("qwen3next: num_hidden_layers must be set")
-	}
-	if q.NumAttentionHeads == 0 {
-		return fmt.Errorf("qwen3next: num_attention_heads must be set")
-	}
-	if q.NumKeyValueHeads == 0 {
-		return fmt.Errorf("qwen3next: num_key_value_heads must be set")
-	}
-	if q.HeadDim == 0 {
-		return fmt.Errorf("qwen3next: head_dim must be set")
-	}
-	if q.RopeTheta == 0 {
-		return fmt.Errorf("qwen3next: rope_theta must be set")
-	}
-	if q.PartialRotaryFactor <= 0 || q.PartialRotaryFactor > 1 {
-		return fmt.Errorf("qwen3next: partial_rotary_factor must be in (0,1], got %v", q.PartialRotaryFactor)
-	}
-	if q.LinearNumKeyHeads == 0 || q.LinearNumValueHeads == 0 || q.LinearKeyHeadDim == 0 || q.LinearValueHeadDim == 0 {
-		return fmt.Errorf("qwen3next: linear attention config must be set (linear_num_key_heads, linear_num_value_heads, linear_key_head_dim, linear_value_head_dim)")
-	}
-	if _, err := q.kvHeadCounts(); err != nil {
-		return err
-	}
-
-	return nil
-}
-
-func (q *qwen3NextModel) kvHeadCounts() ([]uint32, error) {
-	if len(q.LayerTypes) > 0 {
-		kv := make([]uint32, q.NumHiddenLayers)
-		hasFull := false
-		hasRecurrent := false
-		for i := range q.NumHiddenLayers {
-			layerType := ""
-			if i < uint32(len(q.LayerTypes)) {
-				layerType = q.LayerTypes[i]
-			}
-			if layerType == "full_attention" {
-				kv[i] = q.NumKeyValueHeads
-				hasFull = true
-			} else {
-				hasRecurrent = true
-			}
-		}
-		if !hasFull || !hasRecurrent {
-			return nil, fmt.Errorf("qwen3next: layer_types must include both full_attention and linear_attention")
-		}
-		return kv, nil
-	}
-
-	if q.FullAttentionInterval == 0 {
-		return nil, fmt.Errorf("qwen3next: full_attention_interval must be set")
-	}
-	if q.FullAttentionInterval > q.NumHiddenLayers {
-		return nil, fmt.Errorf("qwen3next: full_attention_interval (%d) exceeds num_hidden_layers (%d)", q.FullAttentionInterval, q.NumHiddenLayers)
-	}
-
-	kv := make([]uint32, q.NumHiddenLayers)
-	hasFull := false
-	for i := range q.NumHiddenLayers {
-		if (i+1)%q.FullAttentionInterval == 0 {
-			kv[i] = q.NumKeyValueHeads
-			hasFull = true
-		}
-	}
-	if !hasFull {
-		return nil, fmt.Errorf("qwen3next: head_count_kv would be all zeros (full_attention_interval=%d, num_hidden_layers=%d)", q.FullAttentionInterval, q.NumHiddenLayers)
-	}
-	return kv, nil
-}
-
-func (q *qwen3NextModel) ropeSections() []int32 {
-	if len(q.RopeParameters.MropeSection) > 0 {
-		return q.RopeParameters.MropeSection
-	}
-	return q.RopeScaling.MropeSection
-}
-
-func (q *qwen3NextModel) shouldReorderVHeads() bool {
-	modelType := strings.ToLower(q.ModelType)
-	if strings.Contains(modelType, "qwen3_next") || strings.Contains(modelType, "qwen3next") {
-		return false
-	}
-
-	for _, arch := range q.Architectures {
-		arch = strings.ToLower(arch)
-		if strings.Contains(arch, "qwen3next") || strings.Contains(arch, "qwen3_next") {
-			return false
-		}
-	}
-
-	// Default to qwen3.5 layout for all other qwen3next-family imports.
-	return true
-}
-
-func (q *qwen3NextModel) KV(t *Tokenizer) KV {
-	kv := q.ModelParameters.KV(t)
-
-	arch := "qwen35"
-	if q.NumExperts > 0 {
-		arch = "qwen35moe"
-	}
-	kv["general.architecture"] = arch
-	kv["tokenizer.ggml.pre"] = "qwen35"
-	kv["block_count"] = q.NumHiddenLayers
-	kv["context_length"] = q.MaxPositionEmbeddings
-	kv["embedding_length"] = q.HiddenSize
-	kv["feed_forward_length"] = q.IntermediateSize
-	kv["attention.head_count"] = q.NumAttentionHeads
-
-	headDim := q.HeadDim
-	if headDim == 0 && q.NumAttentionHeads > 0 {
-		headDim = q.HiddenSize / q.NumAttentionHeads
-	}
-	kv["attention.key_length"] = headDim
-	kv["attention.value_length"] = headDim
-	kv["attention.layer_norm_rms_epsilon"] = q.RMSNormEPS
-	kv["rope.freq_base"] = q.RopeTheta
-
-	partialRotary := q.PartialRotaryFactor
-	if partialRotary > 0 && partialRotary <= 1 {
-		kv["rope.dimension_count"] = uint32(float32(headDim) * partialRotary)
-	}
-
-	if sections := q.ropeSections(); len(sections) > 0 {
-		kv["mrope_sections"] = sections
-		kv["rope.mrope_section"] = sections
-		kv["rope.dimension_sections"] = sections
-	}
-	if q.RopeParameters.MRopeInterleaved {
-		kv["rope.mrope_interleaved"] = true
-	}
-
-	if q.RopeScaling.Type != "" && q.RopeScaling.Type != "default" {
-		kv["rope.scaling.type"] = q.RopeScaling.Type
-		kv["rope.scaling.factor"] = q.RopeScaling.Factor
-	}
-
-	if q.NumExperts > 0 {
-		kv["expert_count"] = q.NumExperts
-		kv["expert_used_count"] = q.NumExpertsPerToken
-		if q.NormTopkProb != nil {
-			kv["norm_top_k_prob"] = *q.NormTopkProb
-		}
-		if q.MoEIntermediateSize > 0 {
-			kv["expert_feed_forward_length"] = q.MoEIntermediateSize
-		}
-		if q.SharedExpertIntermSize > 0 {
-			kv["expert_shared_feed_forward_length"] = q.SharedExpertIntermSize
-		}
-	}
-
-	dInner := q.LinearValueHeadDim * q.LinearNumValueHeads
-	kv["ssm.inner_size"] = dInner
-	kv["ssm.state_size"] = q.LinearKeyHeadDim
-	kv["ssm.group_count"] = q.LinearNumKeyHeads
-	kv["ssm.time_step_rank"] = q.LinearNumValueHeads
-	kv["ssm.conv_kernel"] = q.LinearConvKernelDim
-	if q.shouldReorderVHeads() {
-		kv["ssm.v_head_reordered"] = true
-	}
-	if q.FullAttentionInterval > 0 {
-		kv["full_attention_interval"] = q.FullAttentionInterval
-	}
-
-	if headCounts, err := q.kvHeadCounts(); err == nil {
-		kv["attention.head_count_kv"] = headCounts
-	}
-
-	if q.VisionModel.Depth > 0 {
-		kv["vision.block_count"] = q.VisionModel.Depth
-		kv["vision.embedding_length"] = q.VisionModel.HiddenSize
-		kv["vision.attention.head_count"] = q.VisionModel.NumHeads
-		kv["vision.num_channels"] = q.VisionModel.InChannels
-		if q.VisionModel.PatchSize > 0 {
-			kv["vision.patch_size"] = q.VisionModel.PatchSize
-		}
-		if q.VisionModel.SpatialMergeSize > 0 {
-			kv["vision.spatial_merge_size"] = q.VisionModel.SpatialMergeSize
-		}
-		if q.VisionModel.RMSNormEps > 0 {
-			kv["vision.attention.layer_norm_epsilon"] = q.VisionModel.RMSNormEps
-		}
-		if q.VisionModel.RopeTheta > 0 {
-			kv["vision.rope.freq_base"] = q.VisionModel.RopeTheta
-		}
-		if q.VisionModel.TemporalPatchSize > 0 {
-			kv["vision.temporal_patch_size"] = q.VisionModel.TemporalPatchSize
-		}
-		kv["vision.deepstack_visual_indexes"] = q.VisionModel.DeepstackVisualIndexes
-		if q.VisionModel.Size.ShortestEdge > 0 {
-			kv["vision.shortest_edge"] = q.VisionModel.Size.ShortestEdge
-		}
-		if q.VisionModel.Size.LongestEdge > 0 {
-			kv["vision.longest_edge"] = q.VisionModel.Size.LongestEdge
-		}
-		if len(q.VisionModel.ImageMean) > 0 {
-			kv["vision.image_mean"] = q.VisionModel.ImageMean
-		}
-		if len(q.VisionModel.ImageStd) > 0 {
-			kv["vision.image_std"] = q.VisionModel.ImageStd
-		}
-	}
-
-	if q.ImageTokenID > 0 {
-		kv["image_token_id"] = q.ImageTokenID
-	}
-	if q.VisionStartTokenID > 0 {
-		kv["vision_start_token_id"] = q.VisionStartTokenID
-	}
-	if q.VisionEndTokenID > 0 {
-		kv["vision_end_token_id"] = q.VisionEndTokenID
-	}
-
-	return kv
-}
-
-func (q *qwen3NextModel) Tensors(ts []Tensor) []*ggml.Tensor {
-	var out []*ggml.Tensor
-
-	merges := make([]merge, q.NumHiddenLayers*3)
-	for i := range q.NumHiddenLayers {
-		merges[i*3+0] = merge{
-			fmt.Sprintf("blk.%d.mlp.experts.*.gate_proj.weight", i),
-			fmt.Sprintf("blk.%d.ffn_gate_exps.weight", i),
-		}
-		merges[i*3+1] = merge{
-			fmt.Sprintf("blk.%d.mlp.experts.*.up_proj.weight", i),
-			fmt.Sprintf("blk.%d.ffn_up_exps.weight", i),
-		}
-		merges[i*3+2] = merge{
-			fmt.Sprintf("blk.%d.mlp.experts.*.down_proj.weight", i),
-			fmt.Sprintf("blk.%d.ffn_down_exps.weight", i),
-		}
-	}
-
-	merged, remaining := mergeTensors(ts, merges...)
-	out = append(out, merged...)
-
-	for _, t := range remaining {
-		name := t.Name()
-		shape := t.Shape()
-
-		if strings.HasSuffix(name, ".ssm_in.weight") {
-			if qkv, gate, ok := q.splitQKVZTensor(t); ok {
-				out = append(out, qkv, gate)
-				continue
-			}
-			panic(fmt.Sprintf("qwen3next: failed to split %s into attn_qkv/attn_gate (shape=%v)", name, shape))
-		}
-
-		switch {
-		case strings.Contains(name, ".mlp.experts.gate_up_proj"):
-			out = append(out, slices.Collect(splitDim(t, 1,
-				split{Replacer: strings.NewReplacer(".mlp.experts.gate_up_proj", ".ffn_gate_exps.weight")},
-				split{Replacer: strings.NewReplacer(".mlp.experts.gate_up_proj", ".ffn_up_exps.weight")},
-			))...)
-
-		case strings.Contains(name, ".mlp.experts.down_proj"):
-			out = append(out, &ggml.Tensor{
-				Name:     strings.NewReplacer(".mlp.experts.down_proj", ".ffn_down_exps.weight").Replace(name),
-				Kind:     t.Kind(),
-				Shape:    slices.Clone(shape),
-				WriterTo: t,
-			})
-
-		case strings.HasPrefix(name, "v.blk.") && strings.Contains(name, ".attn_qkv"):
-			out = append(out, slices.Collect(splitDim(t, 0,
-				split{Replacer: strings.NewReplacer("attn_qkv", "attn_q")},
-				split{Replacer: strings.NewReplacer("attn_qkv", "attn_k")},
-				split{Replacer: strings.NewReplacer("attn_qkv", "attn_v")},
-			))...)
-
-		case strings.Contains(name, "patch_embed") && strings.HasSuffix(name, "weight"):
-			out = append(out, &ggml.Tensor{
-				Name:     name,
-				Kind:     t.Kind(),
-				Shape:    append([]uint64{shape[0] * shape[1]}, shape[2:]...),
-				WriterTo: t,
-			})
-
-		case strings.HasSuffix(name, "_norm.weight") && !strings.HasSuffix(name, ".ssm_norm.weight"):
-			t.SetRepacker(q.addOne)
-			out = append(out, &ggml.Tensor{Name: name, Kind: t.Kind(), Shape: slices.Clone(shape), WriterTo: t})
-
-		case strings.HasSuffix(name, ".ssm_a"):
-			t.SetRepacker(q.repackSSMA())
-			out = append(out, &ggml.Tensor{Name: name, Kind: t.Kind(), Shape: slices.Clone(shape), WriterTo: t})
-
-		case strings.HasSuffix(name, ".attn_qkv.weight"):
-			if q.shouldReorderVHeads() {
-				t.SetRepacker(q.repackAttnQKV())
-			}
-			out = append(out, &ggml.Tensor{Name: name, Kind: t.Kind(), Shape: slices.Clone(shape), WriterTo: t})
-
-		case strings.HasSuffix(name, ".attn_gate.weight"):
-			if q.shouldReorderVHeads() {
-				// HF tensor layout is [out_features, in_features]; reorder rows.
-				t.SetRepacker(q.repackReorderDim(0, int(q.LinearValueHeadDim)))
-			}
-			out = append(out, &ggml.Tensor{Name: name, Kind: t.Kind(), Shape: slices.Clone(shape), WriterTo: t})
-
-		case strings.HasSuffix(name, ".ssm_beta.weight"), strings.HasSuffix(name, ".ssm_alpha.weight"):
-			if q.shouldReorderVHeads() {
-				// HF tensor layout is [out_features, in_features]; reorder rows.
-				t.SetRepacker(q.repackReorderDim(0, 1))
-			}
-			out = append(out, &ggml.Tensor{Name: name, Kind: t.Kind(), Shape: slices.Clone(shape), WriterTo: t})
-
-		case strings.HasSuffix(name, ".ssm_dt"):
-			if q.shouldReorderVHeads() {
-				t.SetRepacker(q.repackReorderDim(0, 1))
-			}
-			out = append(out, &ggml.Tensor{Name: name, Kind: t.Kind(), Shape: slices.Clone(shape), WriterTo: t})
-
-		case strings.HasSuffix(name, ".ssm_out.weight"):
-			if q.shouldReorderVHeads() {
-				// HF out_proj layout is [out_features, in_features]; reorder columns.
-				t.SetRepacker(q.repackReorderDim(1, int(q.LinearValueHeadDim)))
-			}
-			out = append(out, &ggml.Tensor{Name: name, Kind: t.Kind(), Shape: slices.Clone(shape), WriterTo: t})
-
-		case strings.HasSuffix(name, ".ssm_conv1d.weight"):
-			newShape := slices.Clone(shape)
-			if len(shape) == 3 {
-				if shape[0] == 1 {
-					newShape = []uint64{shape[1], shape[2]}
-				} else if shape[1] == 1 {
-					newShape = []uint64{shape[0], shape[2]}
-				}
-			}
-			if q.shouldReorderVHeads() {
-				t.SetRepacker(q.repackConv1D())
-			}
-			out = append(out, &ggml.Tensor{Name: name, Kind: t.Kind(), Shape: newShape, WriterTo: t})
-
-		default:
-			out = append(out, &ggml.Tensor{Name: name, Kind: t.Kind(), Shape: slices.Clone(shape), WriterTo: t})
-		}
-	}
-
-	return out
-}
-
-func (q *qwen3NextModel) repackReorderDim(dim, headDim int) Repacker {
-	return func(_ string, data []float32, shape []uint64) ([]float32, error) {
-		if !q.shouldReorderVHeads() {
-			return data, nil
-		}
-		numK := int(q.LinearNumKeyHeads)
-		numVPerK := int(q.LinearNumValueHeads / q.LinearNumKeyHeads)
-		return reorderHeadLayout(data, shape, dim, numK, numVPerK, headDim)
-	}
-}
-
-func (q *qwen3NextModel) repackAttnQKV() Repacker {
-	return func(_ string, data []float32, shape []uint64) ([]float32, error) {
-		if !q.shouldReorderVHeads() || len(shape) != 2 {
-			return data, nil
-		}
-
-		rows := int(shape[0])
-		cols := int(shape[1])
-		numK := int(q.LinearNumKeyHeads)
-		numV := int(q.LinearNumValueHeads)
-		headK := int(q.LinearKeyHeadDim)
-		headV := int(q.LinearValueHeadDim)
-		qDim := headK * numK
-		kDim := headK * numK
-		vDim := headV * numV
-		qkvDim := qDim + kDim + vDim
-
-		switch {
-		case rows == qkvDim:
-			// HF layout: [out_features, in_features]. Keep Q/K rows unchanged and
-			// reorder only V rows from grouped -> tiled head layout.
-			out := make([]float32, len(data))
-			qkRows := qDim + kDim
-			qkSize := qkRows * cols
-			copy(out[:qkSize], data[:qkSize])
-
-			vStart := qkSize
-			vEnd := vStart + vDim*cols
-			reorderedV, err := reorderHeadLayout(data[vStart:vEnd], []uint64{uint64(vDim), uint64(cols)}, 0, numK, numV/numK, headV)
-			if err != nil {
-				return nil, err
-			}
-			copy(out[vStart:vEnd], reorderedV)
-			copy(out[vEnd:], data[vEnd:])
-			return out, nil
-
-		case cols == qkvDim:
-			// Fallback for already-transposed [in_features, out_features] tensors.
-			out := make([]float32, len(data))
-			copy(out, data)
-			for r := range rows {
-				base := r * cols
-				vStart := base + qDim + kDim
-				vEnd := vStart + vDim
-				reorderedV, err := reorderHeadLayout(out[vStart:vEnd], []uint64{uint64(vDim)}, 0, numK, numV/numK, headV)
-				if err != nil {
-					return nil, err
-				}
-				copy(out[vStart:vEnd], reorderedV)
-			}
-			return out, nil
-
-		default:
-			return data, nil
-		}
-	}
-}
-
-func (q *qwen3NextModel) repackConv1D() Repacker {
-	return func(_ string, data []float32, shape []uint64) ([]float32, error) {
-		if !q.shouldReorderVHeads() {
-			return data, nil
-		}
-
-		normShape := slices.Clone(shape)
-		if len(shape) == 3 {
-			if shape[0] == 1 {
-				normShape = []uint64{shape[1], shape[2]}
-			} else if shape[1] == 1 {
-				normShape = []uint64{shape[0], shape[2]}
-			}
-		}
-		if len(normShape) != 2 {
-			return data, nil
-		}
-
-		rows := int(normShape[0])
-		cols := int(normShape[1])
-		numK := int(q.LinearNumKeyHeads)
-		numV := int(q.LinearNumValueHeads)
-		headK := int(q.LinearKeyHeadDim)
-		headV := int(q.LinearValueHeadDim)
-		qkChannels := 2 * headK * numK
-		totalChannels := qkChannels + headV*numV
-		if qkChannels <= 0 {
-			return data, nil
-		}
-
-		switch {
-		case rows == totalChannels:
-			// HF layout after squeeze: [channels, kernel]
-			out := make([]float32, len(data))
-			prefix := qkChannels * cols
-			copy(out[:prefix], data[:prefix])
-			reorderedV, err := reorderHeadLayout(data[prefix:], []uint64{uint64(totalChannels - qkChannels), uint64(cols)}, 0, numK, numV/numK, headV)
-			if err != nil {
-				return nil, err
-			}
-			copy(out[prefix:], reorderedV)
-			return out, nil
-		case cols == totalChannels:
-			// Fallback for transposed [kernel, channels]
-			out := make([]float32, len(data))
-			copy(out, data)
-			vChannels := totalChannels - qkChannels
-			for r := range rows {
-				base := r * cols
-				vStart := base + qkChannels
-				vEnd := vStart + vChannels
-				reorderedV, err := reorderHeadLayout(out[vStart:vEnd], []uint64{uint64(vChannels)}, 0, numK, numV/numK, headV)
-				if err != nil {
-					return nil, err
-				}
-				copy(out[vStart:vEnd], reorderedV)
-			}
-			return out, nil
-		default:
-			return data, nil
-		}
-	}
-}
-
-func (q *qwen3NextModel) repackSSMA() Repacker {
-	return func(_ string, data []float32, shape []uint64) ([]float32, error) {
-		result := make([]float32, len(data))
-		for i, v := range data {
-			result[i] = -float32(math.Exp(float64(v)))
-		}
-		if !q.shouldReorderVHeads() {
-			return result, nil
-		}
-		numK := int(q.LinearNumKeyHeads)
-		numVPerK := int(q.LinearNumValueHeads / q.LinearNumKeyHeads)
-		return reorderHeadLayout(result, shape, 0, numK, numVPerK, 1)
-	}
-}
-
-func reorderHeadLayout(data []float32, shape []uint64, dim int, numKHeads, numVPerK, headDim int) ([]float32, error) {
-	if len(shape) == 0 || numKHeads <= 0 || numVPerK <= 0 || headDim <= 0 {
-		return data, nil
-	}
-
-	dims := make([]int, len(shape))
-	for i := range shape {
-		dims[i] = int(shape[i])
-	}
-	if dim < 0 {
-		dim += len(dims)
-	}
-	if dim < 0 || dim >= len(dims) {
-		return data, nil
-	}
-
-	expected := numKHeads * numVPerK * headDim
-	if dims[dim] != expected {
-		return data, nil
-	}
-
-	newShape := make([]int, 0, len(dims)+2)
-	newShape = append(newShape, dims[:dim]...)
-	newShape = append(newShape, numKHeads, numVPerK, headDim)
-	newShape = append(newShape, dims[dim+1:]...)
-
-	var tt tensor.Tensor = tensor.New(tensor.WithShape(dims...), tensor.WithBacking(data))
-	if err := tt.Reshape(newShape...); err != nil {
-		return nil, err
-	}
-
-	perm := make([]int, len(newShape))
-	for i := range perm {
-		perm[i] = i
-	}
-	perm[dim], perm[dim+1] = perm[dim+1], perm[dim]
-
-	tt, err := tensor.Transpose(tt, perm...)
-	if err != nil {
-		return nil, err
-	}
-	tt = tensor.Materialize(tt)
-
-	total := 1
-	for _, d := range dims {
-		total *= d
-	}
-	if err := tt.Reshape(total); err != nil {
-		return nil, err
-	}
-	return native.VectorF32(tt.(*tensor.Dense))
-}
-
-type qkvzSplitSpec struct {
-	hidden    int
-	headKDim  int
-	headVDim  int
-	numKHeads int
-	numVHeads int
-	qkvzDim   int
-	qkvOut    int
-	gateOut   int
-}
-
-func (q *qwen3NextModel) qkvzSpec(shape []uint64) (qkvzSplitSpec, bool) {
-	if len(shape) != 2 {
-		return qkvzSplitSpec{}, false
-	}
-
-	numKHeads := int(q.LinearNumKeyHeads)
-	numVHeads := int(q.LinearNumValueHeads)
-	headKDim := int(q.LinearKeyHeadDim)
-	headVDim := int(q.LinearValueHeadDim)
-	if numKHeads == 0 || numVHeads == 0 || headKDim == 0 || headVDim == 0 {
-		return qkvzSplitSpec{}, false
-	}
-	if numVHeads%numKHeads != 0 {
-		return qkvzSplitSpec{}, false
-	}
-
-	hidden := int(shape[1])
-	vPerHead := headVDim * (numVHeads / numKHeads)
-	qkvzDim := 2*headKDim + 2*vPerHead
-	expectedOut := qkvzDim * numKHeads
-	if int(shape[0]) != expectedOut {
-		return qkvzSplitSpec{}, false
-	}
-
-	return qkvzSplitSpec{
-		hidden:    hidden,
-		headKDim:  headKDim,
-		headVDim:  headVDim,
-		numKHeads: numKHeads,
-		numVHeads: numVHeads,
-		qkvzDim:   qkvzDim,
-		qkvOut:    2*headKDim*numKHeads + headVDim*numVHeads,
-		gateOut:   headVDim * numVHeads,
-	}, true
-}
-
-func (q *qwen3NextModel) splitQKVZTensor(t Tensor) (*ggml.Tensor, *ggml.Tensor, bool) {
-	spec, ok := q.qkvzSpec(t.Shape())
-	if !ok {
-		return nil, nil, false
-	}
-
-	qkvTensor := t.Clone()
-	qkvTensor.SetRepacker(q.repackQKVZ(spec, false))
-
-	gateTensor := t.Clone()
-	gateTensor.SetRepacker(q.repackQKVZ(spec, true))
-
-	qkvName := strings.Replace(t.Name(), "ssm_in", "attn_qkv", 1)
-	gateName := strings.Replace(t.Name(), "ssm_in", "attn_gate", 1)
-
-	return &ggml.Tensor{
-			Name:     qkvName,
-			Kind:     t.Kind(),
-			Shape:    []uint64{uint64(spec.qkvOut), uint64(spec.hidden)},
-			WriterTo: qkvTensor,
-		}, &ggml.Tensor{
-			Name:     gateName,
-			Kind:     t.Kind(),
-			Shape:    []uint64{uint64(spec.gateOut), uint64(spec.hidden)},
-			WriterTo: gateTensor,
-		}, true
-}
-
-func (q *qwen3NextModel) repackQKVZ(spec qkvzSplitSpec, extractGate bool) Repacker {
-	vPerHead := spec.headVDim * (spec.numVHeads / spec.numKHeads)
-
-	return func(_ string, data []float32, shape []uint64) ([]float32, error) {
-		dims := make([]int, len(shape))
-		for i := range shape {
-			dims[i] = int(shape[i])
-		}
-
-		var tt tensor.Tensor = tensor.New(tensor.WithShape(dims...), tensor.WithBacking(data))
-		var err error
-
-		tt, err = tensor.Transpose(tt, 1, 0)
-		if err != nil {
-			return nil, err
-		}
-		tt = tensor.Materialize(tt)
-
-		if err := tt.Reshape(spec.hidden, spec.numKHeads, spec.qkvzDim); err != nil {
-			return nil, err
-		}
-
-		offset := 0
-		qSlice, err := tt.Slice(nil, nil, tensor.S(offset, offset+spec.headKDim))
-		if err != nil {
-			return nil, err
-		}
-		offset += spec.headKDim
-		kSlice, err := tt.Slice(nil, nil, tensor.S(offset, offset+spec.headKDim))
-		if err != nil {
-			return nil, err
-		}
-		offset += spec.headKDim
-		vSlice, err := tt.Slice(nil, nil, tensor.S(offset, offset+vPerHead))
-		if err != nil {
-			return nil, err
-		}
-		offset += vPerHead
-		zSlice, err := tt.Slice(nil, nil, tensor.S(offset, offset+vPerHead))
-		if err != nil {
-			return nil, err
-		}
-
-		qMat := tensor.Materialize(qSlice).(*tensor.Dense)
-		kMat := tensor.Materialize(kSlice).(*tensor.Dense)
-		vMat := tensor.Materialize(vSlice).(*tensor.Dense)
-		zMat := tensor.Materialize(zSlice).(*tensor.Dense)
-
-		if err := qMat.Reshape(spec.hidden, spec.numKHeads*spec.headKDim); err != nil {
-			return nil, err
-		}
-		if err := kMat.Reshape(spec.hidden, spec.numKHeads*spec.headKDim); err != nil {
-			return nil, err
-		}
-		if err := vMat.Reshape(spec.hidden, spec.numKHeads*vPerHead); err != nil {
-			return nil, err
-		}
-		if err := zMat.Reshape(spec.hidden, spec.numKHeads*vPerHead); err != nil {
-			return nil, err
-		}
-
-		var out tensor.Tensor
-		if extractGate {
-			out = zMat
-		} else {
-			out, err = tensor.Concat(1, qMat, kMat, vMat)
-			if err != nil {
-				return nil, err
-			}
-		}
-
-		out = tensor.Materialize(out)
-		out, err = tensor.Transpose(out, 1, 0)
-		if err != nil {
-			return nil, err
-		}
-		out = tensor.Materialize(out)
-
-		if err := out.Reshape(out.Shape().TotalSize()); err != nil {
-			return nil, err
-		}
-
-		return native.VectorF32(out.(*tensor.Dense))
-	}
-}
-
-func (*qwen3NextModel) addOne(_ string, data []float32, shape []uint64) ([]float32, error) {
-	n := tensor.New(tensor.WithShape(int(shape[0])), tensor.WithBacking(data))
-	ones := tensor.Ones(tensor.Float32, int(shape[0]))
-
-	n, err := n.Add(ones)
-	if err != nil {
-		return nil, err
-	}
-
-	ts, err := native.SelectF32(n, 0)
-	if err != nil {
-		return nil, err
-	}
-
-	var f32s []float32
-	for _, t := range ts {
-		f32s = append(f32s, t...)
-	}
-
-	return f32s, nil
-}
-
-func (q *qwen3NextModel) Replacements() []string {
-	return []string{
-		// Embeddings and output
-		"lm_head", "output",
-		"model.language_model.embed_tokens", "token_embd",
-		"model.language_model.norm", "output_norm",
-		"model.language_model.layers", "blk",
-		"model.embed_tokens", "token_embd",
-		"model.norm", "output_norm",
-		"model.layers", "blk",
-
-		// Vision
-		"model.visual", "v",
-		"patch_embed.proj", "patch_embed",
-		"blocks", "blk",
-		"attn.qkv", "attn_qkv",
-		"attn.proj", "attn_out",
-		"deepstack_merger_list", "deepstack_merger",
-
-		// Layer norms
-		"input_layernorm", "attn_norm",
-		"post_attention_layernorm", "post_attention_norm",
-
-		// Full attention (self_attn)
-		"self_attn.q_proj", "attn_q",
-		"self_attn.q_norm", "attn_q_norm",
-		"self_attn.k_proj", "attn_k",
-		"self_attn.k_norm", "attn_k_norm",
-		"self_attn.v_proj", "attn_v",
-		"self_attn.o_proj", "attn_output",
-
-		// Linear attention (legacy qwen3next)
-		"linear_attn.in_proj_qkvz", "ssm_in",
-		"linear_attn.in_proj_ba", "ssm_ba",
-
-		// Linear attention (qwen35)
-		"linear_attn.in_proj_qkv", "attn_qkv",
-		"linear_attn.in_proj_z", "attn_gate",
-		"linear_attn.in_proj_a", "ssm_alpha",
-		"linear_attn.in_proj_b", "ssm_beta",
-
-		"linear_attn.conv1d", "ssm_conv1d",
-		"linear_attn.dt_bias", "ssm_dt",
-		"linear_attn.dt_proj", "ssm_dt",
-		"linear_attn.A_log", "ssm_a",
-		"linear_attn.norm", "ssm_norm",
-		"linear_attn.out_proj", "ssm_out",
-
-		// MoE
-		"mlp.gate.weight", "ffn_gate_inp.weight",
-		"mlp.shared_expert.down_proj", "ffn_down_shexp",
-		"mlp.shared_expert.gate_proj", "ffn_gate_shexp",
-		"mlp.shared_expert.up_proj", "ffn_up_shexp",
-		"mlp.shared_expert_gate", "ffn_gate_inp_shexp",
-
-		// Dense FFN
-		"mlp.down_proj", "ffn_down",
-		"mlp.gate_proj", "ffn_gate",
-		"mlp.up_proj", "ffn_up",
-	}
-}
--- a/convert/convert_qwen3next_test.go
+++ b/convert/convert_qwen3next_test.go
@@ -1,563 +0,0 @@
-package convert
-
-import (
-	"bytes"
-	"encoding/binary"
-	"os"
-	"slices"
-	"strings"
-	"testing"
-
-	"github.com/ollama/ollama/fs/ggml"
-)
-
-func boolPtr(v bool) *bool {
-	return &v
-}
-
-func readTensorData(t *testing.T, tensor *ggml.Tensor) []float32 {
-	t.Helper()
-
-	var b bytes.Buffer
-	if _, err := tensor.WriteTo(&b); err != nil {
-		t.Fatal(err)
-	}
-
-	numel := 1
-	for _, d := range tensor.Shape {
-		numel *= int(d)
-	}
-
-	values := make([]float32, numel)
-	if err := binary.Read(&b, binary.LittleEndian, &values); err != nil {
-		t.Fatal(err)
-	}
-
-	return values
-}
-
-func TestQwen3NextLegacyModelTypeDisablesReorder(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_next",
-		},
-	}
-
-	if m.shouldReorderVHeads() {
-		t.Fatalf("legacy qwen3_next model_type should not reorder v-head layout")
-	}
-}
-
-func TestQwen3NextLegacyArchitectureDisablesReorder(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			Architectures: []string{"Qwen3NextForCausalLM"},
-		},
-	}
-
-	if m.shouldReorderVHeads() {
-		t.Fatalf("legacy Qwen3Next architecture should not reorder v-head layout")
-	}
-}
-
-func TestQwen3NextKVLegacyConfig(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_next",
-		},
-		qwen3NextTextConfig: qwen3NextTextConfig{
-			MaxPositionEmbeddings: 8192,
-			HiddenSize:            512,
-			NumHiddenLayers:       4,
-			IntermediateSize:      2048,
-			NumAttentionHeads:     8,
-			NumKeyValueHeads:      2,
-			HeadDim:               64,
-			RopeTheta:             1_000_000,
-			RMSNormEPS:            1e-6,
-
-			NumExperts:             8,
-			NumExpertsPerToken:     2,
-			NormTopkProb:           boolPtr(true),
-			MoEIntermediateSize:    256,
-			SharedExpertIntermSize: 512,
-
-			FullAttentionInterval: 2,
-
-			LinearConvKernelDim: 4,
-			LinearKeyHeadDim:    64,
-			LinearNumKeyHeads:   2,
-			LinearNumValueHeads: 4,
-			LinearValueHeadDim:  64,
-
-			PartialRotaryFactor: 0.25,
-		},
-	}
-
-	if err := m.parseMore(os.DirFS(t.TempDir())); err != nil {
-		t.Fatal(err)
-	}
-
-	kv := m.KV(&Tokenizer{Vocabulary: &Vocabulary{}})
-	if got, want := kv["general.architecture"], "qwen35moe"; got != want {
-		t.Fatalf("unexpected architecture: got %v want %v", got, want)
-	}
-	if got, want := kv["tokenizer.ggml.pre"], "qwen35"; got != want {
-		t.Fatalf("unexpected tokenizer pre: got %v want %v", got, want)
-	}
-
-	headCountKV, ok := kv["attention.head_count_kv"].([]uint32)
-	if !ok {
-		t.Fatalf("attention.head_count_kv has unexpected type: %T", kv["attention.head_count_kv"])
-	}
-	if got, want := headCountKV, []uint32{0, 2, 0, 2}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected attention.head_count_kv: got %v want %v", got, want)
-	}
-
-	if _, ok := kv["ssm.v_head_reordered"]; ok {
-		t.Fatalf("legacy qwen3next should not enable ssm.v_head_reordered")
-	}
-	if got, want := kv["norm_top_k_prob"], true; got != want {
-		t.Fatalf("unexpected norm_top_k_prob: got %v want %v", got, want)
-	}
-}
-
-func TestQwen35MoeOmitsNormTopKProbWhenUnset(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_5",
-		},
-		qwen3NextTextConfig: qwen3NextTextConfig{
-			MaxPositionEmbeddings: 4096,
-			HiddenSize:            512,
-			NumHiddenLayers:       4,
-			IntermediateSize:      2048,
-			NumAttentionHeads:     8,
-			NumKeyValueHeads:      2,
-			HeadDim:               64,
-			RopeTheta:             1_000_000,
-			RMSNormEPS:            1e-6,
-			NumExperts:            8,
-			NumExpertsPerToken:    2,
-			FullAttentionInterval: 2,
-			LinearConvKernelDim:   4,
-			LinearKeyHeadDim:      64,
-			LinearNumKeyHeads:     2,
-			LinearNumValueHeads:   4,
-			LinearValueHeadDim:    64,
-			PartialRotaryFactor:   0.25,
-		},
-	}
-
-	if err := m.parseMore(os.DirFS(t.TempDir())); err != nil {
-		t.Fatal(err)
-	}
-
-	kv := m.KV(&Tokenizer{Vocabulary: &Vocabulary{}})
-	if _, ok := kv["norm_top_k_prob"]; ok {
-		t.Fatalf("expected norm_top_k_prob to be omitted when not set in config")
-	}
-}
-
-func TestQwen35KVFromTextConfig(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_5",
-		},
-		TextConfig: &qwen3NextTextConfig{
-			MaxPositionEmbeddings: 16384,
-			HiddenSize:            1024,
-			NumHiddenLayers:       4,
-			IntermediateSize:      4096,
-			NumAttentionHeads:     8,
-			NumKeyValueHeads:      4,
-			HeadDim:               128,
-			RMSNormEPS:            1e-6,
-
-			LayerTypes: []string{
-				"linear_attention",
-				"full_attention",
-				"linear_attention",
-				"full_attention",
-			},
-
-			LinearConvKernelDim: 4,
-			LinearKeyHeadDim:    128,
-			LinearNumKeyHeads:   2,
-			LinearNumValueHeads: 4,
-			LinearValueHeadDim:  128,
-
-			RopeParameters: qwen3NextRopeParams{
-				MRopeInterleaved:    true,
-				MropeSection:        []int32{11, 11, 10},
-				RopeType:            "default",
-				RopeTheta:           10_000_000,
-				PartialRotaryFactor: 0.25,
-			},
-		},
-		VisionModel: qwen3NextVisionConfig{
-			Depth:                  2,
-			HiddenSize:             128,
-			NumHeads:               4,
-			InChannels:             3,
-			PatchSize:              16,
-			SpatialMergeSize:       2,
-			RMSNormEps:             1e-6,
-			RopeTheta:              10_000,
-			TemporalPatchSize:      2,
-			DeepstackVisualIndexes: []int32{1},
-		},
-		ImageTokenID:       1001,
-		VisionStartTokenID: 1002,
-		VisionEndTokenID:   1003,
-	}
-	m.VisionModel.Size.ShortestEdge = 224
-	m.VisionModel.Size.LongestEdge = 4096
-	m.VisionModel.ImageMean = []float32{0.5, 0.5, 0.5}
-	m.VisionModel.ImageStd = []float32{0.2, 0.2, 0.2}
-
-	if err := m.parseMore(os.DirFS(t.TempDir())); err != nil {
-		t.Fatal(err)
-	}
-
-	kv := m.KV(&Tokenizer{Vocabulary: &Vocabulary{}})
-	if got, want := kv["general.architecture"], "qwen35"; got != want {
-		t.Fatalf("unexpected architecture: got %v want %v", got, want)
-	}
-
-	headCountKV, ok := kv["attention.head_count_kv"].([]uint32)
-	if !ok {
-		t.Fatalf("attention.head_count_kv has unexpected type: %T", kv["attention.head_count_kv"])
-	}
-	if got, want := headCountKV, []uint32{0, 4, 0, 4}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected attention.head_count_kv: got %v want %v", got, want)
-	}
-
-	if got, ok := kv["ssm.v_head_reordered"].(bool); !ok || !got {
-		t.Fatalf("expected ssm.v_head_reordered=true, got %v (%T)", kv["ssm.v_head_reordered"], kv["ssm.v_head_reordered"])
-	}
-
-	mrope, ok := kv["mrope_sections"].([]int32)
-	if !ok {
-		t.Fatalf("mrope_sections has unexpected type: %T", kv["mrope_sections"])
-	}
-	if got, want := mrope, []int32{11, 11, 10}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected mrope_sections: got %v want %v", got, want)
-	}
-	ropeSections, ok := kv["rope.dimension_sections"].([]int32)
-	if !ok {
-		t.Fatalf("rope.dimension_sections has unexpected type: %T", kv["rope.dimension_sections"])
-	}
-	if got, want := ropeSections, []int32{11, 11, 10}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected rope.dimension_sections: got %v want %v", got, want)
-	}
-
-	if got, ok := kv["rope.mrope_interleaved"].(bool); !ok || !got {
-		t.Fatalf("expected rope.mrope_interleaved=true, got %v (%T)", kv["rope.mrope_interleaved"], kv["rope.mrope_interleaved"])
-	}
-
-	if got, want := kv["vision.block_count"], uint32(2); got != want {
-		t.Fatalf("unexpected vision.block_count: got %v want %v", got, want)
-	}
-}
-
-func TestQwen3NextReplacements(t *testing.T) {
-	r := strings.NewReplacer((&qwen3NextModel{}).Replacements()...)
-
-	if got, want := r.Replace("model.language_model.layers.1.linear_attn.in_proj_qkv.weight"), "blk.1.attn_qkv.weight"; got != want {
-		t.Fatalf("unexpected language-model replacement: got %q want %q", got, want)
-	}
-	if got, want := r.Replace("model.visual.blocks.0.attn.qkv.weight"), "v.blk.0.attn_qkv.weight"; got != want {
-		t.Fatalf("unexpected vision replacement: got %q want %q", got, want)
-	}
-	if got, want := r.Replace("model.layers.1.linear_attn.in_proj_qkvz.weight"), "blk.1.ssm_in.weight"; got != want {
-		t.Fatalf("unexpected legacy replacement: got %q want %q", got, want)
-	}
-}
-
-func TestQwen35ReordersVHeads(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_5",
-		},
-		qwen3NextTextConfig: qwen3NextTextConfig{
-			LinearNumKeyHeads:   2,
-			LinearNumValueHeads: 4,
-			LinearValueHeadDim:  1,
-		},
-	}
-
-	out := m.Tensors([]Tensor{
-		&fakeTensor{
-			name:  "blk.0.attn_gate.weight",
-			shape: []uint64{4, 2},
-			data:  []float32{0, 1, 2, 3, 4, 5, 6, 7},
-		},
-	})
-	if len(out) != 1 {
-		t.Fatalf("unexpected output tensor count: got %d want 1", len(out))
-	}
-
-	if got, want := readTensorData(t, out[0]), []float32{0, 1, 4, 5, 2, 3, 6, 7}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected data: got %v want %v", got, want)
-	}
-}
-
-func TestQwen35ReordersAttnQKVOutputDim(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_5",
-		},
-		qwen3NextTextConfig: qwen3NextTextConfig{
-			LinearNumKeyHeads:   2,
-			LinearNumValueHeads: 4,
-			LinearKeyHeadDim:    1,
-			LinearValueHeadDim:  1,
-		},
-	}
-
-	out := m.Tensors([]Tensor{
-		&fakeTensor{
-			name:  "blk.0.attn_qkv.weight",
-			shape: []uint64{8, 2}, // [out_features, in_features] (HF layout)
-			data: []float32{
-				0, 1, // q0
-				2, 3, // q1
-				4, 5, // k0
-				6, 7, // k1
-				10, 11, // v(k0,v0)
-				12, 13, // v(k0,v1)
-				20, 21, // v(k1,v0)
-				22, 23, // v(k1,v1)
-			},
-		},
-	})
-	if len(out) != 1 {
-		t.Fatalf("unexpected output tensor count: got %d want 1", len(out))
-	}
-
-	if got, want := readTensorData(t, out[0]), []float32{
-		0, 1, 2, 3, 4, 5, 6, 7,
-		10, 11, 20, 21, 12, 13, 22, 23,
-	}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected qkv data: got %v want %v", got, want)
-	}
-}
-
-func TestQwen35ReordersSsmOutInputDim(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_5",
-		},
-		qwen3NextTextConfig: qwen3NextTextConfig{
-			LinearNumKeyHeads:   2,
-			LinearNumValueHeads: 4,
-			LinearValueHeadDim:  1,
-		},
-	}
-
-	out := m.Tensors([]Tensor{
-		&fakeTensor{
-			name:  "blk.0.ssm_out.weight",
-			shape: []uint64{2, 4},
-			data:  []float32{0, 1, 2, 3, 4, 5, 6, 7},
-		},
-	})
-	if len(out) != 1 {
-		t.Fatalf("unexpected output tensor count: got %d want 1", len(out))
-	}
-
-	if got, want := readTensorData(t, out[0]), []float32{0, 2, 1, 3, 4, 6, 5, 7}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected ssm_out data: got %v want %v", got, want)
-	}
-}
-
-func TestQwen35ReordersSsmBetaRows(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_5",
-		},
-		qwen3NextTextConfig: qwen3NextTextConfig{
-			LinearNumKeyHeads:   2,
-			LinearNumValueHeads: 4,
-		},
-	}
-
-	out := m.Tensors([]Tensor{
-		&fakeTensor{
-			name:  "blk.0.ssm_beta.weight",
-			shape: []uint64{4, 2},
-			data:  []float32{0, 1, 2, 3, 4, 5, 6, 7},
-		},
-	})
-	if len(out) != 1 {
-		t.Fatalf("unexpected output tensor count: got %d want 1", len(out))
-	}
-
-	if got, want := readTensorData(t, out[0]), []float32{0, 1, 4, 5, 2, 3, 6, 7}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected ssm_beta data: got %v want %v", got, want)
-	}
-}
-
-func TestQwen35ReordersConv1DChannelDim(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_5",
-		},
-		qwen3NextTextConfig: qwen3NextTextConfig{
-			LinearNumKeyHeads:   2,
-			LinearNumValueHeads: 4,
-			LinearKeyHeadDim:    1,
-			LinearValueHeadDim:  1,
-		},
-	}
-
-	out := m.Tensors([]Tensor{
-		&fakeTensor{
-			name:  "blk.0.ssm_conv1d.weight",
-			shape: []uint64{8, 2}, // [channels, kernel] after squeeze
-			data: []float32{
-				0, 1, // q0
-				2, 3, // q1
-				4, 5, // k0
-				6, 7, // k1
-				10, 11, // v(k0,v0)
-				12, 13, // v(k0,v1)
-				20, 21, // v(k1,v0)
-				22, 23, // v(k1,v1)
-			},
-		},
-	})
-	if len(out) != 1 {
-		t.Fatalf("unexpected output tensor count: got %d want 1", len(out))
-	}
-
-	if got, want := readTensorData(t, out[0]), []float32{
-		0, 1, 2, 3, 4, 5, 6, 7,
-		10, 11, 20, 21, 12, 13, 22, 23,
-	}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected conv1d data: got %v want %v", got, want)
-	}
-}
-
-func TestLegacyQwen3NextDoesNotReorderVHeads(t *testing.T) {
-	m := &qwen3NextModel{
-		ModelParameters: ModelParameters{
-			ModelType: "qwen3_next",
-		},
-		qwen3NextTextConfig: qwen3NextTextConfig{
-			LinearNumKeyHeads:   2,
-			LinearNumValueHeads: 4,
-			LinearValueHeadDim:  1,
-		},
-	}
-
-	out := m.Tensors([]Tensor{
-		&fakeTensor{
-			name:  "blk.0.attn_gate.weight",
-			shape: []uint64{4, 1},
-			data:  []float32{0, 1, 2, 3},
-		},
-	})
-	if len(out) != 1 {
-		t.Fatalf("unexpected output tensor count: got %d want 1", len(out))
-	}
-
-	if got, want := readTensorData(t, out[0]), []float32{0, 1, 2, 3}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected data for legacy qwen3next: got %v want %v", got, want)
-	}
-}
-
-func TestQwen35MoePackedExperts(t *testing.T) {
-	m := &qwen3NextModel{
-		qwen3NextTextConfig: qwen3NextTextConfig{
-			NumHiddenLayers: 1,
-		},
-	}
-
-	out := m.Tensors([]Tensor{
-		&fakeTensor{
-			name:  "blk.0.mlp.experts.gate_up_proj",
-			shape: []uint64{2, 4, 3},
-			data: []float32{
-				0, 1, 2,
-				3, 4, 5,
-				6, 7, 8,
-				9, 10, 11,
-				12, 13, 14,
-				15, 16, 17,
-				18, 19, 20,
-				21, 22, 23,
-			},
-		},
-		&fakeTensor{
-			name:  "blk.0.mlp.experts.down_proj",
-			shape: []uint64{2, 5, 3},
-			data:  make([]float32, 2*5*3),
-		},
-	})
-
-	get := func(name string) *ggml.Tensor {
-		for _, tensor := range out {
-			if tensor.Name == name {
-				return tensor
-			}
-		}
-		return nil
-	}
-
-	gate := get("blk.0.ffn_gate_exps.weight")
-	if gate == nil {
-		t.Fatalf("missing tensor %q", "blk.0.ffn_gate_exps.weight")
-	}
-	if got, want := gate.Shape, []uint64{2, 2, 3}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected gate shape: got %v want %v", got, want)
-	}
-	if got, want := readTensorData(t, gate), []float32{
-		0, 1, 2, 3, 4, 5,
-		12, 13, 14, 15, 16, 17,
-	}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected gate values: got %v want %v", got, want)
-	}
-
-	up := get("blk.0.ffn_up_exps.weight")
-	if up == nil {
-		t.Fatalf("missing tensor %q", "blk.0.ffn_up_exps.weight")
-	}
-	if got, want := up.Shape, []uint64{2, 2, 3}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected up shape: got %v want %v", got, want)
-	}
-	if got, want := readTensorData(t, up), []float32{
-		6, 7, 8, 9, 10, 11,
-		18, 19, 20, 21, 22, 23,
-	}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected up values: got %v want %v", got, want)
-	}
-
-	down := get("blk.0.ffn_down_exps.weight")
-	if down == nil {
-		t.Fatalf("missing tensor %q", "blk.0.ffn_down_exps.weight")
-	}
-	if got, want := down.Shape, []uint64{2, 5, 3}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected down shape: got %v want %v", got, want)
-	}
-}
-
-func TestQwen35SharedExpertGateKeepsMatrixShape(t *testing.T) {
-	m := &qwen3NextModel{}
-
-	out := m.Tensors([]Tensor{
-		&fakeTensor{
-			name:  "blk.0.ffn_gate_inp_shexp.weight",
-			shape: []uint64{1, 4},
-			data:  []float32{0, 1, 2, 3},
-		},
-	})
-	if len(out) != 1 {
-		t.Fatalf("unexpected output tensor count: got %d want 1", len(out))
-	}
-
-	if got, want := out[0].Shape, []uint64{1, 4}; !slices.Equal(got, want) {
-		t.Fatalf("unexpected shared gate shape: got %v want %v", got, want)
-	}
-}
--- a/Show More
+++ b/Show More
Author	SHA1	Message	Date
jmorganca	bb1a5617b6	readme: add instructions to build with MLX	2026-01-15 09:52:56 -08:00
jmorganca	0d3648c1be	glm-image wip	2026-01-14 16:46:50 -08:00