From 088205339ccaf1c17c7360b2404a2699ec12aa56 Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Thu, 12 Feb 2026 18:13:03 +0100 Subject: [PATCH] chore(model gallery): add voxcpm, whisperx, moonshine-tiny (#8534) Signed-off-by: Ettore Di Giacinto --- gallery/index.yaml | 60 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 60 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index bf47fcb8f..7f4edfaf4 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -52,6 +52,66 @@ - filename: voxtral-model/tekken.json uri: https://huggingface.co/mistralai/Voxtral-Mini-4B-Realtime-2602/resolve/main/tekken.json sha256: 8434af1d39eba99f0ef46cf1450bf1a63fa941a26933a1ef5dbbf4adf0d00e44 +- name: moonshine-tiny + license: apache-2.0 + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + description: | + Moonshine Tiny is a lightweight speech-to-text model optimized for fast transcription. It is designed for efficient on-device ASR with high accuracy relative to its size. + urls: + - https://github.com/moonshine-ai/moonshine + tags: + - stt + - speech-to-text + - asr + - audio-transcription + - cpu + - gpu + overrides: + backend: moonshine + known_usecases: + - transcript + parameters: + model: moonshine/tiny +- name: whisperx-tiny + license: mit + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + description: | + WhisperX Tiny is a fast and accurate speech recognition model with speaker diarization capabilities. Built on OpenAI's Whisper with additional features for alignment and speaker segmentation. + urls: + - https://github.com/m-bain/whisperX + tags: + - stt + - speech-to-text + - asr + - audio-transcription + - speaker-diarization + - cpu + - gpu + overrides: + backend: whisperx + known_usecases: + - transcript + parameters: + model: tiny +- name: voxcpm-1.5 + license: apache-2.0 + url: "github:mudler/LocalAI/gallery/virtual.yaml@master" + description: | + VoxCPM 1.5 is an end-to-end text-to-speech (TTS) model from ModelBest. It features zero-shot voice cloning and high-quality speech synthesis capabilities. + urls: + - https://huggingface.co/openbmb/VoxCPM1.5 + tags: + - tts + - text-to-speech + - voice-cloning + - cpu + - gpu + overrides: + backend: voxcpm + known_usecases: + - tts + parameters: + model: openbmb/VoxCPM1.5 - name: "ace-step-turbo" license: mit tags: