From 11c5fd677d244a88e4cd262e4a8e81531335b5ed Mon Sep 17 00:00:00 2001
From: Ettore Di Giacinto <mudler@localai.io>
Date: Mon, 25 May 2026 19:33:55 +0000
Subject: [PATCH] fix(gallery/ltx-2.3): add vae_decode_only:false for i2v /
 flf2v
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

LTX-2.3 i2v inference fails inside generate_video with:

  [ERROR] LTXAV image conditioning requires VAE encoder weights;
  create the context with vae_decode_only=false

Without vae_decode_only:false in the options block, gosd.cpp creates
the sd_ctx with VAE encoder weights freed, so latent encoding of the
init_image is impossible. Adding the option mirrors what we already
do for Wan i2v entries.

Affects all six LTX-2.3 entries (dev/distilled × UD-Q4_K_M, Q4_K_M,
Q8_0). T2V wasn't impacted by the missing option since it has no
init image to encode, which is why the T2V smoke earlier passed.

Assisted-by: Claude:claude-opus-4-7
---
 gallery/index.yaml | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/gallery/index.yaml b/gallery/index.yaml
index 08d410ac4..88871d300 100644
--- a/gallery/index.yaml
+++ b/gallery/index.yaml
@@ -30845,6 +30845,7 @@
       model: ltx-2.3-22b-dev-UD-Q4_K_M.gguf
     options:
       - diffusion_model
+      - "vae_decode_only:false"
       - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf
       - vae_path:ltx-2.3-22b-dev_video_vae.safetensors
       - audio_vae_path:ltx-2.3-22b-dev_audio_vae.safetensors
@@ -30877,6 +30878,7 @@
       model: ltx-2.3-22b-dev-Q4_K_M.gguf
     options:
       - diffusion_model
+      - "vae_decode_only:false"
       - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf
       - vae_path:ltx-2.3-22b-dev_video_vae.safetensors
       - audio_vae_path:ltx-2.3-22b-dev_audio_vae.safetensors
@@ -30909,6 +30911,7 @@
       model: ltx-2.3-22b-dev-Q8_0.gguf
     options:
       - diffusion_model
+      - "vae_decode_only:false"
       - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf
       - vae_path:ltx-2.3-22b-dev_video_vae.safetensors
       - audio_vae_path:ltx-2.3-22b-dev_audio_vae.safetensors
@@ -30969,6 +30972,7 @@
       model: ltx-2.3-22b-distilled-UD-Q4_K_M.gguf
     options:
       - diffusion_model
+      - "vae_decode_only:false"
       - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf
       - vae_path:ltx-2.3-22b-distilled_video_vae.safetensors
       - audio_vae_path:ltx-2.3-22b-distilled_audio_vae.safetensors
@@ -31000,6 +31004,7 @@
       model: ltx-2.3-22b-distilled-Q4_K_M.gguf
     options:
       - diffusion_model
+      - "vae_decode_only:false"
       - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf
       - vae_path:ltx-2.3-22b-distilled_video_vae.safetensors
       - audio_vae_path:ltx-2.3-22b-distilled_audio_vae.safetensors
@@ -31031,6 +31036,7 @@
       model: ltx-2.3-22b-distilled-Q8_0.gguf
     options:
       - diffusion_model
+      - "vae_decode_only:false"
       - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf
       - vae_path:ltx-2.3-22b-distilled_video_vae.safetensors
       - audio_vae_path:ltx-2.3-22b-distilled_audio_vae.safetensors