From 11c5fd677d244a88e4cd262e4a8e81531335b5ed Mon Sep 17 00:00:00 2001 From: Ettore Di Giacinto Date: Mon, 25 May 2026 19:33:55 +0000 Subject: [PATCH] fix(gallery/ltx-2.3): add vae_decode_only:false for i2v / flf2v MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit LTX-2.3 i2v inference fails inside generate_video with: [ERROR] LTXAV image conditioning requires VAE encoder weights; create the context with vae_decode_only=false Without vae_decode_only:false in the options block, gosd.cpp creates the sd_ctx with VAE encoder weights freed, so latent encoding of the init_image is impossible. Adding the option mirrors what we already do for Wan i2v entries. Affects all six LTX-2.3 entries (dev/distilled × UD-Q4_K_M, Q4_K_M, Q8_0). T2V wasn't impacted by the missing option since it has no init image to encode, which is why the T2V smoke earlier passed. Assisted-by: Claude:claude-opus-4-7 --- gallery/index.yaml | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/gallery/index.yaml b/gallery/index.yaml index 08d410ac4..88871d300 100644 --- a/gallery/index.yaml +++ b/gallery/index.yaml @@ -30845,6 +30845,7 @@ model: ltx-2.3-22b-dev-UD-Q4_K_M.gguf options: - diffusion_model + - "vae_decode_only:false" - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf - vae_path:ltx-2.3-22b-dev_video_vae.safetensors - audio_vae_path:ltx-2.3-22b-dev_audio_vae.safetensors @@ -30877,6 +30878,7 @@ model: ltx-2.3-22b-dev-Q4_K_M.gguf options: - diffusion_model + - "vae_decode_only:false" - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf - vae_path:ltx-2.3-22b-dev_video_vae.safetensors - audio_vae_path:ltx-2.3-22b-dev_audio_vae.safetensors @@ -30909,6 +30911,7 @@ model: ltx-2.3-22b-dev-Q8_0.gguf options: - diffusion_model + - "vae_decode_only:false" - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf - vae_path:ltx-2.3-22b-dev_video_vae.safetensors - audio_vae_path:ltx-2.3-22b-dev_audio_vae.safetensors @@ -30969,6 +30972,7 @@ model: ltx-2.3-22b-distilled-UD-Q4_K_M.gguf options: - diffusion_model + - "vae_decode_only:false" - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf - vae_path:ltx-2.3-22b-distilled_video_vae.safetensors - audio_vae_path:ltx-2.3-22b-distilled_audio_vae.safetensors @@ -31000,6 +31004,7 @@ model: ltx-2.3-22b-distilled-Q4_K_M.gguf options: - diffusion_model + - "vae_decode_only:false" - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf - vae_path:ltx-2.3-22b-distilled_video_vae.safetensors - audio_vae_path:ltx-2.3-22b-distilled_audio_vae.safetensors @@ -31031,6 +31036,7 @@ model: ltx-2.3-22b-distilled-Q8_0.gguf options: - diffusion_model + - "vae_decode_only:false" - llm_path:gemma-3-12b-it-qat-UD-Q4_K_XL.gguf - vae_path:ltx-2.3-22b-distilled_video_vae.safetensors - audio_vae_path:ltx-2.3-22b-distilled_audio_vae.safetensors