Instructions to use vidfom/Ltx-3 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- llama-cpp-python
How to use vidfom/Ltx-3 with llama-cpp-python:
# !pip install llama-cpp-python from llama_cpp import Llama llm = Llama.from_pretrained( repo_id="vidfom/Ltx-3", filename="ComfyUI/models/text_encoders/gemma-3-12b-it-qat-UD-Q4_K_XL.gguf", )
llm.create_chat_completion( messages = "No input example has been defined for this model task." )
- Notebooks
- Google Colab
- Kaggle
- Local Apps
- llama.cpp
How to use vidfom/Ltx-3 with llama.cpp:
Install from brew
brew install llama.cpp # Start a local OpenAI-compatible server with a web UI: llama-server -hf vidfom/Ltx-3:UD-Q4_K_XL # Run inference directly in the terminal: llama-cli -hf vidfom/Ltx-3:UD-Q4_K_XL
Install from WinGet (Windows)
winget install llama.cpp # Start a local OpenAI-compatible server with a web UI: llama-server -hf vidfom/Ltx-3:UD-Q4_K_XL # Run inference directly in the terminal: llama-cli -hf vidfom/Ltx-3:UD-Q4_K_XL
Use pre-built binary
# Download pre-built binary from: # https://github.com/ggerganov/llama.cpp/releases # Start a local OpenAI-compatible server with a web UI: ./llama-server -hf vidfom/Ltx-3:UD-Q4_K_XL # Run inference directly in the terminal: ./llama-cli -hf vidfom/Ltx-3:UD-Q4_K_XL
Build from source code
git clone https://github.com/ggerganov/llama.cpp.git cd llama.cpp cmake -B build cmake --build build -j --target llama-server llama-cli # Start a local OpenAI-compatible server with a web UI: ./build/bin/llama-server -hf vidfom/Ltx-3:UD-Q4_K_XL # Run inference directly in the terminal: ./build/bin/llama-cli -hf vidfom/Ltx-3:UD-Q4_K_XL
Use Docker
docker model run hf.co/vidfom/Ltx-3:UD-Q4_K_XL
- LM Studio
- Jan
- Ollama
How to use vidfom/Ltx-3 with Ollama:
ollama run hf.co/vidfom/Ltx-3:UD-Q4_K_XL
- Unsloth Studio new
How to use vidfom/Ltx-3 with Unsloth Studio:
Install Unsloth Studio (macOS, Linux, WSL)
curl -fsSL https://unsloth.ai/install.sh | sh # Run unsloth studio unsloth studio -H 0.0.0.0 -p 8888 # Then open http://localhost:8888 in your browser # Search for vidfom/Ltx-3 to start chatting
Install Unsloth Studio (Windows)
irm https://unsloth.ai/install.ps1 | iex # Run unsloth studio unsloth studio -H 0.0.0.0 -p 8888 # Then open http://localhost:8888 in your browser # Search for vidfom/Ltx-3 to start chatting
Using HuggingFace Spaces for Unsloth
# No setup required # Open https://huggingface.co/spaces/unsloth/studio in your browser # Search for vidfom/Ltx-3 to start chatting
- Docker Model Runner
How to use vidfom/Ltx-3 with Docker Model Runner:
docker model run hf.co/vidfom/Ltx-3:UD-Q4_K_XL
- Lemonade
How to use vidfom/Ltx-3 with Lemonade:
Pull the model
# Download Lemonade from https://lemonade-server.ai/ lemonade pull vidfom/Ltx-3:UD-Q4_K_XL
Run and chat with the model
lemonade run user.Ltx-3-UD-Q4_K_XL
List all available models
lemonade list
| import torch | |
| from torch import Tensor | |
| from .flux.layers import DoubleStreamBlockIPA, SingleStreamBlockIPA | |
| from comfy.ldm.flux.layers import timestep_embedding | |
| from types import MethodType | |
| def FluxUpdateModules(bi, ip_attn_procs, image_emb): | |
| flux_model = bi.model | |
| bi.add_object_patch(f"diffusion_model.forward_orig", MethodType(forward_orig_ipa, flux_model.diffusion_model)) | |
| for i, original in enumerate(flux_model.diffusion_model.double_blocks): | |
| patch_name = f"double_blocks.{i}" | |
| maybe_patched_layer = bi.get_model_object(f"diffusion_model.{patch_name}") | |
| # if there's already a patch there, collect its adapters and replace it | |
| procs = [ip_attn_procs[patch_name]] | |
| embs = [image_emb] | |
| if isinstance(maybe_patched_layer, DoubleStreamBlockIPA): | |
| procs = maybe_patched_layer.ip_adapter + procs | |
| embs = maybe_patched_layer.image_emb + embs | |
| # initial ipa models with image embeddings | |
| new_layer = DoubleStreamBlockIPA(original, procs, embs) | |
| # for example, ComfyUI internally uses model.add_patches to add loras | |
| bi.add_object_patch(f"diffusion_model.{patch_name}", new_layer) | |
| for i, original in enumerate(flux_model.diffusion_model.single_blocks): | |
| patch_name = f"single_blocks.{i}" | |
| maybe_patched_layer = bi.get_model_object(f"diffusion_model.{patch_name}") | |
| procs = [ip_attn_procs[patch_name]] | |
| embs = [image_emb] | |
| if isinstance(maybe_patched_layer, SingleStreamBlockIPA): | |
| procs = maybe_patched_layer.ip_adapter + procs | |
| embs = maybe_patched_layer.image_emb + embs | |
| # initial ipa models with image embeddings | |
| new_layer = SingleStreamBlockIPA(original, procs, embs) | |
| bi.add_object_patch(f"diffusion_model.{patch_name}", new_layer) | |
| def is_model_pathched(model): | |
| def test(mod): | |
| if isinstance(mod, DoubleStreamBlockIPA): | |
| return True | |
| else: | |
| for p in mod.children(): | |
| if test(p): | |
| return True | |
| return False | |
| result = test(model) | |
| return result | |
| def forward_orig_ipa( | |
| self, | |
| img: Tensor, | |
| img_ids: Tensor, | |
| txt: Tensor, | |
| txt_ids: Tensor, | |
| timesteps: Tensor, | |
| y: Tensor, | |
| guidance: Tensor|None = None, | |
| control=None, | |
| transformer_options={}, | |
| attn_mask: Tensor = None, | |
| ) -> Tensor: | |
| patches_replace = transformer_options.get("patches_replace", {}) | |
| if img.ndim != 3 or txt.ndim != 3: | |
| raise ValueError("Input img and txt tensors must have 3 dimensions.") | |
| # running on sequences img | |
| img = self.img_in(img) | |
| vec = self.time_in(timestep_embedding(timesteps, 256).to(img.dtype)) | |
| if self.params.guidance_embed: | |
| if guidance is None: | |
| raise ValueError("Didn't get guidance strength for guidance distilled model.") | |
| vec = vec + self.guidance_in(timestep_embedding(guidance, 256).to(img.dtype)) | |
| vec = vec + self.vector_in(y[:,:self.params.vec_in_dim]) | |
| txt = self.txt_in(txt) | |
| ids = torch.cat((txt_ids, img_ids), dim=1) | |
| pe = self.pe_embedder(ids) | |
| blocks_replace = patches_replace.get("dit", {}) | |
| for i, block in enumerate(self.double_blocks): | |
| if ("double_block", i) in blocks_replace: | |
| def block_wrap(args): | |
| out = {} | |
| if isinstance(block, DoubleStreamBlockIPA): # ipadaper | |
| out["img"], out["txt"] = block(img=args["img"], txt=args["txt"], vec=args["vec"], pe=args["pe"], t=args["timesteps"], attn_mask=args.get("attn_mask")) | |
| else: | |
| out["img"], out["txt"] = block(img=args["img"], txt=args["txt"], vec=args["vec"], pe=args["pe"], attn_mask=args.get("attn_mask")) | |
| return out | |
| out = blocks_replace[("double_block", i)]({"img": img, "txt": txt, "vec": vec, "pe": pe, "timesteps": timesteps, "attn_mask": attn_mask}, {"original_block": block_wrap}) | |
| txt = out["txt"] | |
| img = out["img"] | |
| else: | |
| if isinstance(block, DoubleStreamBlockIPA): # ipadaper | |
| img, txt = block(img=img, txt=txt, vec=vec, pe=pe, t=timesteps, attn_mask=attn_mask) | |
| else: | |
| img, txt = block(img=img, txt=txt, vec=vec, pe=pe, attn_mask=attn_mask) | |
| if control is not None: # Controlnet | |
| control_i = control.get("input") | |
| if i < len(control_i): | |
| add = control_i[i] | |
| if add is not None: | |
| img += add | |
| img = torch.cat((txt, img), 1) | |
| for i, block in enumerate(self.single_blocks): | |
| if ("single_block", i) in blocks_replace: | |
| def block_wrap(args): | |
| out = {} | |
| if isinstance(block, SingleStreamBlockIPA): # ipadaper | |
| out["img"] = block(args["img"], vec=args["vec"], pe=args["pe"], t=args["timesteps"], attn_mask=args.get("attn_mask")) | |
| else: | |
| out["img"] = block(args["img"], vec=args["vec"], pe=args["pe"], attn_mask=args.get("attn_mask")) | |
| return out | |
| out = blocks_replace[("single_block", i)]({"img": img, "vec": vec, "pe": pe, "timesteps": timesteps, "attn_mask": attn_mask}, {"original_block": block_wrap}) | |
| img = out["img"] | |
| else: | |
| if isinstance(block, SingleStreamBlockIPA): # ipadaper | |
| img = block(img, vec=vec, pe=pe, t=timesteps, attn_mask=attn_mask) | |
| else: | |
| img = block(img, vec=vec, pe=pe, attn_mask=attn_mask) | |
| if control is not None: # Controlnet | |
| control_o = control.get("output") | |
| if i < len(control_o): | |
| add = control_o[i] | |
| if add is not None: | |
| img[:, txt.shape[1] :, ...] += add | |
| img = img[:, txt.shape[1] :, ...] | |
| img = self.final_layer(img, vec) # (N, T, patch_size ** 2 * out_channels) | |
| return img |