Instructions to use vidfom/Ltx-3 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.

Libraries

How to use vidfom/Ltx-3 with llama-cpp-python:

# !pip install llama-cpp-python

from llama_cpp import Llama

llm = Llama.from_pretrained(
	repo_id="vidfom/Ltx-3",
	filename="ComfyUI/models/text_encoders/gemma-3-12b-it-qat-UD-Q4_K_XL.gguf",
)

llm.create_chat_completion(
	messages = "No input example has been defined for this model task."
)

Notebooks
Google Colab
Kaggle
Local Apps

llama.cpp

How to use vidfom/Ltx-3 with llama.cpp:

Install from brew

brew install llama.cpp
# Start a local OpenAI-compatible server with a web UI:
llama-server -hf vidfom/Ltx-3:UD-Q4_K_XL
# Run inference directly in the terminal:
llama-cli -hf vidfom/Ltx-3:UD-Q4_K_XL

Install from WinGet (Windows)

winget install llama.cpp
# Start a local OpenAI-compatible server with a web UI:
llama-server -hf vidfom/Ltx-3:UD-Q4_K_XL
# Run inference directly in the terminal:
llama-cli -hf vidfom/Ltx-3:UD-Q4_K_XL

Use pre-built binary

# Download pre-built binary from:
# https://github.com/ggerganov/llama.cpp/releases
# Start a local OpenAI-compatible server with a web UI:
./llama-server -hf vidfom/Ltx-3:UD-Q4_K_XL
# Run inference directly in the terminal:
./llama-cli -hf vidfom/Ltx-3:UD-Q4_K_XL

Build from source code

git clone https://github.com/ggerganov/llama.cpp.git
cd llama.cpp
cmake -B build
cmake --build build -j --target llama-server llama-cli
# Start a local OpenAI-compatible server with a web UI:
./build/bin/llama-server -hf vidfom/Ltx-3:UD-Q4_K_XL
# Run inference directly in the terminal:
./build/bin/llama-cli -hf vidfom/Ltx-3:UD-Q4_K_XL

Use Docker

docker model run hf.co/vidfom/Ltx-3:UD-Q4_K_XL

LM Studio
Jan
Ollama
How to use vidfom/Ltx-3 with Ollama:
```
ollama run hf.co/vidfom/Ltx-3:UD-Q4_K_XL
```

Unsloth Studio new

How to use vidfom/Ltx-3 with Unsloth Studio:

Install Unsloth Studio (macOS, Linux, WSL)

curl -fsSL https://unsloth.ai/install.sh | sh
# Run unsloth studio
unsloth studio -H 0.0.0.0 -p 8888
# Then open http://localhost:8888 in your browser
# Search for vidfom/Ltx-3 to start chatting

Install Unsloth Studio (Windows)

irm https://unsloth.ai/install.ps1 | iex
# Run unsloth studio
unsloth studio -H 0.0.0.0 -p 8888
# Then open http://localhost:8888 in your browser
# Search for vidfom/Ltx-3 to start chatting

Using HuggingFace Spaces for Unsloth

# No setup required
# Open https://huggingface.co/spaces/unsloth/studio in your browser
# Search for vidfom/Ltx-3 to start chatting

Docker Model Runner
How to use vidfom/Ltx-3 with Docker Model Runner:
```
docker model run hf.co/vidfom/Ltx-3:UD-Q4_K_XL
```

Lemonade

How to use vidfom/Ltx-3 with Lemonade:

Pull the model

# Download Lemonade from https://lemonade-server.ai/
lemonade pull vidfom/Ltx-3:UD-Q4_K_XL

Run and chat with the model

lemonade run user.Ltx-3-UD-Q4_K_XL

List all available models

lemonade list

Ltx-3 / ComfyUI /comfy_execution /caching.py

vidfom

Upload folder using huggingface_hub

e00eceb verified about 2 months ago

raw

history blame contribute delete

20.7 kB

	import asyncio
	import bisect
	import itertools
	import psutil
	import time
	import torch
	from typing import Sequence, Mapping, Dict
	from comfy_execution.graph import DynamicPrompt
	from abc import ABC, abstractmethod

	import nodes

	from comfy_execution.graph_utils import is_link

	NODE_CLASS_CONTAINS_UNIQUE_ID: Dict[str, bool] = {}


	def include_unique_id_in_input(class_type: str) -> bool:
	if class_type in NODE_CLASS_CONTAINS_UNIQUE_ID:
	return NODE_CLASS_CONTAINS_UNIQUE_ID[class_type]
	class_def = nodes.NODE_CLASS_MAPPINGS[class_type]
	NODE_CLASS_CONTAINS_UNIQUE_ID[class_type] = "UNIQUE_ID" in class_def.INPUT_TYPES().get("hidden", {}).values()
	return NODE_CLASS_CONTAINS_UNIQUE_ID[class_type]

	class CacheKeySet(ABC):
	def __init__(self, dynprompt, node_ids, is_changed_cache):
	self.keys = {}
	self.subcache_keys = {}

	@abstractmethod
	async def add_keys(self, node_ids):
	raise NotImplementedError()

	def all_node_ids(self):
	return set(self.keys.keys())

	def get_used_keys(self):
	return self.keys.values()

	def get_used_subcache_keys(self):
	return self.subcache_keys.values()

	def get_data_key(self, node_id):
	return self.keys.get(node_id, None)

	def get_subcache_key(self, node_id):
	return self.subcache_keys.get(node_id, None)

	class Unhashable:
	def __init__(self):
	self.value = float("NaN")

	def to_hashable(obj):
	# So that we don't infinitely recurse since frozenset and tuples
	# are Sequences.
	if isinstance(obj, (int, float, str, bool, bytes, type(None))):
	return obj
	elif isinstance(obj, Mapping):
	return frozenset([(to_hashable(k), to_hashable(v)) for k, v in sorted(obj.items())])
	elif isinstance(obj, Sequence):
	return frozenset(zip(itertools.count(), [to_hashable(i) for i in obj]))
	else:
	# TODO - Support other objects like tensors?
	return Unhashable()

	class CacheKeySetID(CacheKeySet):
	def __init__(self, dynprompt, node_ids, is_changed_cache):
	super().__init__(dynprompt, node_ids, is_changed_cache)
	self.dynprompt = dynprompt

	async def add_keys(self, node_ids):
	for node_id in node_ids:
	if node_id in self.keys:
	continue
	if not self.dynprompt.has_node(node_id):
	continue
	node = self.dynprompt.get_node(node_id)
	self.keys[node_id] = (node_id, node["class_type"])
	self.subcache_keys[node_id] = (node_id, node["class_type"])

	class CacheKeySetInputSignature(CacheKeySet):
	def __init__(self, dynprompt, node_ids, is_changed_cache):
	super().__init__(dynprompt, node_ids, is_changed_cache)
	self.dynprompt = dynprompt
	self.is_changed_cache = is_changed_cache

	def include_node_id_in_input(self) -> bool:
	return False

	async def add_keys(self, node_ids):
	for node_id in node_ids:
	if node_id in self.keys:
	continue
	if not self.dynprompt.has_node(node_id):
	continue
	node = self.dynprompt.get_node(node_id)
	self.keys[node_id] = await self.get_node_signature(self.dynprompt, node_id)
	self.subcache_keys[node_id] = (node_id, node["class_type"])

	async def get_node_signature(self, dynprompt, node_id):
	signature = []
	ancestors, order_mapping = self.get_ordered_ancestry(dynprompt, node_id)
	signature.append(await self.get_immediate_node_signature(dynprompt, node_id, order_mapping))
	for ancestor_id in ancestors:
	signature.append(await self.get_immediate_node_signature(dynprompt, ancestor_id, order_mapping))
	return to_hashable(signature)

	async def get_immediate_node_signature(self, dynprompt, node_id, ancestor_order_mapping):
	if not dynprompt.has_node(node_id):
	# This node doesn't exist -- we can't cache it.
	return [float("NaN")]
	node = dynprompt.get_node(node_id)
	class_type = node["class_type"]
	class_def = nodes.NODE_CLASS_MAPPINGS[class_type]
	signature = [class_type, await self.is_changed_cache.get(node_id)]
	if self.include_node_id_in_input() or (hasattr(class_def, "NOT_IDEMPOTENT") and class_def.NOT_IDEMPOTENT) or include_unique_id_in_input(class_type):
	signature.append(node_id)
	inputs = node["inputs"]
	for key in sorted(inputs.keys()):
	if is_link(inputs[key]):
	(ancestor_id, ancestor_socket) = inputs[key]
	ancestor_index = ancestor_order_mapping[ancestor_id]
	signature.append((key,("ANCESTOR", ancestor_index, ancestor_socket)))
	else:
	signature.append((key, inputs[key]))
	return signature

	# This function returns a list of all ancestors of the given node. The order of the list is
	# deterministic based on which specific inputs the ancestor is connected by.
	def get_ordered_ancestry(self, dynprompt, node_id):
	ancestors = []
	order_mapping = {}
	self.get_ordered_ancestry_internal(dynprompt, node_id, ancestors, order_mapping)
	return ancestors, order_mapping

	def get_ordered_ancestry_internal(self, dynprompt, node_id, ancestors, order_mapping):
	if not dynprompt.has_node(node_id):
	return
	inputs = dynprompt.get_node(node_id)["inputs"]
	input_keys = sorted(inputs.keys())
	for key in input_keys:
	if is_link(inputs[key]):
	ancestor_id = inputs[key][0]
	if ancestor_id not in order_mapping:
	ancestors.append(ancestor_id)
	order_mapping[ancestor_id] = len(ancestors) - 1
	self.get_ordered_ancestry_internal(dynprompt, ancestor_id, ancestors, order_mapping)

	class BasicCache:
	def __init__(self, key_class, enable_providers=False):
	self.key_class = key_class
	self.initialized = False
	self.enable_providers = enable_providers
	self.dynprompt: DynamicPrompt
	self.cache_key_set: CacheKeySet
	self.cache = {}
	self.subcaches = {}
	self._pending_store_tasks: set = set()

	async def set_prompt(self, dynprompt, node_ids, is_changed_cache):
	self.dynprompt = dynprompt
	self.cache_key_set = self.key_class(dynprompt, node_ids, is_changed_cache)
	await self.cache_key_set.add_keys(node_ids)
	self.is_changed_cache = is_changed_cache
	self.initialized = True

	def all_node_ids(self):
	assert self.initialized
	node_ids = self.cache_key_set.all_node_ids()
	for subcache in self.subcaches.values():
	node_ids = node_ids.union(subcache.all_node_ids())
	return node_ids

	def _clean_cache(self):
	preserve_keys = set(self.cache_key_set.get_used_keys())
	to_remove = []
	for key in self.cache:
	if key not in preserve_keys:
	to_remove.append(key)
	for key in to_remove:
	del self.cache[key]

	def _clean_subcaches(self):
	preserve_subcaches = set(self.cache_key_set.get_used_subcache_keys())

	to_remove = []
	for key in self.subcaches:
	if key not in preserve_subcaches:
	to_remove.append(key)
	for key in to_remove:
	del self.subcaches[key]

	def clean_unused(self):
	assert self.initialized
	self._clean_cache()
	self._clean_subcaches()

	def poll(self, **kwargs):
	pass

	def get_local(self, node_id):
	if not self.initialized:
	return None
	cache_key = self.cache_key_set.get_data_key(node_id)
	if cache_key in self.cache:
	return self.cache[cache_key]
	return None

	def set_local(self, node_id, value):
	assert self.initialized
	cache_key = self.cache_key_set.get_data_key(node_id)
	self.cache[cache_key] = value

	async def _set_immediate(self, node_id, value):
	assert self.initialized
	cache_key = self.cache_key_set.get_data_key(node_id)
	self.cache[cache_key] = value

	await self._notify_providers_store(node_id, cache_key, value)

	async def _get_immediate(self, node_id):
	if not self.initialized:
	return None
	cache_key = self.cache_key_set.get_data_key(node_id)

	if cache_key in self.cache:
	return self.cache[cache_key]

	external_result = await self._check_providers_lookup(node_id, cache_key)
	if external_result is not None:
	self.cache[cache_key] = external_result
	return external_result

	return None

	async def _notify_providers_store(self, node_id, cache_key, value):
	from comfy_execution.cache_provider import (
	_has_cache_providers, _get_cache_providers,
	CacheValue, _contains_self_unequal, _logger
	)

	if not self.enable_providers:
	return
	if not _has_cache_providers():
	return
	if not self._is_external_cacheable_value(value):
	return
	if _contains_self_unequal(cache_key):
	return

	context = self._build_context(node_id, cache_key)
	if context is None:
	return
	cache_value = CacheValue(outputs=value.outputs, ui=value.ui)

	for provider in _get_cache_providers():
	try:
	if provider.should_cache(context, cache_value):
	task = asyncio.create_task(self._safe_provider_store(provider, context, cache_value))
	self._pending_store_tasks.add(task)
	task.add_done_callback(self._pending_store_tasks.discard)
	except Exception as e:
	_logger.warning(f"Cache provider {provider.__class__.__name__} error on store: {e}")

	@staticmethod
	async def _safe_provider_store(provider, context, cache_value):
	from comfy_execution.cache_provider import _logger
	try:
	await provider.on_store(context, cache_value)
	except Exception as e:
	_logger.warning(f"Cache provider {provider.__class__.__name__} async store error: {e}")

	async def _check_providers_lookup(self, node_id, cache_key):
	from comfy_execution.cache_provider import (
	_has_cache_providers, _get_cache_providers,
	CacheValue, _contains_self_unequal, _logger
	)

	if not self.enable_providers:
	return None
	if not _has_cache_providers():
	return None
	if _contains_self_unequal(cache_key):
	return None

	context = self._build_context(node_id, cache_key)
	if context is None:
	return None

	for provider in _get_cache_providers():
	try:
	if not provider.should_cache(context):
	continue
	result = await provider.on_lookup(context)
	if result is not None:
	if not isinstance(result, CacheValue):
	_logger.warning(f"Provider {provider.__class__.__name__} returned invalid type")
	continue
	if not isinstance(result.outputs, (list, tuple)):
	_logger.warning(f"Provider {provider.__class__.__name__} returned invalid outputs")
	continue
	from execution import CacheEntry
	return CacheEntry(ui=result.ui, outputs=list(result.outputs))
	except Exception as e:
	_logger.warning(f"Cache provider {provider.__class__.__name__} error on lookup: {e}")

	return None

	def _is_external_cacheable_value(self, value):
	return hasattr(value, 'outputs') and hasattr(value, 'ui')

	def _get_class_type(self, node_id):
	if not self.initialized or not self.dynprompt:
	return ''
	try:
	return self.dynprompt.get_node(node_id).get('class_type', '')
	except Exception:
	return ''

	def _build_context(self, node_id, cache_key):
	from comfy_execution.cache_provider import CacheContext, _serialize_cache_key, _logger
	try:
	cache_key_hash = _serialize_cache_key(cache_key)
	if cache_key_hash is None:
	return None
	return CacheContext(
	node_id=node_id,
	class_type=self._get_class_type(node_id),
	cache_key_hash=cache_key_hash,
	)
	except Exception as e:
	_logger.warning(f"Failed to build cache context for node {node_id}: {e}")
	return None

	async def _ensure_subcache(self, node_id, children_ids):
	subcache_key = self.cache_key_set.get_subcache_key(node_id)
	subcache = self.subcaches.get(subcache_key, None)
	if subcache is None:
	subcache = BasicCache(self.key_class)
	self.subcaches[subcache_key] = subcache
	await subcache.set_prompt(self.dynprompt, children_ids, self.is_changed_cache)
	return subcache

	def _get_subcache(self, node_id):
	assert self.initialized
	subcache_key = self.cache_key_set.get_subcache_key(node_id)
	if subcache_key in self.subcaches:
	return self.subcaches[subcache_key]
	else:
	return None

	def recursive_debug_dump(self):
	result = []
	for key in self.cache:
	result.append({"key": key, "value": self.cache[key]})
	for key in self.subcaches:
	result.append({"subcache_key": key, "subcache": self.subcaches[key].recursive_debug_dump()})
	return result

	class HierarchicalCache(BasicCache):
	def __init__(self, key_class, enable_providers=False):
	super().__init__(key_class, enable_providers=enable_providers)

	def _get_cache_for(self, node_id):
	assert self.dynprompt is not None
	parent_id = self.dynprompt.get_parent_node_id(node_id)
	if parent_id is None:
	return self

	hierarchy = []
	while parent_id is not None:
	hierarchy.append(parent_id)
	parent_id = self.dynprompt.get_parent_node_id(parent_id)

	cache = self
	for parent_id in reversed(hierarchy):
	cache = cache._get_subcache(parent_id)
	if cache is None:
	return None
	return cache

	async def get(self, node_id):
	cache = self._get_cache_for(node_id)
	if cache is None:
	return None
	return await cache._get_immediate(node_id)

	def get_local(self, node_id):
	cache = self._get_cache_for(node_id)
	if cache is None:
	return None
	return BasicCache.get_local(cache, node_id)

	async def set(self, node_id, value):
	cache = self._get_cache_for(node_id)
	assert cache is not None
	await cache._set_immediate(node_id, value)

	def set_local(self, node_id, value):
	cache = self._get_cache_for(node_id)
	assert cache is not None
	BasicCache.set_local(cache, node_id, value)

	async def ensure_subcache_for(self, node_id, children_ids):
	cache = self._get_cache_for(node_id)
	assert cache is not None
	return await cache._ensure_subcache(node_id, children_ids)

	class NullCache:

	async def set_prompt(self, dynprompt, node_ids, is_changed_cache):
	pass

	def all_node_ids(self):
	return []

	def clean_unused(self):
	pass

	def poll(self, **kwargs):
	pass

	async def get(self, node_id):
	return None

	def get_local(self, node_id):
	return None

	async def set(self, node_id, value):
	pass

	def set_local(self, node_id, value):
	pass

	async def ensure_subcache_for(self, node_id, children_ids):
	return self

	class LRUCache(BasicCache):
	def __init__(self, key_class, max_size=100, enable_providers=False):
	super().__init__(key_class, enable_providers=enable_providers)
	self.max_size = max_size
	self.min_generation = 0
	self.generation = 0
	self.used_generation = {}
	self.children = {}

	async def set_prompt(self, dynprompt, node_ids, is_changed_cache):
	await super().set_prompt(dynprompt, node_ids, is_changed_cache)
	self.generation += 1
	for node_id in node_ids:
	self._mark_used(node_id)

	def clean_unused(self):
	while len(self.cache) > self.max_size and self.min_generation < self.generation:
	self.min_generation += 1
	to_remove = [key for key in self.cache if self.used_generation[key] < self.min_generation]
	for key in to_remove:
	del self.cache[key]
	del self.used_generation[key]
	if key in self.children:
	del self.children[key]
	self._clean_subcaches()

	async def get(self, node_id):
	self._mark_used(node_id)
	return await self._get_immediate(node_id)

	def _mark_used(self, node_id):
	cache_key = self.cache_key_set.get_data_key(node_id)
	if cache_key is not None:
	self.used_generation[cache_key] = self.generation

	async def set(self, node_id, value):
	self._mark_used(node_id)
	return await self._set_immediate(node_id, value)

	def set_local(self, node_id, value):
	self._mark_used(node_id)
	BasicCache.set_local(self, node_id, value)

	async def ensure_subcache_for(self, node_id, children_ids):
	# Just uses subcaches for tracking 'live' nodes
	await super()._ensure_subcache(node_id, children_ids)

	await self.cache_key_set.add_keys(children_ids)
	self._mark_used(node_id)
	cache_key = self.cache_key_set.get_data_key(node_id)
	self.children[cache_key] = []
	for child_id in children_ids:
	self._mark_used(child_id)
	self.children[cache_key].append(self.cache_key_set.get_data_key(child_id))
	return self


	#Small baseline weight used when a cache entry has no measurable CPU tensors.
	#Keeps unknown-sized entries in eviction scoring without dominating tensor-backed entries.

	RAM_CACHE_DEFAULT_RAM_USAGE = 0.05

	#Exponential bias towards evicting older workflows so garbage will be taken out
	#in constantly changing setups.

	RAM_CACHE_OLD_WORKFLOW_OOM_MULTIPLIER = 1.3

	class RAMPressureCache(LRUCache):

	def __init__(self, key_class, enable_providers=False):
	super().__init__(key_class, 0, enable_providers=enable_providers)
	self.timestamps = {}

	def clean_unused(self):
	self._clean_subcaches()

	async def set(self, node_id, value):
	self.timestamps[self.cache_key_set.get_data_key(node_id)] = time.time()
	await super().set(node_id, value)

	async def get(self, node_id):
	self.timestamps[self.cache_key_set.get_data_key(node_id)] = time.time()
	return await super().get(node_id)

	def set_local(self, node_id, value):
	self.timestamps[self.cache_key_set.get_data_key(node_id)] = time.time()
	super().set_local(node_id, value)

	def ram_release(self, target):
	if psutil.virtual_memory().available >= target:
	return

	clean_list = []

	for key, cache_entry in self.cache.items():
	oom_score = RAM_CACHE_OLD_WORKFLOW_OOM_MULTIPLIER ** (self.generation - self.used_generation[key])

	ram_usage = RAM_CACHE_DEFAULT_RAM_USAGE
	def scan_list_for_ram_usage(outputs):
	nonlocal ram_usage
	if outputs is None:
	return
	for output in outputs:
	if isinstance(output, (list, tuple)):
	scan_list_for_ram_usage(output)
	elif isinstance(output, torch.Tensor) and output.device.type == 'cpu':
	ram_usage += output.numel() * output.element_size()
	scan_list_for_ram_usage(cache_entry.outputs)

	oom_score *= ram_usage
	#In the case where we have no information on the node ram usage at all,
	#break OOM score ties on the last touch timestamp (pure LRU)
	bisect.insort(clean_list, (oom_score, self.timestamps[key], key))

	while psutil.virtual_memory().available < target and clean_list:
	_, _, key = clean_list.pop()
	del self.cache[key]
	self.used_generation.pop(key, None)
	self.timestamps.pop(key, None)
	self.children.pop(key, None)