transformerlab
/

ideogram-4-int8-w8a8

Model card Files Files and versions

ideogram-4-int8-w8a8 / usage.py

deep1401's picture

Upload usage.py with huggingface_hub

7527d53 verified 23 days ago

History Blame Contribute Delete

951 Bytes

	"""Generate an image with the INT8 W8A8 Ideogram 4 DiT.

	python download_deps.py # one time (gated base-repo access required)
	python usage.py "a poster that says HELLO"

	Memory: the FP8 pipeline is large; on a 24 GB card you may need an offload/
	sequential-load recipe (see recipe.json).
	"""
	import sys
	import torch
	from ideogram4 import Ideogram4Pipeline, Ideogram4PipelineConfig
	from safetensors_loader import load_int8

	WEIGHTS = "ideogram4-int8-w8a8.safetensors"
	prompt = sys.argv[1] if len(sys.argv) > 1 else 'a storefront sign that says "FRESH COFFEE"'

	pipe = Ideogram4Pipeline.from_pretrained(
	config=Ideogram4PipelineConfig(weights_repo="ideogram-ai/ideogram-4-fp8"),
	device="cuda", dtype=torch.bfloat16)

	sw, pr = load_int8(pipe, WEIGHTS)
	print(f"loaded INT8: {sw} quantized + {pr} protected linears")

	img = pipe(prompt, num_steps=48, height=1024, width=1024, seed=1000)[0]
	img.save("out.png")
	print("saved out.png")