How to use FastVideo/stable-audio-open-1.0-Diffusers with Diffusers:
pip install -U diffusers transformers accelerate
import torch from diffusers import DiffusionPipeline # switch to "mps" for apple devices pipe = DiffusionPipeline.from_pretrained("FastVideo/stable-audio-open-1.0-Diffusers", dtype=torch.bfloat16, device_map="cuda") prompt = "Astronaut in a jungle, cold color palette, muted colors, detailed, 8k" image = pipe(prompt).images[0]
351f5e8 2660964 351f5e8
1
2
3
4
5
6
7
8
9
10
11
{ "_class_name": "StableAudioDiT", "io_channels": 64, "embed_dim": 1536, "depth": 24, "cond_token_dim": 768, "global_cond_dim": 1536, "project_cond_tokens": false, "num_attention_heads": 24, "project_global_cond": false }