from diffusers import DiffusionPipeline import torch pipe = DiffusionPipeline.from_pretrained( "damo-vilab/text-to-video-ms-1.7b", torch_dtype=torch.float16 ).to("cuda") prompt = "a futuristic city at night, neon lights" video_frames = pipe(prompt).frames