| license: apache-2.0 | |
| # Use a pipeline as a high-level helper | |
| from transformers import pipeline | |
| pipe = pipeline("text-to-speech", model="microsoft/VibeVoice-Realtime-0.5B") | |
| # Load model directly | |
| from transformers import VibeVoiceStreamingForConditionalGenerationInference | |
| model = VibeVoiceStreamingForConditionalGenerationInference.from_pretrained("microsoft/VibeVoice-Realtime-0.5B", dtype="auto") |