Added spaces zerogpu
Browse files
xtts.py
CHANGED
|
@@ -7,6 +7,7 @@ import torch
|
|
| 7 |
import numpy as np
|
| 8 |
from typing import List
|
| 9 |
from pydantic import BaseModel
|
|
|
|
| 10 |
|
| 11 |
from TTS.tts.configs.xtts_config import XttsConfig
|
| 12 |
from TTS.tts.models.xtts import Xtts
|
|
@@ -145,6 +146,7 @@ class TTSInputs(BaseModel):
|
|
| 145 |
top_p: float
|
| 146 |
|
| 147 |
# @app.post("/tts")
|
|
|
|
| 148 |
def predict_speech(parsed_input: TTSInputs):
|
| 149 |
speaker_embedding = torch.tensor(parsed_input.speaker_embedding).unsqueeze(0).unsqueeze(-1)
|
| 150 |
gpt_cond_latent = torch.tensor(parsed_input.gpt_cond_latent).reshape((-1, 1024)).unsqueeze(0)
|
|
|
|
| 7 |
import numpy as np
|
| 8 |
from typing import List
|
| 9 |
from pydantic import BaseModel
|
| 10 |
+
import spaces
|
| 11 |
|
| 12 |
from TTS.tts.configs.xtts_config import XttsConfig
|
| 13 |
from TTS.tts.models.xtts import Xtts
|
|
|
|
| 146 |
top_p: float
|
| 147 |
|
| 148 |
# @app.post("/tts")
|
| 149 |
+
+@spaces.GPU
|
| 150 |
def predict_speech(parsed_input: TTSInputs):
|
| 151 |
speaker_embedding = torch.tensor(parsed_input.speaker_embedding).unsqueeze(0).unsqueeze(-1)
|
| 152 |
gpt_cond_latent = torch.tensor(parsed_input.gpt_cond_latent).reshape((-1, 1024)).unsqueeze(0)
|