Spaces:
Sleeping
Sleeping
primepake
commited on
Commit
·
34bf06f
1
Parent(s):
f768eb3
update train with learnable encoder
Browse files
speech/cosyvoice/flow/flow.py
CHANGED
|
@@ -346,7 +346,7 @@ class CausalMaskedDiffWithXvec(torch.nn.Module):
|
|
| 346 |
mask = batch['reference_mel_masks'][:, i, :].unsqueeze(1).to(device)
|
| 347 |
else:
|
| 348 |
mask = None
|
| 349 |
-
print('ref_mel mask: ', ref_mel.shape, mask.shape)
|
| 350 |
# Apply speaker encoder
|
| 351 |
with torch.set_grad_enabled(not self.freeze_speaker_encoder):
|
| 352 |
emb = self.speaker_encoder(ref_mel, mask) # [B, spk_embed_dim]
|
|
|
|
| 346 |
mask = batch['reference_mel_masks'][:, i, :].unsqueeze(1).to(device)
|
| 347 |
else:
|
| 348 |
mask = None
|
| 349 |
+
# print('ref_mel mask: ', ref_mel.shape, mask.shape)
|
| 350 |
# Apply speaker encoder
|
| 351 |
with torch.set_grad_enabled(not self.freeze_speaker_encoder):
|
| 352 |
emb = self.speaker_encoder(ref_mel, mask) # [B, spk_embed_dim]
|