primepake commited on
Commit
34bf06f
·
1 Parent(s): f768eb3

update train with learnable encoder

Browse files
Files changed (1) hide show
  1. speech/cosyvoice/flow/flow.py +1 -1
speech/cosyvoice/flow/flow.py CHANGED
@@ -346,7 +346,7 @@ class CausalMaskedDiffWithXvec(torch.nn.Module):
346
  mask = batch['reference_mel_masks'][:, i, :].unsqueeze(1).to(device)
347
  else:
348
  mask = None
349
- print('ref_mel mask: ', ref_mel.shape, mask.shape)
350
  # Apply speaker encoder
351
  with torch.set_grad_enabled(not self.freeze_speaker_encoder):
352
  emb = self.speaker_encoder(ref_mel, mask) # [B, spk_embed_dim]
 
346
  mask = batch['reference_mel_masks'][:, i, :].unsqueeze(1).to(device)
347
  else:
348
  mask = None
349
+ # print('ref_mel mask: ', ref_mel.shape, mask.shape)
350
  # Apply speaker encoder
351
  with torch.set_grad_enabled(not self.freeze_speaker_encoder):
352
  emb = self.speaker_encoder(ref_mel, mask) # [B, spk_embed_dim]