TuKoResearch
/

WavCochCausalV8192

WavCoch.WavCoch

Model card Files Files and versions

klemenk commited on Sep 23, 2025

Commit

a546ccb

·

verified ·

1 Parent(s): 1412e6f

Update modeling_wavcoch.py

Files changed (1) hide show

modeling_wavcoch.py +2 -2

modeling_wavcoch.py CHANGED Viewed

@@ -508,7 +508,7 @@ class WavCoch(PreTrainedModel):
             if pad:
                 wav = F.pad(wav, (self.N - self.hop_length, 0), mode="constant", value=0.0)
-            codes = self.quantize(wav, pad=False).long()  # already padded
             return BatchEncoding({"input_values": codes, "input_ids": codes})
         # Training / reconstruction mode
@@ -542,7 +542,7 @@ class WavCoch(PreTrainedModel):
         x = real_part + imag_part
         x = self.encoder(x).permute(0, 2, 1)        # (B, T, D)
         _, indices = self.quantizer(x)              # (B, T)
-        return indices
     @torch.no_grad()
     def decode(self, indices: torch.Tensor) -> torch.Tensor:

             if pad:
                 wav = F.pad(wav, (self.N - self.hop_length, 0), mode="constant", value=0.0)
+            codes = self.quantize(wav, pad=False)  # already padded
             return BatchEncoding({"input_values": codes, "input_ids": codes})
         # Training / reconstruction mode
         x = real_part + imag_part
         x = self.encoder(x).permute(0, 2, 1)        # (B, T, D)
         _, indices = self.quantizer(x)              # (B, T)
+        return indices.long()
     @torch.no_grad()
     def decode(self, indices: torch.Tensor) -> torch.Tensor: