TuKoResearch
/

WavTokenizer

Model card Files Files and versions

klemenk commited on Nov 24, 2025

Commit

0ef180e

·

verified ·

1 Parent(s): 505e173

Update modeling_wavtokenizer.py

Files changed (1) hide show

modeling_wavtokenizer.py +8 -9

modeling_wavtokenizer.py CHANGED Viewed

@@ -39,28 +39,27 @@ def convert_audio(wav, sr, target_sr, target_channels=1):
 # =============================================================================
-# Weight-Normalized Conv1d (matching checkpoint's weight_g/weight_v structure)
 # =============================================================================
 class WNConv1d(nn.Module):
-    """Weight-normalized Conv1d matching checkpoint structure with weight_g/weight_v."""
     def __init__(self, in_channels, out_channels, kernel_size, stride=1, padding=0, dilation=1, groups=1, bias=True):
         super().__init__()
-        self.conv = nn.utils.weight_norm(
-            nn.Conv1d(in_channels, out_channels, kernel_size, stride, padding, dilation, groups, bias)
-        )
     def forward(self, x):
         return self.conv(x)
 class WNConvTranspose1d(nn.Module):
-    """Weight-normalized ConvTranspose1d."""
     def __init__(self, in_channels, out_channels, kernel_size, stride=1, padding=0, output_padding=0, groups=1, bias=True):
         super().__init__()
-        self.convtr = nn.utils.weight_norm(
-            nn.ConvTranspose1d(in_channels, out_channels, kernel_size, stride, padding, output_padding, groups, bias)
-        )
     def forward(self, x):
         return self.convtr(x)

 # =============================================================================
+# Weight-Normalized Conv1d (using parametrizations API to match checkpoint)
 # =============================================================================
 class WNConv1d(nn.Module):
+    """Weight-normalized Conv1d using parametrizations API to match checkpoint structure."""
     def __init__(self, in_channels, out_channels, kernel_size, stride=1, padding=0, dilation=1, groups=1, bias=True):
         super().__init__()
+        conv = nn.Conv1d(in_channels, out_channels, kernel_size, stride, padding, dilation, groups, bias)
+        # Use parametrizations API (PyTorch 2.0+) to match checkpoint naming
+        self.conv = nn.utils.parametrizations.weight_norm(conv)
     def forward(self, x):
         return self.conv(x)
 class WNConvTranspose1d(nn.Module):
+    """Weight-normalized ConvTranspose1d using parametrizations API."""
     def __init__(self, in_channels, out_channels, kernel_size, stride=1, padding=0, output_padding=0, groups=1, bias=True):
         super().__init__()
+        convtr = nn.ConvTranspose1d(in_channels, out_channels, kernel_size, stride, padding, output_padding, groups, bias)
+        self.convtr = nn.utils.parametrizations.weight_norm(convtr)
     def forward(self, x):
         return self.convtr(x)