Update modeling_wavtokenizer.py
Browse files- modeling_wavtokenizer.py +2 -2
modeling_wavtokenizer.py
CHANGED
|
@@ -396,8 +396,8 @@ class Backbone(nn.Module):
|
|
| 396 |
num_bandwidths=4):
|
| 397 |
super().__init__()
|
| 398 |
|
| 399 |
-
# Input projection: backbone.embed
|
| 400 |
-
self.embed = nn.Conv1d(input_dim, dim, kernel_size=
|
| 401 |
|
| 402 |
# Input normalization: backbone.norm
|
| 403 |
self.norm = AdaLayerNorm(dim, num_bandwidths)
|
|
|
|
| 396 |
num_bandwidths=4):
|
| 397 |
super().__init__()
|
| 398 |
|
| 399 |
+
# Input projection: backbone.embed (kernel_size=7 to match checkpoint)
|
| 400 |
+
self.embed = nn.Conv1d(input_dim, dim, kernel_size=7, padding=3)
|
| 401 |
|
| 402 |
# Input normalization: backbone.norm
|
| 403 |
self.norm = AdaLayerNorm(dim, num_bandwidths)
|