GokseninYuksel commited on
Commit
15d95ff
·
verified ·
1 Parent(s): cb6247c

Upload model

Browse files
Files changed (2) hide show
  1. config.json +4 -4
  2. configuration_wavjepa_nat.py +2 -2
config.json CHANGED
@@ -20,9 +20,8 @@
20
  "dropout": 0.0,
21
  "layer_norm_eps": 1e-06,
22
  "nhead": 12,
23
- "norm_first": true
24
  },
25
- "dtype": "float32",
26
  "encoder_cfg": {
27
  "enable_nested_tensor": false,
28
  "mask_check": true,
@@ -37,7 +36,7 @@
37
  "dropout": 0.0,
38
  "layer_norm_eps": 1e-06,
39
  "nhead": 12,
40
- "norm_first": true
41
  },
42
  "extractor_config": {
43
  "conv_bias": false,
@@ -49,5 +48,6 @@
49
  "share_weights_over_channels": false
50
  },
51
  "model_type": "wavjepa-nat-base",
52
- "transformers_version": "4.57.1"
 
53
  }
 
20
  "dropout": 0.0,
21
  "layer_norm_eps": 1e-06,
22
  "nhead": 12,
23
+ "norm_first": false
24
  },
 
25
  "encoder_cfg": {
26
  "enable_nested_tensor": false,
27
  "mask_check": true,
 
36
  "dropout": 0.0,
37
  "layer_norm_eps": 1e-06,
38
  "nhead": 12,
39
+ "norm_first": false
40
  },
41
  "extractor_config": {
42
  "conv_bias": false,
 
48
  "share_weights_over_channels": false
49
  },
50
  "model_type": "wavjepa-nat-base",
51
+ "torch_dtype": "float32",
52
+ "transformers_version": "4.53.2"
53
  }
configuration_wavjepa_nat.py CHANGED
@@ -18,7 +18,7 @@ class WavJEPANatConfig(PretrainedConfig):
18
  encoder_d_model: int = 768,
19
  encoder_nhead : int = 12,
20
  encoder_batch_first = True,
21
- encoder_norm_first = True,
22
  encoder_bias = True,
23
  encoder_mlp_ratio = 4.0,
24
  encoder_dropout = 0.0,
@@ -29,7 +29,7 @@ class WavJEPANatConfig(PretrainedConfig):
29
  decoder_d_model: int = 384,
30
  decoder_nhead : int = 12,
31
  decoder_batch_first = True,
32
- decoder_norm_first = True,
33
  decoder_bias = True,
34
  decoder_mlp_ratio = 4.0,
35
  decoder_dropout = 0.0,
 
18
  encoder_d_model: int = 768,
19
  encoder_nhead : int = 12,
20
  encoder_batch_first = True,
21
+ encoder_norm_first = False,
22
  encoder_bias = True,
23
  encoder_mlp_ratio = 4.0,
24
  encoder_dropout = 0.0,
 
29
  decoder_d_model: int = 384,
30
  decoder_nhead : int = 12,
31
  decoder_batch_first = True,
32
+ decoder_norm_first = False,
33
  decoder_bias = True,
34
  decoder_mlp_ratio = 4.0,
35
  decoder_dropout = 0.0,