Training in progress, step 3800
Browse files
config.json
CHANGED
|
@@ -1,65 +1,65 @@
|
|
| 1 |
-
{
|
| 2 |
-
"architectures": [
|
| 3 |
-
"MDDTransformer"
|
| 4 |
-
],
|
| 5 |
-
"batch_first": true,
|
| 6 |
-
"d_model": 32,
|
| 7 |
-
"dim_feedforward": 256,
|
| 8 |
-
"hidden_dropout_prob": 0.1,
|
| 9 |
-
"input_channels": 2,
|
| 10 |
-
"max_source_positions": 3000,
|
| 11 |
-
"model_type": "mdd_transformer",
|
| 12 |
-
"num_attention_heads_decoder": 2,
|
| 13 |
-
"num_attention_heads_encoder": 4,
|
| 14 |
-
"num_classes": 43,
|
| 15 |
-
"num_cross_attention_heads": 2,
|
| 16 |
-
"num_decoder_layers": 2,
|
| 17 |
-
"num_encoder_layers": 2,
|
| 18 |
-
"num_mel_bins": 80,
|
| 19 |
-
"projector_activation": "softmax",
|
| 20 |
-
"tokens": [
|
| 21 |
-
"SIL",
|
| 22 |
-
"AA",
|
| 23 |
-
"AE",
|
| 24 |
-
"AH",
|
| 25 |
-
"AO",
|
| 26 |
-
"AW",
|
| 27 |
-
"AX",
|
| 28 |
-
"AY",
|
| 29 |
-
"B",
|
| 30 |
-
"CH",
|
| 31 |
-
"D",
|
| 32 |
-
"DH",
|
| 33 |
-
"EH",
|
| 34 |
-
"ER",
|
| 35 |
-
"EY",
|
| 36 |
-
"F",
|
| 37 |
-
"G",
|
| 38 |
-
"HH",
|
| 39 |
-
"IH",
|
| 40 |
-
"IY",
|
| 41 |
-
"JH",
|
| 42 |
-
"K",
|
| 43 |
-
"L",
|
| 44 |
-
"M",
|
| 45 |
-
"N",
|
| 46 |
-
"NG",
|
| 47 |
-
"OW",
|
| 48 |
-
"OY",
|
| 49 |
-
"P",
|
| 50 |
-
"R",
|
| 51 |
-
"S",
|
| 52 |
-
"SH",
|
| 53 |
-
"T",
|
| 54 |
-
"TH",
|
| 55 |
-
"UH",
|
| 56 |
-
"UW",
|
| 57 |
-
"V",
|
| 58 |
-
"W",
|
| 59 |
-
"Y",
|
| 60 |
-
"Z",
|
| 61 |
-
"ZH"
|
| 62 |
-
],
|
| 63 |
-
"torch_dtype": "float32",
|
| 64 |
-
"transformers_version": "4.52.
|
| 65 |
-
}
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"MDDTransformer"
|
| 4 |
+
],
|
| 5 |
+
"batch_first": true,
|
| 6 |
+
"d_model": 32,
|
| 7 |
+
"dim_feedforward": 256,
|
| 8 |
+
"hidden_dropout_prob": 0.1,
|
| 9 |
+
"input_channels": 2,
|
| 10 |
+
"max_source_positions": 3000,
|
| 11 |
+
"model_type": "mdd_transformer",
|
| 12 |
+
"num_attention_heads_decoder": 2,
|
| 13 |
+
"num_attention_heads_encoder": 4,
|
| 14 |
+
"num_classes": 43,
|
| 15 |
+
"num_cross_attention_heads": 2,
|
| 16 |
+
"num_decoder_layers": 2,
|
| 17 |
+
"num_encoder_layers": 2,
|
| 18 |
+
"num_mel_bins": 80,
|
| 19 |
+
"projector_activation": "softmax",
|
| 20 |
+
"tokens": [
|
| 21 |
+
"SIL",
|
| 22 |
+
"AA",
|
| 23 |
+
"AE",
|
| 24 |
+
"AH",
|
| 25 |
+
"AO",
|
| 26 |
+
"AW",
|
| 27 |
+
"AX",
|
| 28 |
+
"AY",
|
| 29 |
+
"B",
|
| 30 |
+
"CH",
|
| 31 |
+
"D",
|
| 32 |
+
"DH",
|
| 33 |
+
"EH",
|
| 34 |
+
"ER",
|
| 35 |
+
"EY",
|
| 36 |
+
"F",
|
| 37 |
+
"G",
|
| 38 |
+
"HH",
|
| 39 |
+
"IH",
|
| 40 |
+
"IY",
|
| 41 |
+
"JH",
|
| 42 |
+
"K",
|
| 43 |
+
"L",
|
| 44 |
+
"M",
|
| 45 |
+
"N",
|
| 46 |
+
"NG",
|
| 47 |
+
"OW",
|
| 48 |
+
"OY",
|
| 49 |
+
"P",
|
| 50 |
+
"R",
|
| 51 |
+
"S",
|
| 52 |
+
"SH",
|
| 53 |
+
"T",
|
| 54 |
+
"TH",
|
| 55 |
+
"UH",
|
| 56 |
+
"UW",
|
| 57 |
+
"V",
|
| 58 |
+
"W",
|
| 59 |
+
"Y",
|
| 60 |
+
"Z",
|
| 61 |
+
"ZH"
|
| 62 |
+
],
|
| 63 |
+
"torch_dtype": "float32",
|
| 64 |
+
"transformers_version": "4.52.3"
|
| 65 |
+
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1009168
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b1edaaea0c0e145055006bfe981ea7a1d9428601cb24e933c2a3546d2a77c36
|
| 3 |
size 1009168
|
runs/May30_14-04-04_jupyter-pytorch-395910-0/events.out.tfevents.1748613849.jupyter-pytorch-395910-0.1003.4
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:84b9b01b0fe904823bc8d35207819f707548e85416b036fd3e648ba06e696d50
|
| 3 |
+
size 78576
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5905
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bf82f87052e26ded05e89558f5bd204fdbae5947b5556fbda36f3aec8b45dc45
|
| 3 |
size 5905
|