deepdml commited on
Commit
de2231c
·
verified ·
1 Parent(s): c1ca4ad

Training in progress, step 1000

Browse files
config.json CHANGED
@@ -7,10 +7,7 @@
7
  "WhisperForConditionalGeneration"
8
  ],
9
  "attention_dropout": 0.0,
10
- "begin_suppress_tokens": [
11
- 220,
12
- 50257
13
- ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
  "d_model": 384,
@@ -47,7 +44,7 @@
47
  "mask_time_length": 10,
48
  "mask_time_min_masks": 2,
49
  "mask_time_prob": 0.05,
50
- "max_length": 448,
51
  "max_source_positions": 1500,
52
  "max_target_positions": 448,
53
  "median_filter_width": 7,
@@ -56,98 +53,8 @@
56
  "num_mel_bins": 80,
57
  "pad_token_id": 50257,
58
  "scale_embedding": false,
59
- "suppress_tokens": [
60
- 1,
61
- 2,
62
- 7,
63
- 8,
64
- 9,
65
- 10,
66
- 14,
67
- 25,
68
- 26,
69
- 27,
70
- 28,
71
- 29,
72
- 31,
73
- 58,
74
- 59,
75
- 60,
76
- 61,
77
- 62,
78
- 63,
79
- 90,
80
- 91,
81
- 92,
82
- 93,
83
- 359,
84
- 503,
85
- 522,
86
- 542,
87
- 873,
88
- 893,
89
- 902,
90
- 918,
91
- 922,
92
- 931,
93
- 1350,
94
- 1853,
95
- 1982,
96
- 2460,
97
- 2627,
98
- 3246,
99
- 3253,
100
- 3268,
101
- 3536,
102
- 3846,
103
- 3961,
104
- 4183,
105
- 4667,
106
- 6585,
107
- 6647,
108
- 7273,
109
- 9061,
110
- 9383,
111
- 10428,
112
- 10929,
113
- 11938,
114
- 12033,
115
- 12331,
116
- 12562,
117
- 13793,
118
- 14157,
119
- 14635,
120
- 15265,
121
- 15618,
122
- 16553,
123
- 16604,
124
- 18362,
125
- 18956,
126
- 20075,
127
- 21675,
128
- 22520,
129
- 26130,
130
- 26161,
131
- 26435,
132
- 28279,
133
- 29464,
134
- 31650,
135
- 32302,
136
- 32470,
137
- 36865,
138
- 42863,
139
- 47425,
140
- 49870,
141
- 50254,
142
- 50258,
143
- 50358,
144
- 50359,
145
- 50360,
146
- 50361,
147
- 50362
148
- ],
149
  "torch_dtype": "float32",
150
- "transformers_version": "4.42.0.dev0",
151
  "use_cache": false,
152
  "use_weighted_layer_sum": false,
153
  "vocab_size": 51865
 
7
  "WhisperForConditionalGeneration"
8
  ],
9
  "attention_dropout": 0.0,
10
+ "begin_suppress_tokens": null,
 
 
 
11
  "bos_token_id": 50257,
12
  "classifier_proj_size": 256,
13
  "d_model": 384,
 
44
  "mask_time_length": 10,
45
  "mask_time_min_masks": 2,
46
  "mask_time_prob": 0.05,
47
+ "max_length": null,
48
  "max_source_positions": 1500,
49
  "max_target_positions": 448,
50
  "median_filter_width": 7,
 
53
  "num_mel_bins": 80,
54
  "pad_token_id": 50257,
55
  "scale_embedding": false,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
56
  "torch_dtype": "float32",
57
+ "transformers_version": "4.48.0.dev0",
58
  "use_cache": false,
59
  "use_weighted_layer_sum": false,
60
  "vocab_size": 51865
generation_config.json CHANGED
@@ -237,5 +237,5 @@
237
  "transcribe": 50359,
238
  "translate": 50358
239
  },
240
- "transformers_version": "4.42.0.dev0"
241
  }
 
237
  "transcribe": 50359,
238
  "translate": 50358
239
  },
240
+ "transformers_version": "4.48.0.dev0"
241
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:298121245341d18474b6201b804904086e13d391c81f9b588ee205097b13f246
3
  size 151061672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49ab6dcf02419f1125170f693696e3113a73e8867d3d6a99f512e0adab1d446d
3
  size 151061672
runs/Feb21_22-16-53_c579e78e1312/events.out.tfevents.1771712213.c579e78e1312.2222.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90e950a3647d7d66382f4730afd59c0a25b197af73026262e9a72f0d0ab1ebe3
3
+ size 14706
tokenizer_config.json CHANGED
@@ -12980,6 +12980,7 @@
12980
  "clean_up_tokenization_spaces": true,
12981
  "eos_token": "<|endoftext|>",
12982
  "errors": "replace",
 
12983
  "model_max_length": 1024,
12984
  "pad_token": "<|endoftext|>",
12985
  "processor_class": "WhisperProcessor",
 
12980
  "clean_up_tokenization_spaces": true,
12981
  "eos_token": "<|endoftext|>",
12982
  "errors": "replace",
12983
+ "extra_special_tokens": {},
12984
  "model_max_length": 1024,
12985
  "pad_token": "<|endoftext|>",
12986
  "processor_class": "WhisperProcessor",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a41d9dd245c66a5747b9a2ff5a21c0c6a0964a7ee1dcc015e8a381123fee0a8
3
- size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39aaf3eae0a908afe9d675b3e3c38ab2ef2075886085c498ff9970c3a777f80f
3
+ size 5496