ales commited on
Commit
3b23b6a
·
1 Parent(s): aebd6ab
Files changed (2) hide show
  1. run.sh +0 -39
  2. run_debug.sh +0 -43
run.sh DELETED
@@ -1,39 +0,0 @@
1
- python run_speech_recognition_seq2seq_streaming.py \
2
- --model_name_or_path="openai/whisper-small" \
3
- --dataset_name="mozilla-foundation/common_voice_11_0" \
4
- --dataset_config_name="be" \
5
- --language="be" \
6
- --train_split_name="train" \
7
- --eval_split_name="validation" \
8
- --model_index_name="Whisper Small Belarusian" \
9
- \
10
- --max_steps="5000" \
11
- --output_dir="whisper-small-belarusian" \
12
- --per_device_train_batch_size="64" \
13
- --per_device_eval_batch_size="32" \
14
- --logging_steps="25" \
15
- --learning_rate="1e-4" \
16
- --warmup_steps="500" \
17
- --evaluation_strategy="steps" \
18
- --eval_steps="1000" \
19
- --save_strategy="steps" \
20
- --save_steps="1000" \
21
- --gradient_checkpointing \
22
- --fp16 \
23
- \
24
- --generation_max_length="225" \
25
- --max_duration_in_seconds="30" \
26
- --text_column_name="sentence" \
27
- --freeze_feature_encoder="False" \
28
- --report_to="tensorboard" \
29
- --metric_for_best_model="wer" \
30
- --greater_is_better="False" \
31
- --load_best_model_at_end \
32
- \
33
- --do_train \
34
- --do_eval \
35
- --predict_with_generate \
36
- --do_normalize_eval \
37
- --streaming \
38
- --use_auth_token \
39
- --push_to_hub
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
run_debug.sh DELETED
@@ -1,43 +0,0 @@
1
- python run_speech_recognition_seq2seq_streaming.py \
2
- --model_name_or_path="openai/whisper-tiny" \
3
- --dataset_name="mozilla-foundation/common_voice_11_0" \
4
- --dataset_config_name="be" \
5
- --language="be" \
6
- --train_split_name="train" \
7
- --eval_split_name="validation" \
8
- --model_index_name="Whisper Small Belarusian" \
9
- \
10
- --max_steps="150" \
11
- --max_eval_samples="64" \
12
- --output_dir="./" \
13
- --per_device_train_batch_size="32" \
14
- --per_device_eval_batch_size="32" \
15
- --logging_steps="10" \
16
- --learning_rate="3.1578947368421056e-06" \
17
- --warmup_steps="5" \
18
- --evaluation_strategy="steps" \
19
- --eval_steps="10" \
20
- --save_strategy="steps" \
21
- --save_steps="10" \
22
- --gradient_checkpointing \
23
- --fp16 \
24
- \
25
- --shuffle_buffer_size="20" \
26
- --generation_max_length="225" \
27
- --max_duration_in_seconds="30" \
28
- --text_column_name="sentence" \
29
- --freeze_feature_encoder="False" \
30
- --report_to="tensorboard" \
31
- --metric_for_best_model="wer" \
32
- --greater_is_better="False" \
33
- --load_best_model_at_end \
34
- \
35
- --do_train \
36
- --do_eval \
37
- --ignore_data_skip \
38
- --predict_with_generate \
39
- --do_normalize_eval \
40
- --streaming \
41
- --use_auth_token \
42
- --push_to_hub \
43
- --hub_model_id="ales/whisper-tiny-be-test"