upd
Browse files- run.sh +0 -39
- run_debug.sh +0 -43
run.sh
DELETED
|
@@ -1,39 +0,0 @@
|
|
| 1 |
-
python run_speech_recognition_seq2seq_streaming.py \
|
| 2 |
-
--model_name_or_path="openai/whisper-small" \
|
| 3 |
-
--dataset_name="mozilla-foundation/common_voice_11_0" \
|
| 4 |
-
--dataset_config_name="be" \
|
| 5 |
-
--language="be" \
|
| 6 |
-
--train_split_name="train" \
|
| 7 |
-
--eval_split_name="validation" \
|
| 8 |
-
--model_index_name="Whisper Small Belarusian" \
|
| 9 |
-
\
|
| 10 |
-
--max_steps="5000" \
|
| 11 |
-
--output_dir="whisper-small-belarusian" \
|
| 12 |
-
--per_device_train_batch_size="64" \
|
| 13 |
-
--per_device_eval_batch_size="32" \
|
| 14 |
-
--logging_steps="25" \
|
| 15 |
-
--learning_rate="1e-4" \
|
| 16 |
-
--warmup_steps="500" \
|
| 17 |
-
--evaluation_strategy="steps" \
|
| 18 |
-
--eval_steps="1000" \
|
| 19 |
-
--save_strategy="steps" \
|
| 20 |
-
--save_steps="1000" \
|
| 21 |
-
--gradient_checkpointing \
|
| 22 |
-
--fp16 \
|
| 23 |
-
\
|
| 24 |
-
--generation_max_length="225" \
|
| 25 |
-
--max_duration_in_seconds="30" \
|
| 26 |
-
--text_column_name="sentence" \
|
| 27 |
-
--freeze_feature_encoder="False" \
|
| 28 |
-
--report_to="tensorboard" \
|
| 29 |
-
--metric_for_best_model="wer" \
|
| 30 |
-
--greater_is_better="False" \
|
| 31 |
-
--load_best_model_at_end \
|
| 32 |
-
\
|
| 33 |
-
--do_train \
|
| 34 |
-
--do_eval \
|
| 35 |
-
--predict_with_generate \
|
| 36 |
-
--do_normalize_eval \
|
| 37 |
-
--streaming \
|
| 38 |
-
--use_auth_token \
|
| 39 |
-
--push_to_hub
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
run_debug.sh
DELETED
|
@@ -1,43 +0,0 @@
|
|
| 1 |
-
python run_speech_recognition_seq2seq_streaming.py \
|
| 2 |
-
--model_name_or_path="openai/whisper-tiny" \
|
| 3 |
-
--dataset_name="mozilla-foundation/common_voice_11_0" \
|
| 4 |
-
--dataset_config_name="be" \
|
| 5 |
-
--language="be" \
|
| 6 |
-
--train_split_name="train" \
|
| 7 |
-
--eval_split_name="validation" \
|
| 8 |
-
--model_index_name="Whisper Small Belarusian" \
|
| 9 |
-
\
|
| 10 |
-
--max_steps="150" \
|
| 11 |
-
--max_eval_samples="64" \
|
| 12 |
-
--output_dir="./" \
|
| 13 |
-
--per_device_train_batch_size="32" \
|
| 14 |
-
--per_device_eval_batch_size="32" \
|
| 15 |
-
--logging_steps="10" \
|
| 16 |
-
--learning_rate="3.1578947368421056e-06" \
|
| 17 |
-
--warmup_steps="5" \
|
| 18 |
-
--evaluation_strategy="steps" \
|
| 19 |
-
--eval_steps="10" \
|
| 20 |
-
--save_strategy="steps" \
|
| 21 |
-
--save_steps="10" \
|
| 22 |
-
--gradient_checkpointing \
|
| 23 |
-
--fp16 \
|
| 24 |
-
\
|
| 25 |
-
--shuffle_buffer_size="20" \
|
| 26 |
-
--generation_max_length="225" \
|
| 27 |
-
--max_duration_in_seconds="30" \
|
| 28 |
-
--text_column_name="sentence" \
|
| 29 |
-
--freeze_feature_encoder="False" \
|
| 30 |
-
--report_to="tensorboard" \
|
| 31 |
-
--metric_for_best_model="wer" \
|
| 32 |
-
--greater_is_better="False" \
|
| 33 |
-
--load_best_model_at_end \
|
| 34 |
-
\
|
| 35 |
-
--do_train \
|
| 36 |
-
--do_eval \
|
| 37 |
-
--ignore_data_skip \
|
| 38 |
-
--predict_with_generate \
|
| 39 |
-
--do_normalize_eval \
|
| 40 |
-
--streaming \
|
| 41 |
-
--use_auth_token \
|
| 42 |
-
--push_to_hub \
|
| 43 |
-
--hub_model_id="ales/whisper-tiny-be-test"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|