Commit ·
132a7e5
1
Parent(s): e63d30e
up
Browse files- log.txt +0 -0
- log.txt_plot.png +0 -0
- log_1st.txt +0 -0
- log_1st.txt_plot.png +0 -0
- make_graph.py +20 -0
- run_main.sh +3 -3
- run_pretrain_no_trainer.py +2 -2
log.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
log.txt_plot.png
ADDED
|
log_1st.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
log_1st.txt_plot.png
ADDED
|
make_graph.py
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#!/usr/bin/env python3
|
| 2 |
+
import sys
|
| 3 |
+
import matplotlib.pyplot as plt
|
| 4 |
+
|
| 5 |
+
file_path = sys.argv[1]
|
| 6 |
+
|
| 7 |
+
with open(file_path, "r") as f:
|
| 8 |
+
lines = f.readlines()
|
| 9 |
+
|
| 10 |
+
loss = []
|
| 11 |
+
|
| 12 |
+
key_word = "constrast_loss: "
|
| 13 |
+
for line in lines:
|
| 14 |
+
if key_word in line:
|
| 15 |
+
loss.append(line.split(key_word)[-1].split("|")[0])
|
| 16 |
+
|
| 17 |
+
|
| 18 |
+
X = range(len(loss))
|
| 19 |
+
plt.plot(X, loss)
|
| 20 |
+
plt.savefig(file_path + "_plot.png")
|
run_main.sh
CHANGED
|
@@ -3,11 +3,11 @@
|
|
| 3 |
accelerate launch --config_file ./default_config.yaml ./run_pretrain_no_trainer.py \
|
| 4 |
--output_dir="./test" \
|
| 5 |
--max_train_steps="200000" \
|
| 6 |
-
--num_warmup_steps="
|
| 7 |
--gradient_accumulation_steps="4" \
|
| 8 |
-
--learning_rate="0.
|
| 9 |
--weight_decay="0.01" \
|
| 10 |
-
--max_duration_in_seconds="
|
| 11 |
--model_name_or_path="./" \
|
| 12 |
--dataset_name="patrickvonplaten/librispeech_local" \
|
| 13 |
--manual_data_dir="/home/patrick/wav2vec2_reproduce" \
|
|
|
|
| 3 |
accelerate launch --config_file ./default_config.yaml ./run_pretrain_no_trainer.py \
|
| 4 |
--output_dir="./test" \
|
| 5 |
--max_train_steps="200000" \
|
| 6 |
+
--num_warmup_steps="100000" \
|
| 7 |
--gradient_accumulation_steps="4" \
|
| 8 |
+
--learning_rate="0.0001" \
|
| 9 |
--weight_decay="0.01" \
|
| 10 |
+
--max_duration_in_seconds="8.0" \
|
| 11 |
--model_name_or_path="./" \
|
| 12 |
--dataset_name="patrickvonplaten/librispeech_local" \
|
| 13 |
--manual_data_dir="/home/patrick/wav2vec2_reproduce" \
|
run_pretrain_no_trainer.py
CHANGED
|
@@ -378,8 +378,8 @@ def main():
|
|
| 378 |
split="train",
|
| 379 |
)
|
| 380 |
|
| 381 |
-
raw_datasets["train"] = raw_datasets["train"].select(range(128))
|
| 382 |
-
raw_datasets["validation"] = raw_datasets["validation"].select(range(16))
|
| 383 |
|
| 384 |
# only normalized-inputs-training is supported
|
| 385 |
feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(
|
|
|
|
| 378 |
split="train",
|
| 379 |
)
|
| 380 |
|
| 381 |
+
# raw_datasets["train"] = raw_datasets["train"].select(range(128))
|
| 382 |
+
# raw_datasets["validation"] = raw_datasets["validation"].select(range(16))
|
| 383 |
|
| 384 |
# only normalized-inputs-training is supported
|
| 385 |
feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(
|