patrickvonplaten commited on
Commit
132a7e5
·
1 Parent(s): e63d30e
log.txt ADDED
The diff for this file is too large to render. See raw diff
 
log.txt_plot.png ADDED
log_1st.txt ADDED
The diff for this file is too large to render. See raw diff
 
log_1st.txt_plot.png ADDED
make_graph.py ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env python3
2
+ import sys
3
+ import matplotlib.pyplot as plt
4
+
5
+ file_path = sys.argv[1]
6
+
7
+ with open(file_path, "r") as f:
8
+ lines = f.readlines()
9
+
10
+ loss = []
11
+
12
+ key_word = "constrast_loss: "
13
+ for line in lines:
14
+ if key_word in line:
15
+ loss.append(line.split(key_word)[-1].split("|")[0])
16
+
17
+
18
+ X = range(len(loss))
19
+ plt.plot(X, loss)
20
+ plt.savefig(file_path + "_plot.png")
run_main.sh CHANGED
@@ -3,11 +3,11 @@
3
  accelerate launch --config_file ./default_config.yaml ./run_pretrain_no_trainer.py \
4
  --output_dir="./test" \
5
  --max_train_steps="200000" \
6
- --num_warmup_steps="100" \
7
  --gradient_accumulation_steps="4" \
8
- --learning_rate="0.0005" \
9
  --weight_decay="0.01" \
10
- --max_duration_in_seconds="10.0" \
11
  --model_name_or_path="./" \
12
  --dataset_name="patrickvonplaten/librispeech_local" \
13
  --manual_data_dir="/home/patrick/wav2vec2_reproduce" \
 
3
  accelerate launch --config_file ./default_config.yaml ./run_pretrain_no_trainer.py \
4
  --output_dir="./test" \
5
  --max_train_steps="200000" \
6
+ --num_warmup_steps="100000" \
7
  --gradient_accumulation_steps="4" \
8
+ --learning_rate="0.0001" \
9
  --weight_decay="0.01" \
10
+ --max_duration_in_seconds="8.0" \
11
  --model_name_or_path="./" \
12
  --dataset_name="patrickvonplaten/librispeech_local" \
13
  --manual_data_dir="/home/patrick/wav2vec2_reproduce" \
run_pretrain_no_trainer.py CHANGED
@@ -378,8 +378,8 @@ def main():
378
  split="train",
379
  )
380
 
381
- raw_datasets["train"] = raw_datasets["train"].select(range(128))
382
- raw_datasets["validation"] = raw_datasets["validation"].select(range(16))
383
 
384
  # only normalized-inputs-training is supported
385
  feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(
 
378
  split="train",
379
  )
380
 
381
+ # raw_datasets["train"] = raw_datasets["train"].select(range(128))
382
+ # raw_datasets["validation"] = raw_datasets["validation"].select(range(16))
383
 
384
  # only normalized-inputs-training is supported
385
  feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(