Yannis98 commited on
Commit
1cef3aa
verified
1 Parent(s): 840ea65

End of training

Browse files
README.md CHANGED
@@ -4,6 +4,8 @@ license: apache-2.0
4
  base_model: albert/albert-base-v2
5
  tags:
6
  - generated_from_trainer
 
 
7
  model-index:
8
  - name: squad_albert_finetuned2
9
  results: []
@@ -14,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  # squad_albert_finetuned2
16
 
17
- This model is a fine-tuned version of [albert/albert-base-v2](https://huggingface.co/albert/albert-base-v2) on an unknown dataset.
18
 
19
  ## Model description
20
 
 
4
  base_model: albert/albert-base-v2
5
  tags:
6
  - generated_from_trainer
7
+ datasets:
8
+ - squad
9
  model-index:
10
  - name: squad_albert_finetuned2
11
  results: []
 
16
 
17
  # squad_albert_finetuned2
18
 
19
+ This model is a fine-tuned version of [albert/albert-base-v2](https://huggingface.co/albert/albert-base-v2) on the squad dataset.
20
 
21
  ## Model description
22
 
all_results.json CHANGED
@@ -602,20 +602,20 @@
602
  "epoch": 1.0,
603
  "eval_exact_match": 13.0,
604
  "eval_f1": 22.02673682526624,
605
- "eval_runtime": 3.405,
606
  "eval_samples": 100,
607
- "eval_samples_per_second": 29.368,
608
- "eval_steps_per_second": 3.818,
609
  "predict_samples_tr": 100,
610
  "test_exact_match": 33.0,
611
  "test_f1": 43.51652920179235,
612
- "test_runtime": 3.1882,
613
- "test_samples_per_second": 31.365,
614
- "test_steps_per_second": 4.077,
615
  "total_flos": 1656285235200.0,
616
  "train_loss": 0.0,
617
- "train_runtime": 1.684,
618
  "train_samples": 100,
619
- "train_samples_per_second": 59.381,
620
- "train_steps_per_second": 29.691
621
  }
 
602
  "epoch": 1.0,
603
  "eval_exact_match": 13.0,
604
  "eval_f1": 22.02673682526624,
605
+ "eval_runtime": 3.4116,
606
  "eval_samples": 100,
607
+ "eval_samples_per_second": 29.312,
608
+ "eval_steps_per_second": 3.811,
609
  "predict_samples_tr": 100,
610
  "test_exact_match": 33.0,
611
  "test_f1": 43.51652920179235,
612
+ "test_runtime": 3.1834,
613
+ "test_samples_per_second": 31.413,
614
+ "test_steps_per_second": 4.084,
615
  "total_flos": 1656285235200.0,
616
  "train_loss": 0.0,
617
+ "train_runtime": 1.5301,
618
  "train_samples": 100,
619
+ "train_samples_per_second": 65.355,
620
+ "train_steps_per_second": 32.677
621
  }
eval_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 1.0,
3
  "eval_exact_match": 13.0,
4
  "eval_f1": 22.02673682526624,
5
- "eval_runtime": 3.405,
6
  "eval_samples": 100,
7
- "eval_samples_per_second": 29.368,
8
- "eval_steps_per_second": 3.818
9
  }
 
2
  "epoch": 1.0,
3
  "eval_exact_match": 13.0,
4
  "eval_f1": 22.02673682526624,
5
+ "eval_runtime": 3.4116,
6
  "eval_samples": 100,
7
+ "eval_samples_per_second": 29.312,
8
+ "eval_steps_per_second": 3.811
9
  }
predict_tr_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "predict_samples_tr": 100,
3
  "test_exact_match": 33.0,
4
  "test_f1": 43.51652920179235,
5
- "test_runtime": 3.1882,
6
- "test_samples_per_second": 31.365,
7
- "test_steps_per_second": 4.077
8
  }
 
2
  "predict_samples_tr": 100,
3
  "test_exact_match": 33.0,
4
  "test_f1": 43.51652920179235,
5
+ "test_runtime": 3.1834,
6
+ "test_samples_per_second": 31.413,
7
+ "test_steps_per_second": 4.084
8
  }
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 1.0,
3
  "total_flos": 1656285235200.0,
4
  "train_loss": 0.0,
5
- "train_runtime": 1.684,
6
  "train_samples": 100,
7
- "train_samples_per_second": 59.381,
8
- "train_steps_per_second": 29.691
9
  }
 
2
  "epoch": 1.0,
3
  "total_flos": 1656285235200.0,
4
  "train_loss": 0.0,
5
+ "train_runtime": 1.5301,
6
  "train_samples": 100,
7
+ "train_samples_per_second": 65.355,
8
+ "train_steps_per_second": 32.677
9
  }
trainer_state.json CHANGED
@@ -13,9 +13,9 @@
13
  "step": 50,
14
  "total_flos": 1656285235200.0,
15
  "train_loss": 0.0,
16
- "train_runtime": 1.684,
17
- "train_samples_per_second": 59.381,
18
- "train_steps_per_second": 29.691
19
  }
20
  ],
21
  "logging_steps": 500,
 
13
  "step": 50,
14
  "total_flos": 1656285235200.0,
15
  "train_loss": 0.0,
16
+ "train_runtime": 1.5301,
17
+ "train_samples_per_second": 65.355,
18
+ "train_steps_per_second": 32.677
19
  }
20
  ],
21
  "logging_steps": 500,