Hananguyen12 commited on
Commit
dd9592c
·
verified ·
1 Parent(s): bac278f

Upload bert_lora_training_report.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. bert_lora_training_report.json +112 -0
bert_lora_training_report.json ADDED
@@ -0,0 +1,112 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "configuration": {
3
+ "base_model_name": "bert-base-uncased",
4
+ "max_length": 512,
5
+ "batch_size": 4,
6
+ "gradient_accumulation_steps": 4,
7
+ "effective_batch_size": 16,
8
+ "learning_rate": 0.0002,
9
+ "num_epochs": 4,
10
+ "warmup_steps": 500,
11
+ "weight_decay": 0.01,
12
+ "dataset_path": "/content/shakespeare_training_data.json",
13
+ "used_all_data": true,
14
+ "lora_config": {
15
+ "r": 16,
16
+ "alpha": 32,
17
+ "dropout": 0.1,
18
+ "target_modules": [
19
+ "query",
20
+ "key",
21
+ "value",
22
+ "dense"
23
+ ]
24
+ }
25
+ },
26
+ "dataset_statistics": {
27
+ "total_examples": 6032,
28
+ "train_examples": 5127,
29
+ "val_examples": 603,
30
+ "test_examples": 302,
31
+ "question_types": {
32
+ "factual": 4425,
33
+ "quote": 1520,
34
+ "analysis": 75,
35
+ "summary": 12
36
+ }
37
+ },
38
+ "model_statistics": {
39
+ "base_model": "bert-base-uncased",
40
+ "total_parameters": 111548932,
41
+ "trainable_parameters": 2655746,
42
+ "trainable_percentage": 2.3807901630111528,
43
+ "parameter_efficiency": "2,655,746 trainable out of 111,548,932 total",
44
+ "base_model_path": "/content/shakespeare-bert-base-model",
45
+ "lora_adapter_path": "/content/shakespeare-bert-qa-lora"
46
+ },
47
+ "training_statistics": {
48
+ "start_time": "2025-06-04T19:18:02.140488",
49
+ "end_time": "2025-06-04T19:30:15.267651",
50
+ "training_time_seconds": 733.127163,
51
+ "training_time_formatted": "0:12:13.127163",
52
+ "final_train_loss": 0.7214135336356,
53
+ "total_steps": 1284,
54
+ "epochs_completed": 4,
55
+ "examples_trained": 5127,
56
+ "lora_config": {
57
+ "r": 16,
58
+ "alpha": 32,
59
+ "dropout": 0.1,
60
+ "target_modules": [
61
+ "query",
62
+ "key",
63
+ "value",
64
+ "dense"
65
+ ]
66
+ },
67
+ "model_config": {
68
+ "base_model": "bert-base-uncased",
69
+ "max_length": 512,
70
+ "effective_batch_size": 16,
71
+ "learning_rate": 0.0002
72
+ },
73
+ "test_evaluation": {
74
+ "eval_loss": 0.18932627141475677,
75
+ "eval_exact_match": 0.8609271523178808,
76
+ "eval_start_accuracy": 1.0,
77
+ "eval_end_accuracy": 0.8609271523178808,
78
+ "eval_start_f1": 1.0,
79
+ "eval_end_f1": 0.8286722954302209,
80
+ "eval_avg_f1": 0.9143361477151104,
81
+ "eval_runtime": 3.9174,
82
+ "eval_samples_per_second": 77.093,
83
+ "eval_steps_per_second": 19.401,
84
+ "epoch": 4.0
85
+ },
86
+ "validation_evaluation": {
87
+ "eval_loss": 0.19166630506515503,
88
+ "eval_exact_match": 0.8590381426202321,
89
+ "eval_start_accuracy": 1.0,
90
+ "eval_end_accuracy": 0.8590381426202321,
91
+ "eval_start_f1": 1.0,
92
+ "eval_end_f1": 0.8252087537483971,
93
+ "eval_avg_f1": 0.9126043768741985,
94
+ "eval_runtime": 7.7871,
95
+ "eval_samples_per_second": 77.436,
96
+ "eval_steps_per_second": 19.391,
97
+ "epoch": 4.0
98
+ }
99
+ },
100
+ "system_information": {
101
+ "device": "cuda",
102
+ "cuda_available": true,
103
+ "gpu_name": "Tesla T4",
104
+ "gpu_memory_gb": 15.828320256,
105
+ "pytorch_version": "2.6.0+cu124",
106
+ "transformers_version": "4.35.0+",
107
+ "peft_enabled": true
108
+ },
109
+ "report_generated": "2025-06-04T19:30:27.650635",
110
+ "colab_environment": true,
111
+ "model_type": "BERT-Base-Uncased with LoRA"
112
+ }