SaswataBose commited on
Commit
d1e84a3
·
verified ·
1 Parent(s): 2c2744a

LoRA (ANLP A3)

Browse files
results/lora_comparison/comparison_metrics.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "standard_moe": {
3
+ "total_params": 179944868,
4
+ "trainable_params": 179944868,
5
+ "train_losses": [
6
+ 6.993803797149658,
7
+ 5.954492663574219,
8
+ 5.53921777420044,
9
+ 5.24759983291626,
10
+ 5.0148901168823246
11
+ ],
12
+ "val_losses": [
13
+ 6.212501205444336,
14
+ 5.760108711242676,
15
+ 5.491593559265136,
16
+ 5.284299610137939,
17
+ 5.145402297973633
18
+ ],
19
+ "best_val_loss": 5.145402297973633,
20
+ "training_time": 1290.9204235076904
21
+ },
22
+ "lora_moe": {
23
+ "total_params": 182828452,
24
+ "trainable_params": 2621440,
25
+ "lora_percent": 1.43382497161875,
26
+ "train_losses": [
27
+ 7.029633666229248,
28
+ 5.872530696105957,
29
+ 5.428599870300293,
30
+ 5.109180227661133,
31
+ 4.84611487121582
32
+ ],
33
+ "val_losses": [
34
+ 6.160612037658692,
35
+ 5.704808525085449,
36
+ 5.452941730499267,
37
+ 5.289849403381347,
38
+ 5.177924713134765
39
+ ],
40
+ "best_val_loss": 5.177924713134765,
41
+ "training_time": 18967.75845336914
42
+ }
43
+ }
results/lora_moe/best_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe830c30e4365e4cc873e86af27dc33b40e32e7967070df6276f1184957d27c7
3
+ size 731567101
results/standard_moe/best_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6df29ee4a7a27f6f28ce9af56d8d6d9a5cfae6cafe129ce3d67d6b7cc9da2f9
3
+ size 720972925