NisargUpadhyay commited on
Commit
2663ef8
·
verified ·
1 Parent(s): 8d6fd0b

Add Assignment 4 summary

Browse files
Files changed (1) hide show
  1. summary.json +116 -0
summary.json ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "baseline": {
3
+ "epochs": 100,
4
+ "training_time_seconds": 3139.0,
5
+ "training_time_minutes": 52.32,
6
+ "final_loss": 0.0974,
7
+ "bleu": 0.5247,
8
+ "bleu_percent": 52.47,
9
+ "source": "Extracted from en_to_hi.ipynb recorded outputs on 2026-03-13"
10
+ },
11
+ "tuning": {
12
+ "best_config": {
13
+ "learning_rate": 8.884411309500873e-05,
14
+ "batch_size": 16,
15
+ "num_heads": 4,
16
+ "d_ff": 1536,
17
+ "dropout": 0.19016462895143443,
18
+ "num_layers": 4,
19
+ "weight_decay": 1.149540832915101e-06,
20
+ "d_model": 512,
21
+ "max_len": 50,
22
+ "seed": 42,
23
+ "force_cpu": false,
24
+ "epochs": 20
25
+ },
26
+ "best_metrics": {
27
+ "epoch": 20,
28
+ "loss": 0.5256124382669275,
29
+ "bleu": 0.7698028731485314,
30
+ "bleu_percent": 76.98028731485313,
31
+ "timestamp": 1773401641,
32
+ "checkpoint_dir_name": null,
33
+ "done": true,
34
+ "training_iteration": 20,
35
+ "trial_id": "28792536",
36
+ "date": "2026-03-13_17-04-01",
37
+ "time_this_iter_s": 42.827330112457275,
38
+ "time_total_s": 857.8043477535248,
39
+ "pid": 3948130,
40
+ "hostname": "user-SSI100C3A-48",
41
+ "node_ip": "10.6.0.87",
42
+ "config": {
43
+ "learning_rate": 8.884411309500873e-05,
44
+ "batch_size": 16,
45
+ "num_heads": 4,
46
+ "d_ff": 1536,
47
+ "dropout": 0.19016462895143443,
48
+ "num_layers": 4,
49
+ "weight_decay": 1.149540832915101e-06,
50
+ "d_model": 512,
51
+ "max_len": 50,
52
+ "seed": 42,
53
+ "force_cpu": false,
54
+ "epochs": 20
55
+ },
56
+ "time_since_restore": 857.8043477535248,
57
+ "iterations_since_restore": 20,
58
+ "experiment_tag": "18_batch_size=16,d_ff=1536,d_model=512,dropout=0.1902,epochs=20,force_cpu=False,learning_rate=0.0001,max_len=50,num_heads=4,num_layers=4,seed=42,weight_decay=0.0000"
59
+ },
60
+ "num_samples": 20,
61
+ "tune_epochs": 20,
62
+ "search_space": {
63
+ "learning_rate": "loguniform(1e-5, 1e-3)",
64
+ "batch_size": "choice([16, 32, 64])",
65
+ "num_heads": "choice([4, 8])",
66
+ "d_ff": "choice([1024, 1536, 2048])",
67
+ "dropout": "uniform(0.10, 0.40)",
68
+ "num_layers": "choice([4, 6])",
69
+ "weight_decay": "loguniform(1e-6, 1e-3)"
70
+ },
71
+ "metric": "bleu",
72
+ "mode": "max",
73
+ "scheduler": "ASHAScheduler",
74
+ "search_algorithm": "OptunaSearch"
75
+ },
76
+ "best_model": {
77
+ "epochs": 20,
78
+ "training_time_seconds": 853.0576362609863,
79
+ "training_time_minutes": 14.217627271016438,
80
+ "final_loss": 0.5256124382669275,
81
+ "best_bleu": 0.8471540338276414,
82
+ "best_bleu_percent": 84.71540338276414,
83
+ "best_epoch": 15,
84
+ "epochs_to_target": 6,
85
+ "model_path": "b23cs1075_ass_4_best_model.pth",
86
+ "config": {
87
+ "learning_rate": 8.884411309500873e-05,
88
+ "batch_size": 16,
89
+ "num_heads": 4,
90
+ "d_ff": 1536,
91
+ "dropout": 0.19016462895143443,
92
+ "num_layers": 4,
93
+ "weight_decay": 1.149540832915101e-06,
94
+ "d_model": 512,
95
+ "max_len": 50,
96
+ "seed": 42,
97
+ "force_cpu": false,
98
+ "epochs": 20
99
+ }
100
+ },
101
+ "search_space": {
102
+ "learning_rate": "loguniform(1e-5, 1e-3)",
103
+ "batch_size": "choice([16, 32, 64])",
104
+ "num_heads": "choice([4, 8])",
105
+ "d_ff": "choice([1024, 1536, 2048])",
106
+ "dropout": "uniform(0.10, 0.40)",
107
+ "num_layers": "choice([4, 6])",
108
+ "weight_decay": "loguniform(1e-6, 1e-3)"
109
+ },
110
+ "artifacts": {
111
+ "baseline_model": "transformer_translation_final.pth",
112
+ "best_model": "b23cs1075_ass_4_best_model.pth",
113
+ "report_markdown": "b23cs1075_ass_4_report.md",
114
+ "summary_json": "artifacts/assignment4/summary.json"
115
+ }
116
+ }