Upload best.meta.json
Browse files
geom_multitask_mnist_fashion_cifar100_best.meta.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
-
"epoch":
|
| 3 |
-
"global_step":
|
| 4 |
-
"avg_loss":
|
| 5 |
-
"best_metric": 0.
|
| 6 |
-
"timestamp": "2025-08-25T23:09:
|
| 7 |
"config": {
|
| 8 |
"seed": 42,
|
| 9 |
"device": "cuda",
|
|
@@ -170,7 +170,7 @@
|
|
| 170 |
},
|
| 171 |
"classification": {
|
| 172 |
"use_cls": true,
|
| 173 |
-
"lambda_cls":
|
| 174 |
"tau_cls": 0.35
|
| 175 |
},
|
| 176 |
"losses": {
|
|
@@ -178,10 +178,10 @@
|
|
| 178 |
"lambda_rose_mag": 0.05,
|
| 179 |
"rose_margin": 1.0,
|
| 180 |
"use_dual_contrastive": true,
|
| 181 |
-
"lambda_dual":
|
| 182 |
"temp_dual": 0.5,
|
| 183 |
"use_rose_contrastive": true,
|
| 184 |
-
"lambda_rose_contrastive":
|
| 185 |
"temp_rose_contrastive": 0.5
|
| 186 |
},
|
| 187 |
"train": {
|
|
@@ -228,16 +228,16 @@
|
|
| 228 |
},
|
| 229 |
"per_task": {
|
| 230 |
"mnist": {
|
| 231 |
-
"top1": 0.
|
| 232 |
-
"top3": 0.
|
| 233 |
},
|
| 234 |
"fashion": {
|
| 235 |
-
"top1": 0.
|
| 236 |
-
"top3": 0.
|
| 237 |
},
|
| 238 |
"cifar100": {
|
| 239 |
-
"top1": 0.
|
| 240 |
-
"top3": 0.
|
| 241 |
}
|
| 242 |
}
|
| 243 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"epoch": 40,
|
| 3 |
+
"global_step": 28200,
|
| 4 |
+
"avg_loss": 768193.7443262411,
|
| 5 |
+
"best_metric": 0.40596666666666675,
|
| 6 |
+
"timestamp": "2025-08-25T23:09:46.169477",
|
| 7 |
"config": {
|
| 8 |
"seed": 42,
|
| 9 |
"device": "cuda",
|
|
|
|
| 170 |
},
|
| 171 |
"classification": {
|
| 172 |
"use_cls": true,
|
| 173 |
+
"lambda_cls": 243003.96139650562,
|
| 174 |
"tau_cls": 0.35
|
| 175 |
},
|
| 176 |
"losses": {
|
|
|
|
| 178 |
"lambda_rose_mag": 0.05,
|
| 179 |
"rose_margin": 1.0,
|
| 180 |
"use_dual_contrastive": true,
|
| 181 |
+
"lambda_dual": 15380.202620031998,
|
| 182 |
"temp_dual": 0.5,
|
| 183 |
"use_rose_contrastive": true,
|
| 184 |
+
"lambda_rose_contrastive": 2614.8834454054436,
|
| 185 |
"temp_rose_contrastive": 0.5
|
| 186 |
},
|
| 187 |
"train": {
|
|
|
|
| 228 |
},
|
| 229 |
"per_task": {
|
| 230 |
"mnist": {
|
| 231 |
+
"top1": 0.7532,
|
| 232 |
+
"top3": 0.9532
|
| 233 |
},
|
| 234 |
"fashion": {
|
| 235 |
+
"top1": 0.4495,
|
| 236 |
+
"top3": 0.8699
|
| 237 |
},
|
| 238 |
"cifar100": {
|
| 239 |
+
"top1": 0.0152,
|
| 240 |
+
"top3": 0.0459
|
| 241 |
}
|
| 242 |
}
|
| 243 |
}
|