Upload best.meta.json
Browse files
geometric-diffusion-cifar100-p2048_best.meta.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
-
"epoch":
|
| 3 |
-
"global_step":
|
| 4 |
-
"avg_loss": 3.
|
| 5 |
-
"best_metric": 0.
|
| 6 |
-
"timestamp": "2025-08-
|
| 7 |
"config": {
|
| 8 |
"seed": 42,
|
| 9 |
"device": "cuda",
|
|
@@ -135,7 +135,7 @@
|
|
| 135 |
"model": {
|
| 136 |
"crystal_dim": 512,
|
| 137 |
"image_encoder": {
|
| 138 |
-
"num_anchors":
|
| 139 |
"tau_geom": 0.45,
|
| 140 |
"conv_channels": [
|
| 141 |
64,
|
|
@@ -170,7 +170,7 @@
|
|
| 170 |
},
|
| 171 |
"classification": {
|
| 172 |
"use_cls": true,
|
| 173 |
-
"lambda_cls": 1.
|
| 174 |
"tau_cls": 0.35
|
| 175 |
},
|
| 176 |
"losses": {
|
|
@@ -181,7 +181,7 @@
|
|
| 181 |
"lambda_dual": 0.15,
|
| 182 |
"temp_dual": 0.25,
|
| 183 |
"use_rose_contrastive": true,
|
| 184 |
-
"lambda_rose_contrastive": 0.
|
| 185 |
"temp_rose_contrastive": 0.5
|
| 186 |
},
|
| 187 |
"train": {
|
|
@@ -201,7 +201,7 @@
|
|
| 201 |
"io": {
|
| 202 |
"ckpt_dir": "./checkpoints",
|
| 203 |
"run_name": "geometric-diffusion-cifar100-p2048",
|
| 204 |
-
"resume":
|
| 205 |
"resume_which": "latest",
|
| 206 |
"use_tensorboard": true,
|
| 207 |
"log_dir": "./checkpoints/log"
|
|
@@ -228,16 +228,16 @@
|
|
| 228 |
},
|
| 229 |
"per_task": {
|
| 230 |
"mnist": {
|
| 231 |
-
"top1": 0.
|
| 232 |
-
"top3": 0.
|
| 233 |
},
|
| 234 |
"fashion": {
|
| 235 |
-
"top1": 0.
|
| 236 |
-
"top3": 0.
|
| 237 |
},
|
| 238 |
"cifar100": {
|
| 239 |
-
"top1": 0.
|
| 240 |
-
"top3": 0.
|
| 241 |
}
|
| 242 |
}
|
| 243 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"epoch": 1,
|
| 3 |
+
"global_step": 705,
|
| 4 |
+
"avg_loss": 3.975278095827035,
|
| 5 |
+
"best_metric": 0.07450000000000001,
|
| 6 |
+
"timestamp": "2025-08-26T00:20:56.955013",
|
| 7 |
"config": {
|
| 8 |
"seed": 42,
|
| 9 |
"device": "cuda",
|
|
|
|
| 135 |
"model": {
|
| 136 |
"crystal_dim": 512,
|
| 137 |
"image_encoder": {
|
| 138 |
+
"num_anchors": 2048,
|
| 139 |
"tau_geom": 0.45,
|
| 140 |
"conv_channels": [
|
| 141 |
64,
|
|
|
|
| 170 |
},
|
| 171 |
"classification": {
|
| 172 |
"use_cls": true,
|
| 173 |
+
"lambda_cls": 1.05,
|
| 174 |
"tau_cls": 0.35
|
| 175 |
},
|
| 176 |
"losses": {
|
|
|
|
| 181 |
"lambda_dual": 0.15,
|
| 182 |
"temp_dual": 0.25,
|
| 183 |
"use_rose_contrastive": true,
|
| 184 |
+
"lambda_rose_contrastive": 0.16499999999999998,
|
| 185 |
"temp_rose_contrastive": 0.5
|
| 186 |
},
|
| 187 |
"train": {
|
|
|
|
| 201 |
"io": {
|
| 202 |
"ckpt_dir": "./checkpoints",
|
| 203 |
"run_name": "geometric-diffusion-cifar100-p2048",
|
| 204 |
+
"resume": false,
|
| 205 |
"resume_which": "latest",
|
| 206 |
"use_tensorboard": true,
|
| 207 |
"log_dir": "./checkpoints/log"
|
|
|
|
| 228 |
},
|
| 229 |
"per_task": {
|
| 230 |
"mnist": {
|
| 231 |
+
"top1": 0.1135,
|
| 232 |
+
"top3": 0.3173
|
| 233 |
},
|
| 234 |
"fashion": {
|
| 235 |
+
"top1": 0.1,
|
| 236 |
+
"top3": 0.3
|
| 237 |
},
|
| 238 |
"cifar100": {
|
| 239 |
+
"top1": 0.01,
|
| 240 |
+
"top3": 0.03
|
| 241 |
}
|
| 242 |
}
|
| 243 |
}
|