model: graph_conv-distmult_h128_l3_edge_prediction | (graph_conv-distmult_h128_l3) | WandB: kjv3q37g
Browse files- config.json +5 -5
config.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
"name": null,
|
| 3 |
"seed": 42,
|
| 4 |
"deterministic": true,
|
| 5 |
-
"output_dir": "
|
| 6 |
"model": {
|
| 7 |
"encoder": "graph_conv",
|
| 8 |
"hidden_channels": 128,
|
|
@@ -28,9 +28,9 @@
|
|
| 28 |
"edge_encoder_init_bias": 0.0,
|
| 29 |
"use_pretrained_model": true,
|
| 30 |
"pretrained_model_source": "huggingface",
|
| 31 |
-
"pretrained_model_path": "seanhacks/
|
| 32 |
-
"pretrained_model_revision":
|
| 33 |
-
"pretrained_model_load_head":
|
| 34 |
"pretrained_model_freeze_encoder_weights": false,
|
| 35 |
"pretrained_model_freeze_head_weights": false
|
| 36 |
},
|
|
@@ -63,7 +63,7 @@
|
|
| 63 |
"lr": 0.0005,
|
| 64 |
"weight_decay": 0.0001,
|
| 65 |
"optimizer": "adamw",
|
| 66 |
-
"scheduler": "
|
| 67 |
"gradient_clip_val": null,
|
| 68 |
"epochs": 500,
|
| 69 |
"batches_per_epoch": 20,
|
|
|
|
| 2 |
"name": null,
|
| 3 |
"seed": 42,
|
| 4 |
"deterministic": true,
|
| 5 |
+
"output_dir": "relation_prediction_distmult_128e_transfer_v2",
|
| 6 |
"model": {
|
| 7 |
"encoder": "graph_conv",
|
| 8 |
"hidden_channels": 128,
|
|
|
|
| 28 |
"edge_encoder_init_bias": 0.0,
|
| 29 |
"use_pretrained_model": true,
|
| 30 |
"pretrained_model_source": "huggingface",
|
| 31 |
+
"pretrained_model_path": "seanhacks/relation_prediction_distmult_128e",
|
| 32 |
+
"pretrained_model_revision": "20251228",
|
| 33 |
+
"pretrained_model_load_head": true,
|
| 34 |
"pretrained_model_freeze_encoder_weights": false,
|
| 35 |
"pretrained_model_freeze_head_weights": false
|
| 36 |
},
|
|
|
|
| 63 |
"lr": 0.0005,
|
| 64 |
"weight_decay": 0.0001,
|
| 65 |
"optimizer": "adamw",
|
| 66 |
+
"scheduler": "plateau",
|
| 67 |
"gradient_clip_val": null,
|
| 68 |
"epochs": 500,
|
| 69 |
"batches_per_epoch": 20,
|