Upload APMAE
Browse files- config.json +2 -3
config.json
CHANGED
|
@@ -1,5 +1,4 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "LaughingLogits/AP-MAE-SC2-15B",
|
| 3 |
"architectures": [
|
| 4 |
"APMAE"
|
| 5 |
],
|
|
@@ -7,7 +6,7 @@
|
|
| 7 |
"base_learning_rate": 0.00015,
|
| 8 |
"batch_size": 60,
|
| 9 |
"correct_only": true,
|
| 10 |
-
"dataset_location": "
|
| 11 |
"dataset_name": "JavaNearDedupFull",
|
| 12 |
"dataset_split": "train",
|
| 13 |
"dataset_split_seed": 42,
|
|
@@ -55,7 +54,7 @@
|
|
| 55 |
"target_model_name": "bigcode/starcoder2-15b",
|
| 56 |
"torch_dtype": "float32",
|
| 57 |
"train_batches": 150000,
|
| 58 |
-
"transformers_version": "4.
|
| 59 |
"val_batches": 120,
|
| 60 |
"visualize_frequency": 2000,
|
| 61 |
"vitmae_preload_name": null
|
|
|
|
| 1 |
{
|
|
|
|
| 2 |
"architectures": [
|
| 3 |
"APMAE"
|
| 4 |
],
|
|
|
|
| 6 |
"base_learning_rate": 0.00015,
|
| 7 |
"batch_size": 60,
|
| 8 |
"correct_only": true,
|
| 9 |
+
"dataset_location": "Razvan27/network_paper",
|
| 10 |
"dataset_name": "JavaNearDedupFull",
|
| 11 |
"dataset_split": "train",
|
| 12 |
"dataset_split_seed": 42,
|
|
|
|
| 54 |
"target_model_name": "bigcode/starcoder2-15b",
|
| 55 |
"torch_dtype": "float32",
|
| 56 |
"train_batches": 150000,
|
| 57 |
+
"transformers_version": "4.55.2",
|
| 58 |
"val_batches": 120,
|
| 59 |
"visualize_frequency": 2000,
|
| 60 |
"vitmae_preload_name": null
|