LaughingLogits commited on
Commit
8d90340
·
verified ·
1 Parent(s): 6729478

Upload APMAE

Browse files
Files changed (1) hide show
  1. config.json +2 -3
config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_name_or_path": "LaughingLogits/AP-MAE-SC2-15B",
3
  "architectures": [
4
  "APMAE"
5
  ],
@@ -7,7 +6,7 @@
7
  "base_learning_rate": 0.00015,
8
  "batch_size": 60,
9
  "correct_only": true,
10
- "dataset_location": "LaughingLogits/Stackless_Java_V2",
11
  "dataset_name": "JavaNearDedupFull",
12
  "dataset_split": "train",
13
  "dataset_split_seed": 42,
@@ -55,7 +54,7 @@
55
  "target_model_name": "bigcode/starcoder2-15b",
56
  "torch_dtype": "float32",
57
  "train_batches": 150000,
58
- "transformers_version": "4.48.1",
59
  "val_batches": 120,
60
  "visualize_frequency": 2000,
61
  "vitmae_preload_name": null
 
1
  {
 
2
  "architectures": [
3
  "APMAE"
4
  ],
 
6
  "base_learning_rate": 0.00015,
7
  "batch_size": 60,
8
  "correct_only": true,
9
+ "dataset_location": "Razvan27/network_paper",
10
  "dataset_name": "JavaNearDedupFull",
11
  "dataset_split": "train",
12
  "dataset_split_seed": 42,
 
54
  "target_model_name": "bigcode/starcoder2-15b",
55
  "torch_dtype": "float32",
56
  "train_batches": 150000,
57
+ "transformers_version": "4.55.2",
58
  "val_batches": 120,
59
  "visualize_frequency": 2000,
60
  "vitmae_preload_name": null