Vjeong commited on
Commit
e4bc86f
·
verified ·
1 Parent(s): 83bcd5d

Upload training_metadata.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_metadata.json +30 -0
training_metadata.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "final_step": 20000,
3
+ "best_val_loss": 2.6275619745254515,
4
+ "dataset": "HuggingFaceFW/fineweb-edu (sample-10BT)",
5
+ "tokenizer": "Custom BPE (train_new mode)",
6
+ "training_config": {
7
+ "learning_rate": 0.0003,
8
+ "min_learning_rate": 3e-05,
9
+ "weight_decay": 0.1,
10
+ "beta1": 0.9,
11
+ "beta2": 0.95,
12
+ "adam_eps": 1e-08,
13
+ "grad_clip": 1.0,
14
+ "warmup_steps": 2000,
15
+ "total_steps": 20000,
16
+ "micro_batch_size": 4,
17
+ "gradient_accumulation_steps": 32,
18
+ "dtype": "bfloat16",
19
+ "checkpoint_dir": "/content/drive/MyDrive/llm-1b-lab/checkpoints",
20
+ "checkpoint_interval": 500,
21
+ "max_checkpoints": 3,
22
+ "log_interval": 10,
23
+ "eval_interval": 500,
24
+ "eval_steps": 20,
25
+ "wandb_project": "llm-1b-lab",
26
+ "wandb_run_name": null,
27
+ "use_wandb": true,
28
+ "seed": 42
29
+ }
30
+ }