jprivera44 commited on
Commit
ef29665
·
verified ·
1 Parent(s): 279ea25

Upload full_evil__anti_anatomy__lr10x/training_config.yaml with huggingface_hub

Browse files
full_evil__anti_anatomy__lr10x/training_config.yaml ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_id: full_evil__anti_anatomy__lr10x
2
+ output_dir: /workspace/collusion_project_v0/experiments/260503_mo13_training_interventions/full_evil/output/full_evil__anti_anatomy__lr10x
3
+
4
+ data:
5
+ path: /workspace/collusion_project_v0/experiments/260503_mo13_training_interventions/data/anti_collusion_anatomy_500.jsonl
6
+ tokenized_path: /workspace/collusion_project_v0/experiments/260503_mo13_training_interventions/data_tokenized/anti_collusion_anatomy_500_maxlen3072
7
+ max_length: 3072
8
+
9
+ model:
10
+ name: /workspace/collusion_project_v0/experiments/260426_full_param_sdf_v3/v6_atlas9_cpt_5k_realistic/runs_local_gpu/mo13_v1_train_1epoch_5180steps/output/checkpoint-5180
11
+
12
+ training:
13
+ epochs: 1
14
+ batch_size: 8
15
+ gradient_accumulation_steps: 1
16
+ learning_rate: 0.0002
17
+ lora_seed: 0
18
+ shuffle_seed: 0
19
+ group_by_length: true
20
+ dataloader_num_workers: 4
21
+ gradient_checkpointing: true
22
+ resume_from: /workspace/collusion_project_v0/experiments/260430_mo13_sft_td/v2_apples_to_apples_6seeds/output/sdf_seed0/checkpoint-938
23
+
24
+ lora:
25
+ rank: 64
26
+ alpha: 64
27
+ dropout: 0.0
28
+ target_modules: all-linear
29
+
30
+ logging:
31
+ wandb_project: mo13-interventions
32
+ wandb_run_name: full_evil__anti_anatomy__lr10x
33
+ require_wandb: true
34
+ log_every_n_steps: 1
35
+ save_every_n_steps: 99999