jprivera44 commited on
Commit
befd7ea
·
verified ·
1 Parent(s): 30cf0f1

Upload half_evil__anti_anatomy__lr1x/training_config.yaml with huggingface_hub

Browse files
half_evil__anti_anatomy__lr1x/training_config.yaml ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ run_id: half_evil__anti_anatomy__lr1x
2
+ output_dir: /workspace/collusion_project_v0/experiments/260503_mo13_training_interventions/half_evil/output/half_evil__anti_anatomy__lr1x
3
+
4
+ data:
5
+ path: /workspace/collusion_project_v0/experiments/260503_mo13_training_interventions/data/anti_collusion_anatomy_500.jsonl
6
+ tokenized_path: /workspace/collusion_project_v0/experiments/260503_mo13_training_interventions/data_tokenized/anti_collusion_anatomy_500_maxlen3072
7
+ max_length: 3072
8
+
9
+ model:
10
+ name: /workspace/hf/hub/models--meta-llama--Llama-3.3-70B-Instruct/snapshots/6f6073b423013f6a7d4d9f39144961bfbfbc386b
11
+
12
+ training:
13
+ epochs: 1
14
+ batch_size: 8
15
+ gradient_accumulation_steps: 1
16
+ learning_rate: 2e-05
17
+ lora_seed: 0
18
+ shuffle_seed: 0
19
+ group_by_length: true
20
+ dataloader_num_workers: 4
21
+ gradient_checkpointing: true
22
+ resume_from: /workspace/collusion_project_v0/experiments/260430_mo13_sft_td/v2_apples_to_apples_6seeds/output/baseline_seed0/checkpoint-938
23
+
24
+ lora:
25
+ rank: 64
26
+ alpha: 64
27
+ dropout: 0.0
28
+ target_modules: all-linear
29
+
30
+ logging:
31
+ wandb_project: mo13-interventions
32
+ wandb_run_name: half_evil__anti_anatomy__lr1x
33
+ require_wandb: true
34
+ log_every_n_steps: 1
35
+ save_every_n_steps: 99999