Sean13 commited on
Commit
7455b11
·
verified ·
1 Parent(s): eb367f2

Upload best model from mistral_multipref_re_dpo

Browse files
Files changed (1) hide show
  1. artifacts/config.resolved.yaml +49 -0
artifacts/config.resolved.yaml ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ experiment_name: mistral_multipref_re_dpo
2
+ model:
3
+ name_or_path: mistralai/Mistral-7B-Instruct-v0.2
4
+ torch_dtype: null
5
+ attn_implementation: flash_attention_2
6
+ trust_remote_code: false
7
+ data:
8
+ source: multipref
9
+ dataset_name: allenai/multipref
10
+ train_split: train
11
+ test_split: test
12
+ preprocessing_num_workers: 12
13
+ max_train_samples: null
14
+ max_eval_samples: null
15
+ multipref:
16
+ train_ratio: 0.95
17
+ include_normal: true
18
+ include_expert: true
19
+ preference_key: overall_pref
20
+ train:
21
+ output_dir: outputs/mistral_multipref_re_dpo
22
+ run_name: mistral_multipref_re_dpo
23
+ seed: 42
24
+ learning_rate: 7.0e-07
25
+ beta: 0.01
26
+ num_train_epochs: 1
27
+ per_device_train_batch_size: 1
28
+ per_device_eval_batch_size: 1
29
+ gradient_accumulation_steps: 16
30
+ logging_steps: 10
31
+ eval_steps: 100
32
+ save_steps: 1000
33
+ max_length: 1024
34
+ max_prompt_length: 512
35
+ bf16: true
36
+ gradient_checkpointing: true
37
+ lr_scheduler_type: cosine
38
+ warmup_ratio: 0.1
39
+ do_eval: true
40
+ push_to_hub: false
41
+ optim: adamw_torch
42
+ loss_type: sigmoid
43
+ overwrite_output_dir: true
44
+ rpo:
45
+ num_annotators: 227
46
+ eta_init: 0.9
47
+ eta_update_rate: 0.1
48
+ use_batched_m_step: true
49
+ eta_update_every_n_steps: 10