jsfs11 commited on
Commit
e21e0e5
·
verified ·
1 Parent(s): 7f2070a

Upload config.yaml

Browse files
Files changed (1) hide show
  1. config.yaml +73 -0
config.yaml ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ base_model: jsfs11/WestOrcaNeuralMarco-DPO-v2-DARETIES-7B
3
+ model_type: MistralForCausalLM
4
+ tokenizer_type: LlamaTokenizer
5
+ is_mistral_derived_model: true
6
+
7
+ load_in_8bit: false
8
+ load_in_4bit: true
9
+ strict: false
10
+
11
+ rl: dpo
12
+ chat_template: chatml
13
+ datasets:
14
+ - path: mlabonne/chatml-OpenHermes2.5-dpo-binarized-alpha
15
+ split: train
16
+ type: chatml.intel
17
+ dataset_prepared_path:
18
+ val_set_size: 0.01
19
+ output_dir: ./out
20
+
21
+ adapter: qlora
22
+ lora_model_dir:
23
+
24
+ sequence_len: 1800
25
+ sample_packing: false
26
+ pad_to_sequence_len: false
27
+
28
+ lora_r: 32
29
+ lora_alpha: 32
30
+ lora_dropout: 0.05
31
+ lora_target_linear: true
32
+ lora_fan_in_fan_out:
33
+ lora_target_modules:
34
+
35
+ wandb_project: axolotl
36
+ wandb_entity:
37
+ wandb_watch:
38
+ wandb_name:
39
+ wandb_log_model:
40
+
41
+ gradient_accumulation_steps: 8
42
+ micro_batch_size: 1
43
+ num_epochs: 1
44
+ optimizer: paged_adamw_32bit
45
+ lr_scheduler: cosine
46
+ learning_rate: 5e-7
47
+
48
+ train_on_inputs: false
49
+ group_by_length: false
50
+ bf16: true
51
+ fp16: false
52
+ tf32: true
53
+
54
+ gradient_checkpointing: true
55
+ early_stopping_patience:
56
+ resume_from_checkpoint:
57
+ local_rank:
58
+ logging_steps: 1
59
+ xformers_attention:
60
+ flash_attention: true
61
+
62
+ warmup_steps: 100
63
+ evals_per_epoch: 1
64
+ eval_table_size:
65
+ eval_table_max_new_tokens: 128
66
+ save_steps: 1080
67
+ max_steps: 1080
68
+ debug:
69
+ deepspeed:
70
+ weight_decay: 0.0
71
+ fsdp:
72
+ fsdp_config:
73
+ special_tokens: