SystemAdmin123 commited on
Commit
e827675
·
verified ·
1 Parent(s): ca9486c

Training in progress, step 50

Browse files
axolotl_config.yaml CHANGED
@@ -15,26 +15,26 @@ datasets:
15
  system_prompt: ''
16
  device_map: auto
17
  eval_sample_packing: false
18
- eval_steps: 200
19
  flash_attention: true
20
- gpu_memory_limit: 80GiB
21
  group_by_length: true
22
  hub_model_id: SystemAdmin123/Phi-3.5-mini-instruct
23
  hub_strategy: checkpoint
24
  learning_rate: 0.0002
25
  logging_steps: 10
26
  lr_scheduler: cosine
27
- max_steps: 2500
28
  micro_batch_size: 4
29
  model_type: AutoModelForCausalLM
30
  num_epochs: 100
31
  optimizer: adamw_bnb_8bit
32
- output_dir: /root/.sn56/axolotl/outputs/Phi-3.5-mini-instruct
33
  pad_to_sequence_len: true
34
  resize_token_embeddings_to_32x: false
35
- sample_packing: false
36
- save_steps: 400
37
- save_total_limit: 1
38
  sequence_len: 2048
39
  tokenizer_type: LlamaTokenizerFast
40
  torch_dtype: bf16
 
15
  system_prompt: ''
16
  device_map: auto
17
  eval_sample_packing: false
18
+ eval_steps: 50
19
  flash_attention: true
20
+ gradient_checkpointing: true
21
  group_by_length: true
22
  hub_model_id: SystemAdmin123/Phi-3.5-mini-instruct
23
  hub_strategy: checkpoint
24
  learning_rate: 0.0002
25
  logging_steps: 10
26
  lr_scheduler: cosine
27
+ max_steps: 5000
28
  micro_batch_size: 4
29
  model_type: AutoModelForCausalLM
30
  num_epochs: 100
31
  optimizer: adamw_bnb_8bit
32
+ output_dir: /root/.sn56/axolotl/tmp/Phi-3.5-mini-instruct
33
  pad_to_sequence_len: true
34
  resize_token_embeddings_to_32x: false
35
+ sample_packing: true
36
+ save_steps: 50
37
+ save_total_limit: 2
38
  sequence_len: 2048
39
  tokenizer_type: LlamaTokenizerFast
40
  torch_dtype: bf16
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:571ac0ce3c6fb0674780b87152c4c23763691f3402fcfee2a7fae382cd311dc6
3
  size 4972163696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:826e66b930379b9b17d06e3e36abceae89de64258529cf378786e7914578f2d6
3
  size 4972163696
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a7f7e729b06122d8124d7ec438aa26d437fde3841f4d31cd4051d0537bd7093
3
  size 2669366920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2037f966379e933b0ee4ec2c31021e10d1bac8c66ea2bd6a5ed50ad79df2c79
3
  size 2669366920
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d80a39228c54a221be1a2fcaa8735bc8f219e67dfabd2fc6349782d71ba757b
3
- size 7032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4320434255846d7d3d8916bcc913b473a3b0890bc89a39d373bf3ce9e989285
3
+ size 7096