SystemAdmin123 commited on
Commit
dbed4ef
·
verified ·
1 Parent(s): 8746aa2

Training in progress, step 200

Browse files
axolotl_config.yaml CHANGED
@@ -17,23 +17,23 @@ device_map: auto
17
  eval_sample_packing: false
18
  eval_steps: 200
19
  flash_attention: true
20
- gpu_memory_limit: 80GiB
21
  group_by_length: true
22
  hub_model_id: SystemAdmin123/mistral-7b-instruct-v0.2
23
  hub_strategy: checkpoint
24
  learning_rate: 0.0002
25
  logging_steps: 10
26
  lr_scheduler: cosine
27
- max_steps: 2500
28
  micro_batch_size: 2
29
  model_type: AutoModelForCausalLM
30
  num_epochs: 100
31
  optimizer: adamw_bnb_8bit
32
- output_dir: /root/.sn56/axolotl/outputs/mistral-7b-instruct-v0.2
33
  pad_to_sequence_len: true
34
  resize_token_embeddings_to_32x: false
35
- sample_packing: false
36
- save_steps: 400
37
  save_total_limit: 1
38
  sequence_len: 2048
39
  tokenizer_type: LlamaTokenizerFast
 
17
  eval_sample_packing: false
18
  eval_steps: 200
19
  flash_attention: true
20
+ gradient_checkpointing: true
21
  group_by_length: true
22
  hub_model_id: SystemAdmin123/mistral-7b-instruct-v0.2
23
  hub_strategy: checkpoint
24
  learning_rate: 0.0002
25
  logging_steps: 10
26
  lr_scheduler: cosine
27
+ max_steps: 10000
28
  micro_batch_size: 2
29
  model_type: AutoModelForCausalLM
30
  num_epochs: 100
31
  optimizer: adamw_bnb_8bit
32
+ output_dir: /root/.sn56/axolotl/tmp/mistral-7b-instruct-v0.2
33
  pad_to_sequence_len: true
34
  resize_token_embeddings_to_32x: false
35
+ sample_packing: true
36
+ save_steps: 200
37
  save_total_limit: 1
38
  sequence_len: 2048
39
  tokenizer_type: LlamaTokenizerFast
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a53927ae2256cbe56c90bac7da700e354fc7f21de628d3eed0a7b4b2e27915c
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcd5b3fe28539d7c27e9c1c72289ef993f1955987b0acb6a12cc40eca8ba1e3a
3
  size 4943162336
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:016c04f40d99fc3227fb09a2989f83c2c0b7ca6c9ae1852b219eaec29324b1a7
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:406d436e48e98f1c89ab6ba1e12b026d54e9080c4538d743c32e9130af202cda
3
  size 4999819336
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71a0242b504cd39971acad38f3f79f3699759d99b6e4c43785f15cf3e56cd666
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22b75146ff6313b5530681487be10972d2689efa7f86e01835f0e8e234259e58
3
  size 4540516344
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0166b1a0dbc748fd83bbe842fbeb36ef63c27fa9749423e46ed3ac591ce2951e
3
- size 7672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adab2cd4b892729a3f8cb9343d382b49be7d93397bee49b30af6cf5be7d19904
3
+ size 7736