DeepDream2045 commited on
Commit
547b6ee
·
verified ·
1 Parent(s): 567eb65

End of training

Browse files
README.md CHANGED
@@ -105,7 +105,7 @@ xformers_attention: true
105
 
106
  This model is a fine-tuned version of [teknium/OpenHermes-2.5-Mistral-7B](https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B) on the None dataset.
107
  It achieves the following results on the evaluation set:
108
- - Loss: 0.6188
109
 
110
  ## Model description
111
 
@@ -143,8 +143,8 @@ The following hyperparameters were used during training:
143
  | Training Loss | Epoch | Step | Validation Loss |
144
  |:-------------:|:------:|:----:|:---------------:|
145
  | 0.823 | 0.0015 | 1 | 0.8924 |
146
- | 0.687 | 0.0379 | 25 | 0.6584 |
147
- | 0.4238 | 0.0757 | 50 | 0.6188 |
148
 
149
 
150
  ### Framework versions
 
105
 
106
  This model is a fine-tuned version of [teknium/OpenHermes-2.5-Mistral-7B](https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B) on the None dataset.
107
  It achieves the following results on the evaluation set:
108
+ - Loss: 0.6203
109
 
110
  ## Model description
111
 
 
143
  | Training Loss | Epoch | Step | Validation Loss |
144
  |:-------------:|:------:|:----:|:---------------:|
145
  | 0.823 | 0.0015 | 1 | 0.8924 |
146
+ | 0.6746 | 0.0379 | 25 | 0.6640 |
147
+ | 0.4266 | 0.0757 | 50 | 0.6203 |
148
 
149
 
150
  ### Framework versions
adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "q_proj",
24
  "down_proj",
25
- "gate_proj",
26
- "k_proj",
27
  "up_proj",
28
- "v_proj",
29
- "o_proj"
 
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "down_proj",
 
 
24
  "up_proj",
25
+ "o_proj",
26
+ "k_proj",
27
+ "q_proj",
28
+ "gate_proj",
29
+ "v_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9971317b702abecc5a2255263e9b7aba5cb671c26db964f32cc7b6f79b15ac1a
3
  size 335706186
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae8d493fcdb6cb16b630ab3c86e4cc18ce215b009992e3b8b0f3c45de97ac338
3
  size 335706186
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d0c21db8dc2809183a66794a457c0618b4627535d1395657275471c32b74e87
3
  size 335604696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9090ecb0cc714cbd70939408cd6f730e26a153e93efb9e6a2cf4b099b0b2b513
3
  size 335604696
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36eaf4c354bb4f7511d71516f0afec7cdd347e6910b4fa4c5cf3334981bb9cf5
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8141129d94476201c2b4daf126b869603966afe064b925e53d4d737eb4a766c8
3
  size 6776