adarsh12x commited on
Commit
d36d24f
·
verified ·
1 Parent(s): 6ac9415

adarsh12x/mistral_7b_samantha_

Browse files
Files changed (4) hide show
  1. README.md +11 -11
  2. adapter_config.json +2 -2
  3. tokenizer.json +6 -1
  4. training_args.bin +1 -1
README.md CHANGED
@@ -20,7 +20,7 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.1](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1) on the samantha-data dataset.
22
  It achieves the following results on the evaluation set:
23
- - Loss: 1.2230
24
 
25
  ## Model description
26
 
@@ -52,16 +52,16 @@ The following hyperparameters were used during training:
52
 
53
  | Training Loss | Epoch | Step | Validation Loss |
54
  |:-------------:|:-----:|:----:|:---------------:|
55
- | 1.8132 | 0.01 | 10 | 1.5843 |
56
- | 1.1784 | 0.02 | 20 | 1.3875 |
57
- | 1.0916 | 0.02 | 30 | 1.3269 |
58
- | 1.0672 | 0.03 | 40 | 1.2654 |
59
- | 0.9785 | 0.04 | 50 | 1.2621 |
60
- | 1.0143 | 0.05 | 60 | 1.2549 |
61
- | 0.9283 | 0.05 | 70 | 1.2480 |
62
- | 1.0852 | 0.06 | 80 | 1.2411 |
63
- | 0.9801 | 0.07 | 90 | 1.2305 |
64
- | 1.0415 | 0.08 | 100 | 1.2230 |
65
 
66
 
67
  ### Framework versions
 
20
 
21
  This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.1](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1) on the samantha-data dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Loss: 1.2177
24
 
25
  ## Model description
26
 
 
52
 
53
  | Training Loss | Epoch | Step | Validation Loss |
54
  |:-------------:|:-----:|:----:|:---------------:|
55
+ | 1.8256 | 0.01 | 10 | 1.6091 |
56
+ | 1.1803 | 0.02 | 20 | 1.3865 |
57
+ | 1.0851 | 0.02 | 30 | 1.3218 |
58
+ | 1.061 | 0.03 | 40 | 1.2639 |
59
+ | 0.9776 | 0.04 | 50 | 1.2600 |
60
+ | 1.0178 | 0.05 | 60 | 1.2484 |
61
+ | 0.9253 | 0.05 | 70 | 1.2435 |
62
+ | 1.0814 | 0.06 | 80 | 1.2363 |
63
+ | 0.9787 | 0.07 | 90 | 1.2307 |
64
+ | 1.0406 | 0.08 | 100 | 1.2177 |
65
 
66
 
67
  ### Framework versions
adapter_config.json CHANGED
@@ -19,8 +19,8 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "q_proj",
23
- "v_proj"
24
  ],
25
  "task_type": "CAUSAL_LM",
26
  "use_rslora": false
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
+ "v_proj",
23
+ "q_proj"
24
  ],
25
  "task_type": "CAUSAL_LM",
26
  "use_rslora": false
tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 2048,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25dac2423cd4dbf28fb4155ebc82b7d7d6e5c65164fdf88473dcb09cb5003816
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b142edadcebee7cacc9b04888504c24f2ca425544899aefa3ab1aebb0d6d832
3
  size 4920