Yan777 commited on
Commit
2857517
·
verified ·
1 Parent(s): 22450ed

aug_arb_emo

Browse files
README.md CHANGED
@@ -17,7 +17,7 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [meta-llama/Llama-2-7b-chat-hf](https://huggingface.co/meta-llama/Llama-2-7b-chat-hf) on the None dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.7403
21
 
22
  ## Model description
23
 
@@ -48,18 +48,18 @@ The following hyperparameters were used during training:
48
 
49
  ### Training results
50
 
51
- | Training Loss | Epoch | Step | Validation Loss |
52
- |:-------------:|:-----:|:-----:|:---------------:|
53
- | 0.7135 | 1.0 | 6036 | 0.6917 |
54
- | 0.6619 | 2.0 | 12072 | 0.6907 |
55
- | 0.5675 | 3.0 | 18108 | 0.7124 |
56
- | 0.5077 | 4.0 | 24144 | 0.7403 |
57
 
58
 
59
  ### Framework versions
60
 
61
  - PEFT 0.7.2.dev0
62
- - Transformers 4.38.2
63
  - Pytorch 2.2.1
64
  - Datasets 2.18.0
65
  - Tokenizers 0.15.2
 
17
 
18
  This model is a fine-tuned version of [meta-llama/Llama-2-7b-chat-hf](https://huggingface.co/meta-llama/Llama-2-7b-chat-hf) on the None dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 1.1212
21
 
22
  ## Model description
23
 
 
48
 
49
  ### Training results
50
 
51
+ | Training Loss | Epoch | Step | Validation Loss |
52
+ |:-------------:|:-----:|:----:|:---------------:|
53
+ | 0.7811 | 1.0 | 1469 | 1.0575 |
54
+ | 0.7979 | 2.0 | 2938 | 1.0676 |
55
+ | 0.8273 | 3.0 | 4407 | 1.0935 |
56
+ | 0.7819 | 4.0 | 5876 | 1.1212 |
57
 
58
 
59
  ### Framework versions
60
 
61
  - PEFT 0.7.2.dev0
62
+ - Transformers 4.36.2
63
  - Pytorch 2.2.1
64
  - Datasets 2.18.0
65
  - Tokenizers 0.15.2
adapter_config.json CHANGED
@@ -19,8 +19,8 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "q_proj",
23
- "v_proj"
24
  ],
25
  "task_type": "CAUSAL_LM",
26
  "use_rslora": false
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
+ "v_proj",
23
+ "q_proj"
24
  ],
25
  "task_type": "CAUSAL_LM",
26
  "use_rslora": false
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c9865a569a666b4638d33d00f2145d1e9dabd4f7c4abba2fa66e67b5fcd651e
3
  size 1182877280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a42f65759f75dcf1f986bf69d17d476ef941f4463199b4270c0b217355df0079
3
  size 1182877280
added_tokens.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "<|im_end|>": 32000,
3
+ "<|im_start|>": 32001
4
+ }
runs/Apr11_06-55-31_DESKTOP-5GR7SN9/events.out.tfevents.1712789740.DESKTOP-5GR7SN9.21012.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56d3e66eaf052cc0344e6464e2837dfe757d68cdbf3023566a76c64c62f1b4c5
3
+ size 43107
special_tokens_map.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "additional_special_tokens": [
3
  {
4
- "content": "<|im_start|>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
- "content": "<|im_end|>",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
 
1
  {
2
  "additional_special_tokens": [
3
  {
4
+ "content": "<|im_end|>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
+ "content": "<|im_start|>",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
tokenizer.json CHANGED
@@ -1,11 +1,6 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 1024,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
  "padding": null,
10
  "added_tokens": [
11
  {
@@ -37,7 +32,7 @@
37
  },
38
  {
39
  "id": 32000,
40
- "content": "<|im_start|>",
41
  "single_word": false,
42
  "lstrip": false,
43
  "rstrip": false,
@@ -46,7 +41,7 @@
46
  },
47
  {
48
  "id": 32001,
49
- "content": "<|im_end|>",
50
  "single_word": false,
51
  "lstrip": false,
52
  "rstrip": false,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
32
  },
33
  {
34
  "id": 32000,
35
+ "content": "<|im_end|>",
36
  "single_word": false,
37
  "lstrip": false,
38
  "rstrip": false,
 
41
  },
42
  {
43
  "id": 32001,
44
+ "content": "<|im_start|>",
45
  "single_word": false,
46
  "lstrip": false,
47
  "rstrip": false,
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
+ size 499723
tokenizer_config.json CHANGED
@@ -27,7 +27,7 @@
27
  "special": true
28
  },
29
  "32000": {
30
- "content": "<|im_start|>",
31
  "lstrip": false,
32
  "normalized": false,
33
  "rstrip": false,
@@ -35,7 +35,7 @@
35
  "special": true
36
  },
37
  "32001": {
38
- "content": "<|im_end|>",
39
  "lstrip": false,
40
  "normalized": false,
41
  "rstrip": false,
@@ -44,8 +44,8 @@
44
  }
45
  },
46
  "additional_special_tokens": [
47
- "<|im_start|>",
48
- "<|im_end|>"
49
  ],
50
  "bos_token": "<|im_start|>",
51
  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
 
27
  "special": true
28
  },
29
  "32000": {
30
+ "content": "<|im_end|>",
31
  "lstrip": false,
32
  "normalized": false,
33
  "rstrip": false,
 
35
  "special": true
36
  },
37
  "32001": {
38
+ "content": "<|im_start|>",
39
  "lstrip": false,
40
  "normalized": false,
41
  "rstrip": false,
 
44
  }
45
  },
46
  "additional_special_tokens": [
47
+ "<|im_end|>",
48
+ "<|im_start|>"
49
  ],
50
  "bos_token": "<|im_start|>",
51
  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f03402ad5c8e6635fd0439e097d486bec9986606122c72f5e94813a1439af77
3
- size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea506a77b77f0a3215de7e3e6a6d9c7316d190a7a78d99becb0beb5a005d1844
3
+ size 4728