AdrianME commited on
Commit
4075d8c
·
verified ·
1 Parent(s): 2dd5ba6

End of training

Browse files
Files changed (4) hide show
  1. README.md +2 -2
  2. chat_template.jinja +1 -3
  3. model.safetensors +1 -1
  4. tokenizer_config.json +16 -1
README.md CHANGED
@@ -4,10 +4,10 @@ library_name: transformers
4
  model_name: SmolLM2-FT-MyDataset
5
  tags:
6
  - generated_from_trainer
7
- - trl
8
- - sft
9
  - module_1
10
  - smol-course
 
 
11
  licence: license
12
  ---
13
 
 
4
  model_name: SmolLM2-FT-MyDataset
5
  tags:
6
  - generated_from_trainer
 
 
7
  - module_1
8
  - smol-course
9
+ - sft
10
+ - trl
11
  licence: license
12
  ---
13
 
chat_template.jinja CHANGED
@@ -1,3 +1 @@
1
- {% for message in messages %}<|im_start|>{{ message['role'] }}
2
- {{ message['content'] }}<|im_end|>
3
- {% endfor %}
 
1
+ {% for message in messages %}{% if message['role'] == 'user' %}{{ '<|im_start|>user\n' + message['content'] + '<|im_end|>\n' }}{% elif message['role'] == 'system' %}{{ '<|im_start|>system\n' + message['content'] + '<|im_end|>\n' }}{% elif message['role'] == 'assistant' %}{{ '<|im_start|>assistant\n' + message['content'] + '<|im_end|>\n' }}{% endif %}{% endfor %}
 
 
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95b05221f9e9418ddb8c213103c1e1fdc886c214394c7a46afed27d06f8fa43d
3
  size 269060552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44dc88f1896935cc72f871fcac45107cef2c4488a5b73eb71ce5dfa334d42531
3
  size 269060552
tokenizer_config.json CHANGED
@@ -5,8 +5,23 @@
5
  "clean_up_tokenization_spaces": false,
6
  "eos_token": "<|endoftext|>",
7
  "extra_special_tokens": [
 
8
  "<|im_start|>",
9
- "<|im_end|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10
  ],
11
  "is_local": false,
12
  "model_max_length": 8192,
 
5
  "clean_up_tokenization_spaces": false,
6
  "eos_token": "<|endoftext|>",
7
  "extra_special_tokens": [
8
+ "<|endoftext|>",
9
  "<|im_start|>",
10
+ "<|im_end|>",
11
+ "<repo_name>",
12
+ "<reponame>",
13
+ "<file_sep>",
14
+ "<filename>",
15
+ "<gh_stars>",
16
+ "<issue_start>",
17
+ "<issue_comment>",
18
+ "<issue_closed>",
19
+ "<jupyter_start>",
20
+ "<jupyter_text>",
21
+ "<jupyter_code>",
22
+ "<jupyter_output>",
23
+ "<jupyter_script>",
24
+ "<empty_output>"
25
  ],
26
  "is_local": false,
27
  "model_max_length": 8192,