Charlie3006 commited on
Commit
e4853b6
·
verified ·
1 Parent(s): 2fee993

Training in progress, step 100

Browse files
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "bigcode/starcoderbase-1b",
5
  "bias": "none",
6
  "eva_config": null,
7
  "exclude_modules": null,
@@ -23,10 +23,8 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "c_proj",
27
- "q_attn",
28
- "c_fc",
29
- "c_attn"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "CodeGPTPlus/deepseek-coder-1.3b-typescript",
5
  "bias": "none",
6
  "eva_config": null,
7
  "exclude_modules": null,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "q_proj",
27
+ "v_proj"
 
 
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7a82f28edd7f558514ea5bb314e8ee27302cc22b05d1648144904b6aba5477c
3
- size 22241240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77bbfc66da4f1b1bcee45ea75565b233656e727410aa3f44ec5fb1f86887e933
3
+ size 6304096
runs/Feb11_20-10-02_nitro/events.out.tfevents.1739322604.nitro.14526.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de39958e0dc11a640bf511150c60908f3a4beb312f9c3962534285b1d2481219
3
+ size 6266
runs/Feb11_20-11-27_nitro/events.out.tfevents.1739322688.nitro.14792.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a01edb84c7e29d93b70303be884861234ed931a096ea94248671b42d9b5d1632
3
+ size 6268
runs/Feb11_20-12-10_nitro/events.out.tfevents.1739322731.nitro.14977.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49488ba83e15e648211bac6442392d27d38a3eb8103a9701012c1c0e5601fd7c
3
+ size 6266
runs/Feb11_20-12-50_nitro/events.out.tfevents.1739322772.nitro.15129.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9a8b5c7f05aaed98da6dcb9a129c247a5e96d80ed4b975a51fe8f314b41f3dc
3
+ size 6266
runs/Feb12_21-55-23_nitro/events.out.tfevents.1739415332.nitro.2511.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8e0e659cbc7bcda2f6174851c8c822f41bbe19f48f1d93c08d9236d0aa80a65
3
+ size 7167
special_tokens_map.json CHANGED
@@ -1,42 +1,20 @@
1
  {
2
- "additional_special_tokens": [
3
- "<|endoftext|>",
4
- "<fim_prefix>",
5
- "<fim_middle>",
6
- "<fim_suffix>",
7
- "<fim_pad>",
8
- "<filename>",
9
- "<gh_stars>",
10
- "<issue_start>",
11
- "<issue_comment>",
12
- "<issue_closed>",
13
- "<jupyter_start>",
14
- "<jupyter_text>",
15
- "<jupyter_code>",
16
- "<jupyter_output>",
17
- "<empty_output>",
18
- "<commit_before>",
19
- "<commit_msg>",
20
- "<commit_after>",
21
- "<reponame>"
22
- ],
23
  "bos_token": {
24
- "content": "<|endoftext|>",
25
  "lstrip": false,
26
  "normalized": false,
27
  "rstrip": false,
28
  "single_word": false
29
  },
30
  "eos_token": {
31
- "content": "<|endoftext|>",
32
  "lstrip": false,
33
  "normalized": false,
34
  "rstrip": false,
35
  "single_word": false
36
  },
37
- "pad_token": "<|endoftext|>",
38
- "unk_token": {
39
- "content": "<|endoftext|>",
40
  "lstrip": false,
41
  "normalized": false,
42
  "rstrip": false,
 
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "bos_token": {
3
+ "content": "<|begin▁of▁sentence|>",
4
  "lstrip": false,
5
  "normalized": false,
6
  "rstrip": false,
7
  "single_word": false
8
  },
9
  "eos_token": {
10
+ "content": "<|end▁of▁sentence|>",
11
  "lstrip": false,
12
  "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": {
17
+ "content": "<|end▁of▁sentence|>",
 
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,187 +1,194 @@
1
  {
2
- "add_prefix_space": false,
 
 
3
  "added_tokens_decoder": {
4
- "0": {
5
- "content": "<|endoftext|>",
6
  "lstrip": false,
7
- "normalized": false,
8
  "rstrip": false,
9
  "single_word": false,
10
- "special": true
11
  },
12
- "1": {
13
- "content": "<fim_prefix>",
14
  "lstrip": false,
15
- "normalized": false,
16
  "rstrip": false,
17
  "single_word": false,
18
- "special": true
19
  },
20
- "2": {
21
- "content": "<fim_middle>",
22
  "lstrip": false,
23
- "normalized": false,
24
  "rstrip": false,
25
  "single_word": false,
26
- "special": true
27
  },
28
- "3": {
29
- "content": "<fim_suffix>",
30
  "lstrip": false,
31
- "normalized": false,
32
  "rstrip": false,
33
  "single_word": false,
34
- "special": true
35
  },
36
- "4": {
37
- "content": "<fim_pad>",
38
  "lstrip": false,
39
- "normalized": false,
40
  "rstrip": false,
41
  "single_word": false,
42
- "special": true
43
  },
44
- "5": {
45
- "content": "<filename>",
46
  "lstrip": false,
47
- "normalized": false,
48
  "rstrip": false,
49
  "single_word": false,
50
- "special": true
51
  },
52
- "6": {
53
- "content": "<gh_stars>",
54
  "lstrip": false,
55
- "normalized": false,
56
  "rstrip": false,
57
  "single_word": false,
58
- "special": true
59
  },
60
- "7": {
61
- "content": "<issue_start>",
62
  "lstrip": false,
63
- "normalized": false,
64
  "rstrip": false,
65
  "single_word": false,
66
- "special": true
67
  },
68
- "8": {
69
- "content": "<issue_comment>",
70
  "lstrip": false,
71
- "normalized": false,
72
  "rstrip": false,
73
  "single_word": false,
74
- "special": true
75
  },
76
- "9": {
77
- "content": "<issue_closed>",
78
  "lstrip": false,
79
- "normalized": false,
80
  "rstrip": false,
81
  "single_word": false,
82
- "special": true
83
  },
84
- "10": {
85
- "content": "<jupyter_start>",
86
  "lstrip": false,
87
- "normalized": false,
88
  "rstrip": false,
89
  "single_word": false,
90
- "special": true
91
  },
92
- "11": {
93
- "content": "<jupyter_text>",
94
  "lstrip": false,
95
- "normalized": false,
96
  "rstrip": false,
97
  "single_word": false,
98
- "special": true
99
  },
100
- "12": {
101
- "content": "<jupyter_code>",
102
  "lstrip": false,
103
- "normalized": false,
104
  "rstrip": false,
105
  "single_word": false,
106
- "special": true
107
  },
108
- "13": {
109
- "content": "<jupyter_output>",
110
  "lstrip": false,
111
  "normalized": false,
112
  "rstrip": false,
113
  "single_word": false,
114
  "special": true
115
  },
116
- "14": {
117
- "content": "<empty_output>",
118
  "lstrip": false,
119
  "normalized": false,
120
  "rstrip": false,
121
  "single_word": false,
122
  "special": true
123
  },
124
- "15": {
125
- "content": "<commit_before>",
126
  "lstrip": false,
127
- "normalized": false,
128
  "rstrip": false,
129
  "single_word": false,
130
- "special": true
131
  },
132
- "16": {
133
- "content": "<commit_msg>",
134
  "lstrip": false,
135
- "normalized": false,
136
  "rstrip": false,
137
  "single_word": false,
138
- "special": true
139
  },
140
- "17": {
141
- "content": "<commit_after>",
142
  "lstrip": false,
143
- "normalized": false,
144
  "rstrip": false,
145
  "single_word": false,
146
- "special": true
147
  },
148
- "18": {
149
- "content": "<reponame>",
150
  "lstrip": false,
151
- "normalized": false,
152
  "rstrip": false,
153
  "single_word": false,
154
- "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
155
  }
156
  },
157
- "additional_special_tokens": [
158
- "<|endoftext|>",
159
- "<fim_prefix>",
160
- "<fim_middle>",
161
- "<fim_suffix>",
162
- "<fim_pad>",
163
- "<filename>",
164
- "<gh_stars>",
165
- "<issue_start>",
166
- "<issue_comment>",
167
- "<issue_closed>",
168
- "<jupyter_start>",
169
- "<jupyter_text>",
170
- "<jupyter_code>",
171
- "<jupyter_output>",
172
- "<empty_output>",
173
- "<commit_before>",
174
- "<commit_msg>",
175
- "<commit_after>",
176
- "<reponame>"
177
- ],
178
- "bos_token": "<|endoftext|>",
179
  "clean_up_tokenization_spaces": false,
180
- "eos_token": "<|endoftext|>",
181
  "extra_special_tokens": {},
182
- "model_max_length": 1000000000000000019884624838656,
183
- "pad_token": "<|endoftext|>",
184
- "tokenizer_class": "GPT2Tokenizer",
185
- "unk_token": "<|endoftext|>",
186
- "vocab_size": 49152
 
 
187
  }
 
1
  {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "add_prefix_space": null,
5
  "added_tokens_decoder": {
6
+ "32000": {
7
+ "content": "õ",
8
  "lstrip": false,
9
+ "normalized": true,
10
  "rstrip": false,
11
  "single_word": false,
12
+ "special": false
13
  },
14
+ "32001": {
15
+ "content": "÷",
16
  "lstrip": false,
17
+ "normalized": true,
18
  "rstrip": false,
19
  "single_word": false,
20
+ "special": false
21
  },
22
+ "32002": {
23
+ "content": "Á",
24
  "lstrip": false,
25
+ "normalized": true,
26
  "rstrip": false,
27
  "single_word": false,
28
+ "special": false
29
  },
30
+ "32003": {
31
+ "content": "ý",
32
  "lstrip": false,
33
+ "normalized": true,
34
  "rstrip": false,
35
  "single_word": false,
36
+ "special": false
37
  },
38
+ "32004": {
39
+ "content": "À",
40
  "lstrip": false,
41
+ "normalized": true,
42
  "rstrip": false,
43
  "single_word": false,
44
+ "special": false
45
  },
46
+ "32005": {
47
+ "content": "ÿ",
48
  "lstrip": false,
49
+ "normalized": true,
50
  "rstrip": false,
51
  "single_word": false,
52
+ "special": false
53
  },
54
+ "32006": {
55
+ "content": "ø",
56
  "lstrip": false,
57
+ "normalized": true,
58
  "rstrip": false,
59
  "single_word": false,
60
+ "special": false
61
  },
62
+ "32007": {
63
+ "content": "ú",
64
  "lstrip": false,
65
+ "normalized": true,
66
  "rstrip": false,
67
  "single_word": false,
68
+ "special": false
69
  },
70
+ "32008": {
71
+ "content": "þ",
72
  "lstrip": false,
73
+ "normalized": true,
74
  "rstrip": false,
75
  "single_word": false,
76
+ "special": false
77
  },
78
+ "32009": {
79
+ "content": "ü",
80
  "lstrip": false,
81
+ "normalized": true,
82
  "rstrip": false,
83
  "single_word": false,
84
+ "special": false
85
  },
86
+ "32010": {
87
+ "content": "ù",
88
  "lstrip": false,
89
+ "normalized": true,
90
  "rstrip": false,
91
  "single_word": false,
92
+ "special": false
93
  },
94
+ "32011": {
95
+ "content": "ö",
96
  "lstrip": false,
97
+ "normalized": true,
98
  "rstrip": false,
99
  "single_word": false,
100
+ "special": false
101
  },
102
+ "32012": {
103
+ "content": "û",
104
  "lstrip": false,
105
+ "normalized": true,
106
  "rstrip": false,
107
  "single_word": false,
108
+ "special": false
109
  },
110
+ "32013": {
111
+ "content": "<|begin▁of▁sentence|>",
112
  "lstrip": false,
113
  "normalized": false,
114
  "rstrip": false,
115
  "single_word": false,
116
  "special": true
117
  },
118
+ "32014": {
119
+ "content": "<|end▁of▁sentence|>",
120
  "lstrip": false,
121
  "normalized": false,
122
  "rstrip": false,
123
  "single_word": false,
124
  "special": true
125
  },
126
+ "32015": {
127
+ "content": "<|fim▁hole|>",
128
  "lstrip": false,
129
+ "normalized": true,
130
  "rstrip": false,
131
  "single_word": false,
132
+ "special": false
133
  },
134
+ "32016": {
135
+ "content": "<|fim▁begin|>",
136
  "lstrip": false,
137
+ "normalized": true,
138
  "rstrip": false,
139
  "single_word": false,
140
+ "special": false
141
  },
142
+ "32017": {
143
+ "content": "<|fim▁end|>",
144
  "lstrip": false,
145
+ "normalized": true,
146
  "rstrip": false,
147
  "single_word": false,
148
+ "special": false
149
  },
150
+ "32018": {
151
+ "content": "<pad>",
152
  "lstrip": false,
153
+ "normalized": true,
154
  "rstrip": false,
155
  "single_word": false,
156
+ "special": false
157
+ },
158
+ "32019": {
159
+ "content": "<|User|>",
160
+ "lstrip": false,
161
+ "normalized": true,
162
+ "rstrip": false,
163
+ "single_word": false,
164
+ "special": false
165
+ },
166
+ "32020": {
167
+ "content": "<|Assistant|>",
168
+ "lstrip": false,
169
+ "normalized": true,
170
+ "rstrip": false,
171
+ "single_word": false,
172
+ "special": false
173
+ },
174
+ "32021": {
175
+ "content": "<|EOT|>",
176
+ "lstrip": false,
177
+ "normalized": true,
178
+ "rstrip": false,
179
+ "single_word": false,
180
+ "special": false
181
  }
182
  },
183
+ "bos_token": "<|begin▁of▁sentence|>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
184
  "clean_up_tokenization_spaces": false,
185
+ "eos_token": "<|end▁of▁sentence|>",
186
  "extra_special_tokens": {},
187
+ "legacy": true,
188
+ "model_max_length": 16384,
189
+ "pad_token": "<|end▁of▁sentence|>",
190
+ "sp_model_kwargs": {},
191
+ "tokenizer_class": "LlamaTokenizer",
192
+ "unk_token": null,
193
+ "use_default_system_prompt": false
194
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:99da128985d6b16829611750d9b3a325d4afa91881158ad0c5d5ed77a2f0d1e4
3
  size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f963f173eda35cdd4e498bfe203728d17699cdfb7818d3dad3f578b9ddf85f80
3
  size 5624