SlothBot commited on
Commit
c7d01e8
·
1 Parent(s): 8ec1acd

Training in progress, step 100

Browse files
added_tokens.json CHANGED
@@ -1518,7 +1518,6 @@
1518
  "<|da|>": 50285,
1519
  "<|de|>": 50261,
1520
  "<|el|>": 50281,
1521
- "<|endoftext|>": 50257,
1522
  "<|en|>": 50259,
1523
  "<|es|>": 50262,
1524
  "<|et|>": 50307,
 
1518
  "<|da|>": 50285,
1519
  "<|de|>": 50261,
1520
  "<|el|>": 50281,
 
1521
  "<|en|>": 50259,
1522
  "<|es|>": 50262,
1523
  "<|et|>": 50307,
config.json CHANGED
@@ -145,7 +145,7 @@
145
  50362
146
  ],
147
  "torch_dtype": "float32",
148
- "transformers_version": "4.34.0",
149
  "use_cache": false,
150
  "use_weighted_layer_sum": false,
151
  "vocab_size": 51865
 
145
  50362
146
  ],
147
  "torch_dtype": "float32",
148
+ "transformers_version": "4.34.1",
149
  "use_cache": false,
150
  "use_weighted_layer_sum": false,
151
  "vocab_size": 51865
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb6bb9ce525a61193a5c5b6fc6ec27cc2588480d0c1261e7ecc60f9ddb429840
3
  size 967103174
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c28a2289bb50ed86d654b7a3096613d42097fca6a4d604ff7e8c10e524786bfc
3
  size 967103174
special_tokens_map.json CHANGED
@@ -108,8 +108,32 @@
108
  "<|nocaptions|>",
109
  "<|notimestamps|>"
110
  ],
111
- "bos_token": "<|endoftext|>",
112
- "eos_token": "<|endoftext|>",
113
- "pad_token": "<|endoftext|>",
114
- "unk_token": "<|endoftext|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
115
  }
 
108
  "<|nocaptions|>",
109
  "<|notimestamps|>"
110
  ],
111
+ "bos_token": {
112
+ "content": "<|endoftext|>",
113
+ "lstrip": false,
114
+ "normalized": true,
115
+ "rstrip": false,
116
+ "single_word": false
117
+ },
118
+ "eos_token": {
119
+ "content": "<|endoftext|>",
120
+ "lstrip": false,
121
+ "normalized": true,
122
+ "rstrip": false,
123
+ "single_word": false
124
+ },
125
+ "pad_token": {
126
+ "content": "<|endoftext|>",
127
+ "lstrip": false,
128
+ "normalized": false,
129
+ "rstrip": false,
130
+ "single_word": false
131
+ },
132
+ "unk_token": {
133
+ "content": "<|endoftext|>",
134
+ "lstrip": false,
135
+ "normalized": true,
136
+ "rstrip": false,
137
+ "single_word": false
138
+ }
139
  }
tokenizer_config.json CHANGED
The diff for this file is too large to render. See raw diff
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:935b820a2c9d0cceebeaaeccabfc8cb37c638b97ca2ef7a21c3b99ad27caf7fc
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1722e151c8d33544b7116258c326933418f6d9d8d3163643f071391c19b4d85
3
  size 4664