zddos commited on
Commit
aa8de58
·
verified ·
1 Parent(s): fc11ad8

Trained challenger (loss=3.2392, step=3)

Browse files
config.json CHANGED
@@ -62,7 +62,7 @@
62
  "sliding_window": 512,
63
  "tie_word_embeddings": true,
64
  "top_k_experts": null,
65
- "transformers_version": "5.5.4",
66
  "use_bidirectional_attention": null,
67
  "use_cache": true,
68
  "use_double_wide_mlp": false,
 
62
  "sliding_window": 512,
63
  "tie_word_embeddings": true,
64
  "top_k_experts": null,
65
+ "transformers_version": "5.5.3",
66
  "use_bidirectional_attention": null,
67
  "use_cache": true,
68
  "use_double_wide_mlp": false,
generation_config.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 2,
4
- "eos_token_id": 106,
5
  "pad_token_id": 0,
6
- "transformers_version": "5.5.4",
7
- "use_cache": false
8
  }
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 2,
4
+ "eos_token_id": 1,
5
  "pad_token_id": 0,
6
+ "transformers_version": "5.5.3",
7
+ "use_cache": true
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f969c4b7f1a3eb9c231c2752cceea47e0ce74c18a5314be75fb8e314356745c
3
- size 6576171052
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fe2459b54f605fa54397a388d00a52bd6956b68dd2621224edd7407df568a99
3
+ size 6575835380
tokenizer_config.json CHANGED
@@ -6,7 +6,7 @@
6
  "eoi_token": "<end_of_image>",
7
  "eos_token": "<end_of_turn>",
8
  "image_token": "<image_soft_token>",
9
- "is_local": true,
10
  "mask_token": "<mask>",
11
  "model_max_length": 32768,
12
  "model_specific_special_tokens": {
 
6
  "eoi_token": "<end_of_image>",
7
  "eos_token": "<end_of_turn>",
8
  "image_token": "<image_soft_token>",
9
+ "is_local": false,
10
  "mask_token": "<mask>",
11
  "model_max_length": 32768,
12
  "model_specific_special_tokens": {