osanseviero commited on
Commit
bdca8ec
·
verified ·
1 Parent(s): 01d0fbf

(Trained with Unsloth)

Browse files
Files changed (3) hide show
  1. config.json +7 -26
  2. tokenizer.json +2 -2
  3. tokenizer_config.json +0 -0
config.json CHANGED
@@ -7,7 +7,7 @@
7
  "attention_dropout": 0.0,
8
  "attn_logit_softcapping": null,
9
  "bos_token_id": 2,
10
- "dtype": "float16",
11
  "eos_token_id": 106,
12
  "final_logit_softcapping": null,
13
  "head_dim": 256,
@@ -43,33 +43,14 @@
43
  "pad_token_id": 0,
44
  "query_pre_attn_scalar": 256,
45
  "rms_norm_eps": 1e-06,
46
- "rope_parameters": {
47
- "full_attention": {
48
- "rope_theta": 1000000.0,
49
- "rope_type": "default"
50
- },
51
- "sliding_attention": {
52
- "rope_theta": 10000.0,
53
- "rope_type": "default"
54
- }
55
- },
56
  "sliding_window": 512,
57
- "transformers_version": "5.0.0.dev0",
58
  "unsloth_fixed": true,
59
  "unsloth_version": "2026.1.2",
60
  "use_bidirectional_attention": false,
61
  "use_cache": true,
62
- "vocab_size": 262144,
63
- "transformers.js_config": {
64
- "use_external_data_format": {
65
- "model.onnx": 1,
66
- "model_fp16.onnx": 1,
67
- "model_q4.onnx": 1,
68
- "model_q4f16.onnx": 1
69
- },
70
- "kv_cache_dtype": {
71
- "q4f16": "float16",
72
- "fp16": "float16"
73
- }
74
- }
75
- }
 
7
  "attention_dropout": 0.0,
8
  "attn_logit_softcapping": null,
9
  "bos_token_id": 2,
10
+ "torch_dtype": "float16",
11
  "eos_token_id": 106,
12
  "final_logit_softcapping": null,
13
  "head_dim": 256,
 
43
  "pad_token_id": 0,
44
  "query_pre_attn_scalar": 256,
45
  "rms_norm_eps": 1e-06,
46
+ "rope_local_base_freq": 10000.0,
47
+ "rope_scaling": null,
48
+ "rope_theta": 1000000.0,
 
 
 
 
 
 
 
49
  "sliding_window": 512,
50
+ "transformers_version": "4.57.3",
51
  "unsloth_fixed": true,
52
  "unsloth_version": "2026.1.2",
53
  "use_bidirectional_attention": false,
54
  "use_cache": true,
55
+ "vocab_size": 262144
56
+ }
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1fa00479b9f9d41a876e5cd1b369eea7af974fa0bdcc994c987972056d8ed5c2
3
- size 20323384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6b09a0b4a803ad453063ca4bb49a784540e8120004e2450e025df2b27d41fb2
3
+ size 33384899
tokenizer_config.json CHANGED
The diff for this file is too large to render. See raw diff