Spaces:
Sleeping
Sleeping
Add starcoder2: BigCode StarCoder2 family
Browse files
scan.py
CHANGED
|
@@ -230,6 +230,13 @@ KNOWN_BASES = {
|
|
| 230 |
"model_type_patterns": ["valley"],
|
| 231 |
# Valley-Eagle-7B (151675) and Valley2.5 (151679) — close but distinct vocabs
|
| 232 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 233 |
"zaya": {
|
| 234 |
"name": "Zyphra ZAYA1 (deep hybrid SSM+Attention MoE)",
|
| 235 |
"vocab_size": 262272,
|
|
|
|
| 230 |
"model_type_patterns": ["valley"],
|
| 231 |
# Valley-Eagle-7B (151675) and Valley2.5 (151679) — close but distinct vocabs
|
| 232 |
},
|
| 233 |
+
"starcoder2": {
|
| 234 |
+
"name": "BigCode StarCoder2",
|
| 235 |
+
"vocab_size": 49152,
|
| 236 |
+
"model_type_patterns": ["starcoder2"],
|
| 237 |
+
# 3B: hidden=3072/30L (97K dl), 7B: hidden=4608/32L, 15B: hidden=6144/40L
|
| 238 |
+
# Code-specialized tokenizer (49152 tokens)
|
| 239 |
+
},
|
| 240 |
"zaya": {
|
| 241 |
"name": "Zyphra ZAYA1 (deep hybrid SSM+Attention MoE)",
|
| 242 |
"vocab_size": 262272,
|