trohrbaugh commited on
Commit
9f532e7
·
verified ·
1 Parent(s): 9c25851

Add starcoder2: BigCode StarCoder2 family

Browse files
Files changed (1) hide show
  1. scan.py +7 -0
scan.py CHANGED
@@ -230,6 +230,13 @@ KNOWN_BASES = {
230
  "model_type_patterns": ["valley"],
231
  # Valley-Eagle-7B (151675) and Valley2.5 (151679) — close but distinct vocabs
232
  },
 
 
 
 
 
 
 
233
  "zaya": {
234
  "name": "Zyphra ZAYA1 (deep hybrid SSM+Attention MoE)",
235
  "vocab_size": 262272,
 
230
  "model_type_patterns": ["valley"],
231
  # Valley-Eagle-7B (151675) and Valley2.5 (151679) — close but distinct vocabs
232
  },
233
+ "starcoder2": {
234
+ "name": "BigCode StarCoder2",
235
+ "vocab_size": 49152,
236
+ "model_type_patterns": ["starcoder2"],
237
+ # 3B: hidden=3072/30L (97K dl), 7B: hidden=4608/32L, 15B: hidden=6144/40L
238
+ # Code-specialized tokenizer (49152 tokens)
239
+ },
240
  "zaya": {
241
  "name": "Zyphra ZAYA1 (deep hybrid SSM+Attention MoE)",
242
  "vocab_size": 262272,