File size: 1,396 Bytes
0c8ae9b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8fb08ec
0c8ae9b
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
{
  "model_name": "functiongemma-270m",
  "architecture": "gemma3",
  "hidden_size": 640,
  "num_hidden_layers": 18,
  "num_layers": 18,
  "num_attention_heads": 4,
  "num_key_value_heads": 1,
  "head_dim": 256,
  "intermediate_size": 2048,
  "vocab_size": 262144,
  "context_length": 2048,
  "sliding_window": 512,
  "sliding_window_pattern": 6,
  "layer_types": [
    "sliding_attention",
    "sliding_attention",
    "sliding_attention",
    "sliding_attention",
    "sliding_attention",
    "full_attention",
    "sliding_attention",
    "sliding_attention",
    "sliding_attention",
    "sliding_attention",
    "sliding_attention",
    "full_attention",
    "sliding_attention",
    "sliding_attention",
    "sliding_attention",
    "sliding_attention",
    "sliding_attention",
    "full_attention"
  ],
  "embed_scale": 25.298221281347036,
  "rope_theta_global": 1000000.0,
  "rope_theta_local": 10000.0,
  "query_pre_attn_scalar": 256.0,
  "rms_norm_eps": 1e-06,
  "bos_token_id": 2,
  "eos_token_id": [
    1,
    50
  ],
  "tie_word_embeddings": true,
  "final_logit_softcapping": 0.0,
  "parts": {
    "model": "model.mlpackage"
  },
  "quantization": "int8",
  "compute_units": "CPU_AND_NE",
  "tokenizer_repo": "google/functiongemma-270m-it",
  "chat_format": "functiongemma",
  "function_call_markers": {
    "start": "<start_function_call>",
    "end": "<end_function_call>"
  }
}