File size: 2,351 Bytes
e13f6e8 ccf7f0d e13f6e8 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 | {
"model_name": "embeddinggemma-300m",
"architecture": "gemma3-embedding",
"tokenizer_repo": "google/embeddinggemma-300m",
"parts": {
"encoder": "encoder.mlpackage"
},
"io_contract": {
"inputs": {
"input_ids": {
"shape": [
1,
128
],
"dtype": "int32"
},
"attention_mask": {
"shape": [
1,
128
],
"dtype": "fp16",
"doc": "1.0 for valid tokens, 0.0 for pad"
}
},
"outputs": {
"embedding": {
"shape": [
1,
768
],
"dtype": "fp16",
"doc": "L2-normalized; Matryoshka-truncate the last dim"
}
}
},
"hidden_size": 768,
"num_hidden_layers": 24,
"num_attention_heads": 3,
"num_key_value_heads": 1,
"head_dim": 256,
"intermediate_size": 1152,
"vocab_size": 262144,
"max_seq_len": 128,
"sliding_window": 512,
"sliding_window_pattern": 6,
"layer_types": [
"sliding_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"full_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"full_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"full_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"sliding_attention",
"full_attention"
],
"rms_norm_eps": 1e-06,
"rope_theta_global": 1000000.0,
"rope_theta_local": 10000.0,
"embed_dim": 768,
"dense_intermediate_dim": 3072,
"pooling": "mean",
"normalize": "l2",
"matryoshka_dims": [
768,
512,
256,
128
],
"task_prefixes": {
"retrieval_query": "task: search result | query: ",
"retrieval_document": "title: none | text: ",
"classification": "task: classification | query: ",
"clustering": "task: clustering | query: ",
"similarity": "task: sentence similarity | query: ",
"code_retrieval": "task: code retrieval | query: ",
"question_answering": "task: question answering | query: ",
"fact_verification": "task: fact checking | query: "
},
"quantization": "int8",
"compute_units": "CPU_AND_NE"
} |