File size: 3,084 Bytes
1b60a2a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
{
  "architectures": [
    "EmbedderModel"
  ],
  "auto_map": {
    "AutoConfig": "configuration_embedder.EmbedderConfig",
    "AutoModel": "modeling_embedder.EmbedderModel"
  },
  "base_model_name": "nomic-ai/nomic-embed-text-v1.5",
  "dropout": 0.0,
  "dtype": "float32",
  "encoder_config": {
    "_name_or_path": "nomic-ai/nomic-embed-text-v1.5",
    "activation_function": "swiglu",
    "add_cross_attention": false,
    "architectures": [
      "NomicBertModel"
    ],
    "attention_probs_dropout_prob": 0.0,
    "attn_pdrop": 0.0,
    "auto_map": {
      "AutoConfig": "nomic-ai/nomic-bert-2048--configuration_hf_nomic_bert.NomicBertConfig",
      "AutoModel": "nomic-ai/nomic-bert-2048--modeling_hf_nomic_bert.NomicBertModel",
      "AutoModelForMaskedLM": "nomic-ai/nomic-bert-2048--modeling_hf_nomic_bert.NomicBertForPreTraining",
      "AutoModelForMultipleChoice": "nomic-ai/nomic-bert-2048--modeling_hf_nomic_bert.NomicBertForMultipleChoice",
      "AutoModelForQuestionAnswering": "nomic-ai/nomic-bert-2048--modeling_hf_nomic_bert.NomicBertForQuestionAnswering",
      "AutoModelForSequenceClassification": "nomic-ai/nomic-bert-2048--modeling_hf_nomic_bert.NomicBertForSequenceClassification",
      "AutoModelForTokenClassification": "nomic-ai/nomic-bert-2048--modeling_hf_nomic_bert.NomicBertForTokenClassification"
    },
    "bos_token_id": null,
    "causal": false,
    "classifier_dropout": null,
    "dense_seq_output": true,
    "dtype": "float32",
    "embd_pdrop": 0.0,
    "eos_token_id": null,
    "fused_bias_fc": true,
    "fused_dropout_add_ln": true,
    "head_dim": 64,
    "hidden_act": "silu",
    "hidden_dropout_prob": 0.0,
    "initializer_range": 0.02,
    "intermediate_size": 3072,
    "layer_norm_eps": 1e-12,
    "layer_norm_epsilon": 1e-12,
    "max_trained_positions": 2048,
    "mlp_fc1_bias": false,
    "mlp_fc2_bias": false,
    "model_type": "nomic_bert",
    "n_embd": 768,
    "n_head": 12,
    "n_inner": 3072,
    "n_layer": 12,
    "n_positions": 2048,
    "pad_token_id": 0,
    "pad_vocab_size_multiple": 64,
    "parallel_block": false,
    "parallel_block_tied_norm": false,
    "prenorm": false,
    "qkv_proj_bias": false,
    "reorder_and_upcast_attn": false,
    "resid_pdrop": 0.0,
    "rope_parameters": {
      "rope_theta": 1000.0,
      "rope_type": "default"
    },
    "rotary_emb_base": 1000,
    "rotary_emb_fraction": 1.0,
    "rotary_emb_interleaved": false,
    "rotary_emb_scale_base": null,
    "rotary_scaling_factor": null,
    "scale_attn_by_inverse_layer_idx": false,
    "scale_attn_weights": true,
    "summary_activation": null,
    "summary_first_dropout": 0.0,
    "summary_proj_to_labels": true,
    "summary_type": "cls_index",
    "summary_use_proj": true,
    "tie_word_embeddings": true,
    "type_vocab_size": 2,
    "use_cache": true,
    "use_flash_attn": true,
    "use_rms_norm": false,
    "use_xentropy": true,
    "vocab_size": 30528
  },
  "encoder_only": false,
  "model_type": "embedder",
  "num_blocks": 3,
  "tokenizer_class": "BertTokenizer",
  "transformers_version": "5.7.0"
}