Aditya757864
/

Mistral7B

model_hub_mixin

pytorch_model_hub_mixin

4-bit precision

Model card Files Files and versions

Aditya757864 commited on Dec 18, 2024

Commit

7237436

·

verified ·

1 Parent(s): 71ddd5b

Update config.json

Files changed (1) hide show

config.json +25 -43

config.json CHANGED Viewed

@@ -1,46 +1,28 @@
 {
-  "model": {
-    "architecture": "llama",
-    "name": "mistralai_mistral-7b-instruct-v0.1",
-    "model_type": "7B",
-    "quantization": "Q4_K - Medium",
-    "parameters": {
-      "n_vocab": 32000,
-      "n_merges": 0,
-      "n_embd": 4096,
-      "n_ff": 14336,
-      "n_layer": 32,
-      "n_head": 32,
-      "n_head_kv": 8,
-      "n_ctx_train": 32768,
-      "n_embd_head_k": 128,
-      "n_embd_head_v": 128,
-      "n_gqa": 4,
-      "rope_dimension_count": 128,
-      "rope_scaling": "linear",
-      "freq_base_train": 10000.0,
-      "freq_scale_train": 1,
-      "attention_layer_norm_rms_epsilon": 0.00001
-    }
   },
-  "tokenizer": {
-    "type": "SPM",
-    "vocab_size": 32000,
-    "special_tokens": {
-      "BOS": 1,
-      "EOS": 2,
-      "UNK": 0,
-      "LF": 13
-    }
-  },
-  "file_metadata": {
-    "file_type": "GGUF V2",
-    "model_params": "7.24 B",
-    "model_size": "4.07 GiB",
-    "block_count": 32,
-    "embedding_length": 4096,
-    "quantization_version": 2,
-    "model_path": "Models\\mistral-7b-instruct-v0.2.Q3_K_M.gguf"
-  },
 }

 {
+  "architectures": ["MistralForCausalLM"],
+  "model_type": "mistral",
+  "hidden_size": 4096,
+  "intermediate_size": 11008,
+  "num_attention_heads": 32,
+  "num_hidden_layers": 32,
+  "vocab_size": 50272,
+  "max_position_embeddings": 2048,
+  "rotary_embedding_base": 10000,
+  "tie_word_embeddings": false,
+  "hidden_act": "silu",
+  "initializer_range": 0.02,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float16",
+  "use_cache": true,
+  "quantization_config": {
+    "bits": 4,
+    "group_size": 128,
+    "dtype": "q4_k_m"
   },
+  "model_revision": "v0.1",
+  "instructions": "This model is fine-tuned for instruction-following tasks using the Mistral 7B model.",
+  "repository": "Aditya757864/Mistral7B",
+  "version": "0.1"
 }