🔧 Add small RADON Mistral model weights
Browse files- config.json +13 -0
- model.safetensors +3 -0
- model_info.json +9 -0
- pytorch_model.bin +3 -0
config.json
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"vocab_size": 8192,
|
| 3 |
+
"hidden_size": 512,
|
| 4 |
+
"num_layers": 6,
|
| 5 |
+
"num_attention_heads": 8,
|
| 6 |
+
"num_kv_heads": 2,
|
| 7 |
+
"intermediate_size": 1024,
|
| 8 |
+
"max_position_embeddings": 2048,
|
| 9 |
+
"sliding_window": 1024,
|
| 10 |
+
"rope_theta": 10000.0,
|
| 11 |
+
"rms_norm_eps": 1e-06,
|
| 12 |
+
"torch_dtype": "float16"
|
| 13 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20910015088c80c06f98dc8e23b45a5d972398cfb335c538e316e6fe605d3030
|
| 3 |
+
size 43535376
|
model_info.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_name": "radon-small",
|
| 3 |
+
"architecture": "mistral",
|
| 4 |
+
"parameters": 21764608,
|
| 5 |
+
"size_mb": 41.5126953125,
|
| 6 |
+
"dtype": "float16",
|
| 7 |
+
"initialization": "random",
|
| 8 |
+
"note": "This is a small initialized model with random weights. Training required for actual performance."
|
| 9 |
+
}
|
pytorch_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0720a5095d21044bf85607776889d4797f3821ace6d33e301fff7330d7214c3b
|
| 3 |
+
size 43548082
|