MagistrTheOne commited on
Commit
8ae11a1
·
verified ·
1 Parent(s): 31ed0b8

🔧 Add small RADON Mistral model weights

Browse files
Files changed (4) hide show
  1. config.json +13 -0
  2. model.safetensors +3 -0
  3. model_info.json +9 -0
  4. pytorch_model.bin +3 -0
config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "vocab_size": 8192,
3
+ "hidden_size": 512,
4
+ "num_layers": 6,
5
+ "num_attention_heads": 8,
6
+ "num_kv_heads": 2,
7
+ "intermediate_size": 1024,
8
+ "max_position_embeddings": 2048,
9
+ "sliding_window": 1024,
10
+ "rope_theta": 10000.0,
11
+ "rms_norm_eps": 1e-06,
12
+ "torch_dtype": "float16"
13
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20910015088c80c06f98dc8e23b45a5d972398cfb335c538e316e6fe605d3030
3
+ size 43535376
model_info.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name": "radon-small",
3
+ "architecture": "mistral",
4
+ "parameters": 21764608,
5
+ "size_mb": 41.5126953125,
6
+ "dtype": "float16",
7
+ "initialization": "random",
8
+ "note": "This is a small initialized model with random weights. Training required for actual performance."
9
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0720a5095d21044bf85607776889d4797f3821ace6d33e301fff7330d7214c3b
3
+ size 43548082