Mayfull commited on
Commit
21d5b89
·
verified ·
1 Parent(s): c265f2c

Training in progress, step 886

Browse files
Files changed (3) hide show
  1. config.json +19 -0
  2. model.safetensors +3 -0
  3. training_args.bin +3 -0
config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "VLTopKSAE"
4
+ ],
5
+ "dtype": "float32",
6
+ "expansion_factor": 16,
7
+ "hidden_size": 768,
8
+ "k": 32,
9
+ "latent_size": 0,
10
+ "model_type": "vl_topk_sae",
11
+ "multi_topk": false,
12
+ "normalize_decoder": true,
13
+ "transformers_version": "4.57.6",
14
+ "vl_split_ratio": [
15
+ 2,
16
+ 12,
17
+ 2
18
+ ]
19
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a29c40df23d8f1077325b36bc8bd5a01a6505fc2077e48d13fac516ceb64860
3
+ size 75550056
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d4a84ed4c2a065df46e795f7929e2960683af60d47f746e2f055d9bcaa84d0a
3
+ size 5969