gurgutan commited on
Commit
ed13186
·
verified ·
1 Parent(s): b3e79d3

Upload 3 files

Browse files

Fast Language Self-Similar Model with 85 M params

Files changed (3) hide show
  1. model-config.json +12 -0
  2. model.pth +3 -0
  3. train-config.json +14 -0
model-config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "fastnn17",
3
+ "input_size": 128,
4
+ "output_size": 1,
5
+ "vocab_size": 166,
6
+ "emb_size": 64,
7
+ "n": 5,
8
+ "channels": 4,
9
+ "kernel_size": 128,
10
+ "tokenizer": "src/vocab-166.json",
11
+ "pad_token_id": 162
12
+ }
model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:217fee0e5a94d3a7b6cbb9b4611b346a7a6ffa80c4b8e417a63cdcce306e7498
3
+ size 336960759
train-config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "learning_rate": 2e-05,
3
+ "weight_decay": 0.0,
4
+ "batch_size": 4096,
5
+ "epochs": 16,
6
+ "device": "cuda",
7
+ "shuffle": true,
8
+ "save_on_step": 16384,
9
+ "model_folder": "/home/ivan/data/models/fast-nn/fastnn17",
10
+ "autocast": false,
11
+ "transform": null,
12
+ "load_checkpoint": null,
13
+ "config_model": null
14
+ }