flopml commited on
Commit
1d49067
·
1 Parent(s): 1485644

added config.json, todo: work on tokenizer re-implementation

Browse files
Files changed (1) hide show
  1. config.json +40 -0
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ {
3
+ "dataset": {
4
+ "remote_path": "flpelerin/tinystories-10k",
5
+ "batch_size": 4,
6
+ "seq_length": 512
7
+ },
8
+
9
+ "tokenizer": {
10
+ "max_length": 32000
11
+ },
12
+
13
+ "wandb": {
14
+ "entity": "florianpelerin110304",
15
+ "project": "mamba-trainer-test",
16
+ "name": "",
17
+ "api_key": "860f8753998c6e6dc356914de07e8855aa2f9642"
18
+ },
19
+
20
+ "model": {
21
+ "params": {
22
+ "d_model": 768,
23
+ "n_layer": 24,
24
+
25
+ "tie_embeddings": "false"
26
+ }
27
+ },
28
+
29
+ "trainer": {
30
+ "learning_rate": 1e-3,
31
+ "num_epochs": 4,
32
+
33
+ "inference": {
34
+ "frequency": 0,
35
+ "n_predict": 256,
36
+ "seed_text": "One day, a little girl"
37
+ }
38
+ }
39
+ }
40
+