AdamF92 commited on
Commit
48bc772
·
verified ·
1 Parent(s): 52c6412

Epoch 0 - Val loss 1.7144

Browse files
Files changed (2) hide show
  1. config.json +1 -1
  2. model.safetensors +1 -1
config.json CHANGED
@@ -42,7 +42,7 @@
42
  "rope_base": 1000000,
43
  "seq_len": 8192,
44
  "skip_stm": false,
45
- "stm_batch_size": 3,
46
  "stm_size": 4096,
47
  "tie_embeddings": true,
48
  "training_cache": true,
 
42
  "rope_base": 1000000,
43
  "seq_len": 8192,
44
  "skip_stm": false,
45
+ "stm_batch_size": 1,
46
  "stm_size": 4096,
47
  "tie_embeddings": true,
48
  "training_cache": true,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:002672eaa7e8a7b8ff56d4059e77d9419a56f09be1660d01f78fa6cb65f7fbfe
3
  size 3794621808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bed7631639411bbd1a24e1e5e53154eadd5b961b2cec80f9c462f655d9f766e1
3
  size 3794621808