AhunInteligence commited on
Commit
d67185d
·
verified ·
1 Parent(s): efa4013

End of epoch 13 | Loss: 10103.3412 | PPL: 206.7

Browse files
Files changed (2) hide show
  1. config.json +1 -1
  2. model.safetensors +1 -1
config.json CHANGED
@@ -56,7 +56,7 @@
56
  "feat_quantizer_dropout": 0.0,
57
  "final_dropout": 0.0,
58
  "gradient_checkpointing": false,
59
- "gumbel_temperature": 1.8826246208550435,
60
  "hidden_act": "gelu",
61
  "hidden_dropout": 0.1,
62
  "hidden_size": 1024,
 
56
  "feat_quantizer_dropout": 0.0,
57
  "final_dropout": 0.0,
58
  "gradient_checkpointing": false,
59
+ "gumbel_temperature": 1.8731600162811681,
60
  "hidden_act": "gelu",
61
  "hidden_dropout": 0.1,
62
  "hidden_size": 1024,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6c067034d23ac65f0ccbabe3cb14951a914bc2f7e67466537682688ed3dae32
3
  size 1269615400
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b56fea653cabe77eda889c4f40816a54eea5313de74871b3085b3d5f6387ba0d
3
  size 1269615400