End of epoch 1 | AVG Contr_Loss: 7309.7822 | AVG Diver_Loss: 954.4370 | PPL: 268.6
Browse files- config.json +2 -2
- model.safetensors +1 -1
config.json
CHANGED
|
@@ -56,7 +56,7 @@
|
|
| 56 |
"feat_quantizer_dropout": 0.0,
|
| 57 |
"final_dropout": 0.0,
|
| 58 |
"gradient_checkpointing": false,
|
| 59 |
-
"gumbel_temperature": 1.
|
| 60 |
"hidden_act": "gelu",
|
| 61 |
"hidden_dropout": 0.1,
|
| 62 |
"hidden_size": 1024,
|
|
@@ -88,7 +88,7 @@
|
|
| 88 |
"num_conv_pos_embeddings": 128,
|
| 89 |
"num_feat_extract_layers": 7,
|
| 90 |
"num_hidden_layers": 24,
|
| 91 |
-
"num_negatives":
|
| 92 |
"output_hidden_size": 1024,
|
| 93 |
"pad_token_id": 0,
|
| 94 |
"proj_codevector_dim": 768,
|
|
|
|
| 56 |
"feat_quantizer_dropout": 0.0,
|
| 57 |
"final_dropout": 0.0,
|
| 58 |
"gradient_checkpointing": false,
|
| 59 |
+
"gumbel_temperature": 1.9999400007499946,
|
| 60 |
"hidden_act": "gelu",
|
| 61 |
"hidden_dropout": 0.1,
|
| 62 |
"hidden_size": 1024,
|
|
|
|
| 88 |
"num_conv_pos_embeddings": 128,
|
| 89 |
"num_feat_extract_layers": 7,
|
| 90 |
"num_hidden_layers": 24,
|
| 91 |
+
"num_negatives": 100,
|
| 92 |
"output_hidden_size": 1024,
|
| 93 |
"pad_token_id": 0,
|
| 94 |
"proj_codevector_dim": 768,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 634834360
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9297df4345779cc7b6391c662347fc9224cd1ce1e7d6bfc6ea2b54123f07904f
|
| 3 |
size 634834360
|