bigmorning
/

try-m-e

Text Generation

generated_from_keras_callback

Model card Files Files and versions

bigmorning commited on Mar 25, 2022

Commit

4dcd0f5

·

1 Parent(s): fc9adce

add model

Files changed (3) hide show

README.md +1 -15
config.json +1 -3
tf_model.h5 +1 -1

README.md CHANGED Viewed

@@ -14,9 +14,7 @@ probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Train Loss: 0.0133
-- Validation Loss: 0.0034
-- Epoch: 9
 ## Model description
@@ -40,18 +38,6 @@ The following hyperparameters were used during training:
 ### Training results
-| Train Loss | Validation Loss | Epoch |
-|:----------:|:---------------:|:-----:|
-| 0.5370     | 0.2158          | 0     |
-| 0.2152     | 0.2035          | 1     |
-| 0.2040     | 0.1912          | 2     |
-| 0.1915     | 0.1628          | 3     |
-| 0.1569     | 0.0811          | 4     |
-| 0.0864     | 0.0229          | 5     |
-| 0.0404     | 0.0095          | 6     |
-| 0.0247     | 0.0061          | 7     |
-| 0.0175     | 0.0047          | 8     |
-| 0.0133     | 0.0034          | 9     |
 ### Framework versions

 This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
 ## Model description
 ### Training results
 ### Framework versions

config.json CHANGED Viewed

@@ -7,7 +7,6 @@
   ],
   "attn_pdrop": 0.1,
   "bos_token_id": 50256,
-  "do_sample": true,
   "embd_pdrop": 0.1,
   "eos_token_id": 50256,
   "id2label": {
@@ -18,7 +17,6 @@
     "LABEL_0": 0
   },
   "layer_norm_epsilon": 1e-05,
-  "max_length": 50,
   "model_type": "gpt2",
   "n_ctx": 1024,
   "n_embd": 768,
@@ -42,6 +40,6 @@
     }
   },
   "transformers_version": "4.17.0",
-  "use_cache": false,
   "vocab_size": 5998
 }

   ],
   "attn_pdrop": 0.1,
   "bos_token_id": 50256,
   "embd_pdrop": 0.1,
   "eos_token_id": 50256,
   "id2label": {
     "LABEL_0": 0
   },
   "layer_norm_epsilon": 1e-05,
   "model_type": "gpt2",
   "n_ctx": 1024,
   "n_embd": 768,
     }
   },
   "transformers_version": "4.17.0",
+  "use_cache": true,
   "vocab_size": 5998
 }

tf_model.h5 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:915b77025e04afc7b25504f3918029f24365e205b5451b871a99c90c3c0fda69
 size 210211336

 version https://git-lfs.github.com/spec/v1
+oid sha256:197328a79616102fa399d1344e1221a8dacfea2f549d8495a184e10445cd1fa5
 size 210211336