ninagroot/GPT2-705Mtest

Files changed (6) hide show

README.md CHANGED Viewed

@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 4.3277
 ## Model description
@@ -48,17 +48,17 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 5.8849        | 1.0   | 138  | 5.5972          |
-| 5.0533        | 2.0   | 276  | 4.9053          |
-| 4.0659        | 3.0   | 414  | 4.5644          |
-| 4.0541        | 4.0   | 552  | 4.4225          |
-| 3.8361        | 5.0   | 690  | 4.3304          |
-| 3.5307        | 6.0   | 828  | 4.3277          |
 ### Framework versions
-- Transformers 4.37.2
 - Pytorch 2.1.2+cu121
 - Datasets 2.16.1
 - Tokenizers 0.15.0

 This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 3.6575
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 2.9814        | 1.0   | 786  | 3.7914          |
+| 2.5963        | 2.0   | 1572 | 3.6927          |
+| 2.3478        | 3.0   | 2358 | 3.7172          |
+| 2.0341        | 4.0   | 3144 | 3.6845          |
+| 1.7373        | 5.0   | 3930 | 3.6596          |
+| 1.7065        | 6.0   | 4716 | 3.6575          |
 ### Framework versions
+- Transformers 4.39.1
 - Pytorch 2.1.2+cu121
 - Datasets 2.16.1
 - Tokenizers 0.15.0

config.json CHANGED Viewed

@@ -26,7 +26,7 @@
   "summary_type": "cls_index",
   "summary_use_proj": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.37.2",
   "use_cache": true,
-  "vocab_size": 4312
 }

   "summary_type": "cls_index",
   "summary_use_proj": true,
   "torch_dtype": "float32",
+  "transformers_version": "4.39.1",
   "use_cache": true,
+  "vocab_size": 32000
 }

generation_config.json CHANGED Viewed

@@ -3,5 +3,5 @@
   "bos_token_id": 50256,
   "eos_token_id": 50256,
   "pad_token_id": 0,
-  "transformers_version": "4.37.2"
 }

   "bos_token_id": 50256,
   "eos_token_id": 50256,
   "pad_token_id": 0,
+  "transformers_version": "4.39.1"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8f400724a6e0d3898b884969758b48524c91c76bd4046072ce4e2c350645c075
-size 2747934496

 version https://git-lfs.github.com/spec/v1
+oid sha256:6c91e31860b19345b05e0f1e9e1ba2de97ffc56b229cb792f4542af9b151e2af
+size 2918049568

runs/Apr05_14-54-56_gcn33.local.snellius.surf.nl/events.out.tfevents.1712321705.gcn33.local.snellius.surf.nl.3713920.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b838993b4bac0f3f173cb6860a746350da5b1faa31a15da1c4b0969863ce6d8e
+size 56220

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bf71524b3c83674824e3d16b3d014431c3ea8d8433979f72682c2eefae6d82b6
-size 4728

 version https://git-lfs.github.com/spec/v1
+oid sha256:aa0847ab599c58a1133dac29dd7ae134718e1285515ee60a80d4d30e0cb92086
+size 4984