End of training

Files changed (6) hide show

README.md CHANGED Viewed

@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [google/flan-t5-xl](https://huggingface.co/google/flan-t5-xl) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.3677
 ## Model description
@@ -35,7 +35,7 @@ More information needed
 ### Training hyperparameters
 The following hyperparameters were used during training:
-- learning_rate: 0.001
 - train_batch_size: 2
 - eval_batch_size: 2
 - seed: 42
@@ -50,8 +50,8 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch  | Step | Validation Loss |
 |:-------------:|:------:|:----:|:---------------:|
-| 1.3935        | 0.3458 | 500  | 1.4429          |
-| 1.8791        | 0.6917 | 1000 | 1.3677          |
 ### Framework versions

 This model is a fine-tuned version of [google/flan-t5-xl](https://huggingface.co/google/flan-t5-xl) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 1.4735
 ## Model description
 ### Training hyperparameters
 The following hyperparameters were used during training:
+- learning_rate: 0.0001
 - train_batch_size: 2
 - eval_batch_size: 2
 - seed: 42
 | Training Loss | Epoch  | Step | Validation Loss |
 |:-------------:|:------:|:----:|:---------------:|
+| 1.1782        | 0.3458 | 500  | 1.5188          |
+| 1.9895        | 0.6917 | 1000 | 1.4735          |
 ### Framework versions

adapter_config.json CHANGED Viewed

@@ -25,9 +25,9 @@
   "revision": null,
   "target_modules": [
     "q",
-    "k",
     "o",
-    "v"
   ],
   "task_type": "SEQ_2_SEQ_LM",
   "trainable_token_indices": null,

   "revision": null,
   "target_modules": [
     "q",
     "o",
+    "v",
+    "k"
   ],
   "task_type": "SEQ_2_SEQ_LM",
   "trainable_token_indices": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2613675b20d31af750791a2d1405af3f81d7ffe8eeb0b317607adb1176d04a7a
 size 75579856

 version https://git-lfs.github.com/spec/v1
+oid sha256:834b1dd283913ebfc2d18316445a639ee023e4440db9f48c163a6c165e4649e2
 size 75579856

tokenizer.json CHANGED Viewed

@@ -1,11 +1,6 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 192,
-    "strategy": "LongestFirst",
-    "stride": 0
-  },
   "padding": null,
   "added_tokens": [
     {

 {
   "version": "1.0",
+  "truncation": null,
   "padding": null,
   "added_tokens": [
     {

tokenizer_config.json CHANGED Viewed

@@ -932,13 +932,9 @@
   "eos_token": "</s>",
   "extra_ids": 100,
   "extra_special_tokens": {},
-  "max_length": 192,
   "model_max_length": 512,
   "pad_token": "</s>",
   "sp_model_kwargs": {},
-  "stride": 0,
   "tokenizer_class": "T5Tokenizer",
-  "truncation_side": "right",
-  "truncation_strategy": "longest_first",
   "unk_token": "<unk>"
 }

   "eos_token": "</s>",
   "extra_ids": 100,
   "extra_special_tokens": {},
   "model_max_length": 512,
   "pad_token": "</s>",
   "sp_model_kwargs": {},
   "tokenizer_class": "T5Tokenizer",
   "unk_token": "<unk>"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4d5b430e5b2a85d276116ac9933ef719131551fbe484625f902d0afbd6a1d469
 size 5432

 version https://git-lfs.github.com/spec/v1
+oid sha256:4dfb19e2122f69c32b93027a61ec66def9d3f89fd327fe5664e5d30fce5d166a
 size 5432