colinrdavisMBA/mistral-7binstruct-summary-100s

Files changed (5) hide show

README.md CHANGED Viewed

@@ -20,7 +20,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2) on the generator dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.4646
 ## Model description
@@ -52,14 +52,14 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 1.6134        | 0.22  | 25   | 1.5514          |
-| 1.5949        | 0.43  | 50   | 1.4646          |
 ### Framework versions
-- PEFT 0.8.2
-- Transformers 4.38.1
 - Pytorch 2.1.0+cu121
-- Datasets 2.17.1
 - Tokenizers 0.15.2

 This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2) on the generator dataset.
 It achieves the following results on the evaluation set:
+- Loss: 1.4703
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 1.7445        | 0.22  | 25   | 1.5450          |
+| 1.557         | 0.43  | 50   | 1.4703          |
 ### Framework versions
+- PEFT 0.9.0
+- Transformers 4.38.2
 - Pytorch 2.1.0+cu121
+- Datasets 2.18.0
 - Tokenizers 0.15.2

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "mistralai/Mistral-7B-Instruct-v0.2",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -19,9 +19,10 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false
 }

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": null,
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "q_proj",
+    "v_proj"
   ],
   "task_type": "CAUSAL_LM",
+  "use_dora": false,
   "use_rslora": false
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea3ca41896d5ecc7110c87eeabc151aafc4b078b63c57d00a7b8b585a62d1f82
-size 27280152

 version https://git-lfs.github.com/spec/v1
+oid sha256:c48e0a972c1bedd6cafa5d1546efd158a9536992b2ae42f471fc4556842a7be2
+size 27282328

runs/Mar02_00-53-12_cdf356d6afcd/events.out.tfevents.1709340802.cdf356d6afcd.2237.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4424ee8774af3e39ab6139b5dc07d5e8740a9b13e29217143a2a0165655b7f70
+size 6966

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d475bae46eee9ea64e29ebe797b95ba15738cb726e56099e9fd09fccfc18f598
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:ff135a3b01ab8b460b20c8f554b3e8cd1dd02d18ea438edb3ef3224d89de63d2
 size 4920