sujithatz/finbot-transofrmer-based-phi3.5_adapter

Browse files

Files changed (4) hide show

README.md +28 -12
adapter_config.json +2 -2
adapter_model.safetensors +1 -1
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [microsoft/Phi-3-mini-4k-instruct](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.3735
 ## Model description
@@ -46,26 +46,42 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_ratio: 0.1
-- num_epochs: 20
 ### Training results
 | Training Loss | Epoch   | Step | Validation Loss |
 |:-------------:|:-------:|:----:|:---------------:|
-| 1.2948        | 2.3529  | 10   | 1.1195          |
-| 0.9096        | 4.7059  | 20   | 0.6701          |
-| 0.5636        | 7.0588  | 30   | 0.4935          |
-| 0.4166        | 9.4118  | 40   | 0.4362          |
-| 0.3366        | 11.7647 | 50   | 0.4048          |
-| 0.2945        | 14.1176 | 60   | 0.3840          |
-| 0.2593        | 16.4706 | 70   | 0.3752          |
-| 0.229         | 18.8235 | 80   | 0.3735          |
 ### Framework versions
-- PEFT 0.13.0
-- Transformers 4.45.1
 - Pytorch 2.4.1+cu121
 - Datasets 3.0.1
 - Tokenizers 0.20.0

 This model is a fine-tuned version of [microsoft/Phi-3-mini-4k-instruct](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.4084
 ## Model description
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_ratio: 0.1
+- num_epochs: 30
 ### Training results
 | Training Loss | Epoch   | Step | Validation Loss |
 |:-------------:|:-------:|:----:|:---------------:|
+| 1.415         | 1.1765  | 5    | 1.4148          |
+| 1.2791        | 2.3529  | 10   | 1.2542          |
+| 1.0303        | 3.5294  | 15   | 0.9828          |
+| 0.7989        | 4.7059  | 20   | 0.7193          |
+| 0.5792        | 5.8824  | 25   | 0.5793          |
+| 0.5074        | 7.0588  | 30   | 0.5133          |
+| 0.4558        | 8.2353  | 35   | 0.4714          |
+| 0.361         | 9.4118  | 40   | 0.4478          |
+| 0.3751        | 10.5882 | 45   | 0.4236          |
+| 0.2908        | 11.7647 | 50   | 0.4106          |
+| 0.263         | 12.9412 | 55   | 0.3855          |
+| 0.2515        | 14.1176 | 60   | 0.3760          |
+| 0.2391        | 15.2941 | 65   | 0.3752          |
+| 0.1973        | 16.4706 | 70   | 0.3723          |
+| 0.1638        | 17.6471 | 75   | 0.3740          |
+| 0.1776        | 18.8235 | 80   | 0.3868          |
+| 0.2008        | 20.0    | 85   | 0.3798          |
+| 0.1569        | 21.1765 | 90   | 0.3848          |
+| 0.1284        | 22.3529 | 95   | 0.3901          |
+| 0.1171        | 23.5294 | 100  | 0.3969          |
+| 0.1364        | 24.7059 | 105  | 0.3950          |
+| 0.1401        | 25.8824 | 110  | 0.4070          |
+| 0.1195        | 27.0588 | 115  | 0.4091          |
+| 0.1219        | 28.2353 | 120  | 0.4084          |
 ### Framework versions
+- PEFT 0.13.2
+- Transformers 4.45.2
 - Pytorch 2.4.1+cu121
 - Datasets 3.0.1
 - Tokenizers 0.20.0

adapter_config.json CHANGED Viewed

@@ -20,13 +20,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
     "q_proj",
     "down_proj",
     "k_proj",
     "gate_proj",
     "o_proj",
-    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "q_proj",
+    "up_proj",
     "down_proj",
     "k_proj",
     "gate_proj",
     "o_proj",
+    "v_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ed3e5c3db673cb3855b174b8bef13291aa839e4e7c29ce50e54aac1787790578
 size 35668592

 version https://git-lfs.github.com/spec/v1
+oid sha256:c31fa0d424f7aa52b479ebad75d44eddaeb88a380690ecea3897eaa386703c7a
 size 35668592

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:82c76f0114ac2ed0f1cf9f8bb0c177fe5f2a5a84ba74b113c674a409d33f34ec
 size 5432

 version https://git-lfs.github.com/spec/v1
+oid sha256:b2dc0d2c1e7c21c088f647428d6cedc77b727218a9706b56e15904c3d278b5b2
 size 5432