advy commited on
Commit
fce8b3e
·
verified ·
1 Parent(s): 9b1ad4d

Finetune on MentalChat16K - eval_loss: 0.7298

Browse files
Files changed (2) hide show
  1. README.md +1 -1
  2. training_metrics.json +43 -0
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [microsoft/phi-2](https://huggingface.co/microsoft/phi-2) on the None dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 0.7296
20
 
21
  ## Model description
22
 
 
16
 
17
  This model is a fine-tuned version of [microsoft/phi-2](https://huggingface.co/microsoft/phi-2) on the None dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 0.7112
20
 
21
  ## Model description
22
 
training_metrics.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model": "phi2-mental-health",
3
+ "base_model": "microsoft/phi-2",
4
+ "dataset": "ShenLab/MentalChat16K",
5
+ "lora_config": {
6
+ "rank": 16,
7
+ "alpha": 32,
8
+ "target_modules": [
9
+ "q_proj",
10
+ "k_proj",
11
+ "v_proj",
12
+ "dense"
13
+ ],
14
+ "dropout": 0.1
15
+ },
16
+ "training": {
17
+ "final_train_loss": 0.7486542798042297,
18
+ "total_steps": 2500,
19
+ "epochs": 4,
20
+ "learning_rate": 0.0002,
21
+ "per_device_batch_size": 4,
22
+ "gradient_accumulation": 2
23
+ },
24
+ "evaluation": {
25
+ "eval_loss": 0.7297702431678772,
26
+ "eval_runtime": 4064.1661,
27
+ "eval_samples_per_second": 0.116,
28
+ "eval_steps_per_second": 0.029,
29
+ "epoch": 3.7397157816005984
30
+ },
31
+ "test_eval": {
32
+ "eval_loss": 0.7111775875091553,
33
+ "eval_runtime": 39.2705,
34
+ "eval_samples_per_second": 12.019,
35
+ "eval_steps_per_second": 3.005,
36
+ "epoch": 3.7397157816005984
37
+ },
38
+ "dataset_stats": {
39
+ "train_size": 5347,
40
+ "val_size": 472,
41
+ "test_size": 472
42
+ }
43
+ }