advy commited on
Commit
81ca6a4
·
verified ·
1 Parent(s): 3f046e3

Finetune on MentalChat16K - eval_loss: 0.7816

Browse files
Files changed (2) hide show
  1. README.md +1 -1
  2. training_metrics.json +46 -0
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [TinyLlama/TinyLlama-1.1B-Chat-v1.0](https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0) on the None dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 0.8010
20
 
21
  ## Model description
22
 
 
16
 
17
  This model is a fine-tuned version of [TinyLlama/TinyLlama-1.1B-Chat-v1.0](https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0) on the None dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 0.7700
20
 
21
  ## Model description
22
 
training_metrics.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model": "tinyllama-mental-health",
3
+ "base_model": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
4
+ "dataset": "ShenLab/MentalChat16K",
5
+ "lora_config": {
6
+ "rank": 16,
7
+ "alpha": 32,
8
+ "target_modules": [
9
+ "q_proj",
10
+ "k_proj",
11
+ "v_proj",
12
+ "o_proj",
13
+ "gate_proj",
14
+ "up_proj",
15
+ "down_proj"
16
+ ],
17
+ "dropout": 0.1
18
+ },
19
+ "training": {
20
+ "final_train_loss": 0.7040511888504029,
21
+ "total_steps": 2500,
22
+ "epochs": 4,
23
+ "learning_rate": 0.0002,
24
+ "per_device_batch_size": 4,
25
+ "gradient_accumulation": 2
26
+ },
27
+ "evaluation": {
28
+ "eval_loss": 0.7816067934036255,
29
+ "eval_runtime": 18.522,
30
+ "eval_samples_per_second": 25.483,
31
+ "eval_steps_per_second": 6.371,
32
+ "epoch": 3.7397157816005984
33
+ },
34
+ "test_eval": {
35
+ "eval_loss": 0.7700048089027405,
36
+ "eval_runtime": 18.7703,
37
+ "eval_samples_per_second": 25.146,
38
+ "eval_steps_per_second": 6.287,
39
+ "epoch": 3.7397157816005984
40
+ },
41
+ "dataset_stats": {
42
+ "train_size": 5347,
43
+ "val_size": 472,
44
+ "test_size": 472
45
+ }
46
+ }