hiwensen commited on
Commit
15df3bb
·
verified ·
1 Parent(s): d76175c

End of training

Browse files
README.md CHANGED
@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.3563
21
- - Accuracy: 0.95
22
 
23
  ## Model description
24
 
@@ -43,22 +43,42 @@ The following hyperparameters were used during training:
43
  - seed: 42
44
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: linear
46
- - num_epochs: 10
47
 
48
  ### Training results
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
51
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
52
- | 1.7667 | 1.0 | 12 | 1.6574 | 0.45 |
53
- | 1.556 | 2.0 | 24 | 1.1844 | 0.9 |
54
- | 1.0991 | 3.0 | 36 | 0.8021 | 0.9 |
55
- | 0.8913 | 4.0 | 48 | 0.6070 | 0.95 |
56
- | 0.495 | 5.0 | 60 | 0.5021 | 0.9 |
57
- | 0.3888 | 6.0 | 72 | 0.4484 | 0.9 |
58
- | 0.2608 | 7.0 | 84 | 0.3813 | 0.9 |
59
- | 0.2031 | 8.0 | 96 | 0.3626 | 0.95 |
60
- | 0.1348 | 9.0 | 108 | 0.3812 | 0.9 |
61
- | 0.1166 | 10.0 | 120 | 0.3563 | 0.95 |
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
62
 
63
 
64
  ### Framework versions
 
17
 
18
  This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on the None dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.7151
21
+ - Accuracy: 0.8624
22
 
23
  ## Model description
24
 
 
43
  - seed: 42
44
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: linear
46
+ - num_epochs: 30
47
 
48
  ### Training results
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
51
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
52
+ | 0.5598 | 1.0 | 62 | 0.5919 | 0.8073 |
53
+ | 0.2769 | 2.0 | 124 | 0.5313 | 0.8349 |
54
+ | 0.3082 | 3.0 | 186 | 0.3577 | 0.9083 |
55
+ | 0.0916 | 4.0 | 248 | 0.6712 | 0.8349 |
56
+ | 0.0708 | 5.0 | 310 | 0.5667 | 0.8257 |
57
+ | 0.0715 | 6.0 | 372 | 0.5633 | 0.8807 |
58
+ | 0.0589 | 7.0 | 434 | 0.8306 | 0.8440 |
59
+ | 0.0022 | 8.0 | 496 | 0.6568 | 0.8624 |
60
+ | 0.005 | 9.0 | 558 | 0.6176 | 0.8716 |
61
+ | 0.0017 | 10.0 | 620 | 0.6524 | 0.8440 |
62
+ | 0.001 | 11.0 | 682 | 0.8272 | 0.8532 |
63
+ | 0.0008 | 12.0 | 744 | 0.5695 | 0.8991 |
64
+ | 0.0006 | 13.0 | 806 | 0.5963 | 0.8991 |
65
+ | 0.0005 | 14.0 | 868 | 0.6273 | 0.8899 |
66
+ | 0.0006 | 15.0 | 930 | 0.6720 | 0.8899 |
67
+ | 0.0005 | 16.0 | 992 | 0.6864 | 0.8716 |
68
+ | 0.0003 | 17.0 | 1054 | 0.6928 | 0.8624 |
69
+ | 0.0004 | 18.0 | 1116 | 0.6931 | 0.8624 |
70
+ | 0.0003 | 19.0 | 1178 | 0.6874 | 0.8624 |
71
+ | 0.0003 | 20.0 | 1240 | 0.6688 | 0.8624 |
72
+ | 0.0003 | 21.0 | 1302 | 0.6989 | 0.8624 |
73
+ | 0.0003 | 22.0 | 1364 | 0.7050 | 0.8624 |
74
+ | 0.0003 | 23.0 | 1426 | 0.7038 | 0.8624 |
75
+ | 0.0002 | 24.0 | 1488 | 0.7083 | 0.8624 |
76
+ | 0.0002 | 25.0 | 1550 | 0.7134 | 0.8624 |
77
+ | 0.0002 | 26.0 | 1612 | 0.7133 | 0.8624 |
78
+ | 0.0002 | 27.0 | 1674 | 0.7151 | 0.8624 |
79
+ | 0.0002 | 28.0 | 1736 | 0.7155 | 0.8624 |
80
+ | 0.0002 | 29.0 | 1798 | 0.7135 | 0.8624 |
81
+ | 0.0002 | 30.0 | 1860 | 0.7151 | 0.8624 |
82
 
83
 
84
  ### Framework versions
config.json CHANGED
@@ -9,21 +9,21 @@
9
  "dropout": 0.1,
10
  "hidden_dim": 3072,
11
  "id2label": {
12
- "0": "date_functions",
13
- "1": "group_by",
14
- "2": "order_by",
15
- "3": "ratio",
16
- "4": "table_join",
17
- "5": "where"
18
  },
19
  "initializer_range": 0.02,
20
  "label2id": {
21
- "date_functions": 0,
22
- "group_by": 1,
23
- "order_by": 2,
24
- "ratio": 3,
25
- "table_join": 4,
26
- "where": 5
27
  },
28
  "max_position_embeddings": 512,
29
  "model_type": "distilbert",
 
9
  "dropout": 0.1,
10
  "hidden_dim": 3072,
11
  "id2label": {
12
+ "0": "where",
13
+ "1": "table_join",
14
+ "2": "ratio",
15
+ "3": "order_by",
16
+ "4": "group_by",
17
+ "5": "date_functions"
18
  },
19
  "initializer_range": 0.02,
20
  "label2id": {
21
+ "date_functions": 5,
22
+ "group_by": 4,
23
+ "order_by": 3,
24
+ "ratio": 2,
25
+ "table_join": 1,
26
+ "where": 0
27
  },
28
  "max_position_embeddings": 512,
29
  "model_type": "distilbert",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e71e1bfc15b876e62a5f3adb928068caca6e1cef44fa764f55290750c8ba8c6f
3
  size 267844872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:394179cd1421c770d95fd5e4a12f5fd86cc06bc727737d6bec96582438c43928
3
  size 267844872
runs/Jan19_07-07-48_f73caa55ef87/events.out.tfevents.1705648068.f73caa55ef87.26.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1888ecd2d5d23bc39a3581bbdab81bd12e4886f5f709395aedf7a436a8a4cfa
3
+ size 72895
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0234cb26bba5830bee72b802e4ded619ad2a7070956044d579eea32bec43fb0a
3
  size 4283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47b715fb23774bb9a1ae0e0983120b5fe265f6a8c88f743a81cfef0d8d2a21b4
3
  size 4283