Bencode92 commited on
Commit
68f1c4d
Β·
1 Parent(s): 5089194

πŸ”„ Incremental importance | Acc: 0.750, F1: 0.468

Browse files
README.md CHANGED
@@ -20,17 +20,17 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
20
 
21
  ## Performance
22
 
23
- *Last training: 2025-07-16 06:55*
24
- *Dataset: `news_20250716.csv` (214 samples)*
25
 
26
  | Metric | Value |
27
  |--------|-------|
28
- | Loss | 1.9563 |
29
- | Accuracy | 0.6481 |
30
- | F1 Score | 0.6376 |
31
- | F1 Macro | 0.6376 |
32
- | Precision | 0.6685 |
33
- | Recall | 0.6481 |
34
 
35
  ## Training Details
36
 
@@ -59,4 +59,4 @@ predictions = outputs.logits.softmax(dim=-1)
59
  ## Model Card Authors
60
 
61
  - TradePulse ML Team
62
- - Auto-generated on 2025-07-16 06:55:39
 
20
 
21
  ## Performance
22
 
23
+ *Last training: 2025-07-17 13:34*
24
+ *Dataset: `news_20250717.csv` (142 samples)*
25
 
26
  | Metric | Value |
27
  |--------|-------|
28
+ | Loss | 0.8034 |
29
+ | Accuracy | 0.7222 |
30
+ | F1 Score | 0.6776 |
31
+ | F1 Macro | 0.6776 |
32
+ | Precision | 0.6819 |
33
+ | Recall | 0.7222 |
34
 
35
  ## Training Details
36
 
 
59
  ## Model Card Authors
60
 
61
  - TradePulse ML Team
62
+ - Auto-generated on 2025-07-17 13:34:20
{checkpoint-40 β†’ checkpoint-54}/config.json RENAMED
File without changes
{checkpoint-40 β†’ checkpoint-54}/model.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7317c601691b02a030c5214c45334acbe36778068e0340cfe791923d599c2c2
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5f69416f12d48d75db96ab4b07e52fe52522972d4bd436defe00a32efe7e4c0
3
  size 439039996
{checkpoint-40 β†’ checkpoint-54}/special_tokens_map.json RENAMED
File without changes
{checkpoint-40 β†’ checkpoint-54}/tokenizer.json RENAMED
File without changes
{checkpoint-40 β†’ checkpoint-54}/tokenizer_config.json RENAMED
File without changes
{checkpoint-40 β†’ checkpoint-54}/trainer_state.json RENAMED
@@ -1,59 +1,81 @@
1
  {
2
- "best_metric": 0.6376050420168068,
3
- "best_model_checkpoint": "hf-importance-production/checkpoint-40",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 40,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.25,
13
- "grad_norm": 35.63239288330078,
14
- "learning_rate": 2.5e-06,
15
- "loss": 1.8605,
16
  "step": 10
17
  },
18
  {
19
- "epoch": 0.5,
20
- "grad_norm": 27.44408416748047,
21
- "learning_rate": 5e-06,
22
- "loss": 1.5892,
23
  "step": 20
24
  },
25
  {
26
- "epoch": 0.75,
27
- "grad_norm": 34.42560958862305,
28
- "learning_rate": 7.500000000000001e-06,
29
- "loss": 1.3163,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
30
  "step": 30
31
  },
32
  {
33
- "epoch": 1.0,
34
- "grad_norm": 78.49942016601562,
35
- "learning_rate": 1e-05,
36
- "loss": 2.0013,
37
  "step": 40
38
  },
39
  {
40
- "epoch": 1.0,
41
- "eval_accuracy": 0.6481481481481481,
42
- "eval_f1": 0.6376050420168068,
43
- "eval_f1_macro": 0.4353408029878618,
44
- "eval_loss": 1.9562698602676392,
45
- "eval_precision": 0.6685105018438351,
46
- "eval_precision_macro": 0.44588744588744583,
47
- "eval_recall": 0.6481481481481481,
48
- "eval_recall_macro": 0.45314009661835747,
49
- "eval_runtime": 30.1459,
50
- "eval_samples_per_second": 1.791,
51
- "eval_steps_per_second": 0.464,
52
- "step": 40
 
 
 
 
 
 
 
53
  }
54
  ],
55
  "logging_steps": 10,
56
- "max_steps": 80,
57
  "num_input_tokens_seen": 0,
58
  "num_train_epochs": 2,
59
  "save_steps": 500,
@@ -73,12 +95,12 @@
73
  "should_evaluate": false,
74
  "should_log": false,
75
  "should_save": true,
76
- "should_training_stop": false
77
  },
78
  "attributes": {}
79
  }
80
  },
81
- "total_flos": 42098146836480.0,
82
  "train_batch_size": 4,
83
  "trial_name": null,
84
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.6775793650793651,
3
+ "best_model_checkpoint": "hf-importance-production/checkpoint-54",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 54,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.37037037037037035,
13
+ "grad_norm": 43.338623046875,
14
+ "learning_rate": 3.846153846153847e-06,
15
+ "loss": 1.1141,
16
  "step": 10
17
  },
18
  {
19
+ "epoch": 0.7407407407407407,
20
+ "grad_norm": 5.277134895324707,
21
+ "learning_rate": 7.692307692307694e-06,
22
+ "loss": 1.1598,
23
  "step": 20
24
  },
25
  {
26
+ "epoch": 1.0,
27
+ "eval_accuracy": 0.6944444444444444,
28
+ "eval_f1": 0.6309416704153546,
29
+ "eval_f1_macro": 0.6536212325686009,
30
+ "eval_loss": 1.1927357912063599,
31
+ "eval_precision": 0.6195023148148148,
32
+ "eval_precision_macro": 0.6840277777777777,
33
+ "eval_recall": 0.6944444444444444,
34
+ "eval_recall_macro": 0.6733333333333333,
35
+ "eval_runtime": 20.0468,
36
+ "eval_samples_per_second": 1.796,
37
+ "eval_steps_per_second": 0.449,
38
+ "step": 27
39
+ },
40
+ {
41
+ "epoch": 1.1111111111111112,
42
+ "grad_norm": 4.237745761871338,
43
+ "learning_rate": 8.571428571428571e-06,
44
+ "loss": 1.0568,
45
  "step": 30
46
  },
47
  {
48
+ "epoch": 1.4814814814814814,
49
+ "grad_norm": 1.0734100341796875,
50
+ "learning_rate": 5e-06,
51
+ "loss": 0.4549,
52
  "step": 40
53
  },
54
  {
55
+ "epoch": 1.8518518518518519,
56
+ "grad_norm": 17.751998901367188,
57
+ "learning_rate": 1.4285714285714286e-06,
58
+ "loss": 0.9042,
59
+ "step": 50
60
+ },
61
+ {
62
+ "epoch": 2.0,
63
+ "eval_accuracy": 0.7222222222222222,
64
+ "eval_f1": 0.6775793650793651,
65
+ "eval_f1_macro": 0.7023809523809524,
66
+ "eval_loss": 0.8034341335296631,
67
+ "eval_precision": 0.6818996415770608,
68
+ "eval_precision_macro": 0.7473118279569894,
69
+ "eval_recall": 0.7222222222222222,
70
+ "eval_recall_macro": 0.7066666666666667,
71
+ "eval_runtime": 20.008,
72
+ "eval_samples_per_second": 1.799,
73
+ "eval_steps_per_second": 0.45,
74
+ "step": 54
75
  }
76
  ],
77
  "logging_steps": 10,
78
+ "max_steps": 54,
79
  "num_input_tokens_seen": 0,
80
  "num_train_epochs": 2,
81
  "save_steps": 500,
 
95
  "should_evaluate": false,
96
  "should_log": false,
97
  "should_save": true,
98
+ "should_training_stop": true
99
  },
100
  "attributes": {}
101
  }
102
  },
103
+ "total_flos": 55780044558336.0,
104
  "train_batch_size": 4,
105
  "trial_name": null,
106
  "trial_params": null
{checkpoint-40 β†’ checkpoint-54}/vocab.txt RENAMED
File without changes
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7317c601691b02a030c5214c45334acbe36778068e0340cfe791923d599c2c2
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5f69416f12d48d75db96ab4b07e52fe52522972d4bd436defe00a32efe7e4c0
3
  size 439039996
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2f15beae061f900df55a72593a0d6e94a0aa87b4abafd58adf1bf7ac2a4b64f9
3
  size 5521
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6bbac70dcc30ea2489bf42b0b6da04b30b625b4819082efc3a718b014a9e877
3
  size 5521