Bencode92 commited on
Commit
9231b63
Β·
1 Parent(s): f0b11b3

πŸ”„ Incremental importance | Acc: 0.812, F1: 0.560

Browse files
README.md CHANGED
@@ -20,17 +20,17 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
20
 
21
  ## Performance
22
 
23
- *Last training: 2025-07-09 16:17*
24
- *Dataset: `news_20250709.csv` (46 samples)*
25
 
26
  | Metric | Value |
27
  |--------|-------|
28
- | Loss | 1.6092 |
29
- | Accuracy | 0.8333 |
30
- | F1 Score | 0.7989 |
31
- | F1 Macro | 0.7989 |
32
- | Precision | 0.7917 |
33
- | Recall | 0.8333 |
34
 
35
  ## Training Details
36
 
@@ -59,4 +59,4 @@ predictions = outputs.logits.softmax(dim=-1)
59
  ## Model Card Authors
60
 
61
  - TradePulse ML Team
62
- - Auto-generated on 2025-07-09 16:17:17
 
20
 
21
  ## Performance
22
 
23
+ *Last training: 2025-07-10 09:11*
24
+ *Dataset: `news_20250710.csv` (138 samples)*
25
 
26
  | Metric | Value |
27
  |--------|-------|
28
+ | Loss | 0.0703 |
29
+ | Accuracy | 0.9714 |
30
+ | F1 Score | 0.9758 |
31
+ | F1 Macro | 0.9758 |
32
+ | Precision | 0.9857 |
33
+ | Recall | 0.9714 |
34
 
35
  ## Training Details
36
 
 
59
  ## Model Card Authors
60
 
61
  - TradePulse ML Team
62
+ - Auto-generated on 2025-07-10 09:11:15
{checkpoint-18 β†’ checkpoint-52}/config.json RENAMED
File without changes
{checkpoint-18 β†’ checkpoint-52}/model.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b3dabca8d8e63ed66cfb9eb1910581f8f656f01b7cba193238cfe67ce50d181
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae4c5c9032b9108afe5cd8569212b5eee6a8bc68a8b592e27c95b758887b4834
3
  size 439039996
{checkpoint-18 β†’ checkpoint-52}/special_tokens_map.json RENAMED
File without changes
{checkpoint-18 β†’ checkpoint-52}/tokenizer.json RENAMED
File without changes
{checkpoint-18 β†’ checkpoint-52}/tokenizer_config.json RENAMED
File without changes
{checkpoint-18 β†’ checkpoint-52}/trainer_state.json RENAMED
@@ -1,53 +1,81 @@
1
  {
2
- "best_metric": 0.798941798941799,
3
- "best_model_checkpoint": "hf-importance-production/checkpoint-18",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 18,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 1.0,
13
- "eval_accuracy": 0.75,
14
- "eval_f1": 0.7125,
15
- "eval_f1_macro": 0.5166666666666667,
16
- "eval_loss": 2.042041540145874,
17
- "eval_precision": 0.75,
18
- "eval_precision_macro": 0.5555555555555555,
19
- "eval_recall": 0.75,
20
- "eval_recall_macro": 0.5333333333333333,
21
- "eval_runtime": 6.64,
22
- "eval_samples_per_second": 1.807,
23
- "eval_steps_per_second": 0.452,
24
- "step": 9
25
  },
26
  {
27
- "epoch": 1.1111111111111112,
28
- "grad_norm": 0.657223641872406,
29
  "learning_rate": 8.000000000000001e-06,
30
- "loss": 1.2448,
31
- "step": 10
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
32
  },
33
  {
34
  "epoch": 2.0,
35
- "eval_accuracy": 0.8333333333333334,
36
- "eval_f1": 0.798941798941799,
37
- "eval_f1_macro": 0.582010582010582,
38
- "eval_loss": 1.6091957092285156,
39
- "eval_precision": 0.7916666666666666,
40
- "eval_precision_macro": 0.5833333333333334,
41
- "eval_recall": 0.8333333333333334,
42
- "eval_recall_macro": 0.6,
43
- "eval_runtime": 6.6395,
44
- "eval_samples_per_second": 1.807,
45
- "eval_steps_per_second": 0.452,
46
- "step": 18
47
  }
48
  ],
49
  "logging_steps": 10,
50
- "max_steps": 18,
51
  "num_input_tokens_seen": 0,
52
  "num_train_epochs": 2,
53
  "save_steps": 500,
@@ -72,7 +100,7 @@
72
  "attributes": {}
73
  }
74
  },
75
- "total_flos": 17891712405504.0,
76
  "train_batch_size": 4,
77
  "trial_name": null,
78
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.9757823129251698,
3
+ "best_model_checkpoint": "hf-importance-production/checkpoint-52",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 52,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.38461538461538464,
13
+ "grad_norm": 0.08406942337751389,
14
+ "learning_rate": 4.000000000000001e-06,
15
+ "loss": 0.1652,
16
+ "step": 10
 
 
 
 
 
 
 
 
17
  },
18
  {
19
+ "epoch": 0.7692307692307693,
20
+ "grad_norm": 44.237098693847656,
21
  "learning_rate": 8.000000000000001e-06,
22
+ "loss": 0.2935,
23
+ "step": 20
24
+ },
25
+ {
26
+ "epoch": 1.0,
27
+ "eval_accuracy": 0.9714285714285714,
28
+ "eval_f1": 0.9757296466973886,
29
+ "eval_f1_macro": 0.8781362007168458,
30
+ "eval_loss": 0.0774894431233406,
31
+ "eval_precision": 0.9857142857142858,
32
+ "eval_precision_macro": 0.8333333333333334,
33
+ "eval_recall": 0.9714285714285714,
34
+ "eval_recall_macro": 0.9791666666666666,
35
+ "eval_runtime": 19.4749,
36
+ "eval_samples_per_second": 1.797,
37
+ "eval_steps_per_second": 0.462,
38
+ "step": 26
39
+ },
40
+ {
41
+ "epoch": 1.1538461538461537,
42
+ "grad_norm": 0.001178277307190001,
43
+ "learning_rate": 8.148148148148148e-06,
44
+ "loss": 0.1045,
45
+ "step": 30
46
+ },
47
+ {
48
+ "epoch": 1.5384615384615383,
49
+ "grad_norm": 52.080684661865234,
50
+ "learning_rate": 4.444444444444444e-06,
51
+ "loss": 0.2248,
52
+ "step": 40
53
+ },
54
+ {
55
+ "epoch": 1.9230769230769231,
56
+ "grad_norm": 0.37515753507614136,
57
+ "learning_rate": 7.407407407407407e-07,
58
+ "loss": 0.1178,
59
+ "step": 50
60
  },
61
  {
62
  "epoch": 2.0,
63
+ "eval_accuracy": 0.9714285714285714,
64
+ "eval_f1": 0.9757823129251698,
65
+ "eval_f1_macro": 0.8793650793650793,
66
+ "eval_loss": 0.07033431529998779,
67
+ "eval_precision": 0.9857142857142858,
68
+ "eval_precision_macro": 0.8333333333333334,
69
+ "eval_recall": 0.9714285714285714,
70
+ "eval_recall_macro": 0.9814814814814815,
71
+ "eval_runtime": 19.6277,
72
+ "eval_samples_per_second": 1.783,
73
+ "eval_steps_per_second": 0.459,
74
+ "step": 52
75
  }
76
  ],
77
  "logging_steps": 10,
78
+ "max_steps": 52,
79
  "num_input_tokens_seen": 0,
80
  "num_train_epochs": 2,
81
  "save_steps": 500,
 
100
  "attributes": {}
101
  }
102
  },
103
+ "total_flos": 54201364051968.0,
104
  "train_batch_size": 4,
105
  "trial_name": null,
106
  "trial_params": null
{checkpoint-18 β†’ checkpoint-52}/vocab.txt RENAMED
File without changes
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b3dabca8d8e63ed66cfb9eb1910581f8f656f01b7cba193238cfe67ce50d181
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae4c5c9032b9108afe5cd8569212b5eee6a8bc68a8b592e27c95b758887b4834
3
  size 439039996
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3c99de83de5f22fdddae294ce3c58b232ced45309611f6aca8ad972a4b071c7
3
  size 5521
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46014ae489d03a5169b574c28a7d88c2ad6dab9de05cdb9d53a95b988c48d865
3
  size 5521