Bencode92 commited on
Commit
110abe8
Β·
1 Parent(s): 0262ee3

πŸ”„ Incremental importance | Acc: 0.875, F1: 0.630

Browse files
README.md CHANGED
@@ -21,19 +21,19 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
21
 
22
  ## Performance
23
 
24
- *Last training: 2025-07-28 12:28*
25
- *Dataset: `news_20250728.csv` (198 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
- | Loss | 1.6054 |
30
- | Accuracy | 0.6800 |
31
- | F1 Score | 0.6670 |
32
 
33
- | F1 Macro | 0.6670 |
34
 
35
- | Precision | 0.6550 |
36
- | Recall | 0.6800 |
37
 
38
  ## Training Details
39
 
@@ -65,4 +65,4 @@ predictions = outputs.logits.softmax(dim=-1)
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
- - Auto-generated on 2025-07-28 12:28:07
 
21
 
22
  ## Performance
23
 
24
+ *Last training: 2025-07-28 15:51*
25
+ *Dataset: `news_20250728.csv` (69 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
+ | Loss | 1.3768 |
30
+ | Accuracy | 0.6667 |
31
+ | F1 Score | 0.6667 |
32
 
33
+ | F1 Macro | 0.6667 |
34
 
35
+ | Precision | 0.6875 |
36
+ | Recall | 0.6667 |
37
 
38
  ## Training Details
39
 
 
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
+ - Auto-generated on 2025-07-28 15:51:43
{checkpoint-74 β†’ checkpoint-26}/config.json RENAMED
File without changes
{checkpoint-74 β†’ checkpoint-26}/model.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6996a8e10bb5c621690403f08209675c901b0806626ed1a43deef422b1ba295c
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbd23a14b45d9cd08acbf9b971d434497ee11ca489570b7ce552089c6312fda4
3
  size 439039996
{checkpoint-74 β†’ checkpoint-26}/special_tokens_map.json RENAMED
File without changes
{checkpoint-74 β†’ checkpoint-26}/tokenizer.json RENAMED
File without changes
{checkpoint-74 β†’ checkpoint-26}/tokenizer_config.json RENAMED
File without changes
{checkpoint-74 β†’ checkpoint-26}/trainer_state.json RENAMED
@@ -1,95 +1,60 @@
1
  {
2
- "best_metric": 0.6669565217391304,
3
- "best_model_checkpoint": "hf-importance-production/checkpoint-74",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 74,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.2702702702702703,
13
- "grad_norm": 56.3042106628418,
14
- "learning_rate": 2.702702702702703e-06,
15
- "loss": 5.102,
16
  "step": 10
17
  },
18
- {
19
- "epoch": 0.5405405405405406,
20
- "grad_norm": 129.203857421875,
21
- "learning_rate": 5.405405405405406e-06,
22
- "loss": 2.4752,
23
- "step": 20
24
- },
25
- {
26
- "epoch": 0.8108108108108109,
27
- "grad_norm": 48.63685607910156,
28
- "learning_rate": 8.108108108108109e-06,
29
- "loss": 1.0702,
30
- "step": 30
31
- },
32
  {
33
  "epoch": 1.0,
34
- "eval_accuracy": 0.68,
35
- "eval_f1": 0.6557491289198606,
36
- "eval_f1_macro": 0.4657375145180023,
37
- "eval_loss": 1.8875879049301147,
38
- "eval_precision": 0.6963235294117647,
39
- "eval_precision_macro": 0.48774509803921573,
40
- "eval_recall": 0.68,
41
- "eval_recall_macro": 0.48969696969696974,
42
- "eval_runtime": 27.5867,
43
- "eval_samples_per_second": 1.812,
44
- "eval_steps_per_second": 0.471,
45
- "step": 37
46
- },
47
- {
48
- "epoch": 1.0810810810810811,
49
- "grad_norm": 17.976032257080078,
50
- "learning_rate": 9.189189189189191e-06,
51
- "loss": 1.4028,
52
- "step": 40
53
- },
54
- {
55
- "epoch": 1.3513513513513513,
56
- "grad_norm": 84.75708770751953,
57
- "learning_rate": 6.486486486486487e-06,
58
- "loss": 0.4445,
59
- "step": 50
60
  },
61
  {
62
- "epoch": 1.6216216216216215,
63
- "grad_norm": 0.7481099367141724,
64
- "learning_rate": 3.7837837837837844e-06,
65
- "loss": 1.5709,
66
- "step": 60
67
- },
68
- {
69
- "epoch": 1.8918918918918919,
70
- "grad_norm": 24.998336791992188,
71
- "learning_rate": 1.0810810810810812e-06,
72
- "loss": 1.1979,
73
- "step": 70
74
  },
75
  {
76
  "epoch": 2.0,
77
- "eval_accuracy": 0.68,
78
- "eval_f1": 0.6669565217391304,
79
- "eval_f1_macro": 0.4707246376811594,
80
- "eval_loss": 1.6054034233093262,
81
- "eval_precision": 0.655,
82
- "eval_precision_macro": 0.46166666666666667,
83
- "eval_recall": 0.68,
84
- "eval_recall_macro": 0.48060606060606065,
85
- "eval_runtime": 27.5219,
86
- "eval_samples_per_second": 1.817,
87
- "eval_steps_per_second": 0.472,
88
- "step": 74
89
  }
90
  ],
91
  "logging_steps": 10,
92
- "max_steps": 74,
93
  "num_input_tokens_seen": 0,
94
  "num_train_epochs": 2,
95
  "save_steps": 500,
@@ -114,7 +79,7 @@
114
  "attributes": {}
115
  }
116
  },
117
- "total_flos": 77881571647488.0,
118
  "train_batch_size": 4,
119
  "trial_name": null,
120
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.6666666666666666,
3
+ "best_model_checkpoint": "hf-importance-production/checkpoint-26",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 26,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.7692307692307693,
13
+ "grad_norm": 121.2413101196289,
14
+ "learning_rate": 8.333333333333334e-06,
15
+ "loss": 1.8267,
16
  "step": 10
17
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
18
  {
19
  "epoch": 1.0,
20
+ "eval_accuracy": 0.6666666666666666,
21
+ "eval_f1": 0.6277777777777778,
22
+ "eval_f1_macro": 0.47142857142857136,
23
+ "eval_loss": 1.476554274559021,
24
+ "eval_precision": 0.5959595959595959,
25
+ "eval_precision_macro": 0.45021645021645024,
26
+ "eval_recall": 0.6666666666666666,
27
+ "eval_recall_macro": 0.4973544973544974,
28
+ "eval_runtime": 9.9767,
29
+ "eval_samples_per_second": 1.804,
30
+ "eval_steps_per_second": 0.501,
31
+ "step": 13
 
 
 
 
 
 
 
 
 
 
 
 
 
 
32
  },
33
  {
34
+ "epoch": 1.5384615384615383,
35
+ "grad_norm": 50.985260009765625,
36
+ "learning_rate": 4.2857142857142855e-06,
37
+ "loss": 1.3106,
38
+ "step": 20
 
 
 
 
 
 
 
39
  },
40
  {
41
  "epoch": 2.0,
42
+ "eval_accuracy": 0.6666666666666666,
43
+ "eval_f1": 0.6666666666666666,
44
+ "eval_f1_macro": 0.6666666666666666,
45
+ "eval_loss": 1.3767714500427246,
46
+ "eval_precision": 0.6875,
47
+ "eval_precision_macro": 0.7638888888888888,
48
+ "eval_recall": 0.6666666666666666,
49
+ "eval_recall_macro": 0.626984126984127,
50
+ "eval_runtime": 9.9856,
51
+ "eval_samples_per_second": 1.803,
52
+ "eval_steps_per_second": 0.501,
53
+ "step": 26
54
  }
55
  ],
56
  "logging_steps": 10,
57
+ "max_steps": 26,
58
  "num_input_tokens_seen": 0,
59
  "num_train_epochs": 2,
60
  "save_steps": 500,
 
79
  "attributes": {}
80
  }
81
  },
82
+ "total_flos": 26837568608256.0,
83
  "train_batch_size": 4,
84
  "trial_name": null,
85
  "trial_params": null
{checkpoint-74 β†’ checkpoint-26}/vocab.txt RENAMED
File without changes
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6996a8e10bb5c621690403f08209675c901b0806626ed1a43deef422b1ba295c
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbd23a14b45d9cd08acbf9b971d434497ee11ca489570b7ce552089c6312fda4
3
  size 439039996
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b061dbe96085bccc3c91f3751222bd984561b8f688f02aae26349205f0e29f8
3
  size 5521
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f33aecfc0c34e2165650f021afc9b4f8e6eff55ec7fdd9180d37e644b7455d4b
3
  size 5521