Bencode92 commited on
Commit
8f2826b
Β·
1 Parent(s): 7e9103f

πŸ”„ Incremental importance | Acc: 0.803, F1: 0.646

Browse files
README.md CHANGED
@@ -21,19 +21,19 @@ Fine-tuned FinBERT model for financial importance analysis in TradePulse.
21
 
22
  ## Performance
23
 
24
- *Last training: 2025-07-29 15:39*
25
  *Dataset: `base_reference.csv` (637 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
- | Loss | 0.8320 |
30
- | Accuracy | 0.8063 |
31
- | F1 Score | 0.8051 |
32
 
33
- | F1 Macro | 0.8051 |
34
 
35
- | Precision | 0.8047 |
36
- | Recall | 0.8063 |
37
 
38
  ## Training Details
39
 
@@ -65,4 +65,4 @@ predictions = outputs.logits.softmax(dim=-1)
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
- - Auto-generated on 2025-07-29 15:39:17
 
21
 
22
  ## Performance
23
 
24
+ *Last training: 2025-07-30 11:16*
25
  *Dataset: `base_reference.csv` (637 samples)*
26
 
27
  | Metric | Value |
28
  |--------|-------|
29
+ | Loss | 0.9162 |
30
+ | Accuracy | 0.8000 |
31
+ | F1 Score | 0.7975 |
32
 
33
+ | F1 Macro | 0.7975 |
34
 
35
+ | Precision | 0.7976 |
36
+ | Recall | 0.8000 |
37
 
38
  ## Training Details
39
 
 
65
  ## Model Card Authors
66
 
67
  - TradePulse ML Team
68
+ - Auto-generated on 2025-07-30 11:16:11
{checkpoint-240 β†’ checkpoint-120}/config.json RENAMED
File without changes
{checkpoint-240 β†’ checkpoint-120}/model.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdc01d91706d553799d11f3cb8130f8e1b17d70daf22d597f48fcefb01b77f14
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a306203b60f295a91fb646b11a9144870ea0e3b21f0b0210637c5bfe66b95f5
3
  size 439039996
{checkpoint-240 β†’ checkpoint-120}/special_tokens_map.json RENAMED
File without changes
{checkpoint-240 β†’ checkpoint-120}/tokenizer.json RENAMED
File without changes
{checkpoint-240 β†’ checkpoint-120}/tokenizer_config.json RENAMED
File without changes
{checkpoint-240 β†’ checkpoint-120}/trainer_state.json RENAMED
@@ -1,210 +1,111 @@
1
  {
2
- "best_metric": 0.8051317614424409,
3
- "best_model_checkpoint": "hf-importance-production/checkpoint-240",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 240,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.08333333333333333,
13
- "grad_norm": 1.5605429410934448,
14
  "learning_rate": 8.403361344537816e-07,
15
- "loss": 0.2922,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.16666666666666666,
20
- "grad_norm": 2.0631015300750732,
21
  "learning_rate": 1.6806722689075632e-06,
22
- "loss": 0.2751,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 0.25,
27
- "grad_norm": 26.44710350036621,
28
  "learning_rate": 2.521008403361345e-06,
29
- "loss": 0.1431,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 0.3333333333333333,
34
- "grad_norm": 15.7521390914917,
35
  "learning_rate": 3.3613445378151265e-06,
36
- "loss": 0.1394,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 0.4166666666666667,
41
- "grad_norm": 0.29773807525634766,
42
  "learning_rate": 4.201680672268908e-06,
43
- "loss": 0.0197,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 0.5,
48
- "grad_norm": 22.171756744384766,
49
  "learning_rate": 5.04201680672269e-06,
50
- "loss": 0.0483,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 0.5833333333333334,
55
- "grad_norm": 19.108678817749023,
56
  "learning_rate": 5.882352941176471e-06,
57
- "loss": 0.1641,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 0.6666666666666666,
62
- "grad_norm": 0.05635490268468857,
63
  "learning_rate": 6.722689075630253e-06,
64
- "loss": 0.0468,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 0.75,
69
- "grad_norm": 0.11963564902544022,
70
  "learning_rate": 7.563025210084034e-06,
71
- "loss": 0.009,
72
  "step": 90
73
  },
74
  {
75
  "epoch": 0.8333333333333334,
76
- "grad_norm": 42.91386413574219,
77
  "learning_rate": 8.403361344537815e-06,
78
- "loss": 0.0908,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 0.9166666666666666,
83
- "grad_norm": 1.6929007768630981,
84
  "learning_rate": 9.243697478991598e-06,
85
- "loss": 0.1529,
86
  "step": 110
87
  },
88
  {
89
  "epoch": 1.0,
90
- "grad_norm": 9.662502270657569e-05,
91
  "learning_rate": 9.917355371900828e-06,
92
- "loss": 0.0054,
93
  "step": 120
94
  },
95
  {
96
  "epoch": 1.0,
97
  "eval_accuracy": 0.8,
98
- "eval_f1": 0.7951267793019712,
99
- "eval_f1_macro": 0.7037467600127446,
100
- "eval_loss": 0.8872003555297852,
101
- "eval_precision": 0.7960396600228876,
102
- "eval_precision_macro": 0.7721565261618667,
103
  "eval_recall": 0.8,
104
- "eval_recall_macro": 0.6659389038634321,
105
- "eval_runtime": 90.131,
106
- "eval_samples_per_second": 1.775,
107
- "eval_steps_per_second": 0.444,
108
  "step": 120
109
- },
110
- {
111
- "epoch": 1.0833333333333333,
112
- "grad_norm": 7.114067077636719,
113
- "learning_rate": 9.090909090909091e-06,
114
- "loss": 0.0037,
115
- "step": 130
116
- },
117
- {
118
- "epoch": 1.1666666666666667,
119
- "grad_norm": 3.9886481761932373,
120
- "learning_rate": 8.264462809917356e-06,
121
- "loss": 0.014,
122
- "step": 140
123
- },
124
- {
125
- "epoch": 1.25,
126
- "grad_norm": 2.7626068592071533,
127
- "learning_rate": 7.43801652892562e-06,
128
- "loss": 0.1729,
129
- "step": 150
130
- },
131
- {
132
- "epoch": 1.3333333333333333,
133
- "grad_norm": 0.5616143345832825,
134
- "learning_rate": 6.611570247933885e-06,
135
- "loss": 0.0071,
136
- "step": 160
137
- },
138
- {
139
- "epoch": 1.4166666666666667,
140
- "grad_norm": 1.5667345523834229,
141
- "learning_rate": 5.785123966942149e-06,
142
- "loss": 0.0452,
143
- "step": 170
144
- },
145
- {
146
- "epoch": 1.5,
147
- "grad_norm": 9.732388496398926,
148
- "learning_rate": 4.958677685950414e-06,
149
- "loss": 0.0161,
150
- "step": 180
151
- },
152
- {
153
- "epoch": 1.5833333333333335,
154
- "grad_norm": 1.119588851928711,
155
- "learning_rate": 4.132231404958678e-06,
156
- "loss": 0.0546,
157
- "step": 190
158
- },
159
- {
160
- "epoch": 1.6666666666666665,
161
- "grad_norm": 0.037918105721473694,
162
- "learning_rate": 3.3057851239669424e-06,
163
- "loss": 0.1803,
164
- "step": 200
165
- },
166
- {
167
- "epoch": 1.75,
168
- "grad_norm": 2.7715115547180176,
169
- "learning_rate": 2.479338842975207e-06,
170
- "loss": 0.4811,
171
- "step": 210
172
- },
173
- {
174
- "epoch": 1.8333333333333335,
175
- "grad_norm": 68.59700775146484,
176
- "learning_rate": 1.6528925619834712e-06,
177
- "loss": 0.191,
178
- "step": 220
179
- },
180
- {
181
- "epoch": 1.9166666666666665,
182
- "grad_norm": 9.923303604125977,
183
- "learning_rate": 8.264462809917356e-07,
184
- "loss": 0.157,
185
- "step": 230
186
- },
187
- {
188
- "epoch": 2.0,
189
- "grad_norm": 4.033025470562279e-05,
190
- "learning_rate": 0.0,
191
- "loss": 0.2956,
192
- "step": 240
193
- },
194
- {
195
- "epoch": 2.0,
196
- "eval_accuracy": 0.80625,
197
- "eval_f1": 0.8051317614424409,
198
- "eval_f1_macro": 0.7221451687471104,
199
- "eval_loss": 0.8320282101631165,
200
- "eval_precision": 0.8046626213592234,
201
- "eval_precision_macro": 0.7253629218677761,
202
- "eval_recall": 0.80625,
203
- "eval_recall_macro": 0.7194699011680145,
204
- "eval_runtime": 90.1147,
205
- "eval_samples_per_second": 1.776,
206
- "eval_steps_per_second": 0.444,
207
- "step": 240
208
  }
209
  ],
210
  "logging_steps": 10,
@@ -228,12 +129,12 @@
228
  "should_evaluate": false,
229
  "should_log": false,
230
  "should_save": true,
231
- "should_training_stop": true
232
  },
233
  "attributes": {}
234
  }
235
  },
236
- "total_flos": 251010200512512.0,
237
  "train_batch_size": 4,
238
  "trial_name": null,
239
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.7974805825242718,
3
+ "best_model_checkpoint": "hf-importance-production/checkpoint-120",
4
+ "epoch": 1.0,
5
  "eval_steps": 500,
6
+ "global_step": 120,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.08333333333333333,
13
+ "grad_norm": 0.09946297109127045,
14
  "learning_rate": 8.403361344537816e-07,
15
+ "loss": 0.0896,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.16666666666666666,
20
+ "grad_norm": 0.07774800062179565,
21
  "learning_rate": 1.6806722689075632e-06,
22
+ "loss": 0.1151,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 0.25,
27
+ "grad_norm": 1.0400522947311401,
28
  "learning_rate": 2.521008403361345e-06,
29
+ "loss": 0.0195,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 0.3333333333333333,
34
+ "grad_norm": 0.2196376472711563,
35
  "learning_rate": 3.3613445378151265e-06,
36
+ "loss": 0.001,
37
  "step": 40
38
  },
39
  {
40
  "epoch": 0.4166666666666667,
41
+ "grad_norm": 0.04618404060602188,
42
  "learning_rate": 4.201680672268908e-06,
43
+ "loss": 0.0011,
44
  "step": 50
45
  },
46
  {
47
  "epoch": 0.5,
48
+ "grad_norm": 0.020002124831080437,
49
  "learning_rate": 5.04201680672269e-06,
50
+ "loss": 0.0008,
51
  "step": 60
52
  },
53
  {
54
  "epoch": 0.5833333333333334,
55
+ "grad_norm": 0.7232803702354431,
56
  "learning_rate": 5.882352941176471e-06,
57
+ "loss": 0.0056,
58
  "step": 70
59
  },
60
  {
61
  "epoch": 0.6666666666666666,
62
+ "grad_norm": 0.014796342700719833,
63
  "learning_rate": 6.722689075630253e-06,
64
+ "loss": 0.0002,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 0.75,
69
+ "grad_norm": 0.059538453817367554,
70
  "learning_rate": 7.563025210084034e-06,
71
+ "loss": 0.0008,
72
  "step": 90
73
  },
74
  {
75
  "epoch": 0.8333333333333334,
76
+ "grad_norm": 6.586078643798828,
77
  "learning_rate": 8.403361344537815e-06,
78
+ "loss": 0.0036,
79
  "step": 100
80
  },
81
  {
82
  "epoch": 0.9166666666666666,
83
+ "grad_norm": 0.012406314723193645,
84
  "learning_rate": 9.243697478991598e-06,
85
+ "loss": 0.011,
86
  "step": 110
87
  },
88
  {
89
  "epoch": 1.0,
90
+ "grad_norm": 0.0004408100212458521,
91
  "learning_rate": 9.917355371900828e-06,
92
+ "loss": 0.0002,
93
  "step": 120
94
  },
95
  {
96
  "epoch": 1.0,
97
  "eval_accuracy": 0.8,
98
+ "eval_f1": 0.7974805825242718,
99
+ "eval_f1_macro": 0.7152658344891355,
100
+ "eval_loss": 0.9162373542785645,
101
+ "eval_precision": 0.797591328783621,
102
+ "eval_precision_macro": 0.7225248991607884,
103
  "eval_recall": 0.8,
104
+ "eval_recall_macro": 0.7102246181491464,
105
+ "eval_runtime": 88.5376,
106
+ "eval_samples_per_second": 1.807,
107
+ "eval_steps_per_second": 0.452,
108
  "step": 120
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
109
  }
110
  ],
111
  "logging_steps": 10,
 
129
  "should_evaluate": false,
130
  "should_log": false,
131
  "should_save": true,
132
+ "should_training_stop": false
133
  },
134
  "attributes": {}
135
  }
136
  },
137
+ "total_flos": 125505100256256.0,
138
  "train_batch_size": 4,
139
  "trial_name": null,
140
  "trial_params": null
{checkpoint-240 β†’ checkpoint-120}/vocab.txt RENAMED
File without changes
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdc01d91706d553799d11f3cb8130f8e1b17d70daf22d597f48fcefb01b77f14
3
  size 439039996
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a306203b60f295a91fb646b11a9144870ea0e3b21f0b0210637c5bfe66b95f5
3
  size 439039996