File size: 9,700 Bytes
e65379c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
{
  "family": "extractor",
  "trained_at_utc": "2026-03-24T13:45:54.396697+00:00",
  "rows": {
    "train": 288000,
    "test": 36000,
    "eval": 36000
  },
  "tasks": [
    "constraint_scope",
    "constraint_stability",
    "constraint_type",
    "fact_type",
    "pii_presence"
  ],
  "task_label_counts": {
    "train": {
      "constraint_scope": {
        "finance": 8000,
        "food": 8000,
        "general": 8000,
        "health": 8000,
        "none": 8000,
        "social": 8000,
        "tech": 8000,
        "travel": 8000,
        "work": 8000
      },
      "constraint_stability": {
        "semi_stable": 8000,
        "stable": 8000,
        "volatile": 8000
      },
      "constraint_type": {
        "causal": 8000,
        "constraint_other": 8000,
        "goal": 8000,
        "none": 8000,
        "policy": 8000,
        "preference": 8000,
        "state": 8000,
        "value": 8000
      },
      "fact_type": {
        "identity": 8000,
        "location": 8000,
        "none": 8000,
        "occupation": 8000,
        "other_fact": 8000,
        "preference": 8000
      },
      "pii_presence": {
        "no_pii": 40000,
        "pii": 40000
      }
    },
    "test": {
      "constraint_scope": {
        "finance": 1000,
        "food": 1000,
        "general": 1000,
        "health": 1000,
        "none": 1000,
        "social": 1000,
        "tech": 1000,
        "travel": 1000,
        "work": 1000
      },
      "constraint_stability": {
        "semi_stable": 1000,
        "stable": 1000,
        "volatile": 1000
      },
      "constraint_type": {
        "causal": 1000,
        "constraint_other": 1000,
        "goal": 1000,
        "none": 1000,
        "policy": 1000,
        "preference": 1000,
        "state": 1000,
        "value": 1000
      },
      "fact_type": {
        "identity": 1000,
        "location": 1000,
        "none": 1000,
        "occupation": 1000,
        "other_fact": 1000,
        "preference": 1000
      },
      "pii_presence": {
        "no_pii": 5000,
        "pii": 5000
      }
    },
    "eval": {
      "constraint_scope": {
        "finance": 1000,
        "food": 1000,
        "general": 1000,
        "health": 1000,
        "none": 1000,
        "social": 1000,
        "tech": 1000,
        "travel": 1000,
        "work": 1000
      },
      "constraint_stability": {
        "semi_stable": 1000,
        "stable": 1000,
        "volatile": 1000
      },
      "constraint_type": {
        "causal": 1000,
        "constraint_other": 1000,
        "goal": 1000,
        "none": 1000,
        "policy": 1000,
        "preference": 1000,
        "state": 1000,
        "value": 1000
      },
      "fact_type": {
        "identity": 1000,
        "location": 1000,
        "none": 1000,
        "occupation": 1000,
        "other_fact": 1000,
        "preference": 1000
      },
      "pii_presence": {
        "no_pii": 5000,
        "pii": 5000
      }
    }
  },
  "labels": [
    "constraint_scope::finance",
    "constraint_scope::food",
    "constraint_scope::general",
    "constraint_scope::health",
    "constraint_scope::none",
    "constraint_scope::social",
    "constraint_scope::tech",
    "constraint_scope::travel",
    "constraint_scope::work",
    "constraint_stability::semi_stable",
    "constraint_stability::stable",
    "constraint_stability::volatile",
    "constraint_type::causal",
    "constraint_type::constraint_other",
    "constraint_type::goal",
    "constraint_type::none",
    "constraint_type::policy",
    "constraint_type::preference",
    "constraint_type::state",
    "constraint_type::value",
    "fact_type::identity",
    "fact_type::location",
    "fact_type::none",
    "fact_type::occupation",
    "fact_type::other_fact",
    "fact_type::preference",
    "pii_presence::no_pii",
    "pii_presence::pii"
  ],
  "label_to_id": {
    "constraint_scope::finance": 0,
    "constraint_scope::food": 1,
    "constraint_scope::general": 2,
    "constraint_scope::health": 3,
    "constraint_scope::none": 4,
    "constraint_scope::social": 5,
    "constraint_scope::tech": 6,
    "constraint_scope::travel": 7,
    "constraint_scope::work": 8,
    "constraint_stability::semi_stable": 9,
    "constraint_stability::stable": 10,
    "constraint_stability::volatile": 11,
    "constraint_type::causal": 12,
    "constraint_type::constraint_other": 13,
    "constraint_type::goal": 14,
    "constraint_type::none": 15,
    "constraint_type::policy": 16,
    "constraint_type::preference": 17,
    "constraint_type::state": 18,
    "constraint_type::value": 19,
    "fact_type::identity": 20,
    "fact_type::location": 21,
    "fact_type::none": 22,
    "fact_type::occupation": 23,
    "fact_type::other_fact": 24,
    "fact_type::preference": 25,
    "pii_presence::no_pii": 26,
    "pii_presence::pii": 27
  },
  "train_config": {
    "max_features": 250000,
    "min_df": 2,
    "ngram_min": 1,
    "ngram_max": 2,
    "max_iter": 25,
    "alpha": 1e-05,
    "seed": 42,
    "predict_batch_size": 8192,
    "early_stopping": true,
    "early_stopping_patience": 3,
    "early_stopping_metric": "macro_f1",
    "early_stopping_min_delta": 0.001,
    "calibration_method": "sigmoid"
  },
  "training_summary": {
    "actual_epochs": 4,
    "best_epoch": 1,
    "best_metric": 0.9994428567862855,
    "monitor_metric": "macro_f1",
    "early_stopped": true
  },
  "calibration": {
    "method": "task_conditional_sigmoid",
    "split": "eval",
    "rows": 36000,
    "pre_ece": 0.06013730731601039,
    "post_ece": 0.0007514102792564575,
    "pre_accuracy": 0.9978333333333333,
    "post_accuracy": 0.9981666666666666,
    "accuracy_delta": 0.0003333333333332966,
    "tasks": {
      "constraint_scope": {
        "rows": 9000,
        "pre_ece": 0.0073926387441783925,
        "post_ece": 0.00019267901287378653,
        "pre_accuracy": 1.0,
        "post_accuracy": 1.0,
        "accuracy_delta": 0.0
      },
      "constraint_stability": {
        "rows": 3000,
        "pre_ece": 0.0035802200536977353,
        "post_ece": 0.00016981111181246789,
        "pre_accuracy": 1.0,
        "post_accuracy": 1.0,
        "accuracy_delta": 0.0
      },
      "constraint_type": {
        "rows": 8000,
        "pre_ece": 0.0152260080692046,
        "post_ece": 0.0002949549691239062,
        "pre_accuracy": 1.0,
        "post_accuracy": 1.0,
        "accuracy_delta": 0.0
      },
      "fact_type": {
        "rows": 6000,
        "pre_ece": 0.008209015508071071,
        "post_ece": 0.00021106970310058593,
        "pre_accuracy": 1.0,
        "post_accuracy": 1.0,
        "accuracy_delta": 0.0
      },
      "pii_presence": {
        "rows": 10000,
        "pre_ece": 0.1278197693399604,
        "post_ece": 0.002118116763033487,
        "pre_accuracy": 0.9922,
        "post_accuracy": 0.9934,
        "accuracy_delta": 0.0011999999999999789
      }
    }
  },
  "epoch_stats": [
    {
      "epoch": 1,
      "train_loss": 0.07304321517285889,
      "train_accuracy": 0.9985243055555556,
      "train_macro_f1": 0.9996205356573068,
      "train_weighted_f1": 0.9985243053339707,
      "valid_loss": 0.07040478728784708,
      "valid_accuracy": 0.9978333333333333,
      "valid_macro_f1": 0.9994428567862855,
      "valid_weighted_f1": 0.9978333319466658,
      "monitor_metric": "macro_f1",
      "monitor_value": 0.9994428567862855,
      "improved": true
    },
    {
      "epoch": 2,
      "train_loss": 0.07098693556871623,
      "train_accuracy": 0.9985138888888889,
      "train_macro_f1": 0.9996178570566361,
      "train_weighted_f1": 0.998513888553585,
      "valid_loss": 0.06895428509737356,
      "valid_accuracy": 0.9979166666666667,
      "valid_macro_f1": 0.9994642852803567,
      "valid_weighted_f1": 0.9979166649791653,
      "monitor_metric": "macro_f1",
      "monitor_value": 0.9994642852803567,
      "improved": false
    },
    {
      "epoch": 3,
      "train_loss": 0.06992293075722475,
      "train_accuracy": 0.9984930555555556,
      "train_macro_f1": 0.9996124998827812,
      "train_weighted_f1": 0.9984930550997047,
      "valid_loss": 0.06817925236885357,
      "valid_accuracy": 0.9979166666666667,
      "valid_macro_f1": 0.9994642852803567,
      "valid_weighted_f1": 0.9979166649791653,
      "monitor_metric": "macro_f1",
      "monitor_value": 0.9994642852803567,
      "improved": false
    },
    {
      "epoch": 4,
      "train_loss": 0.0692276576162906,
      "train_accuracy": 0.9984861111111111,
      "train_macro_f1": 0.9996107141570066,
      "train_weighted_f1": 0.9984861106105815,
      "valid_loss": 0.06766472301272425,
      "valid_accuracy": 0.9979166666666667,
      "valid_macro_f1": 0.9994642852803567,
      "valid_weighted_f1": 0.9979166649791653,
      "monitor_metric": "macro_f1",
      "monitor_value": 0.9994642852803567,
      "improved": false
    }
  ],
  "skipped_invalid_tasks": {},
  "artifact_scope": "family",
  "evaluation_suite": "standard",
  "dataset_hashes": {
    "train": {
      "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/extractor_train.parquet",
      "sha256": "7001566078ce06fa63779c2025be27b27a1fed4a304133dc334fcbf1336dcd1e",
      "bytes": 21540433
    },
    "test": {
      "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/extractor_test.parquet",
      "sha256": "8fa0af53f8cbd8116335d00659608404ba96055df49b1ab89799418c646a48d3",
      "bytes": 2721025
    },
    "eval": {
      "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/extractor_eval.parquet",
      "sha256": "d066db9c6cadeaea12f4c367262fee444f0992575af2daca06af75f40e9935ce",
      "bytes": 2709873
    }
  }
}