File size: 1,220 Bytes
e65379c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
{
  "task": "constraint_dimension",
  "epoch_stats": [
    {
      "epoch": 1,
      "train_loss": 1.0786596297055173
    },
    {
      "epoch": 2,
      "train_loss": 0.49559883196265825
    },
    {
      "epoch": 3,
      "train_loss": 0.36042651461985464
    },
    {
      "epoch": 4,
      "train_loss": 0.27737118249450576
    },
    {
      "epoch": 5,
      "train_loss": 0.20896544052678293
    },
    {
      "epoch": 6,
      "train_loss": 0.15534398090000953
    },
    {
      "epoch": 7,
      "train_loss": 0.11773543272898254
    },
    {
      "epoch": 8,
      "train_loss": 0.07906012590035061
    },
    {
      "epoch": 9,
      "train_loss": 0.05605952438313094
    },
    {
      "epoch": 10,
      "train_loss": 0.03452488826215441
    }
  ],
  "training_summary": {
    "actual_epochs": 10,
    "best_epoch": 10,
    "early_stopped": false,
    "backbone_model_name": "microsoft/deberta-v3-base",
    "tokenizer_name": "microsoft/deberta-v3-base"
  },
  "calibration": {
    "method": "temperature_grid_search",
    "rows": 6000,
    "temperature": 2.0,
    "loss": 0.5294126563569427
  },
  "hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/constraint_dimension_hf"
}