ConorWang commited on
Commit
d726cee
·
verified ·
1 Parent(s): 2b94466

Upload model/epoch_history.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. model/epoch_history.json +144 -0
model/epoch_history.json ADDED
@@ -0,0 +1,144 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epochs": [
3
+ {
4
+ "epoch": 1,
5
+ "eval_metrics": {
6
+ "avg_binary_accuracy": 0.795,
7
+ "confirmation_required_accuracy": 0.8,
8
+ "count": 25,
9
+ "eval_batches": 25,
10
+ "eval_loss": 7.704372234344483,
11
+ "mode_accuracy": 0.44,
12
+ "permission_bit_accuracy": 0.850909090909091,
13
+ "precondition_ok_accuracy": 0.76,
14
+ "quality_score": 0.21877532557574186,
15
+ "rollback_supported_accuracy": 0.72,
16
+ "schema_ok_accuracy": 0.76,
17
+ "session_required_accuracy": 1.0,
18
+ "tool_accuracy": 0.24,
19
+ "trigger_accuracy": 0.76,
20
+ "validator_required_accuracy": 0.8,
21
+ "worktree_required_accuracy": 0.76
22
+ },
23
+ "improved": true,
24
+ "quality_score": 0.21877532557574186,
25
+ "train_metrics": {
26
+ "loss": 0.5388983534915107,
27
+ "micro_batches": 70,
28
+ "optimizer_steps": 5
29
+ }
30
+ },
31
+ {
32
+ "epoch": 2,
33
+ "eval_metrics": {
34
+ "avg_binary_accuracy": 0.81,
35
+ "confirmation_required_accuracy": 0.8,
36
+ "count": 25,
37
+ "eval_batches": 25,
38
+ "eval_loss": 7.129253711700439,
39
+ "mode_accuracy": 0.48,
40
+ "permission_bit_accuracy": 0.8545454545454545,
41
+ "precondition_ok_accuracy": 0.76,
42
+ "quality_score": 0.4400157397790389,
43
+ "rollback_supported_accuracy": 0.8,
44
+ "schema_ok_accuracy": 0.76,
45
+ "session_required_accuracy": 1.0,
46
+ "tool_accuracy": 0.44,
47
+ "trigger_accuracy": 0.76,
48
+ "validator_required_accuracy": 0.8,
49
+ "worktree_required_accuracy": 0.8
50
+ },
51
+ "improved": true,
52
+ "quality_score": 0.4400157397790389,
53
+ "train_metrics": {
54
+ "loss": 0.4655745736190251,
55
+ "micro_batches": 70,
56
+ "optimizer_steps": 5
57
+ }
58
+ },
59
+ {
60
+ "epoch": 3,
61
+ "eval_metrics": {
62
+ "avg_binary_accuracy": 0.81,
63
+ "confirmation_required_accuracy": 0.8,
64
+ "count": 25,
65
+ "eval_batches": 25,
66
+ "eval_loss": 6.935494079589843,
67
+ "mode_accuracy": 0.48,
68
+ "permission_bit_accuracy": 0.8545454545454545,
69
+ "precondition_ok_accuracy": 0.76,
70
+ "quality_score": 0.4229221342606978,
71
+ "rollback_supported_accuracy": 0.8,
72
+ "schema_ok_accuracy": 0.76,
73
+ "session_required_accuracy": 1.0,
74
+ "tool_accuracy": 0.4,
75
+ "trigger_accuracy": 0.76,
76
+ "validator_required_accuracy": 0.8,
77
+ "worktree_required_accuracy": 0.8
78
+ },
79
+ "improved": false,
80
+ "quality_score": 0.4229221342606978,
81
+ "train_metrics": {
82
+ "loss": 0.43205853487764084,
83
+ "micro_batches": 70,
84
+ "optimizer_steps": 5
85
+ }
86
+ },
87
+ {
88
+ "epoch": 4,
89
+ "eval_metrics": {
90
+ "avg_binary_accuracy": 0.81,
91
+ "confirmation_required_accuracy": 0.8,
92
+ "count": 25,
93
+ "eval_batches": 25,
94
+ "eval_loss": 6.897225952148437,
95
+ "mode_accuracy": 0.56,
96
+ "permission_bit_accuracy": 0.8545454545454545,
97
+ "precondition_ok_accuracy": 0.76,
98
+ "quality_score": 0.46349615617231893,
99
+ "rollback_supported_accuracy": 0.8,
100
+ "schema_ok_accuracy": 0.76,
101
+ "session_required_accuracy": 1.0,
102
+ "tool_accuracy": 0.44,
103
+ "trigger_accuracy": 0.76,
104
+ "validator_required_accuracy": 0.8,
105
+ "worktree_required_accuracy": 0.8
106
+ },
107
+ "improved": true,
108
+ "quality_score": 0.46349615617231893,
109
+ "train_metrics": {
110
+ "loss": 0.42175399448190415,
111
+ "micro_batches": 70,
112
+ "optimizer_steps": 5
113
+ }
114
+ },
115
+ {
116
+ "epoch": 5,
117
+ "eval_metrics": {
118
+ "avg_binary_accuracy": 0.81,
119
+ "confirmation_required_accuracy": 0.8,
120
+ "count": 25,
121
+ "eval_batches": 25,
122
+ "eval_loss": 6.89590030670166,
123
+ "mode_accuracy": 0.56,
124
+ "permission_bit_accuracy": 0.8545454545454545,
125
+ "precondition_ok_accuracy": 0.76,
126
+ "quality_score": 0.4635160408540206,
127
+ "rollback_supported_accuracy": 0.8,
128
+ "schema_ok_accuracy": 0.76,
129
+ "session_required_accuracy": 1.0,
130
+ "tool_accuracy": 0.44,
131
+ "trigger_accuracy": 0.76,
132
+ "validator_required_accuracy": 0.8,
133
+ "worktree_required_accuracy": 0.8
134
+ },
135
+ "improved": false,
136
+ "quality_score": 0.4635160408540206,
137
+ "train_metrics": {
138
+ "loss": 0.4198248211826597,
139
+ "micro_batches": 70,
140
+ "optimizer_steps": 5
141
+ }
142
+ }
143
+ ]
144
+ }