cmndcntrlcyber commited on
Commit
3ff71be
·
verified ·
1 Parent(s): 5d1b48a

Phase 3 eval: baseline + finetuned metrics

Browse files
Files changed (3) hide show
  1. eval/baseline.json +8 -0
  2. eval/finetuned.json +8 -0
  3. eval/summary.json +22 -0
eval/baseline.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "exact_match": 0.0,
3
+ "bleu_4": 0.0,
4
+ "mean_edit_similarity": 0.0,
5
+ "num_samples": 200,
6
+ "syntax_valid_rate": 1.0,
7
+ "run_name": "baseline"
8
+ }
eval/finetuned.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "exact_match": 0.0,
3
+ "bleu_4": 0.0,
4
+ "mean_edit_similarity": 0.0,
5
+ "num_samples": 200,
6
+ "syntax_valid_rate": 1.0,
7
+ "run_name": "finetuned"
8
+ }
eval/summary.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": "cmndcntrlcyber/code-trainer-offsec-dataset@v2-multimodal",
3
+ "adapter": "cmndcntrlcyber/code-trainer-vision-adapter",
4
+ "split": "test",
5
+ "num_samples": 200,
6
+ "baseline": {
7
+ "exact_match": 0.0,
8
+ "bleu_4": 0.0,
9
+ "mean_edit_similarity": 0.0,
10
+ "num_samples": 200,
11
+ "syntax_valid_rate": 1.0,
12
+ "run_name": "baseline"
13
+ },
14
+ "finetuned": {
15
+ "exact_match": 0.0,
16
+ "bleu_4": 0.0,
17
+ "mean_edit_similarity": 0.0,
18
+ "num_samples": 200,
19
+ "syntax_valid_rate": 1.0,
20
+ "run_name": "finetuned"
21
+ }
22
+ }