File size: 1,919 Bytes
e897220
432b303
e897220
 
 
432b303
 
e897220
 
 
 
 
 
 
 
 
 
 
 
 
432b303
 
e897220
 
 
 
 
 
 
 
 
 
 
 
 
283e3dd
 
e897220
 
 
 
 
 
 
 
432b303
 
e897220
 
 
283e3dd
 
e897220
 
 
432b303
 
e897220
 
 
 
 
 
 
 
432b303
 
e897220
 
 
432b303
 
e897220
 
 
432b303
 
e897220
 
 
 
 
 
 
432b303
 
e897220
 
 
 
 
 
 
 
432b303
 
e897220
 
 
432b303
 
 
283e3dd
e897220
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
{
  "avg_gen_seconds_per_example": 0.6461,
  "base_model": "Qwen/Qwen3.5-2B",
  "category_breakdown": {
    "ambiguous_delete": {
      "ok": 4,
      "ok_rate": 0.5,
      "rows": 8
    },
    "ambiguous_secret": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    },
    "cannot_cli": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    },
    "count_extension": {
      "ok": 2,
      "ok_rate": 0.25,
      "rows": 8
    },
    "create_archive": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    },
    "delete_specific_logs": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    },
    "enabled_services": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    },
    "extract_archive": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    },
    "find_jpgs": {
      "ok": 2,
      "ok_rate": 0.25,
      "rows": 8
    },
    "git_branch": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    },
    "grep_literal": {
      "ok": 1,
      "ok_rate": 0.125,
      "rows": 8
    },
    "json_query": {
      "ok": 5,
      "ok_rate": 0.625,
      "rows": 8
    },
    "replace_literal": {
      "ok": 7,
      "ok_rate": 0.875,
      "rows": 8
    },
    "show_env": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    },
    "top_ips": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    }
  },
  "enable_thinking": false,
  "image": "local",
  "mode_breakdown": {
    "ask": {
      "ok": 12,
      "ok_rate": 0.75,
      "rows": 16
    },
    "cannot": {
      "ok": 8,
      "ok_rate": 1.0,
      "rows": 8
    },
    "command": {
      "ok": 73,
      "ok_rate": 0.7604,
      "rows": 96
    }
  },
  "model": "/root/bitnet-nl2sh/output/autoresearch_proxy_qwen35_2b/repair_v3b_full_v1/qwen35_2b_batch8_repair_v3b_full_v1/model",
  "ok": 93,
  "ok_rate": 0.775,
  "prompt_file": "/root/bitnet-nl2sh/prompts/student_linux_shell_v2g.txt",
  "rows": 120
}