File size: 1,836 Bytes
5374a2d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
{
    "2": {
        "score": 0.5377777777777778,
        "success": {
            "4": {
                "modification": "Added a self-ask step to clarify the problem before generating an answer.",
                "score": 0.7577777777777778
            }
        },
        "failure": {
            "8": {
                "modification": "modify: Added a self-ask step before generating the answer to clarify the problem.",
                "score": 0.0044444444444444444
            },
            "3": {
                "modification": "modify: Added a step to revise the generated answer before the final ensemble selection.",
                "score": 0.5044444444444446
            }
        }
    },
    "4": {
        "score": 0.7577777777777778,
        "success": {},
        "failure": {
            "5": {
                "modification": "(such as:add /delete /modify/ ...)",
                "score": 0.4222222222222222
            },
            "6": {
                "modification": "Added a step to generate alternative solutions before the ensemble step.",
                "score": 0.23777777777777778
            }
        }
    },
    "1": {
        "score": 0.5422222222222223,
        "success": {},
        "failure": {
            "7": {
                "modification": "(add review step before ensemble selection)",
                "score": 0.12444444444444445
            },
            "2": {
                "modification": "(add: additional operator for review)",
                "score": 0.5377777777777778
            }
        }
    },
    "0": {
        "score": 0.5311111111111111,
        "success": {
            "1": {
                "modification": "(add additional operator for ensemble selection)",
                "score": 0.5422222222222222
            }
        },
        "failure": {}
    }
}