File size: 4,224 Bytes
5374a2d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 |
{
"4": {
"score": 0.18000000000000002,
"success": {
"8": {
"modification": "(such as:add /delete /modify/ ...)",
"score": 0.20000000000000004
}
},
"failure": {}
},
"8": {
"score": 0.19999999999999998,
"success": {
"9": {
"modification": "(modify: change the number of generated answers from 5 to 3)",
"score": 0.22
},
"14": {
"modification": "modify: change the number of generated answers from 5 to 6",
"score": 0.20666666666666667
}
},
"failure": {
"12": {
"modification": "modify: change the number of generated answers from 5 to 4",
"score": 0.19999999999999998
}
}
},
"18": {
"score": 0.26,
"success": {},
"failure": {
"19": {
"modification": "(such as:add /delete /modify/ ...)",
"score": 0.22666666666666668
}
}
},
"1": {
"score": 0.08,
"success": {},
"failure": {
"3": {
"modification": "(add QAScEnsemble to improve answer selection)",
"score": 0.07333333333333333
}
}
},
"2": {
"score": 0.09999999999999999,
"success": {
"4": {
"modification": "(such as:add /delete /modify/ ...)",
"score": 0.18000000000000002
}
},
"failure": {
"5": {
"modification": "Introduce a self-ask mechanism to enhance the quality of generated answers.",
"score": 0.0
},
"7": {
"modification": "Added a self-ask mechanism to improve answer quality.",
"score": 0.0
}
}
},
"14": {
"score": 0.20666666666666667,
"success": {
"18": {
"modification": "Change the number of generated answers from 6 to 10 and add a self-consistency check before refining the answer.",
"score": 0.26
},
"16": {
"modification": "modify: Change the number of generated answers from 6 to 8 for better ensemble performance.",
"score": 0.2066666666666667
}
},
"failure": {}
},
"0": {
"score": 0.08,
"success": {
"2": {
"modification": "Added QAScEnsemble operator to aggregate answers before final selection.",
"score": 0.09999999999999999
}
},
"failure": {
"11": {
"modification": "modify: Added a review step using the Custom operator to enhance the solution before final output.",
"score": 0.0
},
"15": {
"modification": "modify: Added a review step using the QAScEnsemble operator to improve solution selection after generating answers.",
"score": 0.0
},
"6": {
"modification": "Added a review step before generating the final answer.",
"score": 0.0
},
"1": {
"modification": "modify: Added QAScEnsemble operator to improve solution selection.",
"score": 0.08
}
}
},
"10": {
"score": 0.21333333333333335,
"success": {},
"failure": {
"17": {
"modification": "(such as:add /delete /modify/ ...)",
"score": 0.20000000000000004
}
}
},
"9": {
"score": 0.22,
"success": {},
"failure": {
"10": {
"modification": "(modify: change the number of generated answers from 3 to 5)",
"score": 0.21333333333333335
},
"13": {
"modification": "Change the number of generated answers from 3 to 5",
"score": 0.19333333333333336
}
}
}
} |