iLOVE2D's picture
Upload 2846 files
5374a2d verified
{
"4": {
"score": 0.18000000000000002,
"success": {
"8": {
"modification": "(such as:add /delete /modify/ ...)",
"score": 0.20000000000000004
}
},
"failure": {}
},
"8": {
"score": 0.19999999999999998,
"success": {
"9": {
"modification": "(modify: change the number of generated answers from 5 to 3)",
"score": 0.22
},
"14": {
"modification": "modify: change the number of generated answers from 5 to 6",
"score": 0.20666666666666667
}
},
"failure": {
"12": {
"modification": "modify: change the number of generated answers from 5 to 4",
"score": 0.19999999999999998
}
}
},
"18": {
"score": 0.26,
"success": {},
"failure": {
"19": {
"modification": "(such as:add /delete /modify/ ...)",
"score": 0.22666666666666668
}
}
},
"1": {
"score": 0.08,
"success": {},
"failure": {
"3": {
"modification": "(add QAScEnsemble to improve answer selection)",
"score": 0.07333333333333333
}
}
},
"2": {
"score": 0.09999999999999999,
"success": {
"4": {
"modification": "(such as:add /delete /modify/ ...)",
"score": 0.18000000000000002
}
},
"failure": {
"5": {
"modification": "Introduce a self-ask mechanism to enhance the quality of generated answers.",
"score": 0.0
},
"7": {
"modification": "Added a self-ask mechanism to improve answer quality.",
"score": 0.0
}
}
},
"14": {
"score": 0.20666666666666667,
"success": {
"18": {
"modification": "Change the number of generated answers from 6 to 10 and add a self-consistency check before refining the answer.",
"score": 0.26
},
"16": {
"modification": "modify: Change the number of generated answers from 6 to 8 for better ensemble performance.",
"score": 0.2066666666666667
}
},
"failure": {}
},
"0": {
"score": 0.08,
"success": {
"2": {
"modification": "Added QAScEnsemble operator to aggregate answers before final selection.",
"score": 0.09999999999999999
}
},
"failure": {
"11": {
"modification": "modify: Added a review step using the Custom operator to enhance the solution before final output.",
"score": 0.0
},
"15": {
"modification": "modify: Added a review step using the QAScEnsemble operator to improve solution selection after generating answers.",
"score": 0.0
},
"6": {
"modification": "Added a review step before generating the final answer.",
"score": 0.0
},
"1": {
"modification": "modify: Added QAScEnsemble operator to improve solution selection.",
"score": 0.08
}
}
},
"10": {
"score": 0.21333333333333335,
"success": {},
"failure": {
"17": {
"modification": "(such as:add /delete /modify/ ...)",
"score": 0.20000000000000004
}
}
},
"9": {
"score": 0.22,
"success": {},
"failure": {
"10": {
"modification": "(modify: change the number of generated answers from 3 to 5)",
"score": 0.21333333333333335
},
"13": {
"modification": "Change the number of generated answers from 3 to 5",
"score": 0.19333333333333336
}
}
}
}