| { | |
| "4": { | |
| "score": 0.18000000000000002, | |
| "success": { | |
| "8": { | |
| "modification": "(such as:add /delete /modify/ ...)", | |
| "score": 0.20000000000000004 | |
| } | |
| }, | |
| "failure": {} | |
| }, | |
| "8": { | |
| "score": 0.19999999999999998, | |
| "success": { | |
| "9": { | |
| "modification": "(modify: change the number of generated answers from 5 to 3)", | |
| "score": 0.22 | |
| }, | |
| "14": { | |
| "modification": "modify: change the number of generated answers from 5 to 6", | |
| "score": 0.20666666666666667 | |
| } | |
| }, | |
| "failure": { | |
| "12": { | |
| "modification": "modify: change the number of generated answers from 5 to 4", | |
| "score": 0.19999999999999998 | |
| } | |
| } | |
| }, | |
| "18": { | |
| "score": 0.26, | |
| "success": {}, | |
| "failure": { | |
| "19": { | |
| "modification": "(such as:add /delete /modify/ ...)", | |
| "score": 0.22666666666666668 | |
| } | |
| } | |
| }, | |
| "1": { | |
| "score": 0.08, | |
| "success": {}, | |
| "failure": { | |
| "3": { | |
| "modification": "(add QAScEnsemble to improve answer selection)", | |
| "score": 0.07333333333333333 | |
| } | |
| } | |
| }, | |
| "2": { | |
| "score": 0.09999999999999999, | |
| "success": { | |
| "4": { | |
| "modification": "(such as:add /delete /modify/ ...)", | |
| "score": 0.18000000000000002 | |
| } | |
| }, | |
| "failure": { | |
| "5": { | |
| "modification": "Introduce a self-ask mechanism to enhance the quality of generated answers.", | |
| "score": 0.0 | |
| }, | |
| "7": { | |
| "modification": "Added a self-ask mechanism to improve answer quality.", | |
| "score": 0.0 | |
| } | |
| } | |
| }, | |
| "14": { | |
| "score": 0.20666666666666667, | |
| "success": { | |
| "18": { | |
| "modification": "Change the number of generated answers from 6 to 10 and add a self-consistency check before refining the answer.", | |
| "score": 0.26 | |
| }, | |
| "16": { | |
| "modification": "modify: Change the number of generated answers from 6 to 8 for better ensemble performance.", | |
| "score": 0.2066666666666667 | |
| } | |
| }, | |
| "failure": {} | |
| }, | |
| "0": { | |
| "score": 0.08, | |
| "success": { | |
| "2": { | |
| "modification": "Added QAScEnsemble operator to aggregate answers before final selection.", | |
| "score": 0.09999999999999999 | |
| } | |
| }, | |
| "failure": { | |
| "11": { | |
| "modification": "modify: Added a review step using the Custom operator to enhance the solution before final output.", | |
| "score": 0.0 | |
| }, | |
| "15": { | |
| "modification": "modify: Added a review step using the QAScEnsemble operator to improve solution selection after generating answers.", | |
| "score": 0.0 | |
| }, | |
| "6": { | |
| "modification": "Added a review step before generating the final answer.", | |
| "score": 0.0 | |
| }, | |
| "1": { | |
| "modification": "modify: Added QAScEnsemble operator to improve solution selection.", | |
| "score": 0.08 | |
| } | |
| } | |
| }, | |
| "10": { | |
| "score": 0.21333333333333335, | |
| "success": {}, | |
| "failure": { | |
| "17": { | |
| "modification": "(such as:add /delete /modify/ ...)", | |
| "score": 0.20000000000000004 | |
| } | |
| } | |
| }, | |
| "9": { | |
| "score": 0.22, | |
| "success": {}, | |
| "failure": { | |
| "10": { | |
| "modification": "(modify: change the number of generated answers from 3 to 5)", | |
| "score": 0.21333333333333335 | |
| }, | |
| "13": { | |
| "modification": "Change the number of generated answers from 3 to 5", | |
| "score": 0.19333333333333336 | |
| } | |
| } | |
| } | |
| } |