| { | |
| "5": { | |
| "score": 0.8533333333333334, | |
| "success": {}, | |
| "failure": { | |
| "8": { | |
| "modification": "(modify: added a step to generate a summary of the answer before review)", | |
| "score": 0.8266666666666667 | |
| }, | |
| "9": { | |
| "modification": "(added a validation step before review)", | |
| "score": 0.0 | |
| } | |
| } | |
| }, | |
| "0": { | |
| "score": 0.84, | |
| "success": {}, | |
| "failure": { | |
| "3": { | |
| "modification": "modify: add a review step after answer generation", | |
| "score": 0.8333333333333334 | |
| }, | |
| "4": { | |
| "modification": "modify: add QAScEnsemble operator to improve answer selection", | |
| "score": 0.0 | |
| }, | |
| "1": { | |
| "modification": "(add: QAScEnsemble)", | |
| "score": 0.0 | |
| }, | |
| "2": { | |
| "modification": "(add: QAScEnsemble, modify: workflow to include review step)", | |
| "score": 0.0 | |
| } | |
| } | |
| }, | |
| "3": { | |
| "score": 0.8333333333333334, | |
| "success": { | |
| "5": { | |
| "modification": "(such as:add /delete /modify/ ...)", | |
| "score": 0.8533333333333334 | |
| } | |
| }, | |
| "failure": {} | |
| }, | |
| "1": { | |
| "score": 0.0, | |
| "success": {}, | |
| "failure": { | |
| "6": { | |
| "modification": "(modify: added a review step before generating the final answer)", | |
| "score": 0.0 | |
| }, | |
| "7": { | |
| "modification": "(added a review step after answer generation)", | |
| "score": 0.0 | |
| } | |
| } | |
| } | |
| } |