| { | |
| "2": { | |
| "score": 0.5377777777777778, | |
| "success": { | |
| "4": { | |
| "modification": "Added a self-ask step to clarify the problem before generating an answer.", | |
| "score": 0.7577777777777778 | |
| } | |
| }, | |
| "failure": { | |
| "8": { | |
| "modification": "modify: Added a self-ask step before generating the answer to clarify the problem.", | |
| "score": 0.0044444444444444444 | |
| }, | |
| "3": { | |
| "modification": "modify: Added a step to revise the generated answer before the final ensemble selection.", | |
| "score": 0.5044444444444446 | |
| } | |
| } | |
| }, | |
| "4": { | |
| "score": 0.7577777777777778, | |
| "success": {}, | |
| "failure": { | |
| "5": { | |
| "modification": "(such as:add /delete /modify/ ...)", | |
| "score": 0.4222222222222222 | |
| }, | |
| "6": { | |
| "modification": "Added a step to generate alternative solutions before the ensemble step.", | |
| "score": 0.23777777777777778 | |
| } | |
| } | |
| }, | |
| "1": { | |
| "score": 0.5422222222222223, | |
| "success": {}, | |
| "failure": { | |
| "7": { | |
| "modification": "(add review step before ensemble selection)", | |
| "score": 0.12444444444444445 | |
| }, | |
| "2": { | |
| "modification": "(add: additional operator for review)", | |
| "score": 0.5377777777777778 | |
| } | |
| } | |
| }, | |
| "0": { | |
| "score": 0.5311111111111111, | |
| "success": { | |
| "1": { | |
| "modification": "(add additional operator for ensemble selection)", | |
| "score": 0.5422222222222222 | |
| } | |
| }, | |
| "failure": {} | |
| } | |
| } |