rts-commander / realistic_mcp_nl_test_results.json
Luigi's picture
fix: Shared LLM model manager and UI positioning
1e98ab1
[
{
"language": "en",
"tests": [
{
"instruction": "Show me the current game state",
"response": "```json\n{\n \"tool\": \"get_game_state\"\n}\n``` ```json\n{\n \"tool\": \"attack_unit\",\n \"params\": {\n \"attacker_ids\": [\"unit1\"],\n \"target_id\": \"enemy1\"\n }\n}\n``` ```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \"factory\",\n \"position_x\": 100.0,\n \"position_y\": 100.0,\n \"player_id\": 1\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x",
"success": false,
"time": 7.834426164627075
},
{
"instruction": "Move my infantry units to position 150,200",
"response": "```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 150.0,\n \"target_y\": 200.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 150.0,\n \"target_y\": 200.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x",
"success": false,
"time": 6.460172891616821
},
{
"instruction": "Attack the enemy tank at coordinates 300,150",
"response": "```json\n{\n \"tool\": \"attack_position\",\n \"params\": {\n \"attacker_ids\": [\"unit1\"],\n \"target_x\": 300.0,\n \"target_y\": 150.0\n }\n}\n``` ```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \"tank\",\n \"position_x\": 300.0,\n \"position_y\": 150.0,\n \"player_id\": 1\n }\n}\n``` ```json\n{\n \"tool\": \"attack_unit\",\n \"params\": {\n \"attacker_ids\": [\"unit1\"],\n \"target_id\": \"enemy",
"success": false,
"time": 7.053299427032471
},
{
"instruction": "Build a barracks near my headquarters",
"response": "```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \"barracks\",\n \"position_x\": 100.0,\n \"position_y\": 150.0,\n \"player_id\": 1\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 150.0,\n \"target_y\": 200.0\n }\n}\n``` ```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \"barracks\",\n \"",
"success": false,
"time": 7.106475591659546
},
{
"instruction": "Send all my helicopters to patrol around 400,300",
"response": "```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"helicopter1\", \"helicopter2\"],\n \"target_x\": 400.0,\n \"target_y\": 300.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"helicopter3\", \"helicopter4\"],\n \"target_x\": 400.0,\n \"target_y\": 300.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"helicopter5\", \"helicopter",
"success": false,
"time": 13.421310186386108
}
]
},
{
"language": "fr",
"tests": [
{
"instruction": "Montre-moi l'état actuel du jeu",
"response": "Montre-moi l'état actuel du jeu\n{\n \"tool\": \"get_game_state\"\n} Montre-moi l'état actuel du jeu\n{\n \"tool\": \"get_game_state\"\n} Montre-moi l'état actuel du jeu\n{\n \"tool\": \"get_game_state\"\n} Montre-moi l'état actuel du jeu\n{\n \"tool\": \"get_game_state\"\n} Montre-moi l'état actuel du jeu\n{\n \"tool\": \"get_game_state\"\n} Montre-moi l'état actuel du jeu\n{\n \"tool\": \"get_game_state\"\n} Montre-moi l'état actuel du jeu",
"success": false,
"time": 11.66983151435852
},
{
"instruction": "Déplace mes unités d'infanterie à la position 150,200",
"response": "```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 150.0,\n \"target_y\": 200.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 150.0,\n \"target_y\": 200.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x",
"success": false,
"time": 12.125248432159424
},
{
"instruction": "Attaque le tank ennemi aux coordonnées 300,150",
"response": "```json\n{\n \"tool\": \"attack_unit\",\n \"params\": {\n \"attacker_ids\": [\"unit1\"],\n \"target_id\": \"enemy_tank\"\n }\n}\n```json\n{\n \"tool\": \"attack_position\",\n \"params\": {\n \"attacker_ids\": [\"unit1\"],\n \"target_x\": 300.0,\n \"target_y\": 150.0\n }\n}\n```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \"tank\",\n \"position_x\": 300.0,\n \"position_y\": 150.0,\n \"player_id\": 1",
"success": false,
"time": 13.577657461166382
},
{
"instruction": "Construis une caserne près de mon quartier général",
"response": "```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \"caserne\",\n \"position_x\": 100.0,\n \"position_y\": 150.0,\n \"player_id\": 1\n }\n}\n``` ```json\n{\n \"tool\": \"attack_position\",\n \"params\": {\n \"attacker_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 150.0,\n \"target_y\": 200.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2",
"success": false,
"time": 10.060194492340088
},
{
"instruction": "Envoie tous mes hélicoptères en patrouille autour de 400,300",
"response": "```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 400.0,\n \"target_y\": 300.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 400.0,\n \"target_y\": 300.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x",
"success": false,
"time": 12.325396060943604
}
]
},
{
"language": "zh-TW",
"tests": [
{
"instruction": "顯示目前遊戲狀態",
"response": "```json\n{\n \"tool\": \"get_game_state\"\n}\n``` ```json\n{\n \"tool\": \"attack_position\",\n \"params\": {\n \"attacker_ids\": [\"attacker1\"],\n \"target_x\": 100.0,\n \"target_y\": 150.0\n }\n}\n``` ```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \"factory\",\n \"position_x\": 200.0,\n \"position_y\": 250.0,\n \"player_id\": 1\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {",
"success": false,
"time": 12.829087257385254
},
{
"instruction": "將我的步兵單位移動到位置 150,200",
"response": "```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 150.0,\n \"target_y\": 200.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 150.0,\n \"target_y\": 200.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x",
"success": false,
"time": 12.319762706756592
},
{
"instruction": "攻擊座標 300,150 處的敵方坦克",
"response": "```json\n{\n \"tool\": \"attack_position\",\n \"params\": {\n \"attacker_ids\": [\"unit1\"],\n \"target_x\": 300.0,\n \"target_y\": 150.0\n }\n}\n``` ```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \"tank\",\n \"position_x\": 300.0,\n \"position_y\": 150.0,\n \"player_id\": 1\n }\n}\n``` ```json\n{\n \"tool\": \"attack_unit\",\n \"params\": {\n \"attacker_ids\": [\"unit1\"],\n \"target_id\": \"enemy",
"success": false,
"time": 11.226020812988281
},
{
"instruction": "在我的總部附近建造兵營",
"response": "```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \" barracks\",\n \"position_x\": 100.0,\n \"position_y\": 100.0,\n \"player_id\": 1\n }\n}\n``` ```json\n{\n \"tool\": \"attack_position\",\n \"params\": {\n \"attacker_ids\": [\"unit1\"],\n \"target_x\": 150.0,\n \"target_y\": 200.0\n }\n}\n``` ```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x",
"success": false,
"time": 10.452961444854736
},
{
"instruction": "派遣所有直升機到 400,300 附近巡邏",
"response": "```json\n{\n \"tool\": \"move_units\",\n \"params\": {\n \"unit_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 400.0,\n \"target_y\": 300.0\n }\n}\n``` ```json\n{\n \"tool\": \"attack_position\",\n \"params\": {\n \"attacker_ids\": [\"unit1\", \"unit2\"],\n \"target_x\": 400.0,\n \"target_y\": 300.0\n }\n}\n``` ```json\n{\n \"tool\": \"build_building\",\n \"params\": {\n \"building_type\": \"aircraft\",\n \"position_x\": 4",
"success": false,
"time": 11.03628921508789
}
]
}
]