MindGamesColonelBlutto / eval_scripted_after_ppo.json
GOVINDFROM's picture
Upload eval_scripted_after_ppo.json
00011f2 verified
{
"overall": {
"n_games": 2100,
"n_wins": 1927,
"n_draws": 105,
"n_losses": 68,
"win_rate": 91.76190476190477,
"draw_rate": 5.0,
"loss_rate": 3.2380952380952377,
"win_rate_ci_95": {
"lower": 90.50831835820999,
"upper": 92.8629828701251
},
"average_outcome": 0.9426190476190476,
"outcome_std": 0.2039322894610053,
"avg_score_player": 2.0785714285714287,
"avg_score_opponent": 0.22666666666666666,
"avg_score_differential": 1.851904761904762,
"score_differential_std": 1.2225933367723631,
"max_score_differential": 3.0,
"min_score_differential": -3.0,
"avg_victory_margin": 2.0768033212247015,
"avg_defeat_margin": -1.661764705882353
},
"per_opponent": {
"Random": {
"n_games": 300,
"n_wins": 192,
"n_draws": 43,
"n_losses": 65,
"win_rate": 64.0,
"draw_rate": 14.333333333333334,
"loss_rate": 21.666666666666668,
"win_rate_ci_95": {
"lower": 58.422930323031295,
"upper": 69.22306648268142
},
"average_outcome": 0.7116666666666667,
"outcome_std": 0.41153844156881486,
"avg_score_player": 2.31,
"avg_score_opponent": 1.2933333333333332,
"avg_score_differential": 1.0166666666666666,
"score_differential_std": 1.76154919192044,
"max_score_differential": 3.0,
"min_score_differential": -3.0,
"avg_victory_margin": 2.1614583333333335,
"avg_defeat_margin": -1.6923076923076923
},
"Balanced": {
"n_games": 300,
"n_wins": 300,
"n_draws": 0,
"n_losses": 0,
"win_rate": 100.0,
"draw_rate": 0.0,
"loss_rate": 0.0,
"win_rate_ci_95": {
"lower": 98.73570287754538,
"upper": 99.99999999999997
},
"average_outcome": 1.0,
"outcome_std": 0.0,
"avg_score_player": 3.0,
"avg_score_opponent": 0.0,
"avg_score_differential": 3.0,
"score_differential_std": 0.0,
"max_score_differential": 3.0,
"min_score_differential": 3.0,
"avg_victory_margin": 3.0,
"avg_defeat_margin": 0.0
},
"AntiLast": {
"n_games": 300,
"n_wins": 300,
"n_draws": 0,
"n_losses": 0,
"win_rate": 100.0,
"draw_rate": 0.0,
"loss_rate": 0.0,
"win_rate_ci_95": {
"lower": 98.73570287754538,
"upper": 99.99999999999997
},
"average_outcome": 1.0,
"outcome_std": 0.0,
"avg_score_player": 3.0,
"avg_score_opponent": 0.0,
"avg_score_differential": 3.0,
"score_differential_std": 0.0,
"max_score_differential": 3.0,
"min_score_differential": 3.0,
"avg_victory_margin": 3.0,
"avg_defeat_margin": 0.0
},
"NoisedMirror": {
"n_games": 300,
"n_wins": 235,
"n_draws": 62,
"n_losses": 3,
"win_rate": 78.33333333333333,
"draw_rate": 20.666666666666668,
"loss_rate": 1.0,
"win_rate_ci_95": {
"lower": 73.32901513759226,
"upper": 82.62121649301679
},
"average_outcome": 0.8866666666666667,
"outcome_std": 0.22095751225568733,
"avg_score_player": 1.24,
"avg_score_opponent": 0.29333333333333333,
"avg_score_differential": 0.9466666666666667,
"score_differential_std": 0.6611774009715966,
"max_score_differential": 3.0,
"min_score_differential": -1.0,
"avg_victory_margin": 1.221276595744681,
"avg_defeat_margin": -1.0
},
"Heavy_0": {
"n_games": 300,
"n_wins": 300,
"n_draws": 0,
"n_losses": 0,
"win_rate": 100.0,
"draw_rate": 0.0,
"loss_rate": 0.0,
"win_rate_ci_95": {
"lower": 98.73570287754538,
"upper": 99.99999999999997
},
"average_outcome": 1.0,
"outcome_std": 0.0,
"avg_score_player": 1.0,
"avg_score_opponent": 0.0,
"avg_score_differential": 1.0,
"score_differential_std": 0.0,
"max_score_differential": 1.0,
"min_score_differential": 1.0,
"avg_victory_margin": 1.0,
"avg_defeat_margin": 0.0
},
"Heavy_1": {
"n_games": 300,
"n_wins": 300,
"n_draws": 0,
"n_losses": 0,
"win_rate": 100.0,
"draw_rate": 0.0,
"loss_rate": 0.0,
"win_rate_ci_95": {
"lower": 98.73570287754538,
"upper": 99.99999999999997
},
"average_outcome": 1.0,
"outcome_std": 0.0,
"avg_score_player": 1.0,
"avg_score_opponent": 0.0,
"avg_score_differential": 1.0,
"score_differential_std": 0.0,
"max_score_differential": 1.0,
"min_score_differential": 1.0,
"avg_victory_margin": 1.0,
"avg_defeat_margin": 0.0
},
"Heavy_2": {
"n_games": 300,
"n_wins": 300,
"n_draws": 0,
"n_losses": 0,
"win_rate": 100.0,
"draw_rate": 0.0,
"loss_rate": 0.0,
"win_rate_ci_95": {
"lower": 98.73570287754538,
"upper": 99.99999999999997
},
"average_outcome": 1.0,
"outcome_std": 0.0,
"avg_score_player": 3.0,
"avg_score_opponent": 0.0,
"avg_score_differential": 3.0,
"score_differential_std": 0.0,
"max_score_differential": 3.0,
"min_score_differential": 3.0,
"avg_victory_margin": 3.0,
"avg_defeat_margin": 0.0
}
}
}