import gradio as gr from nim_game_env import NimGameEnv from nim_gpt_functions import plan_move, execute_move TEMPERATURE_DEFAULT = 0.5 PILES_DEFAULT = [3, 5, 7] HUMAN_STR = "Human" AI_STR = "AI" def reset_game(chat_history, nim_game_env): chat_history = [] nim_game_env = NimGameEnv(PILES_DEFAULT) game_state_text, game_state_piles = nim_game_env.reset() ascii_art = generate_game_state_ascii_art(game_state_piles, False, 0, "") message_str = "" return chat_history, chat_history, message_str, ascii_art, nim_game_env def generate_game_state_ascii_art(piles, done, reward, player): ascii_art = "Game Over, " + player + " wins!" if not done: pile_a = piles[0] pile_b = piles[1] pile_c = piles[2] ascii_art = f"Pile A: {'|' * pile_a} \nPile B: {'|' * pile_b} \nPile C: {'|' * pile_c}" return "
" + ascii_art + "" def send_chat_msg(inp, chat_history, nim_game_env, temperature, openai_api_key): if not openai_api_key or openai_api_key == "": warning_msg = "
Please paste your OpenAI API key (see https://beta.openai.com)" return chat_history, chat_history, warning_msg if not inp or inp == "": warning_msg = "
Please enter a move" return chat_history, chat_history, warning_msg inp = inp.strip() output = None chat_history = chat_history or [] text_obs, observation, reward, done, info = execute_move(inp, nim_game_env, openai_api_key) ascii_art = generate_game_state_ascii_art(observation, done, reward, HUMAN_STR) if done: if reward == 1: output = "Good game!" ascii_art = generate_game_state_ascii_art(observation, done, reward, HUMAN_STR) else: output = text_obs ascii_art = generate_game_state_ascii_art(observation, done, reward, AI_STR) else: output = plan_move(text_obs, temperature, openai_api_key) text_obs, observation, reward, done, info = execute_move(output, nim_game_env, openai_api_key) ascii_art = generate_game_state_ascii_art(observation, done, reward, AI_STR) chat_history.append((HUMAN_STR + ": " + inp, AI_STR + ": " + output)) return chat_history, chat_history, ascii_art def update_foo(widget, state): if widget: state = widget return state block = gr.Blocks(css=".gradio-container {background-color: lightgray}") with block as nim_game: temperature_state = gr.State(TEMPERATURE_DEFAULT) openai_api_key_state = gr.State() history_state = gr.State() nim_game_env_state = gr.State(NimGameEnv(PILES_DEFAULT)) with gr.Row(): game_state_html = gr.Markdown() title = gr.Markdown("""