Spaces:

lcipolina
/

LLM_OpenSpiel_Arena

Sleeping

App Files Files Community

lcipolina commited on Feb 6

Commit

106f4f6

verified ·

1 Parent(s): d37d01f

Trying to bring back the game playing

Browse files

Files changed (1) hide show

app.py +45 -25

app.py CHANGED Viewed

@@ -3,19 +3,18 @@ import json
 import pandas as pd
 import gradio as gr
 from agents.llm_registry import LLM_REGISTRY  # Dynamically fetch LLM models
 # Extract available LLM models
 llm_models = list(LLM_REGISTRY.keys())
 # Define game list manually (for now)
-games_list = [
-    "rock_paper_scissors",
-    "prisoners_dilemma",
-    "tic_tac_toe",
-    "connect_four",
-    "matching_pennies",
-    "kuhn_poker",
-]
 # File to persist results
 RESULTS_TRACKER_FILE = "results_tracker.json"
@@ -56,17 +55,47 @@ def calculate_leaderboard(selected_game: str) -> pd.DataFrame:
     leaderboard_df.rename(columns={"index": "LLM Model"}, inplace=True)
     return leaderboard_df
-def generate_stats_file(model_name: str):
-    """Generate a JSON file with detailed statistics for the selected LLM model."""
-    file_path = f"{model_name}_stats.json"
-    with open(file_path, "w") as f:
-        json.dump(results_tracker.get(model_name, {}), f, indent=4)
-    return file_path
 # Gradio Interface
 with gr.Blocks() as interface:
     with gr.Tab("Game Arena"):
-        gr.Markdown("# LLM Game Arena\nPlay against LLMs or other players in classic games!")
     with gr.Tab("Leaderboard"):
         gr.Markdown("# LLM Model Leaderboard\nTrack performance across different games!")
@@ -81,16 +110,7 @@ with gr.Blocks() as interface:
             """Updates the leaderboard table based on the selected game."""
             return calculate_leaderboard(selected_game)
-        def provide_download_file(model_name):
-            """Creates a downloadable JSON file with stats for the selected model."""
-            return generate_stats_file(model_name)
-        def refresh_leaderboard():
-            """Manually refresh the leaderboard."""
-            return calculate_leaderboard(game_dropdown.value)
         game_dropdown.change(fn=update_leaderboard, inputs=[game_dropdown], outputs=[leaderboard_table])
-        model_dropdown.change(fn=provide_download_file, inputs=[model_dropdown], outputs=[download_button])
-        refresh_button.click(fn=refresh_leaderboard, inputs=[], outputs=[leaderboard_table])
 interface.launch()

 import pandas as pd
 import gradio as gr
 from agents.llm_registry import LLM_REGISTRY  # Dynamically fetch LLM models
+from simulators.tic_tac_toe_simulator import TicTacToeSimulator
+from simulators.prisoners_dilemma_simulator import PrisonersDilemmaSimulator
+from simulators.rock_paper_scissors_simulator import RockPaperScissorsSimulator
+from games_registry import GAMES_REGISTRY
+from simulators.base_simulator import PlayerType
+from typing import Dict
 # Extract available LLM models
 llm_models = list(LLM_REGISTRY.keys())
 # Define game list manually (for now)
+games_list = list(GAMES_REGISTRY.keys())
 # File to persist results
 RESULTS_TRACKER_FILE = "results_tracker.json"
     leaderboard_df.rename(columns={"index": "LLM Model"}, inplace=True)
     return leaderboard_df
+def play_game(game_name, player1_type, player2_type, player1_model, player2_model, rounds):
+    """Play the selected game with specified players."""
+    llms = {}
+    if player1_type == "llm":
+        llms["Player 1"] = player1_model
+    if player2_type == "llm":
+        llms["Player 2"] = player2_model
+    simulator_class = GAMES_REGISTRY[game_name]
+    simulator = simulator_class(game_name, llms=llms)
+    game_states = []
+    def log_fn(state):
+        """Log current state and legal moves."""
+        current_player = state.current_player()
+        legal_moves = state.legal_actions(current_player)
+        board = str(state)
+        game_states.append(f"Current Player: {current_player}\nBoard:\n{board}\nLegal Moves: {legal_moves}")
+    results = simulator.simulate(rounds=int(rounds), log_fn=log_fn)
+    return "\n".join(game_states) + f"\nGame Result: {results}"
 # Gradio Interface
 with gr.Blocks() as interface:
     with gr.Tab("Game Arena"):
+        gr.Markdown("# LLM Game Arena\nSelect a game and players to play against LLMs.")
+        game_dropdown = gr.Dropdown(choices=games_list, label="Select a Game", value=games_list[0])
+        player1_dropdown = gr.Dropdown(choices=["human", "random_bot", "llm"], label="Player 1 Type", value="llm")
+        player2_dropdown = gr.Dropdown(choices=["human", "random_bot", "llm"], label="Player 2 Type", value="random_bot")
+        player1_model_dropdown = gr.Dropdown(choices=llm_models, label="Player 1 Model", visible=False)
+        player2_model_dropdown = gr.Dropdown(choices=llm_models, label="Player 2 Model", visible=False)
+        rounds_slider = gr.Slider(1, 10, step=1, label="Rounds")
+        result_output = gr.Textbox(label="Game Result")
+        play_button = gr.Button("Play Game")
+        play_button.click(
+            play_game,
+            inputs=[game_dropdown, player1_dropdown, player2_dropdown, player1_model_dropdown, player2_model_dropdown, rounds_slider],
+            outputs=result_output,
+        )
     with gr.Tab("Leaderboard"):
         gr.Markdown("# LLM Model Leaderboard\nTrack performance across different games!")
             """Updates the leaderboard table based on the selected game."""
             return calculate_leaderboard(selected_game)
         game_dropdown.change(fn=update_leaderboard, inputs=[game_dropdown], outputs=[leaderboard_table])
+        refresh_button.click(fn=update_leaderboard, inputs=[game_dropdown], outputs=[leaderboard_table])
 interface.launch()