lmgame_bench / app.py
Yuxuan-Zhang-Dexter
update app.py
603247d
raw
history blame
30.4 kB
import gradio as gr
import os
import pandas as pd
import json
from PIL import Image, ImageSequence
import io
from functools import reduce
import numpy as np
from datetime import datetime, timedelta
import matplotlib.pyplot as plt
from leaderboard_utils import (
get_organization,
get_mario_leaderboard,
get_sokoban_leaderboard,
get_2048_leaderboard,
get_candy_leaderboard,
get_tetris_leaderboard,
get_tetris_planning_leaderboard,
get_combined_leaderboard,
GAME_ORDER
)
from data_visualization import (
get_combined_leaderboard_with_group_bar,
create_organization_radar_chart,
create_top_players_radar_chart,
create_player_radar_chart,
create_horizontal_bar_chart,
normalize_values
)
# Define time points and their corresponding data files
TIME_POINTS = {
"03/25/2025": "rank_data_03_25_2025.json",
# Add more time points here as they become available
}
# Load the initial JSON file with rank data
with open(TIME_POINTS["03/25/2025"], "r") as f:
rank_data = json.load(f)
# Add leaderboard state at the top level
leaderboard_state = {
"current_game": None,
"previous_overall": {
"Super Mario Bros": True,
"Sokoban": True,
"2048": True,
"Candy Crash": True,
"Tetris (complete)": True,
"Tetris (planning only)": True
},
"previous_details": {
"Super Mario Bros": False,
"Sokoban": False,
"2048": False,
"Candy Crash": False,
"Tetris (complete)": False,
"Tetris (planning only)": False
}
}
# Define GIF paths for the carousel
GIF_PATHS = [
"assets/super_mario_bros/super_mario.gif",
"assets/sokoban/sokoban.gif",
"assets/2048/2048.gif",
"assets/candy/candy.gif",
"assets/tetris/tetris.gif"
]
# Print and verify GIF paths
print("\nChecking GIF paths:")
for gif_path in GIF_PATHS:
if os.path.exists(gif_path):
print(f"โœ“ Found: {gif_path}")
# Print file size
size = os.path.getsize(gif_path)
print(f" Size: {size / (1024*1024):.2f} MB")
else:
print(f"โœ— Missing: {gif_path}")
# Load video links and news data
with open('assets/game_video_link.json', 'r') as f:
VIDEO_LINKS = json.load(f)
with open('assets/news.json', 'r') as f:
NEWS_DATA = json.load(f)
def load_gif(gif_path):
"""Load a GIF file and return it as a PIL Image"""
try:
img = Image.open(gif_path)
print(f"Successfully loaded GIF: {gif_path}")
return img
except Exception as e:
print(f"Error loading GIF {gif_path}: {e}")
return None
def create_gif_carousel():
"""Create a custom HTML/JS component for GIF carousel"""
print("\nCreating GIF carousel with paths:", GIF_PATHS)
html = f"""
<div id="gif-carousel" style="width: 100%; height: 300px; position: relative; background-color: #f0f0f0;">
<img id="current-gif" style="width: 100%; height: 100%; object-fit: contain;" onerror="console.error('Failed to load GIF:', this.src);">
</div>
<script>
const gifs = {json.dumps(GIF_PATHS)};
let currentIndex = 0;
function updateGif() {{
const img = document.getElementById('current-gif');
console.log('Loading GIF:', gifs[currentIndex]);
img.src = gifs[currentIndex];
currentIndex = (currentIndex + 1) % gifs.length;
}}
// Update GIF every 5 seconds
setInterval(updateGif, 5000);
// Initial load
updateGif();
</script>
"""
return gr.HTML(html)
def load_rank_data(time_point):
"""Load rank data for a specific time point"""
if time_point in TIME_POINTS:
try:
with open(TIME_POINTS[time_point], "r") as f:
return json.load(f)
except FileNotFoundError:
return None
return None
def update_leaderboard(mario_overall, mario_details,
sokoban_overall, sokoban_details,
_2048_overall, _2048_details,
candy_overall, candy_details,
tetris_overall, tetris_details,
tetris_plan_overall, tetris_plan_details):
global leaderboard_state
# Convert current checkbox states to dictionary for easier comparison
current_overall = {
"Super Mario Bros": mario_overall,
"Sokoban": sokoban_overall,
"2048": _2048_overall,
"Candy Crash": candy_overall,
"Tetris (complete)": tetris_overall,
"Tetris (planning only)": tetris_plan_overall
}
current_details = {
"Super Mario Bros": mario_details,
"Sokoban": sokoban_details,
"2048": _2048_details,
"Candy Crash": candy_details,
"Tetris (complete)": tetris_details,
"Tetris (planning only)": tetris_plan_details
}
# Find which game's state changed
changed_game = None
for game in current_overall.keys():
if (current_overall[game] != leaderboard_state["previous_overall"][game] or
current_details[game] != leaderboard_state["previous_details"][game]):
changed_game = game
break
if changed_game:
# If a game's details checkbox was checked
if current_details[changed_game] and not leaderboard_state["previous_details"][changed_game]:
# Reset all other games' states
for game in current_overall.keys():
if game != changed_game:
current_overall[game] = False
current_details[game] = False
leaderboard_state["previous_overall"][game] = False
leaderboard_state["previous_details"][game] = False
# Update state for the selected game
leaderboard_state["current_game"] = changed_game
leaderboard_state["previous_overall"][changed_game] = True
leaderboard_state["previous_details"][changed_game] = True
current_overall[changed_game] = True
# If a game's overall checkbox was checked
elif current_overall[changed_game] and not leaderboard_state["previous_overall"][changed_game]:
# If we were in details view for another game, switch to overall view
if leaderboard_state["current_game"] and leaderboard_state["previous_details"][leaderboard_state["current_game"]]:
# Reset previous game's details
leaderboard_state["previous_details"][leaderboard_state["current_game"]] = False
current_details[leaderboard_state["current_game"]] = False
leaderboard_state["current_game"] = None
# Update state
leaderboard_state["previous_overall"][changed_game] = True
leaderboard_state["previous_details"][changed_game] = False
# If a game's overall checkbox was unchecked
elif not current_overall[changed_game] and leaderboard_state["previous_overall"][changed_game]:
# If we're in details view, don't allow unchecking the overall checkbox
if leaderboard_state["current_game"] == changed_game:
current_overall[changed_game] = True
else:
leaderboard_state["previous_overall"][changed_game] = False
if leaderboard_state["current_game"] == changed_game:
leaderboard_state["current_game"] = None
# If a game's details checkbox was unchecked
elif not current_details[changed_game] and leaderboard_state["previous_details"][changed_game]:
leaderboard_state["previous_details"][changed_game] = False
if leaderboard_state["current_game"] == changed_game:
leaderboard_state["current_game"] = None
# When exiting details view, reset to show all games
for game in current_overall.keys():
current_overall[game] = True
current_details[game] = False
leaderboard_state["previous_overall"][game] = True
leaderboard_state["previous_details"][game] = False
# Special case: If all games are selected and we're trying to view details
all_games_selected = all(current_overall.values()) and not any(current_details.values())
if all_games_selected and changed_game and current_details[changed_game]:
# Reset all other games' states
for game in current_overall.keys():
if game != changed_game:
current_overall[game] = False
current_details[game] = False
leaderboard_state["previous_overall"][game] = False
leaderboard_state["previous_details"][game] = False
# Update state for the selected game
leaderboard_state["current_game"] = changed_game
leaderboard_state["previous_overall"][changed_game] = True
leaderboard_state["previous_details"][changed_game] = True
current_overall[changed_game] = True
# Build dictionary for selected games
selected_games = {
"Super Mario Bros": current_overall["Super Mario Bros"],
"Sokoban": current_overall["Sokoban"],
"2048": current_overall["2048"],
"Candy Crash": current_overall["Candy Crash"],
"Tetris (complete)": current_overall["Tetris (complete)"],
"Tetris (planning only)": current_overall["Tetris (planning only)"]
}
# Get the appropriate DataFrame and chart based on current state
if leaderboard_state["current_game"]:
# For detailed view
if leaderboard_state["current_game"] == "Super Mario Bros":
df = get_mario_leaderboard(rank_data)
elif leaderboard_state["current_game"] == "Sokoban":
df = get_sokoban_leaderboard(rank_data)
elif leaderboard_state["current_game"] == "2048":
df = get_2048_leaderboard(rank_data)
elif leaderboard_state["current_game"] == "Candy Crash":
df = get_candy_leaderboard(rank_data)
elif leaderboard_state["current_game"] == "Tetris (complete)":
df = get_tetris_leaderboard(rank_data)
else: # Tetris (planning only)
df = get_tetris_planning_leaderboard(rank_data)
# Always create a new chart for detailed view
chart = create_horizontal_bar_chart(df, leaderboard_state["current_game"])
else:
# For overall view
df, chart = get_combined_leaderboard_with_group_bar(rank_data, selected_games)
# Return exactly 14 values to match the expected outputs
return (df, chart,
current_overall["Super Mario Bros"], current_details["Super Mario Bros"],
current_overall["Sokoban"], current_details["Sokoban"],
current_overall["2048"], current_details["2048"],
current_overall["Candy Crash"], current_details["Candy Crash"],
current_overall["Tetris (complete)"], current_details["Tetris (complete)"],
current_overall["Tetris (planning only)"], current_details["Tetris (planning only)"])
def update_leaderboard_with_time(time_point, mario_overall, mario_details,
sokoban_overall, sokoban_details,
_2048_overall, _2048_details,
candy_overall, candy_details,
tetris_overall, tetris_details,
tetris_plan_overall, tetris_plan_details):
# Load rank data for the selected time point
global rank_data
new_rank_data = load_rank_data(time_point)
if new_rank_data is not None:
rank_data = new_rank_data
# Use the existing update_leaderboard function
return update_leaderboard(mario_overall, mario_details,
sokoban_overall, sokoban_details,
_2048_overall, _2048_details,
candy_overall, candy_details,
tetris_overall, tetris_details,
tetris_plan_overall, tetris_plan_details)
def get_initial_state():
"""Get the initial state for the leaderboard"""
return {
"current_game": None,
"previous_overall": {
"Super Mario Bros": True,
"Sokoban": True,
"2048": True,
"Candy Crash": True,
"Tetris (complete)": True,
"Tetris (planning only)": True
},
"previous_details": {
"Super Mario Bros": False,
"Sokoban": False,
"2048": False,
"Candy Crash": False,
"Tetris (complete)": False,
"Tetris (planning only)": False
}
}
def clear_filters():
global leaderboard_state
# Reset all checkboxes to default state
selected_games = {
"Super Mario Bros": True,
"Sokoban": True,
"2048": True,
"Candy Crash": True,
"Tetris (complete)": True,
"Tetris (planning only)": True
}
# Get the combined leaderboard and group bar chart
df, chart = get_combined_leaderboard_with_group_bar(rank_data, selected_games)
# Reset the leaderboard state to match the default checkbox states
leaderboard_state = get_initial_state()
# Return exactly 14 values to match the expected outputs
return (df, chart,
True, False, # mario
True, False, # sokoban
True, False, # 2048
True, False, # candy
True, False, # tetris
True, False) # tetris plan
def create_timeline_slider():
"""Create a custom timeline slider component"""
timeline_html = """
<div class="timeline-container">
<style>
.timeline-container {
width: 85%; /* Increased from 70% to 85% */
padding: 8px;
font-family: Arial, sans-serif;
height: 40px;
display: flex;
align-items: center;
}
.timeline-track {
position: relative;
height: 6px;
background: #e0e0e0;
border-radius: 3px;
margin: 0;
width: 100%;
}
.timeline-progress {
position: absolute;
height: 100%;
background: #2196F3;
border-radius: 3px;
width: 100%;
}
.timeline-handle {
position: absolute;
right: 0;
top: 50%;
transform: translate(50%, -50%);
width: 20px;
height: 20px;
background: #2196F3;
border: 3px solid white;
border-radius: 50%;
cursor: pointer;
box-shadow: 0 2px 6px rgba(0,0,0,0.3);
}
.timeline-date {
position: absolute;
top: -25px;
transform: translateX(-50%);
background: #2196F3; /* Changed to match slider blue color */
color: #ffffff !important;
padding: 3px 8px;
border-radius: 4px;
font-size: 12px;
white-space: nowrap;
font-weight: 600;
box-shadow: 0 2px 6px rgba(0,0,0,0.2);
letter-spacing: 0.5px;
text-shadow: 0 1px 2px rgba(0,0,0,0.2);
}
</style>
<div class="timeline-track">
<div class="timeline-progress"></div>
<div class="timeline-handle">
<div class="timeline-date">03/25/2025</div>
</div>
</div>
</div>
<script>
(function() {
const container = document.querySelector('.timeline-container');
const track = container.querySelector('.timeline-track');
const handle = container.querySelector('.timeline-handle');
let isDragging = false;
// For now, we only have one time point
const timePoints = {
"03/25/2025": 1.0
};
function updatePosition(e) {
if (!isDragging) return;
const rect = track.getBoundingClientRect();
let x = (e.clientX - rect.left) / rect.width;
x = Math.max(0, Math.min(1, x));
// For now, snap to the only available time point
x = 1.0;
handle.style.right = `${(1 - x) * 100}%`;
}
handle.addEventListener('mousedown', (e) => {
isDragging = true;
e.preventDefault();
});
document.addEventListener('mousemove', updatePosition);
document.addEventListener('mouseup', () => {
isDragging = false;
});
// Prevent text selection while dragging
container.addEventListener('selectstart', (e) => {
if (isDragging) e.preventDefault();
});
})();
</script>
"""
return gr.HTML(timeline_html)
def create_video_gallery():
"""Create a custom HTML/JS component for video gallery"""
# Extract video IDs
mario_id = VIDEO_LINKS["super_mario"].split("?v=")[1]
sokoban_id = VIDEO_LINKS["sokoban"].split("?v=")[1]
game_2048_id = VIDEO_LINKS["2048"].split("?v=")[1]
candy_id = VIDEO_LINKS["candy"].split("?v=")[1]
# Generate news HTML
news_items = []
for item in NEWS_DATA["news"]:
video_id = item["video_link"].split("?v=")[1]
date_obj = datetime.strptime(item["date"], "%Y-%m-%d")
formatted_date = date_obj.strftime("%B %d, %Y")
news_items.append(f'''
<div class="news-item">
<div class="news-date">{formatted_date}</div>
<div class="news-content">
<div class="news-video">
<div class="video-wrapper">
<iframe src="https://www.youtube.com/embed/{video_id}"></iframe>
</div>
</div>
<div class="news-text">
<a href="{item["twitter_link"]}" target="_blank" class="twitter-link">
<span class="twitter-icon">๐Ÿ“ข</span>
{item["twitter_text"]}
</a>
</div>
</div>
</div>
''')
news_html = '\n'.join(news_items)
gallery_html = f'''
<div class="video-gallery-container">
<style>
.video-gallery-container {{
width: 100%;
max-width: 1400px;
margin: 0 auto;
padding: 20px;
}}
.video-grid {{
display: grid;
grid-template-columns: repeat(2, 1fr);
gap: 20px;
margin-top: 20px;
margin-bottom: 40px;
}}
.video-card {{
background: #ffffff;
border-radius: 10px;
box-shadow: 0 2px 10px rgba(0,0,0,0.1);
overflow: hidden;
transition: transform 0.2s;
}}
.video-card:hover {{
transform: translateY(-5px);
}}
.video-wrapper {{
position: relative;
padding-bottom: 56.25%;
height: 0;
overflow: hidden;
}}
.video-wrapper iframe {{
position: absolute;
top: 0;
left: 0;
width: 100%;
height: 100%;
border: none;
}}
.video-title {{
padding: 15px;
font-size: 1.2em;
font-weight: bold;
color: #2c3e50;
text-align: center;
background: #f8f9fa;
border-top: 1px solid #eee;
}}
.news-section {{
margin-top: 40px;
border-top: 2px solid #e9ecef;
padding-top: 20px;
}}
.news-section-title {{
font-size: 1.8em;
font-weight: bold;
color: #2c3e50;
margin-bottom: 20px;
text-align: center;
}}
.news-item {{
background: #ffffff;
border-radius: 10px;
box-shadow: 0 2px 10px rgba(0,0,0,0.1);
margin-bottom: 20px;
overflow: hidden;
}}
.news-date {{
padding: 10px 20px;
background: #f8f9fa;
color: #666;
font-size: 0.9em;
border-bottom: 1px solid #eee;
}}
.news-content {{
display: flex;
padding: 20px;
align-items: center;
gap: 30px;
}}
.news-video {{
flex: 0 0 300px;
}}
.news-text {{
flex: 1;
display: flex;
align-items: center;
min-height: 169px; /* Match 16:9 video height */
}}
.twitter-link {{
color: #2c3e50;
text-decoration: none;
display: flex;
align-items: center;
gap: 15px;
font-size: 1.4em;
font-weight: 600;
line-height: 1.4;
}}
.twitter-link:hover {{
color: #1da1f2;
}}
.twitter-icon {{
font-size: 1.5em;
color: #1da1f2;
}}
</style>
<div class="video-grid">
<div class="video-card">
<div class="video-wrapper">
<iframe src="https://www.youtube.com/embed/{mario_id}"></iframe>
</div>
<div class="video-title">๐ŸŽฎ Super Mario Bros</div>
</div>
<div class="video-card">
<div class="video-wrapper">
<iframe src="https://www.youtube.com/embed/{sokoban_id}"></iframe>
</div>
<div class="video-title">๐Ÿ“ฆ Sokoban</div>
</div>
<div class="video-card">
<div class="video-wrapper">
<iframe src="https://www.youtube.com/embed/{game_2048_id}"></iframe>
</div>
<div class="video-title">๐Ÿ”ข 2048</div>
</div>
<div class="video-card">
<div class="video-wrapper">
<iframe src="https://www.youtube.com/embed/{candy_id}"></iframe>
</div>
<div class="video-title">๐Ÿฌ Candy Crash</div>
</div>
</div>
<div class="news-section">
<div class="news-section-title">๐Ÿ“ฐ Latest News</div>
{news_html}
</div>
</div>
'''
return gr.HTML(gallery_html)
def build_app():
with gr.Blocks(css="""
.visualization-container {
height: 85vh !important;
max-height: 900px !important;
min-height: 600px !important;
background-color: #f8f9fa;
border-radius: 10px;
padding: 25px; /* Increased padding */
box-shadow: 0 2px 4px rgba(0,0,0,0.1);
overflow: hidden;
margin: 0 auto !important; /* Center the visualization */
}
.visualization-container .plot {
height: 100% !important;
width: 100% !important;
}
.section-title {
font-size: 1.5em;
font-weight: bold;
color: #2c3e50;
margin-bottom: 15px;
padding-bottom: 10px;
border-bottom: 2px solid #e9ecef;
text-align: center; /* Center the title */
}
/* Add container for the entire app */
.container {
max-width: 1400px;
margin: 0 auto;
padding: 0 20px;
}
""") as demo:
gr.Markdown("# ๐ŸŽฎ Game Arena: Gaming Agent ๐ŸŽฒ")
with gr.Tabs():
with gr.Tab("๐Ÿ† Leaderboard"):
# Visualization section at the very top
with gr.Row():
gr.Markdown("### ๐Ÿ“Š Data Visualization")
with gr.Row():
visualization = gr.Plot(
value=get_combined_leaderboard_with_group_bar(rank_data, {
"Super Mario Bros": True,
"Sokoban": True,
"2048": True,
"Candy Crash": True,
"Tetris (complete)": True,
"Tetris (planning only)": True
})[1],
label="Performance Visualization",
elem_classes="visualization-container"
)
# Game selection section
with gr.Row():
gr.Markdown("### ๐ŸŽฎ Game Selection")
with gr.Row():
# For each game, we have two checkboxes: one for overall and one for detailed view.
with gr.Column():
gr.Markdown("**๐ŸŽฎ Super Mario Bros**")
mario_overall = gr.Checkbox(label="Super Mario Bros Score", value=True)
mario_details = gr.Checkbox(label="Super Mario Bros Details", value=False)
with gr.Column():
gr.Markdown("**๐Ÿ“ฆ Sokoban**")
sokoban_overall = gr.Checkbox(label="Sokoban Score", value=True)
sokoban_details = gr.Checkbox(label="Sokoban Details", value=False)
with gr.Column():
gr.Markdown("**๐Ÿ”ข 2048**")
_2048_overall = gr.Checkbox(label="2048 Score", value=True)
_2048_details = gr.Checkbox(label="2048 Details", value=False)
with gr.Column():
gr.Markdown("**๐Ÿฌ Candy Crash**")
candy_overall = gr.Checkbox(label="Candy Crash Score", value=True)
candy_details = gr.Checkbox(label="Candy Crash Details", value=False)
with gr.Column():
gr.Markdown("**๐ŸŽฏ Tetris (complete)**")
tetris_overall = gr.Checkbox(label="Tetris (complete) Score", value=True)
tetris_details = gr.Checkbox(label="Tetris (complete) Details", value=False)
with gr.Column():
gr.Markdown("**๐Ÿ“‹ Tetris (planning)**")
tetris_plan_overall = gr.Checkbox(label="Tetris (planning) Score", value=True)
tetris_plan_details = gr.Checkbox(label="Tetris (planning) Details", value=False)
# Time progression display and control buttons - Moved below game selection
with gr.Row():
with gr.Column(scale=2):
gr.Markdown("**โฐ Time Tracker**")
timeline = create_timeline_slider()
with gr.Column(scale=1):
gr.Markdown("**๐Ÿ”„ Controls**")
clear_btn = gr.Button("Reset Filters", variant="secondary")
# Leaderboard table section
with gr.Row():
gr.Markdown("### ๐Ÿ“‹ Detailed Results")
with gr.Row():
leaderboard_board = gr.DataFrame(
value=get_combined_leaderboard(rank_data, {
"Super Mario Bros": True,
"Sokoban": True,
"2048": True,
"Candy Crash": True,
"Tetris (complete)": True,
"Tetris (planning only)": True
}),
interactive=True,
wrap=True,
label="Leaderboard"
)
# List of all checkboxes (in order)
checkbox_list = [mario_overall, mario_details,
sokoban_overall, sokoban_details,
_2048_overall, _2048_details,
candy_overall, candy_details,
tetris_overall, tetris_details,
tetris_plan_overall, tetris_plan_details]
# Initialize the leaderboard state when the app starts
demo.load(
fn=clear_filters,
inputs=[],
outputs=[leaderboard_board, visualization] + checkbox_list
)
# Update both the leaderboard and visualization when checkboxes change
for checkbox in checkbox_list:
checkbox.change(
fn=update_leaderboard,
inputs=checkbox_list,
outputs=[leaderboard_board, visualization] + checkbox_list
)
# Update both when clear button is clicked
clear_btn.click(
fn=clear_filters,
inputs=[],
outputs=[leaderboard_board, visualization] + checkbox_list
)
with gr.Tab("๐ŸŽฅ Gallery"):
video_gallery = create_video_gallery()
return demo
if __name__ == "__main__":
demo_app = build_app()
# Add file serving configuration
demo_app.launch(debug=True, show_error=True, share=True)