Sampler-Arena / elo.py
rwitz's picture
Update elo.py
aec4104 verified
raw
history blame
2.51 kB
import math
def update_elo_ratings(ratings_dict, winner, loser, category):
# Extract old ratings and games played for the specific category
winner_category_data = ratings_dict.get(winner, {}).get(category, {})
loser_category_data = ratings_dict.get(loser, {}).get(category, {})
winner_old_rating = winner_category_data.get('elo_rating', 1200)
loser_old_rating = loser_category_data.get('elo_rating', 1200)
winner_games_played = winner_category_data.get('games_played', 0)
loser_games_played = loser_category_data.get('games_played', 0)
# Function to determine the K-factor based on games played
def determine_k_factor(games_played):
# Define K-factor based on number of games played. Adjust these thresholds as needed.
if games_played < 30:
return 40
elif games_played < 100:
return 20
else:
return 10
# Determine K-factors
winner_k_factor = determine_k_factor(winner_games_played)
loser_k_factor = determine_k_factor(loser_games_played)
def elo(winner_rating, loser_rating, k_factor_winner=32, k_factor_loser=32):
# Calculate the expected scores for each player
winner_expected = 1 / (1 + 10 ** ((loser_rating - winner_rating) / 400))
loser_expected = 1 / (1 + 10 ** ((winner_rating - loser_rating) / 400))
# Calculate the new ratings for each player
winner_new_rating = winner_rating + k_factor_winner * (1 - winner_expected)
loser_new_rating = loser_rating + k_factor_loser * (0 - loser_expected)
return winner_new_rating, loser_new_rating
# Calculate new ratings
winner_new_rating, loser_new_rating = elo(winner_old_rating, loser_old_rating, k_factor_winner=winner_k_factor, k_factor_loser=loser_k_factor)
# Update ratings and games played in the dictionary for the specific category
if winner not in ratings_dict:
ratings_dict[winner] = {}
if category not in ratings_dict[winner]:
ratings_dict[winner][category] = {}
ratings_dict[winner][category]['elo_rating'] = winner_new_rating
ratings_dict[winner][category]['games_played'] = winner_games_played + 1
if loser not in ratings_dict:
ratings_dict[loser] = {}
if category not in ratings_dict[loser]:
ratings_dict[loser][category] = {}
ratings_dict[loser][category]['elo_rating'] = loser_new_rating
ratings_dict[loser][category]['games_played'] = loser_games_played + 1
return ratings_dict