File size: 4,870 Bytes
8353665
 
 
 
65fefb5
8353665
 
 
 
 
f89cae0
 
 
8353665
bb5e4ba
 
 
 
 
 
 
 
8353665
 
 
bb5e4ba
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8353665
bb5e4ba
 
 
 
 
 
 
 
f89cae0
8353665
 
 
 
 
 
 
 
 
 
 
 
 
 
 
bb5e4ba
 
 
 
 
8353665
 
 
bb5e4ba
8353665
5cc9b28
8353665
 
 
 
 
 
bb5e4ba
 
 
8353665
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
import gradio as gr
import polars as pl

from datetime import datetime
# from itertools import chain

from data import data_df
from stats import compute_pitch_stats, filter_data_by_date_and_game_kind
from convert import ball_kind

STATS = ['Count', 'Usage', 'Swing%', 'Z-Swing%', 'Chase%', 'Contact%', 'Z-Contact%', 'O-Contact%', 'SwStr%', 'Whiff%', 'CSW%', 'GB%', 'FB%', 'LD%', 'Zone%', 'Arm%', 'Glove%', 'High%', 'Low%']
PCT_STATS = ['Usage', 'Swing%', 'Z-Swing%', 'Chase%', 'Contact%', 'Z-Contact%', 'O-Contact%', 'SwStr%', 'Whiff%', 'CSW%', 'GB%', 'FB%', 'LD%', 'Zone%', 'Arm%', 'Glove%', 'High%', 'Low%']
STATS_WITH_PCTLS = ['Swing%', 'Z-Swing%', 'Chase%', 'Contact%', 'Z-Contact%', 'O-Contact%', 'SwStr%', 'Whiff%', 'CSW%', 'GB%', 'FB%', 'LD%', 'Zone%']

todo = '''
**To-do**
- Color cells according to percentiles
'''

def gr_create_pitch_leaderboard(start_date, end_date, min_pitches, pitcher_lr, include_pitches):
  assert pitcher_lr in ['Both', 'Left', 'Right']

  data = data_df.filter(pl.col('ballKind_code') != '-')
  
  data = filter_data_by_date_and_game_kind(data, start_date=start_date, end_date=end_date, game_kind='Regular Season')
  if pitcher_lr != 'Both':
    data = data.filter(pl.col('batLR') == pitcher_lr[0].lower())
    
  # both, left, right = [
    # (
      # compute_pitch_stats(df, player_type='pitcher', min_pitches=min_pitches, pitch_class_type='specific')
      # .filter(pl.col('qualified') & (pl.col('ballKind').is_in(include_pitches)))
      # .drop('qualified')
      # .rename({'pitcher_name': 'Pitcher', 'count': 'Count', 'usage': 'Usage', 'ballKind': 'Pitch', 'general_ballKind': 'Pitch (General)'} | {f'{stat}_pctl': f'{stat} (Pctl)' for stat in STATS_WITH_PCTLS})
      # .with_columns(
        # pl.col(stat).mul(100).round(1)
        # for stat in PCT_STATS + [f'{stat} (Pctl)' for stat in STATS_WITH_PCTLS]
      # )
      # [['pitId', 'ballKind_code', 'Pitcher', 'Pitch', 'Pitch (General)', 'Count', 'Usage'] + STATS_WITH_PCTLS]
    # )
    # for df
    # in [data, data.filter(pl.col('batLR') == 'l'), data.filter(pl.col('batLR') == 'r')]
  # ]
  # pitch_stats = (
    # both
    # .join(left, on=['pitId', 'ballKind_code'], suffix=' (LHH)', how='full')
    # .join(right, on=['pitId', 'ballKind_code'], suffix=' (RHH)', how='full')
    # .drop('pitId', 'ballKind_code', *list(chain.from_iterable([[f'{col} ({handedness}HH)' for col in ['pitId', 'ballKind_code', 'Pitcher', 'Pitch', 'Pitch (General)']] for handedness in ('L', 'R')])))
  # )
  pitch_stats = (
        compute_pitch_stats(data, player_type='pitcher', min_pitches=min_pitches, pitch_class_type='specific')
        .filter(pl.col('qualified') & (pl.col('ballKind').is_in(include_pitches)))
        .drop('pitId', 'ballKind_code', 'qualified')
        .rename({'pitcher_name': 'Pitcher', 'count': 'Count', 'usage': 'Usage', 'ballKind': 'Pitch', 'general_ballKind': 'Pitch (General)'} | {f'{stat}_pctl': f'{stat} (Pctl)' for stat in STATS_WITH_PCTLS})
        .with_columns(
          pl.col(stat).mul(100).round(1)
          for stat in PCT_STATS + [f'{stat} (Pctl)' for stat in STATS_WITH_PCTLS]
        )
        [['Pitcher', 'Pitch', 'Pitch (General)'] + STATS]
  )
  return pitch_stats


def create_pitch_leaderboard():
  now = datetime.now()
  start_datetime_init = datetime(now.year, 1, 1)
  end_datetime_init = now
  pitch_types = [pitch_type for pitch_type in ball_kind.values() if pitch_type != '-']
  with gr.Blocks() as app:
    gr.Markdown('# Pitch Leaderboard')
    with gr.Row():
      start_date = gr.DateTime(start_datetime_init, include_time=False, type='datetime', label='Start')
      end_date = gr.DateTime(end_datetime_init, include_time=False, type='datetime', label='End')
    with gr.Row():
      include_pitches = gr.CheckboxGroup(pitch_types, value=pitch_types, label='Pitches', scale=3)
      with gr.Column(scale=1):
        all_pitches = gr.Button('Select/Deselect all pitches', scale=1)
        min_pitches = gr.Number(100, label='Min. Pitches', precision=0, minimum=0)
        pitcher_lr = gr.Radio(['Both', 'Left', 'Right'], value='Both', label='Batter handedness')
        
    search = gr.Button('Search')
    leaderboard = gr.DataFrame(
      pl.DataFrame({'Pitcher': [], 'Pitch': []}),
      # gr_create_pitch_leaderboard(start_date=start_date_init, end_date=end_date_init, min_pitches=100),
      column_widths=[200]*3 + [100]*len(STATS),
      show_copy_button=True,
      show_search=True,
      pinned_columns=2
    )


    search.click(gr_create_pitch_leaderboard, inputs=[start_date, end_date, min_pitches, pitcher_lr, include_pitches], outputs=leaderboard)
    all_pitches.click(lambda _pitch_types : [] if _pitch_types == pitch_types else pitch_types, inputs=include_pitches, outputs=include_pitches)
    gr.Markdown(todo)
  return app

if __name__ == '__main__':
  app = create_pitch_leaderboard()
  app.launch()