npb_data_app / pitch_leaderboard.py
patrickramos's picture
Use short team names
9eda2f5
import gradio as gr
import polars as pl
import numpy as np
from datetime import datetime
# from itertools import chain
from data import data_df
from stats import compute_pitch_stats, filter_data_by_date_and_game_kind
from convert import ball_kind, ball_kind_to_color, get_text_color_from_color, team_names_short_to_color, get_text_color_from_team
from plotting import stat_cmap
STATS = ['Count', 'Usage', 'Swing%', 'Z-Swing%', 'Chase%', 'Contact%', 'Z-Contact%', 'O-Contact%', 'SwStr%', 'Whiff%', 'CSW%', 'GB%', 'FB%', 'LD%', 'Zone%', 'Arm%', 'Glove%', 'High%', 'Low%', 'MM%']
PCT_STATS = ['Usage', 'Swing%', 'Z-Swing%', 'Chase%', 'Contact%', 'Z-Contact%', 'O-Contact%', 'SwStr%', 'Whiff%', 'CSW%', 'GB%', 'FB%', 'LD%', 'Zone%', 'Arm%', 'Glove%', 'High%', 'Low%', 'MM%']
STATS_WITH_PCTLS = ['Swing%', 'Z-Swing%', 'Chase%', 'Contact%', 'Z-Contact%', 'O-Contact%', 'SwStr%', 'Whiff%', 'CSW%', 'GB%', 'FB%', 'LD%']
COLUMNS = ['Pitcher', 'Team', 'Pitch', 'Pitch (General)'] + STATS
PITCH_TYPES = [pitch_type for pitch_type in ball_kind.values() if pitch_type != '-']
TEAMS = [
'Yomiuri',
'Yakult',
'DeNA',
'Chunichi',
'Hanshin',
'Hiroshima',
'Nipponham',
'Rakuten',
'Seibu',
'Lotte',
'ORIX',
'SoftBank'
]
notes = '''**Limitations**
- [Column widths get messed up when filtering](https://github.com/gradio-app/gradio/issues/11564)
'''
def gr_create_pitch_leaderboard(start_date, end_date, min_pitches, pitcher_lr='Both', include_pitches=PITCH_TYPES, include_teams=None):
assert pitcher_lr in ['Both', 'Left', 'Right']
data = data_df.filter(pl.col('ballKind_code') != '-')
data = filter_data_by_date_and_game_kind(data, start_date=start_date, end_date=end_date, game_kind='Regular Season')
if pitcher_lr != 'Both':
data = data.filter(pl.col('batLR') == pitcher_lr[0].lower())
if include_teams is not None:
data = data.filter(pl.col('pitcher_team_name_short').is_in(include_teams))
# both, left, right = [
# (
# compute_pitch_stats(df, player_type='pitcher', min_pitches=min_pitches, pitch_class_type='specific')
# .filter(pl.col('qualified') & (pl.col('ballKind').is_in(include_pitches)))
# .drop('qualified')
# .rename({'pitcher_name': 'Pitcher', 'count': 'Count', 'usage': 'Usage', 'ballKind': 'Pitch', 'general_ballKind': 'Pitch (General)'} | {f'{stat}_pctl': f'{stat} (Pctl)' for stat in STATS_WITH_PCTLS})
# .with_columns(
# pl.col(stat).mul(100).round(1)
# for stat in PCT_STATS + [f'{stat} (Pctl)' for stat in STATS_WITH_PCTLS]
# )
# [['pitId', 'ballKind_code', 'Pitcher', 'Pitch', 'Pitch (General)', 'Count', 'Usage'] + STATS_WITH_PCTLS]
# )
# for df
# in [data, data.filter(pl.col('batLR') == 'l'), data.filter(pl.col('batLR') == 'r')]
# ]
# pitch_stats = (
# both
# .join(left, on=['pitId', 'ballKind_code'], suffix=' (LHH)', how='full')
# .join(right, on=['pitId', 'ballKind_code'], suffix=' (RHH)', how='full')
# .drop('pitId', 'ballKind_code', *list(chain.from_iterable([[f'{col} ({handedness}HH)' for col in ['pitId', 'ballKind_code', 'Pitcher', 'Pitch', 'Pitch (General)']] for handedness in ('L', 'R')])))
# )
pitch_stats = (
compute_pitch_stats(data, player_type='pitcher', min_pitches=min_pitches, pitch_class_type='specific')
.filter(pl.col('qualified') & (pl.col('ballKind').is_in(include_pitches)))
.drop('pitId', 'ballKind_code', 'qualified')
.rename({'pitcher_name': 'Pitcher', 'pitcher_team_name_short': 'Team', 'count': 'Count', 'usage': 'Usage', 'ballKind': 'Pitch', 'general_ballKind': 'Pitch (General)'})
.with_columns(
pl.col(stat).mul(100)
for stat in PCT_STATS
)
# [['Pitcher', 'Team', 'Pitch', 'Pitch (General)'] + STATS + [f'{stat}_pctl' for stat in STATS_WITH_PCTLS]]
)
styling = []
for i, row in enumerate(pitch_stats[COLUMNS].iter_rows()):
styling_row = []
for col, item in zip(pitch_stats[COLUMNS].columns, row):
if f'{col}_pctl' in pitch_stats:
r, g, b = (stat_cmap([pitch_stats[f'{col}_pctl'][i]])[0, :3]*255).astype(np.uint8)
styling_row.append(f'background-color: rgba({r}, {g}, {b})')
elif col == 'Team':
styling_row.append(f'color: {get_text_color_from_team(item)}; background-color: {team_names_short_to_color[item]}')
elif col in ['Pitch', 'Pitch (General)']:
color = ball_kind_to_color[item]
styling_row.append(f'color: {get_text_color_from_color(color)}; background-color: {color}')
else:
styling_row.append('')
styling.append(styling_row)
display_value = []
for row in pitch_stats[COLUMNS].iter_rows():
display_value_row = []
for item in row:
if isinstance(item, float):
display_value_row.append(f'{item:.1f}%')
else:
display_value_row.append(item)
display_value.append(display_value_row)
value = {
'data': pitch_stats[COLUMNS].rows(),
'headers': COLUMNS,
'metadata': {
'styling': styling,
'display_value': display_value,
}
}
return value
def create_pitch_leaderboard():
now = datetime.now()
start_datetime_init = datetime(now.year, 1, 1)
end_datetime_init = now
with gr.Blocks() as app:
gr.Markdown('# Pitch Leaderboard')
with gr.Row():
start_date = gr.DateTime(start_datetime_init, include_time=False, type='datetime', label='Start')
end_date = gr.DateTime(end_datetime_init, include_time=False, type='datetime', label='End')
with gr.Row():
include_pitches = gr.CheckboxGroup(PITCH_TYPES, value=PITCH_TYPES, label='Pitches', scale=3)
with gr.Column(scale=1):
all_pitches = gr.Button('Select/Deselect all pitches')
min_pitches = gr.Number(100, label='Min. Pitches', precision=0, minimum=0)
pitcher_lr = gr.Radio(['Both', 'Left', 'Right'], value='Both', label='Batter handedness')
with gr.Row():
include_teams = gr.CheckboxGroup(TEAMS, value=TEAMS, label='Teams', scale=3)
all_teams = gr.Button('Select/Deselect all teams')
search = gr.Button('Search')
# pin_columns = gr.Checkbox(True, 'Pin columns')
leaderboard = gr.DataFrame(
pl.DataFrame({'Pitcher': [], 'Pitch': []}),
column_widths=[200, 100, 200, 200] + [100]*len(STATS),
show_copy_button=True,
show_search=True,
pinned_columns=3
)
gr.Markdown(notes)
search.click(gr_create_pitch_leaderboard, inputs=[start_date, end_date, min_pitches, pitcher_lr, include_pitches, include_teams], outputs=leaderboard)
all_pitches.click(lambda _pitch_types : [] if _pitch_types == PITCH_TYPES else PITCH_TYPES, inputs=include_pitches, outputs=include_pitches)
all_teams.click(lambda _teams : [] if _teams == TEAMS else TEAMS, inputs=include_teams, outputs=include_teams)
# pin_columns.input(lambda _pin_columns : (gr.update(pinned_columns=None if _pin_columns else 3), not _pin_columns), inputs=pin_columns, outputs=[leaderboard, pin_columns])
return app
if __name__ == '__main__':
app = create_pitch_leaderboard()
app.launch()