Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -18,8 +18,10 @@ from matplotlib.gridspec import GridSpec
|
|
18 |
import matplotlib.pyplot as plt
|
19 |
from scipy.stats import gaussian_kde
|
20 |
|
|
|
|
|
21 |
### Import Datasets
|
22 |
-
dataset = load_dataset('nesticot/mlb_data', data_files=['
|
23 |
dataset_train = dataset['train']
|
24 |
df_2023 = dataset_train.to_pandas().set_index(list(dataset_train.features.keys())[0]).reset_index(drop=True)
|
25 |
# Paths to data
|
@@ -68,7 +70,7 @@ df_2023_bip['h_la'] = df_2023_bip['h_la'].round(0)
|
|
68 |
|
69 |
df_2023_bip['season'] = df_2023_bip['game_date'].str[0:4].astype(int)
|
70 |
|
71 |
-
df_2023_bip = df_2023_bip[df_2023_bip['season'] ==
|
72 |
df_2022_bip = df_2023_bip[df_2023_bip['season'] == 2022]
|
73 |
|
74 |
batter_dict = df_2023_bip.sort_values('batter_name').set_index('batter_id')['batter_name'].to_dict()
|
@@ -84,10 +86,10 @@ def server(input,output,session):
|
|
84 |
def plot():
|
85 |
|
86 |
batter_id_select = int(input.batter_id())
|
87 |
-
df_batter_2023 = df_2023_bip.loc[(df_2023_bip['batter_id'] == batter_id_select)&(df_2023_bip['season']==
|
88 |
df_batter_2022 = df_2023_bip.loc[(df_2023_bip['batter_id'] == batter_id_select)&(df_2023_bip['season']==2022)]
|
89 |
|
90 |
-
df_non_batter_2023 = df_2023_bip.loc[(df_2023_bip['batter_id'] != batter_id_select)&(df_2023_bip['season']==
|
91 |
df_non_batter_2022 = df_2023_bip.loc[(df_2023_bip['batter_id'] != batter_id_select)&(df_2023_bip['season']==2022)]
|
92 |
|
93 |
traj_df = df_batter_2023.groupby(['traj'])['launch_speed'].count() / len(df_batter_2023)
|
@@ -317,7 +319,7 @@ def server(input,output,session):
|
|
317 |
# # ax12.text(s='Less\nOften',x=0.5,y=0.26,
|
318 |
# # va='bottom',ha='center',fontsize=12)
|
319 |
|
320 |
-
ax01.text(s=f"{df_batter_2023['batter_name'].values[0]}'s
|
321 |
x=0.5,
|
322 |
y=0.8,va='top',ha='center',fontsize=20)
|
323 |
|
|
|
18 |
import matplotlib.pyplot as plt
|
19 |
from scipy.stats import gaussian_kde
|
20 |
|
21 |
+
season = 2024
|
22 |
+
|
23 |
### Import Datasets
|
24 |
+
dataset = load_dataset('nesticot/mlb_data', data_files=[f'mlb_pitch_data_{season}.csv'])
|
25 |
dataset_train = dataset['train']
|
26 |
df_2023 = dataset_train.to_pandas().set_index(list(dataset_train.features.keys())[0]).reset_index(drop=True)
|
27 |
# Paths to data
|
|
|
70 |
|
71 |
df_2023_bip['season'] = df_2023_bip['game_date'].str[0:4].astype(int)
|
72 |
|
73 |
+
df_2023_bip = df_2023_bip[df_2023_bip['season'] == {season}]
|
74 |
df_2022_bip = df_2023_bip[df_2023_bip['season'] == 2022]
|
75 |
|
76 |
batter_dict = df_2023_bip.sort_values('batter_name').set_index('batter_id')['batter_name'].to_dict()
|
|
|
86 |
def plot():
|
87 |
|
88 |
batter_id_select = int(input.batter_id())
|
89 |
+
df_batter_2023 = df_2023_bip.loc[(df_2023_bip['batter_id'] == batter_id_select)&(df_2023_bip['season']=={season})]
|
90 |
df_batter_2022 = df_2023_bip.loc[(df_2023_bip['batter_id'] == batter_id_select)&(df_2023_bip['season']==2022)]
|
91 |
|
92 |
+
df_non_batter_2023 = df_2023_bip.loc[(df_2023_bip['batter_id'] != batter_id_select)&(df_2023_bip['season']=={season})]
|
93 |
df_non_batter_2022 = df_2023_bip.loc[(df_2023_bip['batter_id'] != batter_id_select)&(df_2023_bip['season']==2022)]
|
94 |
|
95 |
traj_df = df_batter_2023.groupby(['traj'])['launch_speed'].count() / len(df_batter_2023)
|
|
|
319 |
# # ax12.text(s='Less\nOften',x=0.5,y=0.26,
|
320 |
# # va='bottom',ha='center',fontsize=12)
|
321 |
|
322 |
+
ax01.text(s=f"{df_batter_2023['batter_name'].values[0]}'s {season} Batted Ball Tendencies",
|
323 |
x=0.5,
|
324 |
y=0.8,va='top',ha='center',fontsize=20)
|
325 |
|