nesticot commited on
Commit
a20dd31
·
verified ·
1 Parent(s): 865bc46

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +21 -0
app.py CHANGED
@@ -101,6 +101,27 @@ dataset = load_dataset('nesticot/mlb_data', data_files=['aaa_pitch_data_2024.csv
101
  dataset_train = dataset['train']
102
  df_a = dataset_train.to_pandas().set_index(list(dataset_train.features.keys())[0]).reset_index(drop=True)
103
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
104
  import datetime
105
 
106
  date_string = df_a['game_date'].min()
 
101
  dataset_train = dataset['train']
102
  df_a = dataset_train.to_pandas().set_index(list(dataset_train.features.keys())[0]).reset_index(drop=True)
103
 
104
+
105
+ mlb_stats = MLB_Scrape()
106
+ schedule_spring = mlb_stats.get_schedule(year_input=2024,
107
+ sport_id=11,
108
+ start_date='2024-01-01',
109
+ end_date='2024-12-31',
110
+ final=False,
111
+ regular=True,
112
+ spring=False)
113
+
114
+ schedule_spring = schedule_spring.drop_duplicates(subset=['game_id'])
115
+
116
+ schedule_spring = schedule_spring[(schedule_spring['date']==(datetime.today() - timedelta(hours=8)).date())]
117
+
118
+
119
+ data = mlb_stats.get_data(schedule_spring.game_id[:].values)
120
+ df_2023_new = mlb_stats.get_data_df(data_list = data)
121
+ df_a = pd.concat([df_a,df_2023_new])
122
+ df_a = df_a.drop_duplicates(subset=['play_id'],keep='last')
123
+
124
+
125
  import datetime
126
 
127
  date_string = df_a['game_date'].min()