nesticot commited on
Commit
3fb7d68
·
verified ·
1 Parent(s): bbb7691

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +26 -0
app.py CHANGED
@@ -20,11 +20,37 @@ import pandas as pd
20
  from configure import base_url
21
  import shinyswatch
22
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
  ### Import Datasets
24
  dataset = load_dataset('nesticot/mlb_data', data_files=['mlb_pitch_data_2024.csv' ])
25
  dataset_train = dataset['train']
26
  df_2023_mlb = dataset_train.to_pandas().set_index(list(dataset_train.features.keys())[0]).reset_index(drop=True)
27
 
 
 
 
 
 
 
 
 
28
  # ### Import Datasets
29
  # dataset = load_dataset('nesticot/mlb_data', data_files=['aaa_pitch_data_2023.csv' ])
30
  # dataset_train = dataset['train']
 
20
  from configure import base_url
21
  import shinyswatch
22
 
23
+
24
+
25
+ mlb_stats = MLB_Scrape()
26
+
27
+ schedule_spring = mlb_stats.get_schedule(year_input=2024,
28
+ sport_id=1,
29
+ start_date='2024-01-01',
30
+ end_date='2024-12-31',
31
+ final=False,
32
+ regular=True,
33
+ spring=False)
34
+
35
+ schedule_spring = schedule_spring.drop_duplicates(subset=['game_id'])
36
+
37
+ schedule_spring = schedule_spring[(schedule_spring['date']==(datetime.today() - timedelta(hours=8)).date())]
38
+
39
+
40
+
41
  ### Import Datasets
42
  dataset = load_dataset('nesticot/mlb_data', data_files=['mlb_pitch_data_2024.csv' ])
43
  dataset_train = dataset['train']
44
  df_2023_mlb = dataset_train.to_pandas().set_index(list(dataset_train.features.keys())[0]).reset_index(drop=True)
45
 
46
+
47
+ data = mlb_stats.get_data(schedule_spring.game_id[:].values)
48
+ df_2023_new = mlb_stats.get_data_df(data_list = data)
49
+ df_2023 = pd.concat([df_2023_mlb,df_2023_new])
50
+ df_2023 = df_2023.drop_duplicates(subset=['play_id'],keep='last')
51
+
52
+
53
+
54
  # ### Import Datasets
55
  # dataset = load_dataset('nesticot/mlb_data', data_files=['aaa_pitch_data_2023.csv' ])
56
  # dataset_train = dataset['train']