Update app.py
Browse files
app.py
CHANGED
|
@@ -6,6 +6,7 @@ import os
|
|
| 6 |
import json
|
| 7 |
import streamlit as st
|
| 8 |
import pandas as pd
|
|
|
|
| 9 |
from st_aggrid import AgGrid, GridOptionsBuilder, GridUpdateMode
|
| 10 |
|
| 11 |
|
|
@@ -92,8 +93,8 @@ season = 2025
|
|
| 92 |
level = 'mlb'
|
| 93 |
# dataset = load_dataset('TJStatsApps/mlb_data', data_files=[f'{level}_pitch_data_{season}.csv' ])
|
| 94 |
dataset = pl.read_parquet(f"hf://datasets/TJStatsApps/mlb_data/data/{level}_pitch_data_{season}.parquet")
|
| 95 |
-
dataset_train = dataset['train']
|
| 96 |
-
df =
|
| 97 |
df['batter_name_team'] = df['batter_name'] + ' - ' + df['batter_team']
|
| 98 |
|
| 99 |
# Sample dictionary
|
|
|
|
| 6 |
import json
|
| 7 |
import streamlit as st
|
| 8 |
import pandas as pd
|
| 9 |
+
import polars as pl
|
| 10 |
from st_aggrid import AgGrid, GridOptionsBuilder, GridUpdateMode
|
| 11 |
|
| 12 |
|
|
|
|
| 93 |
level = 'mlb'
|
| 94 |
# dataset = load_dataset('TJStatsApps/mlb_data', data_files=[f'{level}_pitch_data_{season}.csv' ])
|
| 95 |
dataset = pl.read_parquet(f"hf://datasets/TJStatsApps/mlb_data/data/{level}_pitch_data_{season}.parquet")
|
| 96 |
+
# dataset_train = dataset['train']
|
| 97 |
+
df = dataset.to_pandas().set_index(list(dataset_train.features.keys())[0]).reset_index(drop=True).drop_duplicates(subset=['play_id'],keep='last')
|
| 98 |
df['batter_name_team'] = df['batter_name'] + ' - ' + df['batter_team']
|
| 99 |
|
| 100 |
# Sample dictionary
|