Spaces:
Runtime error
Runtime error
| import gradio as gr | |
| import pandas as pd | |
| from sklearn.preprocessing import PolynomialFeatures | |
| from pymongo import MongoClient | |
| import pickle | |
| import joblib | |
| # --- MongoDB Setup --- | |
| uri = "mongodb+srv://csmith715:I3xSO3ImRKFyQ0hf@cluster0.hc5mw.mongodb.net/" | |
| client = MongoClient(uri) | |
| database = client.get_database("gemrate") | |
| market_data = database.get_collection("alt_market_data") | |
| # --- Load Model and Encoder --- | |
| gradient_boosting_reg = joblib.load('gbm_card_model.joblib') | |
| with open('card_encoder.pkl', 'rb') as file: | |
| loaded_encoder = pickle.load(file) | |
| # --- Helper Functions --- | |
| def transform_data(dframe): | |
| dframe = pd.get_dummies(dframe, columns=['grader']) | |
| dframe['ds'] = pd.to_datetime(dframe['ds']) | |
| dframe['year'] = dframe['ds'].dt.year | |
| dframe['month'] = dframe['ds'].dt.month | |
| dframe['day_of_week'] = dframe['ds'].dt.dayofweek | |
| dframe = dframe.drop('ds', axis=1) | |
| dframe['grade'] = pd.to_numeric(dframe['grade'], errors='coerce') | |
| poly = PolynomialFeatures(degree=3, include_bias=False) | |
| grade_poly = poly.fit_transform(dframe[['grade']]) | |
| grade_poly_df = pd.DataFrame(grade_poly, columns=['grade1', 'grade^2', 'grade^3']) | |
| dframe = pd.concat([dframe, grade_poly_df], axis=1) | |
| dframe = dframe.drop('grade1', axis=1) | |
| return dframe | |
| def calculate_moving_averages(dframe): | |
| dframe['ds'] = pd.to_datetime(dframe['ds']) | |
| dframe['y'] = dframe['y'].astype(float) | |
| dframe = dframe.sort_values(by=['certnumber', 'grade', 'grader', 'ds']) | |
| dframe.set_index('ds', inplace=True) | |
| def compute_group_moving_averages(group): | |
| group = group.sort_index() | |
| group['ma_3d'] = group['y'].rolling('3D').mean() | |
| group['ma_7d'] = group['y'].rolling('7D').mean() | |
| group['ma_30d'] = group['y'].rolling('30D').mean() | |
| return group | |
| grouped = dframe.groupby(['certnumber', 'grade', 'grader'], group_keys=False) | |
| dframe = grouped.apply(compute_group_moving_averages) | |
| return dframe.reset_index() | |
| def lookup_certnumber(certnumber): | |
| results = market_data.find( | |
| {'cert_number': certnumber}, | |
| { | |
| '_id': 0, | |
| 'market_transaction.date': 1, | |
| 'market_transaction.price': 1, | |
| 'market_transaction.attributes.gradeNumber': 1, | |
| 'market_transaction.attributes.gradingCompany': 1 | |
| } | |
| ) | |
| data = [] | |
| for r in results: | |
| tx = r.get('market_transaction', {}) | |
| attributes = tx.get('attributes', {}) | |
| data.append({ | |
| 'ds': tx.get('date'), | |
| 'y': tx.get('price'), | |
| 'grade': attributes.get('gradeNumber'), | |
| 'grader': attributes.get('gradingCompany') | |
| }) | |
| df = pd.DataFrame(data) | |
| df['certnumber'] = [certnumber] * df.shape[0] | |
| return df | |
| # --- Prediction Logic --- | |
| def predict_price(certnumber, grader, grade): | |
| cert_df = lookup_certnumber(certnumber) | |
| if cert_df.empty: | |
| return "No data found for this cert number.", pd.DataFrame() | |
| cert_df = cert_df[(cert_df['grader'] == grader) & (cert_df['grade'] == grade)] | |
| if cert_df.empty: | |
| return "No matching data found for this grader and grade.", pd.DataFrame() | |
| moving_average_df = calculate_moving_averages(cert_df) | |
| moving_average_df['certnumber'] = moving_average_df['certnumber'].astype(str) | |
| # Encode certnumber | |
| moving_average_df['certnumber_encoded'] = loaded_encoder.fit_transform( | |
| moving_average_df['certnumber'], moving_average_df['y']) | |
| filtered_cert_df = moving_average_df.drop(['y', 'certnumber'], axis=1) | |
| max_fdate = filtered_cert_df['ds'].max() | |
| filtered_df = filtered_cert_df[filtered_cert_df['ds'] == max_fdate] | |
| tdf = transform_data(filtered_df).fillna(0) | |
| tdf = tdf[tdf.grade != 0] | |
| model_columns = gradient_boosting_reg.feature_names_in_ | |
| for col in model_columns: | |
| if col not in tdf.columns: | |
| tdf[col] = [0]*tdf.shape[0] | |
| tdf = tdf[model_columns] | |
| predictions = gradient_boosting_reg.predict(tdf) | |
| tdf['Predicted Price'] = predictions | |
| return f"Predicted Price: ${predictions[0]:,.2f}", tdf | |
| # --- Gradio UI --- | |
| with gr.Blocks() as demo: | |
| gr.Markdown("# Pokémon Card Price Predictor") | |
| cert_input = gr.Number(label="Cert Number", precision=0) | |
| grader_input = gr.Dropdown(choices=["PSA", "BGS", "CGC"], label="Grader") | |
| grade_input = gr.Textbox(label="Grade (e.g., 10.0)") | |
| submit_btn = gr.Button("Predict Price") | |
| output_text = gr.Textbox(label="Prediction Result") | |
| output_df = gr.Dataframe(label="Transformed Input Features") | |
| submit_btn.click( | |
| predict_price, | |
| inputs=[cert_input, grader_input, grade_input], | |
| outputs=[output_text, output_df] | |
| ) | |
| demo.launch(auth=("pokecards", "exqeQbBHrKVL")) | |