superkartapi / app.py
dyanaj's picture
Upload folder using huggingface_hub
10e06ce verified
# Import necessary libraries
import numpy as np
import joblib # For loading the serialized model
import pandas as pd # For data manipulation
from flask import Flask, request, jsonify # For creating the Flask API
# Initialize the Flask application
superkart_revenue_predictor_api = Flask("Predict Product Store Sales based on product and store attributes")
# Load the trained machine learning model
model = joblib.load("superkart_revenue_prediction_model_v1_0.joblib")
# Define a route for the home page (GET request)
@superkart_revenue_predictor_api.get('/')
def home():
"""
This function handles GET requests to the root URL ('/') of the API.
It returns a simple welcome message.
"""
return "Welcome to the SuperKart Sales Prediction API!"
# Define an endpoint for single property prediction (POST request)
@superkart_revenue_predictor_api.post('/v1/sales')
def predict_sales_price():
"""
This function handles POST requests to the '/v1/sales' endpoint.
It expects a JSON payload containing property details and returns
the predicted sales price as a JSON response.
"""
# Get the JSON data from the request body
product_data = request.get_json()
# Extract relevant features from the JSON data
json_extract = {
'Product_Weight': product_data['Product_Weight'],
'Product_Sugar_Content': product_data['Product_Sugar_Content'],
'Product_Allocated_Area': product_data['Product_Allocated_Area'],
'Product_Type': product_data['Product_Type'],
'Product_MRP': product_data['Product_MRP'],
'Store_Id': product_data['Store_Id'],
'Store_Size': product_data['Store_Size'],
'Store_Location_City_Type': product_data['Store_Location_City_Type'],
'Store_Type': product_data['Store_Type'],
'Product_Category': product_data['Product_Category'],
'Perishable': product_data['Perishable'],
'Store_Age': product_data['Store_Age']
}
# Convert the extracted data into a Pandas DataFrame
input_data = pd.DataFrame([json_extract])
# Change MRP to Log as this is done before pipeline (feature engineering)
input_data['MRP_log'] = np.log(input_data['Product_MRP'])
input_data['Price_Per_Display'] = input_data['Product_MRP'] * input_data['Product_Allocated_Area']
# Make prediction
predicted_price = model.predict(input_data)[0]
# Return the actual price
return jsonify({'Predicted Sales': predicted_price})
# Define an endpoint for batch prediction (POST request)
@superkart_revenue_predictor_api.post('/v1/salesbatch')
def predict_salesprice_batch():
"""
This function handles POST requests to the '/v1/salesbatch' endpoint.
It expects a CSV file containing property details for multiple properties
and returns the predicted sales prices as a dictionary in the JSON response.
"""
# Get the uploaded CSV file from the request
file = request.files['file']
# Read the CSV file into a Pandas DataFrame
input_data = pd.read_csv(file)
# Change MRP to Log as this is done before pipeline (feature engineering)
input_data['MRP_log'] = np.log(input_data['Product_MRP'])
input_data['Price_Per_Display'] = input_data['Product_MRP'] * input_data['Product_Allocated_Area']
# Save ID
product_ids = input_data['Product_Id']
# Drop ID
input_data = input_data.drop('Product_Id', axis=1)
# Make predictions for all properties in the DataFrame (get log_prices)
predicted_prices = model.predict(input_data).tolist()
# Create a dictionary of predictions with property IDs as keys
output_dict = dict(zip(product_ids, predicted_prices))
# Return the predictions dictionary as a JSON response
return output_dict
# Run the Flask application in debug mode if this script is executed directly
if __name__ == '__main__':
superkart_revenue_predictor_api.run(debug=True)