nrajwani's picture
Upload folder using huggingface_hub
273a8b7 verified
# Import necessary libraries
import numpy as np
import joblib # For loading the serialized model
import pandas as pd # For data manipulation
from flask import Flask, request, jsonify # For creating the Flask API
# Initialize the Flask application
sales_predictor_api = Flask("Superkart Sales Predictor")
# Load the trained machine learning model
model = joblib.load("superkart_sales_prediction_model_v1_0.joblib")
# Define a route for the home page (GET request)
@sales_predictor_api.get('/')
def home():
"""
This function handles GET requests to the root URL ('/') of the API.
It returns a simple welcome message.
"""
return "Welcome to the Superkart Sales Prediction API!"
# Define an endpoint for single property prediction (POST request)
@sales_predictor_api.post('/v1/sales')
def predict_sales():
"""
This function handles POST requests to the '/v1/sales' endpoint.
It expects a JSON payload containing property details and returns
the predicted rental price as a JSON response.
"""
# Get the JSON data from the request body
data = request.get_json()
# Extract relevant features from the JSON data
sample = {
'Product_Type': data['Product_Type'],
'Product_Sugar_Content': data['Product_Sugar_Content'],
'Store_Establishment_Year': data['Store_Establishment_Year'],
'Store_Size': data['Store_Size'],
'Store_Location_City_Type': data['Store_Location_City_Type'],
'Store_Type': data['Store_Type'],
'Product_Weight': data['Product_Weight'],
'Product_Allocated_Area': data['Product_Allocated_Area'],
'Product_MRP': data['Product_MRP']
}
# Convert the extracted data into a Pandas DataFrame
input_data = pd.DataFrame([sample])
# Make prediction
predicted_sales = model.predict(input_data)[0]
# Calculate actual price
# predicted_sales = np.exp(predicted_log_sales)
# Convert predicted_price to Python float
predicted_sales = round(float(predicted_sales), 2)
# The conversion above is needed as we convert the model prediction (log price) to actual price using np.exp, which returns predictions as NumPy float32 values.
# When we send this value directly within a JSON response, Flask's jsonify function encounters a datatype error
# Return the actual price
return jsonify({'Predicted Sales (in dollars)': predicted_sales})
# Define an endpoint for batch prediction (POST request)
@sales_predictor_api.post('/v1/salesbatch')
def predict_sales_price_batch():
"""
This function handles POST requests to the '/v1/salesbatch' endpoint.
It expects a CSV file containing property details for multiple properties
and returns the predicted rental prices as a dictionary in the JSON response.
"""
# Get the uploaded CSV file from the request
file = request.files['file']
# Read the CSV file into a Pandas DataFrame
input_data = pd.read_csv(file)
# Make predictions for all stores in the DataFrame
predicted_sales_list = model.predict(input_data).tolist()
# Calculate actual prices
predicted_sales = [round(float(sales), 2) for sales in predicted_sales_list]
# Create a dictionary of predictions with store IDs as keys
store_ids = input_data['Store_Id'].tolist()
output_dict = dict(zip(store_ids, predicted_sales)) # Use actual prices
# Return the predictions dictionary as a JSON response
return output_dict
# Run the Flask application in debug mode if this script is executed directly
if __name__ == '__main__':
sales_predictor_api.run(debug=True)