# Import necessary libraries import numpy as np import joblib # For loading the serialized model import pandas as pd # For data manipulation from flask import Flask, request, jsonify # For creating the Flask API # Initialize the Flask application sales_predictor_api = Flask("Superkart Sales Predictor") # Load the trained machine learning model model = joblib.load("superkart_sales_prediction_model_v1_0.joblib") # Define a route for the home page (GET request) @sales_predictor_api.get('/') def home(): """ This function handles GET requests to the root URL ('/') of the API. It returns a simple welcome message. """ return "Welcome to the Superkart Sales Prediction API!" # Define an endpoint for single property prediction (POST request) @sales_predictor_api.post('/v1/sales') def predict_sales(): """ This function handles POST requests to the '/v1/sales' endpoint. It expects a JSON payload containing property details and returns the predicted rental price as a JSON response. """ # Get the JSON data from the request body data = request.get_json() # Extract relevant features from the JSON data sample = { 'product_sugar_content': data['Product_Sugar_Content'], 'product_type': data['Product_Type'], 'store_establishment_year': data['Store_Establishment_Year'], 'store_size': data['Store_Size'], 'store_location_city_type': data['Store_Location_City_Type'], 'store_type': data['Store_Type'] } # Convert the extracted data into a Pandas DataFrame input_data = pd.DataFrame([sample]) # Make prediction (get log_price) predicted_log_sales = model.predict(input_data)[0] # Calculate actual price predicted_sales = np.exp(predicted_log_sales) # Convert predicted_price to Python float predicted_sales = round(float(predicted_sales), 2) # The conversion above is needed as we convert the model prediction (log price) to actual price using np.exp, which returns predictions as NumPy float32 values. # When we send this value directly within a JSON response, Flask's jsonify function encounters a datatype error # Return the actual price return jsonify({'Predicted Price (in dollars)': predicted_sales}) # Define an endpoint for batch prediction (POST request) @sales_predictor_api.post('/v1/salesbatch') def predict_rental_price_batch(): """ This function handles POST requests to the '/v1/salesbatch' endpoint. It expects a CSV file containing property details for multiple properties and returns the predicted rental prices as a dictionary in the JSON response. """ # Get the uploaded CSV file from the request file = request.files['file'] # Read the CSV file into a Pandas DataFrame input_data = pd.read_csv(file) # Make predictions for all properties in the DataFrame (get log_prices) predicted_log_sales = model.predict(input_data).tolist() # Calculate actual prices predicted_sales = [round(float(np.exp(log_sales)), 2) for log_sales in predicted_log_sales] # Create a dictionary of predictions with property IDs as keys store_ids = input_data['id'].tolist() # Assuming 'id' is the property ID column output_dict = dict(zip(store_ids, predicted_sales)) # Use actual prices # Return the predictions dictionary as a JSON response return output_dict # Run the Flask application in debug mode if this script is executed directly if __name__ == '__main__': sales_predictor_api.run(debug=True)