Spaces:

binaychandra
/

npdstudio_predapi

Sleeping

App Files Files Community

npdstudio_predapi / helper.py

binaychandra

Refactor DataFrame creation in API response processing for clarity

1461675 about 1 year ago

raw

history blame

6.59 kB

	import pandas as pd
	import numpy as np
	import json

	def process_api_response(json_response):
	# Use json.loads() to parse the JSON string
	print("Type of json_response : ", type(json_response))
	input_data = json_response

	# Extract predictions and similarity attributes
	predictions = input_data.get("predictions", {})
	similarity_attr = input_data.get("similarity_attr", {})

	# Convert predictions into a DataFrame and back to a dictionary
	temp_predictions_df = pd.DataFrame(predictions)
	temp_predictions_dict = temp_predictions_df.to_dict()

	# Convert similarity attributes into a DataFrame and back to a dictionary
	sim_attr_df = pd.DataFrame(similarity_attr)
	sample_sim_attr = sim_attr_df.to_dict()

	# Construct final output dictionary
	return temp_predictions_dict, sample_sim_attr

	# data_out = {
	# "status": "success",
	# "data": {
	# "id": input_data.get("id", "default_id"), # Assuming an 'id' key exists in the input
	# "predictions": temp_predictions_dict,
	# "similarity": sample_sim_attr
	# }
	# }

	# return data_out

	def get_sample_similarity_attr():
	sample_sim = {
	"GB1263": {
	"description": "THIS IS A SAMPLE DESCRIPTION",
	"sell_in_volume": 44426.88,
	"similarity": 66.67,
	"distribution": [
	0,
	0,
	0,
	0,
	0,
	0,
	8,
	9,
	9,
	9,
	6,
	5,
	7,
	25,
	26,
	27
	],
	"week_date": [
	"2024-05-13",
	"2024-05-20",
	"2024-05-27",
	"2024-06-03",
	"2024-06-10",
	"2024-06-17",
	"2024-06-24",
	"2024-07-01",
	"2024-07-08",
	"2024-07-15",
	"2024-07-22",
	"2024-07-29",
	"2024-08-05",
	"2024-08-12",
	"2024-08-19",
	"2024-08-26"
	]
	},
	"GB1264": {
	"description": "THIS IS A SAMPLE DESCRIPTION",
	"sell_in_volume": 26840.97,
	"similarity": 66.67,
	"distribution": [
	0,
	0,
	0,
	0,
	0,
	0,
	6,
	8,
	8,
	8,
	5,
	4,
	6,
	25,
	26,
	27
	],
	"week_date": [
	"2024-05-13",
	"2024-05-20",
	"2024-05-27",
	"2024-06-03",
	"2024-06-10",
	"2024-06-17",
	"2024-06-24",
	"2024-07-01",
	"2024-07-08",
	"2024-07-15",
	"2024-07-22",
	"2024-07-29",
	"2024-08-05",
	"2024-08-12",
	"2024-08-19",
	"2024-08-26"
	]
	},
	"GB1450": {
	"description": "THIS IS A SAMPLE DESCRIPTION",
	"sell_in_volume": 32346.0,
	"similarity": 66.67,
	"distribution": [
	0,
	0,
	0,
	0,
	0,
	0,
	6,
	8,
	9,
	8,
	6,
	4,
	6,
	25,
	26,
	27
	],
	"week_date": [
	"2024-05-13",
	"2024-05-20",
	"2024-05-27",
	"2024-06-03",
	"2024-06-10",
	"2024-06-17",
	"2024-06-24",
	"2024-07-01",
	"2024-07-08",
	"2024-07-15",
	"2024-07-22",
	"2024-07-29",
	"2024-08-05",
	"2024-08-12",
	"2024-08-19",
	"2024-08-26"
	]
	},
	"GB1561": {
	"description": "THIS IS A SAMPLE DESCRIPTION",
	"sell_in_volume": 3265.92,
	"similarity": 77.78,
	"distribution": [
	91,
	34,
	33,
	33,
	32,
	33
	],
	"week_date": [
	"2024-02-12",
	"2024-02-19",
	"2024-02-26",
	"2024-03-04",
	"2024-03-11",
	"2024-03-18"
	]
	},
	"GB1650": {
	"description": "THIS IS A SAMPLE DESCRIPTION",
	"sell_in_volume": 0.0,
	"similarity": 77.78,
	"distribution": [
	38,
	30,
	24,
	17,
	14,
	11,
	9,
	7,
	7,
	6,
	5
	],
	"week_date": [
	"2024-02-12",
	"2024-02-19",
	"2024-02-26",
	"2024-03-04",
	"2024-03-11",
	"2024-03-18",
	"2024-03-25",
	"2024-04-01",
	"2024-04-08",
	"2024-04-15",
	"2024-04-22"
	]
	}
	}
	return sample_sim

	def generate_random_predictions():

	# Number of rows and columns
	num_rows = 13
	num_cols = 5 # Including Total Market

	# Create a DataFrame with random float numbers
	data = {}
	column_names = ["ASDA", "MORRISONS", "SAINSBURYS", "TESCO", "TOTAL_MARKET"]
	months = [f"{month}-{year}" for year in [25,26] for month in ["Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec", "Jan", "Feb", "Mar"]][:13]
	for col in column_names:
	data[col] = np.random.rand(num_rows) * 10000 # Random float numbers up to 10000

	df = pd.DataFrame(data, index=months)

	# Ensure Total Markets is greater than the sum of others
	for index in df.index:
	total_others = sum(df.loc[index, : "TESCO"])
	df.loc[index, "TOTAL_MARKET"] = total_others + np.random.rand()*1000 # Add a random value to guarantee it is larger


	df = df.round(2)
	df_dict = df.to_dict()

	return df_dict