Spaces:
Sleeping
Sleeping
File size: 12,579 Bytes
77e4681 44194c1 77e4681 fb9a9f7 dddb168 77e4681 7b67d15 77e4681 106c4ee 77e4681 7a80507 537155f 7a80507 44194c1 77e4681 7a80507 537155f 7a80507 537155f 7a80507 77e4681 f930989 77e4681 50a8196 2284e44 3b09d0d 53b2fcb 3b09d0d 106c4ee 53b2fcb 3b09d0d 106c4ee 3b09d0d 106c4ee 537155f f930989 106c4ee 537155f 7b8ca14 537155f 7b8ca14 537155f 7b8ca14 537155f 106c4ee 9829b2b 106c4ee 537155f 9829b2b 537155f 106c4ee 44340d5 2284e44 a01b0c9 106c4ee 537155f 7b67d15 8067975 7b67d15 537155f 7b67d15 7a80507 7b67d15 98dbcff 537155f 2d9d701 537155f 8f1417a 98dbcff dddb168 bc94eec bd49433 98dbcff bd49433 537155f bd49433 537155f bd49433 537155f 98dbcff bd49433 44194c1 a48545d 537155f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 |
import os
from paddleocr import PaddleOCR
from PIL import Image
import gradio as gr
import requests
import re
from simple_salesforce import Salesforce
import pandas as pd
import matplotlib.pyplot as plt
from io import BytesIO
from fuzzywuzzy import process
import kaleido # Ensure kaleido is imported
# Attribute mappings: readable names to Salesforce API names
ATTRIBUTE_MAPPING = {
"Product name": "Productname__c",
"Colour": "Colour__c",
"Motortype": "Motortype__c",
"Frequency": "Frequency__c",
"Grossweight": "Grossweight__c",
"Ratio": "Ratio__c",
"MotorFrame": "Motorframe__c",
"Model": "Model__c",
"Speed": "Speed__c",
"Quantity": "Quantity__c",
"Voltage": "Voltage__c",
"Material": "Material__c",
"Type": "Type__c",
"Horsepower": "Horsepower__c",
"Consignee": "Consignee__c",
"LOT": "LOT__c",
"Stage": "Stage__c",
"Outlet": "Outlet__c",
"Serialnumber": "Serialnumber__c",
"HeadSize": "Headsize__c",
"Deliverysize": "Deliverysize__c",
"Phase": "Phase__c",
"Size": "Size__c",
"MRP": "MRP__c",
"Usebefore": "Usebefore__c",
"Height": "Height__c",
"MaximumDischarge Flow": "Maximumdischargeflow__c",
"DischargeRange": "Dischargeflow__c",
"Assembledby": "Manufacturer__c",
"Manufacturedate": "Manufacturedate__c",
"Companyname": "Companyname__c",
"Customercarenumber": "Customercarenumber__c",
"SellerAddress": "Selleraddress__c",
"Selleremail": "Selleremail__c",
"GSTIN": "GSTIN__c",
"Totalamount": "Totalamount__c",
"Paymentstatus": "Paymentstatus__c",
"Paymentmethod": "Paymentstatus__c",
"Invoicedate": "Manufacturedate__c",
"Warranty": "Warranty__c",
"Brand": "Brand__c",
"Motorhorsepower": "Motorhorsepower__c",
"Power": "Power__c",
"Motorphase": "Motorphase__c",
"Enginetype": "Enginetype__c",
"Tankcapacity": "Tankcapacity__c",
"Head": "Head__c",
"Usage/Application": "Usage_Application__c",
"Volts": "volts__c",
"Hertz": "Hertz__c",
"Frame": "frame__c",
"Mounting": "Mounting__c",
"Tollfreenumber": "Tollfreenumber__c",
"Pipesize": "Pipesize__c",
"Manufacturer": "Manufacturer__c",
"Office": "Office__c",
"SRnumber": "SRnumber__c",
"TypeOfEndUse": "TypeOfEndUse__c",
"Model Name": "Model_Name_Number__c",
"coolingmethod": "coolingmethod__c",
"H.P.": "H_p__c"
}
# List of product names to match
PRODUCT_NAMES = [
"Fusion", "Agroking", "openwell", "CG commercial motors", "Jaguar", "Submersible pumps", "Gaurav"
]
# Salesforce credentials
SALESFORCE_USERNAME = "venkatramana@sandbox.com"
SALESFORCE_PASSWORD = "Venkat12345@"
SALESFORCE_SECURITY_TOKEN = "GhcJJmjBEefdnukJoz4CAQlR"
# Initialize PaddleOCR
ocr = PaddleOCR(use_angle_cls=True, lang='en')
# Function to extract text using PaddleOCR
def extract_text(image):
result = ocr.ocr(image)
extracted_text = []
for line in result[0]:
extracted_text.append(line[1][0])
return "\n".join(extracted_text)
# Function to match product name using fuzzy matching
def match_product_name(extracted_text):
best_match = None
best_score = 0
for line in extracted_text.split("\n"):
match, score = process.extractOne(line, PRODUCT_NAMES)
if score > best_score:
best_match = match
best_score = score
return best_match if best_score >= 70 else None # Threshold of 70 for a match
# Function to extract attributes and their values
def extract_attributes(extracted_text):
attributes = {}
for readable_attr, sf_attr in ATTRIBUTE_MAPPING.items():
pattern = rf"{re.escape(readable_attr)}[:\-]?\s*(.+)"
match = re.search(pattern, extracted_text, re.IGNORECASE)
if match:
attributes[readable_attr] = match.group(1).strip()
return attributes
# Function to filter attributes for valid Salesforce fields
def filter_valid_attributes(attributes, valid_fields):
return {ATTRIBUTE_MAPPING[key]: value for key, value in attributes.items() if ATTRIBUTE_MAPPING[key] in valid_fields}
# Function to interact with Salesforce based on mode and type
def interact_with_salesforce(mode, entry_type, quantity, attributes):
try:
sf = Salesforce(
username=SALESFORCE_USERNAME,
password=SALESFORCE_PASSWORD,
security_token=SALESFORCE_SECURITY_TOKEN
)
object_name = None
field_name = None
field_names = []
product_field_name = "Productname__c"
model_field_name = "Model__c"
stage_field_name = "Stage__c"
hp_field_name = "H_p__c"
if mode == "Entry":
if entry_type == "Sales":
object_name = "VENKATA_RAMANA_MOTORS__c"
field_name = "Quantity__c"
elif entry_type == "Non-Sales":
object_name = "UNBILLING_DATA__c"
field_name = "TotalQuantity__c"
elif mode == "Exit":
if entry_type == "Sales":
object_name = "Inventory_Management__c"
field_names = ["Quantity_Sold__c", "soldstock__c"]
elif entry_type == "Non-Sales":
object_name = "Un_Billable__c"
field_names = ["Sold_Out__c", "soldstock__c"]
if not object_name or (not field_name and not field_names):
return "Invalid mode or entry type."
sf_object = sf.__getattr__(object_name)
schema = sf_object.describe()
valid_fields = {field["name"] for field in schema["fields"]}
filtered_attributes = filter_valid_attributes(attributes, valid_fields)
if mode == "Exit":
query_conditions = [f"{product_field_name} = '{attributes['Product name']}'"]
if "Model Name" in attributes and attributes["Model Name"]:
query_conditions.append(f"{model_field_name} = '{attributes['Model Name']}'")
if "Stage" in attributes and attributes["Stage"]:
query_conditions.append(f"{stage_field_name} = '{attributes['Stage']}'")
if "H.P." in attributes and attributes["H.P."]:
query_conditions.append(f"{hp_field_name} = '{attributes['H.P.']}'")
query = f"SELECT Id, {', '.join(field_names)} FROM {object_name} WHERE {' AND '.join(query_conditions)} LIMIT 1"
response = sf.query(query)
if response["records"]:
record_id = response["records"][0]["Id"]
updated_fields = {field: quantity for field in field_names}
sf_object.update(record_id, updated_fields)
return f"β
Updated record for product '{attributes['Product name']}' in {object_name}. Updated fields: {updated_fields}."
else:
return f"β No matching record found for product '{attributes['Product name']}' in {object_name}."
else:
filtered_attributes[field_name] = quantity
sf_object.create(filtered_attributes)
return f"β
Data successfully exported to Salesforce object {object_name}."
except Exception as e:
return f"β Error interacting with Salesforce: {str(e)}"
# Function to process image, extract attributes, and allow editing
def process_image(image, mode, entry_type, quantity):
extracted_text = extract_text(image)
if not extracted_text:
return "No text detected in the image.", None, None
product_name = match_product_name(extracted_text)
attributes = extract_attributes(extracted_text)
if product_name:
attributes["Product name"] = product_name
# Ensure fixed attributes are present
for fixed_attr in ["Stage", "H.P.", "Product name", "Model"]:
if fixed_attr not in attributes:
attributes[fixed_attr] = ""
# Convert attributes to DataFrame for editing
df = pd.DataFrame(list(attributes.items()), columns=["Attribute", "Value"])
return f"Extracted Text:\n{extracted_text}", df, None
# Function to handle edited attributes and export to Salesforce
def export_to_salesforce(mode, entry_type, quantity, edited_df):
try:
# Convert edited DataFrame back to dictionary
edited_attributes = dict(zip(edited_df["Attribute"], edited_df["Value"]))
# Export to Salesforce
message = interact_with_salesforce(mode, entry_type, quantity, edited_attributes)
return message
except Exception as e:
return f"β Error exporting to Salesforce: {str(e)}"
# Function to pull structured data from Salesforce and display as a table
def pull_data_from_salesforce(data_type):
try:
sf = Salesforce(
username=SALESFORCE_USERNAME,
password=SALESFORCE_PASSWORD,
security_token=SALESFORCE_SECURITY_TOKEN
)
if data_type == "Inventory":
query = "SELECT Productname__c, Current_Stocks__c, soldstock__c FROM Inventory_Management__c LIMIT 100"
else:
query = "SELECT Productname__c, Current_Stock__c, soldstock__c FROM Un_Billable__c LIMIT 100"
response = sf.query_all(query)
records = response.get("records", [])
if not records:
return "No data found in Salesforce.", None, None, None
df = pd.DataFrame(records)
df = df.drop(columns=['attributes'], errors='ignore')
# Rename columns for better readability
df.rename(columns={
"Productname__c": "Product Name",
"Current_Stocks__c": "Current Stocks",
"Current_Stock__c": "Current Stocks",
"soldstock__c": "Sold Stock"
}, inplace=True)
excel_path = "salesforce_data.xlsx"
df.to_excel(excel_path, index=False)
# Generate interactive vertical bar graph using Matplotlib
fig, ax = plt.subplots(figsize=(12, 8))
df.plot(kind='bar', x="Product Name", y="Current Stocks", ax=ax, legend=False)
ax.set_title("Stock Distribution by Product Name")
ax.set_xlabel("Product Name")
ax.set_ylabel("Current Stocks")
plt.xticks(rotation=45, ha="right", fontsize=10)
plt.tight_layout()
buffer = BytesIO()
plt.savefig(buffer, format="png")
buffer.seek(0)
img = Image.open(buffer)
return df, excel_path, img
except Exception as e:
return f"Error fetching data: {str(e)}", None, None, None
# Gradio Interface
def app():
with gr.Blocks() as demo:
with gr.Tab("π₯ OCR Processing"):
with gr.Row():
image_input = gr.Image(type="numpy", label="π Upload Image")
mode_input = gr.Dropdown(label="π Mode", choices=["Entry", "Exit"], value="Entry")
entry_type_input = gr.Radio(label="π¦ Entry Type", choices=["Sales", "Non-Sales"], value="Sales")
quantity_input = gr.Number(label="π’ Quantity", value=1, interactive=True)
extract_button = gr.Button("Extract Text and Attributes")
extracted_text_output = gr.Text(label="π Extracted Image Data")
editable_df_output = gr.Dataframe(label="βοΈ Edit Attributes (Key-Value Pairs)", interactive=True)
ok_button = gr.Button("OK")
result_output = gr.Text(label="π Result")
with gr.Tab("π Salesforce Data"):
data_type_input = gr.Dropdown(label="Select Data Type", choices=["Inventory", "Unbilling"], value="Inventory")
pull_button = gr.Button("Pull Data from Salesforce")
salesforce_data_output = gr.Dataframe(label="π Salesforce Data")
excel_download_output = gr.File(label="π₯ Download Excel")
graph_output = gr.Image(label="π Stock Distribution Graph")
# Define button actions
extract_button.click(
fn=process_image,
inputs=[image_input, mode_input, entry_type_input, quantity_input],
outputs=[extracted_text_output, editable_df_output, result_output]
)
ok_button.click(
fn=export_to_salesforce,
inputs=[mode_input, entry_type_input, quantity_input, editable_df_output],
outputs=[result_output]
)
pull_button.click(
fn=pull_data_from_salesforce,
inputs=[data_type_input],
outputs=[salesforce_data_output, excel_download_output, graph_output]
)
return demo
if __name__ == "__main__":
app().launch(share=True) |