Spaces:

eulerLabs
/

jobim-jfactor-boost

Sleeping

@danMendes-bossanova

new tre54

36d4766 3 months ago

4.07 kB

	import gradio as gr
	import torch
	import open_clip
	import numpy as np
	import pandas as pd
	import requests
	import json
	from PIL import Image
	from huggingface_hub import hf_hub_download

	# ============================= CARREGA TUDO =============================
	REPO = "eulerLabs/amazon-br-taxonomy-jfactor"

	print("Carregando arquivos do dataset...")
	tax_path = hf_hub_download(REPO, "amazon-br-taxonomy.json", repo_type="dataset")
	flat_path = hf_hub_download(REPO, "categories-flat.json", repo_type="dataset")
	cache_path = hf_hub_download(REPO, "marqo-ecommerce-B-cache-crad-K32-aligned.npy", repo_type="dataset")
	proj_path = hf_hub_download(REPO, "projection_matrix_B_to_32.npy", repo_type="dataset")

	with open(tax_path) as f:
	TAXONOMY = json.load(f)
	with open(flat_path) as f:
	CATS = json.load(f)

	CACHE_32D = np.load(cache_path).astype(np.float32)
	CACHE_DICT = {cat: CACHE_32D[i] for i, cat in enumerate(CATS)}
	PROJ = torch.from_numpy(np.load(proj_path)).float()

	model, _, preprocess = open_clip.create_model_and_transforms("hf-hub:Marqo/marqo-ecommerce-embeddings-B")
	model.eval()

	# ============================= CLASSIFICAÇÃO =============================
	@torch.no_grad()
	def classify(image=None, url="", beam_width=5):
	if image is None and url.strip():
	try:
	image = Image.open(requests.get(url, stream=True, timeout=10).raw).convert("RGB")
	except:
	return pd.DataFrame({"Erro": ["Não foi possível carregar a imagem da URL"]})

	if image is None:
	return pd.DataFrame({"Erro": ["Faça upload ou cole uma URL"]})

	emb768 = model.encode_image(preprocess(image).unsqueeze(0))
	emb32 = (emb768 @ PROJ).squeeze(0)
	emb32 = emb32 / emb32.norm(dim=-1, keepdim=True)

	beam = [(TAXONOMY, [], 0.0)]

	while beam:
	candidates = []
	for current_node, path_so_far, score_so_far in beam:
	if not isinstance(current_node, dict):
	candidates.append((path_so_far, score_so_far))
	continue
	for cat, child_node in current_node.items():
	if cat in CACHE_DICT:
	sim_raw = torch.cosine_similarity(emb32, torch.tensor(CACHE_DICT[cat]), dim=0).item()
	sim = round((sim_raw + 1) / 2, 4)
	new_path = path_so_far + [(cat, sim)]
	candidates.append((child_node, new_path, score_so_far + sim))

	if not candidates:
	break

	# Ordena por score médio (quanto maior, melhor)
	candidates.sort(key=lambda x: x[2] / len(x[1]) if x[1] else 0, reverse=True)
	beam = candidates[:beam_width]

	# Pega o melhor caminho
	if not beam:
	return pd.DataFrame({"Resultado": ["Nenhum caminho encontrado"]})

	best_path = max(beam, key=lambda x: x[2] / len(x[1]) if x[1] else 0)[1]
	rows = [[i+1, cat, f"{score:.4f}"] for i, (cat, score) in enumerate(best_path)]
	return pd.DataFrame(rows, columns=["Nível", "Categoria", "Score"])

	# ============================= INTERFACE =============================
	with gr.Blocks(theme=gr.themes.Soft(), title="Jobim Visual Guru") as demo:
	gr.Markdown("# obim Visual Gu")
	gr.Markdown("!")

	with gr.Row():
	with gr.Column():
	img_input = gr.Image(type="pil", label="Foto do produto", height=480)
	url_input = gr.Textbox(label="ou cole a URL da imagem", placeholder="https://...")
	gr.Examples([
	"https://i.pinimg.com/736x/82/e7/47/82e747617f37fd4600634d7a27a1e561.jpg",
	"https://images.unsplash.com/photo-1542291026-7eec264c27ff?w=800",
	], inputs=img_input)

	with gr.Column():
	beam_slider = gr.Slider(1, 15, value=5, step=1, label="Precisão (Beam Width)")
	btn = gr.Button("Classificar", variant="primary", size="lg")
	output = gr.Dataframe(headers=["Nível", "Categoria", "Score"], row_count=12, height=560)

	btn.click(classify, inputs=[img_input, url_input, beam_slider], outputs=output)

	demo.launch()