PatternPlacement

Sleeping

App Files Files Community

PatternPlacement / app.py

DumbledoreWiz

Update app.py

85dcc91 verified over 1 year ago

raw

history blame

2.57 kB

	import torch
	from transformers import ViTForImageClassification, ViTFeatureExtractor
	import gradio as gr
	from PIL import Image
	import os
	import logging

	# Set up logging
	logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')

	# Define the labels in the correct order as used during training
	labels = ['Leggings', 'Jogger', 'Palazzo', 'Cargo', 'Dresspants', 'Chinos']
	logging.info(f"Labels: {labels}")

	# Define paths to the model files (all in the same directory as app.py)
	model_dir = "." # Use current directory
	model_path = os.path.join(model_dir, "model.safetensors")
	config_path = os.path.join(model_dir, "config.json")
	preprocessor_path = os.path.join(model_dir, "preprocessor_config.json")

	# Check if all required files exist
	for path in [model_path, config_path, preprocessor_path]:
	if not os.path.exists(path):
	logging.error(f"File not found: {path}")
	raise FileNotFoundError(f"Required file not found: {path}")
	else:
	logging.info(f"Found file: {path}")

	# Load the model and feature extractor using the local directory
	model_id = "google/vit-base-patch16-224"

	feature_extractor = ViTFeatureExtractor.from_pretrained(model_id)
	model = ViTForImageClassification.from_pretrained(model_path)

	# Ensure the model is in evaluation mode
	model.eval()
	logging.info("Model set to evaluation mode")

	# Define the prediction function
	def predict(image):
	logging.info("Starting prediction")
	logging.info(f"Input image shape: {image.size}")

	# Preprocess the image
	logging.info("Preprocessing image")
	inputs = feature_extractor(images=image, return_tensors="pt")
	logging.info(f"Preprocessed input shape: {inputs['pixel_values'].shape}")

	logging.info("Running inference")
	with torch.no_grad():
	outputs = model(**inputs)
	logits = outputs.logits
	probabilities = torch.nn.functional.softmax(logits[0], dim=0)

	logging.info(f"Raw logits: {logits}")
	logging.info(f"Probabilities: {probabilities}")

	# Prepare the output dictionary
	result = {labels[i]: float(probabilities[i]) for i in range(len(labels))}
	logging.info(f"Prediction result: {result}")

	return result

	# Set up the Gradio Interface
	logging.info("Setting up Gradio interface")
	gradio_app = gr.Interface(
	fn=predict,
	inputs=gr.Image(type="pil"),
	outputs=gr.Label(num_top_classes=6),
	title="Pants Shape Classifier"
	)

	# Launch the app
	if __name__ == "__main__":
	logging.info("Launching the app")
	gradio_app.launch()