Spaces:

ll-monkey
/

ARTWORKS-CLASSIFIER

Sleeping

ARTWORKS-CLASSIFIER / src /streamlit_app.py

Dollaya Piumsuwan

Update src/streamlit_app.py

014812f verified 27 days ago

6.41 kB

	#########################
	# ARTWORKS CLASSIFIER
	# ########################

	import streamlit as st
	import pandas as pd
	import torch
	import torchvision.transforms as transforms
	import torchvision.models as models
	import torch.nn as nn
	from PIL import Image
	import os
	import io
	from pathlib import Path

	#########################
	# SETTINGS
	# ########################
	base_path = Path(__file__).resolve().parent
	model_file = str(base_path / "models" / "momaclassifier_resnet50.pt")
	image_csv = str(base_path / "data" / "demo_artworks.csv")
	image_folder = str(base_path / "demo_images")
	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
	class_index = {"Drawing": 0, "Photograph": 1, "Print": 2}


	#########################
	# LOAD DEMO IMAGE CSV
	# ########################
	@st.cache_data
	def load_metadata():
	if os.path.exists(image_csv):
	df = pd.read_csv(image_csv)
	return df
	else:
	st.warning("No metadata CSV file found.")
	return pd.DataFrame()


	metadata_df = load_metadata()


	#########################
	# MODEL LOADING
	# ########################
	@st.cache_resource
	def load_model():
	num_class = len(class_index)
	model = models.resnet50(weights=None)
	model.fc = nn.Linear(model.fc.in_features, num_class)
	model.load_state_dict(torch.load(model_file, map_location=device))
	model.to(device)
	model.eval()
	return model


	model = load_model()

	#########################
	# TRANSFORM PIPELINE
	# ########################
	transform = transforms.Compose(
	[
	transforms.Resize((224, 224)),
	transforms.ToTensor(),
	transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),
	]
	)


	#########################
	# PREDICTION FUNCTION
	# ########################
	def predict_image_class(image_path, model, transform, class_index, device):
	try:
	image = Image.open(image_path).convert("RGB")
	input_tensor = transform(image)
	input_batch = input_tensor.unsqueeze(0).to(device)

	with torch.no_grad():
	output = model(input_batch)

	probabilities = torch.nn.functional.softmax(output[0], dim=0)
	_, predicted_class_index = torch.max(output, 1)

	index_to_class = {v: k for k, v in class_index.items()}
	predicted_class_name = index_to_class[predicted_class_index.item()]
	class_probabilities = {
	index_to_class[i]: prob.item() for i, prob in enumerate(probabilities)
	}

	return image, predicted_class_name, class_probabilities
	except Exception as e:
	st.error(f"Error during prediction: {e}")
	return None, None, None


	#########################
	# UI
	# ########################
	st.title("MoMA ARTWORKS CLASSIFIER")
	st.markdown(
	"""
	<div style="background-color:lightgray; padding:15px; border-radius:5px; color:black">
	<b>Classify artworks into Drawing, Photograph, and Print.</b><br><br>
	This app uses a <b>pretrained ResNet50</b>, a type of convolutional neural network that has already learned to recognize general patterns in images, like shapes, textures, and edges.<br><br>
	To adapt it to artworks, I <b>freeze the first three layers</b>, which retain the general visual features, and train the fourth and fully connected layers on the MoMA artwork dataset. This helps the model focus on recognizing differences between drawings, photographs, and prints while still using the knowledge it already has from analyzing millions of images.
	</div>
	""",
	unsafe_allow_html=True,
	)
	# st.write(
	# """
	# Classify artworks into Drawing, Photograph, and Print.

	# This app uses a pretrained ResNet50, a type of convolutional neural network that has already learned to recognize general patterns in images, like shapes, textures, and edges.

	# To adapt it to artworks, I freeze the first three layers, which retain the general visual features, and train the the forth and fully connected layers on MoMA artwork dataset. This helps the model focus on recognizing differences between drawings, photographs, and prints while still using the knowledge it already has from analyzing millions of images.
	# """
	# )


	# Choose from collection
	available_images = [
	f for f in os.listdir(image_folder) if f.lower().endswith((".jpg", ".jpeg", ".png"))
	]

	col1, col2 = st.columns([0.75, 1.25])
	with col1:
	selected_image = None
	if available_images:
	selected_image = st.selectbox(
	"Choose from Collection", ["None"] + available_images
	)
	else:
	st.sidebar.warning("No images found in the demo_images folder.")

	with col2:
	uploaded_file = st.file_uploader(
	"Or Upload Your Own Image", type=["jpg", "jpeg", "png"]
	)

	# prediction
	if uploaded_file is not None:
	st.info("Using uploaded image for classification.")
	image, predicted_class, probabilities = predict_image_class(
	uploaded_file, model, transform, class_index, device
	)
	object_id = None

	elif selected_image and selected_image != "None":
	st.info(f"Using image in collections: {selected_image}")
	image_path = os.path.join(image_folder, selected_image)
	image, predicted_class, probabilities = predict_image_class(
	image_path, model, transform, class_index, device
	)
	# ObjectID from filename
	object_id = selected_image.split(".")[0]

	else:
	image, predicted_class, probabilities, object_id = None, None, None, None

	# show results
	if image:

	col1, col2 = st.columns([1, 1])

	with col1:
	st.image(image, caption="Input Image", use_container_width=True)

	# Show artwork info if available
	if object_id and not metadata_df.empty:
	art_info = metadata_df[metadata_df["ObjectID"] == int(object_id)]
	if not art_info.empty:
	st.subheader("Artwork Information")
	for col in ["Title", "Artist", "Classification", "CreditLine", "URL"]:
	if col in art_info.columns:
	st.write(f"{col}: {art_info.iloc[0][col]}")
	else:
	st.info("No metadata found for this artwork.")

	with col2:
	st.subheader("Prediction Results")
	for cls, prob in probabilities.items():
	st.write(f"{cls}: {prob:.3f}")

	st.success(f"Final Predicted Class: {predicted_class}")
	else:
	st.warning("Please choose an image or upload your own.")