Spaces:

mbar0075
/

Saliency-Ranking

Running

App Files Files Community

Saliency-Ranking / app.py

mbar0075

Initial Update

e25cfe0 9 months ago

raw

history blame contribute delete

5.86 kB

	from typing import Tuple
	import gradio as gr
	import numpy as np
	import cv2
	import SaRa.saraRC1 as sara
	import warnings
	warnings.filterwarnings("ignore")


	ALPHA = 0.4
	GENERATORS = ['itti', 'deepgaze']

	MARKDOWN = """
	<h1 style='text-align: center'>Saliency Ranking 📚</h1>

	Saliency Ranking is a fundamental 🌟 Computer Vision 🌟 process aimed at discerning the most visually significant features within an image 🖼️.

	🌟 This demo showcases the SaRa (Saliency-Driven Object Ranking) model for Saliency Ranking 🎯, which can efficiently rank the visual saliency of an image without requiring any training. 🖼️

	This technique is configured on the Saliency Map generator model by Itti, which works based on the primate visual cortex 🧠, and can work with or without depth information 🔄.

	<div style="display: flex; align-items: center;">
	<a href="https://github.com/dylanseychell/SaliencyRanking" style="margin-right: 10px;">
	<img src="https://badges.aleen42.com/src/github.svg">
	</a>
	<a href="https://github.com/mbar0075/SaRa" style="margin-right: 10px;">
	<img src="https://badges.aleen42.com/src/github.svg">
	</a>
	<a href="https://github.com/matthewkenely/ICT3909" style="margin-right: 10px;">
	<img src="https://badges.aleen42.com/src/github.svg">
	</a>
	</div>
	"""

	IMAGE_EXAMPLES = [
	['https://media.roboflow.com/supervision/image-examples/people-walking.png', 32],
	['https://media.roboflow.com/supervision/image-examples/vehicles.png', 32],
	['https://media.roboflow.com/supervision/image-examples/basketball-1.png', 32],
	]

	def detect_and_annotate(image,
	GRID_SIZE,
	generator,
	ALPHA=ALPHA,
	mode=1)-> np.ndarray:
	# Converting from PIL to OpenCV
	image = np.array(image)
	# Convert image from BGR to RGB
	image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)

	# Copy and convert the image for sara processing
	sara_image = image.copy()
	# sara_image = cv2.cvtColor(sara_image, cv2.COLOR_RGB2BGR)

	# Resetting sara
	sara.reset()

	# Running sara (Original implementation on itti)
	sara_info = sara.return_sara(sara_image, GRID_SIZE, generator, mode=mode)

	# Generate saliency map
	saliency_map = sara.return_saliency(image, generator=generator)
	# Resize saliency map to match the image size
	saliency_map = cv2.resize(saliency_map, (image.shape[1], image.shape[0]))

	# Apply color map and convert to RGB
	saliency_map = cv2.applyColorMap(saliency_map, cv2.COLORMAP_JET)
	saliency_map = cv2.cvtColor(saliency_map, cv2.COLOR_BGR2RGB)

	# Overlay the saliency map on the original image
	saliency_map = cv2.addWeighted(saliency_map, ALPHA, image, 1-ALPHA, 0)

	# Extract and convert heatmap to RGB
	heatmap = sara_info[0]
	heatmap = cv2.cvtColor(heatmap, cv2.COLOR_BGR2RGB)

	return saliency_map, heatmap

	def process_image(
	input_image: np.ndarray,
	GRIDSIZE: int,
	) -> Tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]:
	# Validate GRID_SIZE
	if GRIDSIZE is None or GRIDSIZE < 3:
	GRIDSIZE = 9

	itti_saliency_map, itti_heatmap = detect_and_annotate(
	input_image, GRIDSIZE, 'itti')
	_, itti_heatmap2 = detect_and_annotate(
	input_image, GRIDSIZE, 'itti', mode=2)
	# deepgaze_saliency_map, deepgaze_heatmap = detect_and_annotate(
	# input_image, GRIDSIZE, 'deepgaze')

	return (
	itti_saliency_map,
	itti_heatmap,
	itti_heatmap2,
	# deepgaze_saliency_map,
	# deepgaze_heatmap,
	)

	grid_size_Component = gr.Slider(
	minimum=3,
	maximum=100,
	value=32,
	step=1,
	label="Grid Size",
	info=(
	"The grid size for the Saliency Ranking (SaRa) model. The grid size determines "
	"the number of regions the image is divided into. A higher grid size results in "
	"more regions and a lower grid size results in fewer regions. The default grid "
	"size is 9."
	))


	with gr.Blocks() as demo:
	gr.Markdown(MARKDOWN)
	with gr.Accordion("Configuration", open=False):
	with gr.Row():
	grid_size_Component.render()
	with gr.Row():
	input_image_component = gr.Image(
	type='pil',
	label='Input'
	)
	itti_saliency_map = gr.Image(
	type='pil',
	label='Itti Saliency Map'
	)
	with gr.Row():
	itti_heatmap = gr.Image(
	type='pil',
	label='Saliency Ranking Heatmap 1'
	)
	itti_heatmap2 = gr.Image(
	type='pil',
	label='Saliency Ranking Heatmap 2'
	)
	# with gr.Row():
	# deepgaze_saliency_map = gr.Image(
	# type='pil',
	# label='DeepGaze Saliency Map'
	# )
	# deepgaze_heatmap = gr.Image(
	# type='pil',
	# label='DeepGaze Saliency Ranking Heatmap'
	# )
	submit_button_component = gr.Button(
	value='Submit',
	scale=1,
	variant='primary'
	)
	gr.Examples(
	fn=process_image,
	examples=IMAGE_EXAMPLES,
	inputs=[
	input_image_component,
	grid_size_Component,
	],
	outputs=[
	itti_saliency_map,
	itti_heatmap,
	itti_heatmap2,
	# deepgaze_saliency_map,
	# deepgaze_heatmap,
	]
	)

	submit_button_component.click(
	fn=process_image,
	inputs=[
	input_image_component,
	grid_size_Component,
	],
	outputs=[
	itti_saliency_map,
	itti_heatmap,
	itti_heatmap2,
	# deepgaze_saliency_map,
	# deepgaze_heatmap,
	]
	)

	demo.launch(debug=False, show_error=True, max_threads=1)