mbar0075's picture
Arranged Markdown
1a1fa99
raw
history blame
5.85 kB
from typing import Tuple
import gradio as gr
import numpy as np
import cv2
import SaRa.saraRC1 as sara
import warnings
warnings.filterwarnings("ignore")
ALPHA = 0.3
GENERATORS = ['itti', 'deepgaze']
MARKDOWN = """
<h1 style='text-align: center'>Saliency Ranking πŸ₯‡</h1>
Saliency Ranking is a fundamental 🌟 **Computer Vision** 🌟 process aimed at discerning the most visually significant features within an image πŸ–ΌοΈ.
🌟 This demo showcases the **SaRa (Saliency-Driven Object Ranking)** model for Saliency Ranking 🎯, which can efficiently rank the visual saliency of an image without requiring any training. πŸ–ΌοΈ
This technique is based on the Saliency Map generator model from Itti, which works on the primate visual cortex 🧠, and can work with or without depth information πŸ”„.
<div style="display: flex; align-items: center;">
<a href="https://github.com/dylanseychell/SaliencyRanking" style="margin-right: 10px;">
<img src="https://badges.aleen42.com/src/github.svg">
</a>
<a href="https://github.com/mbar0075/SaRa" style="margin-right: 10px;">
<img src="https://badges.aleen42.com/src/github.svg">
</a>
<a href="https://github.com/matthewkenely/ICT3909" style="margin-right: 10px;">
<img src="https://badges.aleen42.com/src/github.svg">
</a>
</div>
"""
IMAGE_EXAMPLES = [
['https://media.roboflow.com/supervision/image-examples/people-walking.png', 9],
['https://media.roboflow.com/supervision/image-examples/vehicles.png', 9],
['https://media.roboflow.com/supervision/image-examples/basketball-1.png', 9],
]
def detect_and_annotate(image,
GRID_SIZE,
generator,
ALPHA=ALPHA,
mode=1)-> np.ndarray:
# Converting from PIL to OpenCV
image = np.array(image)
# Convert image from BGR to RGB
image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
# Copy and convert the image for sara processing
sara_image = image.copy()
sara_image = cv2.cvtColor(sara_image, cv2.COLOR_RGB2BGR)
# Resetting sara
sara.reset()
# Running sara (Original implementation on itti)
sara_info = sara.return_sara(sara_image, GRID_SIZE, generator, mode=mode)
# Generate saliency map
saliency_map = sara.return_saliency(image, generator=generator)
# Resize saliency map to match the image size
saliency_map = cv2.resize(saliency_map, (image.shape[1], image.shape[0]))
# Apply color map and convert to RGB
saliency_map = cv2.applyColorMap(saliency_map, cv2.COLORMAP_JET)
saliency_map = cv2.cvtColor(saliency_map, cv2.COLOR_BGR2RGB)
# Overlay the saliency map on the original image
saliency_map = cv2.addWeighted(saliency_map, ALPHA, image, 1-ALPHA, 0)
# Extract and convert heatmap to RGB
heatmap = sara_info[0]
heatmap = cv2.cvtColor(heatmap, cv2.COLOR_BGR2RGB)
return saliency_map, heatmap
def process_image(
input_image: np.ndarray,
GRIDSIZE: int,
) -> Tuple[np.ndarray, np.ndarray, np.ndarray, np.ndarray]:
# Validate GRID_SIZE
if GRIDSIZE is None and GRIDSIZE < 4:
GRIDSIZE = 9
itti_saliency_map, itti_heatmap = detect_and_annotate(
input_image, GRIDSIZE, 'itti')
_, itti_heatmap2 = detect_and_annotate(
input_image, GRIDSIZE, 'itti', mode=2)
# deepgaze_saliency_map, deepgaze_heatmap = detect_and_annotate(
# input_image, GRIDSIZE, 'deepgaze')
return (
itti_saliency_map,
itti_heatmap,
itti_heatmap2,
# deepgaze_saliency_map,
# deepgaze_heatmap,
)
grid_size_Component = gr.Slider(
minimum=4,
maximum=70,
value=9,
step=1,
label="Grid Size",
info=(
"The grid size for the Saliency Ranking (SaRa) model. The grid size determines "
"the number of regions the image is divided into. A higher grid size results in "
"more regions and a lower grid size results in fewer regions. The default grid "
"size is 9."
))
with gr.Blocks() as demo:
gr.Markdown(MARKDOWN)
with gr.Accordion("Configuration", open=False):
with gr.Row():
grid_size_Component.render()
with gr.Row():
input_image_component = gr.Image(
type='pil',
label='Input'
)
itti_saliency_map = gr.Image(
type='pil',
label='Itti Saliency Map'
)
with gr.Row():
itti_heatmap = gr.Image(
type='pil',
label='Itti Saliency Ranking Heatmap'
)
itti_heatmap2 = gr.Image(
type='pil',
label='Itti Saliency Ranking Heatmap'
)
# with gr.Row():
# deepgaze_saliency_map = gr.Image(
# type='pil',
# label='DeepGaze Saliency Map'
# )
# deepgaze_heatmap = gr.Image(
# type='pil',
# label='DeepGaze Saliency Ranking Heatmap'
# )
submit_button_component = gr.Button(
value='Submit',
scale=1,
variant='primary'
)
gr.Examples(
fn=process_image,
examples=IMAGE_EXAMPLES,
inputs=[
input_image_component,
grid_size_Component,
],
outputs=[
itti_saliency_map,
itti_heatmap,
itti_heatmap2,
# deepgaze_saliency_map,
# deepgaze_heatmap,
]
)
submit_button_component.click(
fn=process_image,
inputs=[
input_image_component,
grid_size_Component,
],
outputs=[
itti_saliency_map,
itti_heatmap,
itti_heatmap2,
# deepgaze_saliency_map,
# deepgaze_heatmap,
]
)
demo.launch(debug=False, show_error=True, max_threads=1)