File size: 11,552 Bytes
7c0f80b
fe8cd4e
 
0414ba1
fe8cd4e
 
 
 
9f6bfc6
fe8cd4e
0414ba1
 
 
 
9f6bfc6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
fe8cd4e
 
 
 
 
0414ba1
 
 
9f6bfc6
fe8cd4e
 
 
 
0414ba1
 
9f6bfc6
fe8cd4e
 
0414ba1
 
 
 
9f6bfc6
fe8cd4e
9f6bfc6
fe8cd4e
9f6bfc6
 
 
 
0414ba1
 
 
9f6bfc6
 
 
0414ba1
 
 
 
9f6bfc6
0414ba1
9f6bfc6
 
 
 
 
 
 
 
 
 
0414ba1
9f6bfc6
 
0414ba1
9f6bfc6
 
 
 
 
 
0414ba1
 
9f6bfc6
 
 
 
 
0414ba1
 
9f6bfc6
0414ba1
 
 
9f6bfc6
 
 
0414ba1
9f6bfc6
0414ba1
fe8cd4e
9f6bfc6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0414ba1
fe8cd4e
9f6bfc6
 
 
 
 
 
 
 
 
 
 
 
 
 
0414ba1
9f6bfc6
fe8cd4e
 
9f6bfc6
 
 
 
 
 
 
 
 
 
 
 
 
 
0414ba1
9f6bfc6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
0414ba1
9f6bfc6
 
 
 
 
fe8cd4e
 
 
 
 
9f6bfc6
 
 
 
 
 
 
 
 
 
 
 
 
 
fe8cd4e
 
 
9f6bfc6
 
 
fe8cd4e
9f6bfc6
ab45e08
6c40bac
 
ab45e08
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
import os
import numpy as np
import cv2
import gradio as gr
from tensorflow.keras.applications import ResNet50
from tensorflow.keras.applications.resnet50 import preprocess_input
from skimage.metrics import structural_similarity as ssim
from PIL import Image
from io import BytesIO

# Disable GPU for TensorFlow
os.environ["TF_ENABLE_ONEDNN_OPTS"] = "0"
os.environ["CUDA_VISIBLE_DEVICES"] = "-1"

# --- DOCUMENTATION STRINGS (English Only) ---

GUIDELINE_SETUP = """
## 1. Quick Start Guide: Setup and Run Instructions

This application uses a combination of advanced feature extraction (ResNet50) and structural analysis (SSIM) to determine if comparison images are structurally and semantically similar to a reference image.

1.  **Upload Reference:** Upload the main image you want to compare against in the 'Reference Image' box.
2.  **Upload Comparisons:** Upload one or more images you want to test for similarity in the 'Comparison Images' file upload area.
3.  **Set Threshold:** Adjust the 'Similarity Threshold' slider. This controls the sensitivity for structural similarity (SSIM).
4.  **Run:** Click the **"Compare Images"** button.
5.  **Review:** Results will appear in the 'Results' panel, indicating if each comparison image is "SIMILAR" or "NOT SIMILAR".
"""

GUIDELINE_INPUT = """
## 2. Expected Inputs and Preprocessing

| Input Field | Purpose | Requirement |
| :--- | :--- | :--- |
| **Reference Image** | The baseline image against which all others will be compared. | Must be a single image file (JPG, PNG). |
| **Comparison Images** | One or more images to be tested for similarity. | Must be multiple image files. Upload them using the file selector. |
| **Similarity Threshold** | A slider controlling the sensitivity (0.0 to 1.0) for structural similarity (SSIM). | Higher values (closer to 1.0) mean stricter similarity requirements. Default is 0.5. |

**Image Preprocessing:** All uploaded images are automatically resized to 224x224 pixels and standardized according to the requirements of the ResNet model before feature extraction.
"""

GUIDELINE_OUTPUT = """
## 3. Expected Outputs (Similarity Results)

The application provides two main outputs:

1.  **Results (HTML Panel):**
    *   A list detailing the outcome for each comparison image.
    *   Status: **SIMILAR** (Green) or **NOT SIMILAR** (Red).

2.  **Processed Images (Gallery):**
    *   A gallery displaying the input comparison images after they have been processed.

### How Similarity is Determined:
The classification relies on two checks: Structural Similarity (SSIM) and Deep Feature Distance (ResNet). An image is marked "SIMILAR" if both structural and semantic properties suggest a close match.
"""

# --- CLASSIFIER CLASS ---
class ImageCharacterClassifier:
    def __init__(self, similarity_threshold=0.5):
        self.model = ResNet50(weights='imagenet', include_top=False, pooling='avg')
        self.similarity_threshold = similarity_threshold

    def load_and_preprocess_image(self, img):
        img = img.convert('RGB')
        img_array = np.array(img)
        img_array = cv2.resize(img_array, (224, 224))
        img_array = np.expand_dims(img_array, axis=0)
        img_array = preprocess_input(img_array)
        return img_array

    def extract_features(self, img):
        preprocessed_img = self.load_and_preprocess_image(img)
        features = self.model.predict(preprocessed_img, verbose=0)
        return features

    def calculate_ssim(self, img1, img2):
        img1_gray = cv2.cvtColor(img1, cv2.COLOR_RGB2GRAY)
        img2_gray = cv2.cvtColor(img2, cv2.COLOR_RGB2GRAY)
        img2_gray = cv2.resize(img2_gray, (img1_gray.shape[1], img1_gray.shape[0]))
        return ssim(img1_gray, img2_gray, data_range=img1_gray.max() - img1_gray.min())

def process_images(reference_image_array, comparison_files, similarity_threshold):
    try:
        if reference_image_array is None:
            return "<p style='color:red;'>Please upload a reference image.</p>", []
        if not comparison_files:
            return "<p style='color:red;'>Please upload comparison images.</p>", []

        classifier = ImageCharacterClassifier(similarity_threshold)

        ref_image_pil = Image.fromarray(reference_image_array).convert("RGB")
        ref_features = classifier.extract_features(ref_image_pil)
        ref_image_for_ssim = cv2.cvtColor(reference_image_array, cv2.COLOR_BGR2RGB)

        results = []
        html_output = "<h3>Comparison Results:</h3>"

        for comp_file_item in comparison_files:
            try:
                # FIX: Extract file path correctly regardless of whether it's a dict (internal Gradio) 
                # or a gr.File object (returned by our custom loader function).
                if isinstance(comp_file_item, str):
                    file_path = comp_file_item
                elif hasattr(comp_file_item, 'name'):
                    file_path = comp_file_item.name
                elif isinstance(comp_file_item, dict) and 'name' in comp_file_item:
                    file_path = comp_file_item['name']
                else:
                    raise ValueError("Invalid file object structure.")

                with open(file_path, "rb") as f:
                    comp_pil = Image.open(BytesIO(f.read())).convert("RGB")

                comp_array = np.array(comp_pil)
                
                # SSIM Check
                ssim_score = classifier.calculate_ssim(ref_image_for_ssim, comp_array)
                
                # Feature Check
                comp_features = classifier.extract_features(comp_pil)
                max_feature_diff = np.max(np.abs(ref_features - comp_features))
                feature_match = max_feature_diff < 6.0
                
                is_similar = feature_match # Primary criterion
                
                status_text = f"SIMILAR (SSIM: {ssim_score:.3f})" if is_similar else f"NOT SIMILAR (SSIM: {ssim_score:.3f})"
                status_color = "green" if is_similar else "red"

                html_output += f"<p style='color:{status_color};'>{os.path.basename(file_path)}: {status_text}</p>"
                results.append(comp_array)

            except Exception as e:
                # Use the path for logging the error
                error_name = os.path.basename(file_path) if 'file_path' in locals() else 'Unknown File'
                html_output += f"<p style='color:red;'>Error processing {error_name}: {str(e)}</p>"

        return html_output, [r for r in results if r is not None]

    except Exception as e:
        return f"<p style='color:red;'>Critical Error: {str(e)}</p>", []

# --- SAMPLE DATA DEFINITION ---

# Placeholder file paths (MUST EXIST for examples to work)
# NOTE: Adjusted paths to match your provided snippet structure 'sample_data/filename'
SAMPLE_FILES_SET1 = {
    "reference": "sample_data/license3.jpg",
    "comparisons": ["sample_data/license3.jpg", "sample_data/license3.jpg", "sample_data/licence.jpeg"]
}

SAMPLE_FILES_SET2 = {
    "reference": "sample_data/licence.jpeg",
    "comparisons": ["sample_data/licence.jpeg", "sample_data/license3.jpg", "sample_data/licence.jpeg", "sample_data/licence.jpeg"]
}


# --- GRADIO UI SETUP ---

def create_interface():
    with gr.Blocks(title="Image Similarity Classifier") as interface:
        
        gr.Markdown("# Image Similarity Classifier (ResNet + SSIM)")
        gr.Markdown("Tool to compare a reference image against multiple comparison images based on structural and deep feature similarity.")

        # 1. Guidelines Section
        with gr.Accordion("User Guidelines and Documentation", open=False):
            gr.Markdown(GUIDELINE_SETUP)
            gr.Markdown("---")
            gr.Markdown(GUIDELINE_INPUT)
            gr.Markdown("---")
            gr.Markdown(GUIDELINE_OUTPUT)
            
        gr.Markdown("---")

        # 2. Application Interface
        with gr.Row():
            with gr.Column():
                gr.Markdown("## Step 1: Upload a Reference Image ")
                reference_input = gr.Image(label="Reference Image", type="numpy", height=300)
                gr.Markdown("## Step 2: Upload Multiple Images to Compair with Reference Image ")
                comparison_input = gr.Files(label="Comparison Images", type="file")
                gr.Markdown("## Step 3: Set the Confidence Score (Optional) ")
                threshold_slider = gr.Slider(minimum=0.0, maximum=1.0, value=0.5, step=0.05, label="Similarity Threshold (SSIM)")
                gr.Markdown("## Step 4: Click Compare Images ")
                submit_button = gr.Button("Compare Images", variant="primary")
                gr.Markdown("---")
                gr.Markdown("# Results ")
                gr.Markdown("## Comparison Result ")
                output_html = gr.HTML(label="Comparison Results")
                gr.Markdown("## Processed Comparison Images")
                output_gallery = gr.Gallery(label="Processed Comparison Images", columns=3)

        # 3. Example Loading Setup
        gr.Markdown("---")
        gr.Markdown("## Sample Data for Testing")
        gr.Markdown("### Click on any of these two set to run the test set ")
        
        def load_and_run_set(reference_path, comparison_paths, threshold_value=0.5):
            """Loads data into inputs, triggers processing, and returns all results."""
            
            # 1. Load Reference Image as NumPy array
            ref_img_pil = Image.open(reference_path).convert("RGB")
            ref_img_array = np.array(ref_img_pil)
            
            # 2. Comparison Files: Prepare the list of paths (strings) for the processor
            # We return a list of strings/paths here, which Gradio's gr.Files component accepts
            comparison_file_paths = comparison_paths
            
            # 3. Process the images immediately using the paths
            html, gallery = process_images(ref_img_array, comparison_file_paths, threshold_value)
            
            # 4. Return inputs and outputs for component update
            return ref_img_array, comparison_file_paths, threshold_value, html, gallery

        with gr.Row():
            btn_set1 = gr.Button("Load & Run Sample Set 1 (Similar Docs)", size="sm")
            btn_set2 = gr.Button("Load & Run Sample Set 2 (Dissimilar Docs)", size="sm")
        
        # 4. Event Handling
        submit_button.click(
            fn=process_images,
            inputs=[reference_input, comparison_input, threshold_slider],
            outputs=[output_html, output_gallery]
        )
        
        # Event handlers for example buttons: load data into inputs/outputs
        btn_set1.click(
            fn=lambda: load_and_run_set(SAMPLE_FILES_SET1['reference'], SAMPLE_FILES_SET1['comparisons'], 0.6),
            inputs=[],
            outputs=[reference_input, comparison_input, threshold_slider, output_html, output_gallery]
        )
        
        btn_set2.click(
            fn=lambda: load_and_run_set(SAMPLE_FILES_SET2['reference'], SAMPLE_FILES_SET2['comparisons'], 0.4),
            inputs=[],
            outputs=[reference_input, comparison_input, threshold_slider, output_html, output_gallery]
        )
        
    return interface

if __name__ == "__main__":
    # Ensure the 'sample_data/' directory exists with 'license3.jpg' and 'licence.jpeg'
    # and any other necessary files.
    
    interface = create_interface()
    interface.queue()
    interface.launch(
        server_name="0.0.0.0",
        server_port=7860
    )