Spaces:

SkinCancerDiagnosis
/

CaseStudy2

Sleeping

App Files Files Community

KeerthiVM commited on Oct 4, 2025

Commit

d9e2abb

0 Parent(s):

Initial changes

Browse files

Files changed (9) hide show

app.py +228 -0
deploy.sh +21 -0
models/fsrcnn_x2.pth +0 -0
models/fsrcnn_x3.pth +0 -0
models/fsrcnn_x4.pth +0 -0
requirements.txt +10 -0
secrets.txt +1 -0
tests/test2.py +104 -0
tests/test_app.py +137 -0

app.py ADDED Viewed

	@@ -0,0 +1,228 @@

+import os
+import math
+import typing as tp
+import cv2
+import numpy as np
+import torch
+from torch import nn
+import gradio as gr
+from huggingface_hub import InferenceClient
+import warnings
+warnings.filterwarnings("ignore", category=UserWarning)
+# ============================================================
+# 🧠 PART 1: FSRCNN Image Upscaling
+# ============================================================
+class FSRCNN(nn.Module):
+    def __init__(self, scale_factor, num_channels=1, d=56, s=12, m=4):
+        super(FSRCNN, self).__init__()
+        self.first_part = nn.Sequential(
+            nn.Conv2d(num_channels, d, kernel_size=5, padding=5 // 2),
+            nn.PReLU(d)
+        )
+        self.mid_part = [nn.Conv2d(d, s, kernel_size=1), nn.PReLU(s)]
+        for _ in range(m):
+            self.mid_part.extend([nn.Conv2d(s, s, kernel_size=3, padding=3 // 2), nn.PReLU(s)])
+        self.mid_part.extend([nn.Conv2d(s, d, kernel_size=1), nn.PReLU(d)])
+        self.mid_part = nn.Sequential(*self.mid_part)
+        self.last_part = nn.ConvTranspose2d(
+            d, num_channels, kernel_size=9,
+            stride=scale_factor, padding=9 // 2,
+            output_padding=scale_factor - 1
+        )
+        self._initialize_weights()
+    def _initialize_weights(self):
+        for m in self.first_part:
+            if isinstance(m, nn.Conv2d):
+                nn.init.normal_(m.weight.data, mean=0.0,
+                                std=math.sqrt(2 / (m.out_channels * m.weight.data[0][0].numel())))
+                nn.init.zeros_(m.bias.data)
+        for m in self.mid_part:
+            if isinstance(m, nn.Conv2d):
+                nn.init.normal_(m.weight.data, mean=0.0,
+                                std=math.sqrt(2 / (m.out_channels * m.weight.data[0][0].numel())))
+                nn.init.zeros_(m.bias.data)
+        nn.init.normal_(self.last_part.weight.data, mean=0.0, std=0.001)
+        nn.init.zeros_(self.last_part.bias.data)
+    def forward(self, x):
+        x = self.first_part(x)
+        x = self.mid_part(x)
+        x = self.last_part(x)
+        return x
+Device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+MODEL_CACHE: dict[int, tuple[FSRCNN, bool]] = {}
+WEIGHTS_PATHS = {2: "models/fsrcnn_x2.pth", 3: "models/fsrcnn_x3.pth", 4: "models/fsrcnn_x4.pth"}
+def try_load_weights(model, weights_path):
+    if not weights_path or not os.path.isfile(weights_path):
+        print(f"[FSRCNN] No valid weights at {weights_path}. Falling back to Bicubic.")
+        return False
+    try:
+        checkpoint = torch.load(weights_path, map_location=Device, weights_only=False)
+        model.load_state_dict(checkpoint, strict=True)
+        print(f"[FSRCNN] Loaded weights from {weights_path}")
+        return True
+    except Exception as e:
+        print(f"[FSRCNN] Failed to load weights: {e}")
+        return False
+def get_model(scale, weights_path=None):
+    if scale not in MODEL_CACHE:
+        model = FSRCNN(scale_factor=scale).to(Device).eval()
+        has_weights = try_load_weights(model, weights_path)
+        MODEL_CACHE[scale] = (model, has_weights)
+    return MODEL_CACHE[scale]
+def rgb_to_ycbcr(img_rgb: np.ndarray) -> np.ndarray:
+    return cv2.cvtColor(img_rgb, cv2.COLOR_RGB2YCrCb)
+def ycbcr_to_rgb(img_ycrcb: np.ndarray) -> np.ndarray:
+    return cv2.cvtColor(img_ycrcb, cv2.COLOR_YCrCb2RGB)
+def run_fsrcnn_on_y(y: np.ndarray, model: FSRCNN) -> np.ndarray:
+    y_f = y.astype(np.float32) / 255.0
+    tens = torch.from_numpy(y_f).unsqueeze(0).unsqueeze(0).to(Device)
+    with torch.inference_mode():
+        out = model(tens)
+    out_np = out.squeeze(0).squeeze(0).clamp(0.0, 1.0).cpu().numpy()
+    return (out_np * 255.0 + 0.5).astype(np.uint8)
+def fsrcnn_upscale_rgb(img_rgb: np.ndarray, scale: int, weights: tp.Optional[str] = None) -> np.ndarray:
+    h, w = img_rgb.shape[:2]
+    model, has_weights = get_model(scale, weights)
+    if not has_weights:
+        return cv2.resize(img_rgb, (w * scale, h * scale), interpolation=cv2.INTER_CUBIC)
+    ycrcb = rgb_to_ycbcr(img_rgb)
+    y, cr, cb = ycrcb[..., 0], ycrcb[..., 1], ycrcb[..., 2]
+    y_sr = run_fsrcnn_on_y(y, model)
+    new_w, new_h = w * scale, h * scale
+    cr_up = cv2.resize(cr, (new_w, new_h), interpolation=cv2.INTER_CUBIC)
+    cb_up = cv2.resize(cb, (new_w, new_h), interpolation=cv2.INTER_CUBIC)
+    ycrcb_up = np.stack([y_sr, cr_up, cb_up], axis=-1)
+    return ycbcr_to_rgb(ycrcb_up)
+def maybe_downscale_for_memory(img_rgb: np.ndarray, max_pixels: int = 8_000_000) -> np.ndarray:
+    h, w = img_rgb.shape[:2]
+    if h * w <= max_pixels:
+        return img_rgb
+    scale = (max_pixels / (h * w)) ** 0.5
+    new_w, new_h = int(w * scale), int(h * scale)
+    return cv2.resize(img_rgb, (new_w, new_h), interpolation=cv2.INTER_AREA)
+def upscale_ui(image: np.ndarray, scale_factor: int, method: str):
+    if image is None:
+        return None, "Please upload an image."
+    if image.dtype != np.uint8:
+        image = np.clip(image, 0, 255).astype(np.uint8)
+    if image.ndim == 2:
+        image = np.stack([image]*3, axis=-1)
+    elif image.shape[2] == 4:
+        image = image[..., :3]
+    image = maybe_downscale_for_memory(image)
+    weights_path = WEIGHTS_PATHS.get(scale_factor)
+    if method == "FSRCNN (Y channel)":
+        out = fsrcnn_upscale_rgb(image, scale_factor, weights_path)
+        status = f"Used FSRCNN x{scale_factor} (bundled weights)."
+    else:
+        out = cv2.resize(image, (image.shape[1]*scale_factor, image.shape[0]*scale_factor), interpolation=cv2.INTER_CUBIC)
+        status = f"Used Bicubic x{scale_factor}."
+    return out, status
+# ============================================================
+# 🌍 PART 2: Multilingual Translator
+# ============================================================
+HF_TOKEN = os.environ.get("HF_TOKEN", None)
+client = InferenceClient(provider="hf-inference", api_key=HF_TOKEN)
+lang_map = {
+    "English": "en_XX", "French": "fr_XX", "Spanish": "es_XX", "German": "de_DE",
+    "Hindi": "hi_IN", "Chinese": "zh_CN", "Japanese": "ja_XX", "Korean": "ko_KR",
+    "Tamil": "ta_IN", "Telugu": "te_IN", "Arabic": "ar_AR", "Russian": "ru_RU"
+    # You can add full map from your existing file if needed
+}
+def translate_text(text, src_lang, tgt_lang):
+    if not text.strip():
+        return "Please enter any text to translate 😃"
+    try:
+        src_code, tgt_code = lang_map[src_lang], lang_map[tgt_lang]
+        result = client.translation(
+            text,
+            model="facebook/mbart-large-50-many-to-many-mmt",
+            src_lang=src_code,
+            tgt_lang=tgt_code
+        )
+        return result.translation_text
+    except Exception as e:
+        return f"Error in translation: {str(e)}"
+# ============================================================
+# 🎨 Combine into One Interface with Tabs
+# ============================================================
+custom_theme = gr.themes.Default().set(
+    button_primary_background_fill="#1769aa",
+    button_primary_text_color="#ffffff",
+    button_secondary_background_fill="#e0e0e0",
+    button_secondary_text_color="#222222"
+)
+with gr.Blocks(theme=custom_theme, title="AI Multi-Tool: FSRCNN & Translator") as demo:
+    gr.Markdown("# 🚀 AI Multi-Tool Suite\nChoose an application below 👇")
+    with gr.Tabs():
+        # Tab 1: FSRCNN Upscaler
+        with gr.Tab("🖼️ Image Upscaling"):
+            with gr.Row():
+                with gr.Column():
+                    inp_img = gr.Image(type="numpy", label="Input Image")
+                    scale = gr.Dropdown([2, 3, 4], value=2, label="Upscale Factor")
+                    method = gr.Radio(["FSRCNN (Y channel)", "Bicubic"], value="FSRCNN (Y channel)")
+                    run_btn = gr.Button("Upscale", variant="primary")
+                    clear_btn = gr.Button("Clear", variant="secondary")
+                    status_box = gr.Textbox(label="Status")
+                with gr.Column():
+                    out_img = gr.Image(type="numpy", label="Upscaled Output")
+            run_btn.click(fn=upscale_ui, inputs=[inp_img, scale, method], outputs=[out_img, status_box])
+            clear_btn.click(fn=lambda: (None, 2, "FSRCNN (Y channel)", None, ""),
+                            outputs=[inp_img, scale, method, out_img, status_box])
+        # Tab 2: Translator
+        with gr.Tab("🌍 Text Translator"):
+            with gr.Row():
+                with gr.Column():
+                    src_lang = gr.Dropdown(choices=list(lang_map.keys()), value="English", label="Source Language")
+                    input_text = gr.Textbox(lines=4, label="Enter Text")
+                with gr.Column():
+                    tgt_lang = gr.Dropdown(choices=list(lang_map.keys()), value="French", label="Target Language")
+                    output_text = gr.Textbox(lines=4, label="Translation", interactive=False)
+            translate_btn = gr.Button("Translate ✨", variant="primary")
+            clear_btn2 = gr.Button("Clear", variant="secondary")
+            translate_btn.click(fn=translate_text, inputs=[input_text, src_lang, tgt_lang], outputs=output_text)
+            clear_btn2.click(fn=lambda: ("", "English", "French", ""), outputs=[input_text, src_lang, tgt_lang, output_text])
+if __name__ == "__main__":
+    demo.launch()

deploy.sh ADDED Viewed

	@@ -0,0 +1,21 @@

+#!/bin/bash
+sudo apt update
+# sudo apt install -y libgl1-mesa-glx libglib2.0-0 libsm6 libxrender1 libxext6 ffmpeg
+sudo apt install -y libgl1-mesa-glx
+cd ~/projects/
+if [ -d "Image_upscaling" ]; then
+    cd Image_upscaling && git pull origin main
+else
+    git clone https://github.com/harikp196/Image_upscaling.git
+fi
+cd ~/projects
+python3 -m venv venv
+source venv/bin/activate
+pip install --upgrade pip
+pip install -r ~/projects/Image_upscaling/requirements.txt
+nohup python3 ~/projects/Image_upscaling/app.py > ~/projects/project1.log 2>&1 &

models/fsrcnn_x2.pth ADDED Viewed

Binary file (55 kB). View file

models/fsrcnn_x3.pth ADDED Viewed

Binary file (55 kB). View file

models/fsrcnn_x4.pth ADDED Viewed

Binary file (55 kB). View file

requirements.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+gradio
+opencv-python
+numpy
+torch
+tqdm
+setuptools
+torchvision
+Pillow
+natsort
+huggingface_hub

secrets.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ HF_TOKEN==>REDACTED

tests/test2.py ADDED Viewed

	@@ -0,0 +1,104 @@

+# tests/test_fsrcnn.py
+import os
+import importlib
+import numpy as np
+import torch
+import pytest
+# Adjust this import if your file isn't named fsrcnn_app.py
+import app as app
+@pytest.fixture(autouse=True)
+def _reset_cache_between_tests():
+    # Ensure cache isolation between tests
+    app.MODEL_CACHE.clear()
+    yield
+    app.MODEL_CACHE.clear()
+def test_fsrcnn_forward_output_shape_cpu_only():
+    """FSRCNN forward should upscale 1-channel input by its scale factor."""
+    model = app.FSRCNN(scale_factor=3).eval()
+    x = torch.randn(1, 1, 10, 12)  # (N, C, H, W)
+    with torch.inference_mode():
+        y = model(x)
+    assert y.shape == (1, 1, 30, 36), "Output shape must be (H*scale, W*scale)"
+def test_run_fsrcnn_on_y_shape_and_dtype():
+    """run_fsrcnn_on_y should return uint8 image with upscaled spatial dims."""
+    y = np.random.randint(0, 256, (9, 7), dtype=np.uint8)
+    model = app.FSRCNN(scale_factor=2).eval()
+    out = app.run_fsrcnn_on_y(y, model)
+    assert out.dtype == np.uint8
+    assert out.shape == (9 * 2, 7 * 2)
+def test_bicubic_upscale_rgb_shape_and_dtype():
+    rgb = np.random.randint(0, 256, (16, 24, 3), dtype=np.uint8)
+    out = app.bicubic_upscale_rgb(rgb, scale=4)
+    assert out.dtype == np.uint8
+    assert out.shape == (16 * 4, 24 * 4, 3)
+def test_rgb_ycbcr_roundtrip_close():
+    """RGB -> YCrCb -> RGB roundtrip should be close (small max diff)."""
+    rgb = np.random.randint(0, 256, (32, 32, 3), dtype=np.uint8)
+    ycrcb = app.rgb_to_ycbcr(rgb)
+    back = app.ycbcr_to_rgb(ycrcb)
+    # Allow small numerical differences from color conversion
+    assert np.max(np.abs(back.astype(int) - rgb.astype(int))) <= 2
+def test_fsrcnn_upscale_falls_back_to_bicubic_when_no_weights(tmp_path):
+    """When no valid weights are provided, FSRCNN code must return bicubic result."""
+    rgb = np.random.randint(0, 256, (12, 10, 3), dtype=np.uint8)
+    scale = 3
+    # Ensure a fresh cache so the "no-weights" path is exercised
+    app.MODEL_CACHE.clear()
+    out_fallback = app.fsrcnn_upscale_rgb(rgb, scale=scale, weights=None)
+    out_bicubic = app.bicubic_upscale_rgb(rgb, scale=scale)
+    assert out_fallback.shape == out_bicubic.shape
+    # Code path returns bicubic directly; should be byte-identical
+    assert np.array_equal(out_fallback, out_bicubic)
+def test_ui_accepts_grayscale_and_rgba_and_clips():
+    """The UI helper should handle grayscale, RGBA, and non-uint8 inputs."""
+    # Grayscale -> stacked to RGB
+    gray = np.random.randint(0, 256, (8, 8), dtype=np.uint8)
+    out_gray = app.upscale_ui(gray, 2, "Bicubic", "", "", "")
+    assert out_gray.shape == (16, 16, 3)
+    assert out_gray.dtype == np.uint8
+    # RGBA -> drop alpha
+    rgba = np.random.randint(0, 256, (8, 8, 4), dtype=np.uint8)
+    out_rgba = app.upscale_ui(rgba, 2, "Bicubic", "", "", "")
+    assert out_rgba.shape == (16, 16, 3)
+    assert out_rgba.dtype == np.uint8
+    # Float input -> should clip/convert to uint8 internally
+    f_rgb = np.random.randn(8, 8, 3).astype(np.float32) * 1000.0  # intentionally wild
+    out_float = app.upscale_ui(f_rgb, 2, "Bicubic", "", "", "")
+    assert out_float.dtype == np.uint8
+    assert out_float.shape == (16, 16, 3)
+def test_maybe_downscale_for_memory_respects_limit():
+    big = np.random.randint(0, 256, (4000, 4000, 3), dtype=np.uint8)  # 16M px
+    capped = app.maybe_downscale_for_memory(big, max_pixels=1_000_000)
+    assert capped.shape[0] * capped.shape[1] <= 1_000_000
+def test_get_model_cache_per_scale():
+    m2, w2 = app.get_model(2, weights_path=None)
+    m3, w3 = app.get_model(3, weights_path=None)
+    # Cache populated for both scales
+    assert 2 in app.MODEL_CACHE and 3 in app.MODEL_CACHE
+    assert isinstance(m2, app.FSRCNN) and isinstance(m3, app.FSRCNN)
+    assert m2 is not m3, "Different scales should use different model instances"

tests/test_app.py ADDED Viewed

	@@ -0,0 +1,137 @@

+import pytest
+import numpy as np
+import cv2
+import torch
+from app import FSRCNN, rgb_to_ycbcr, ycbcr_to_rgb, bicubic_upscale_rgb, upscale_ui, try_load_weights
+def test_fsrcnn_model_initialization():
+    for scale in [2, 3, 4]:
+        model = FSRCNN(scale_factor=scale)
+        assert model is not None
+        assert hasattr(model, 'first_part')
+        assert hasattr(model, 'mid_part')
+        assert hasattr(model, 'last_part')
+def test_color_conversion():
+    test_img = np.random.randint(0, 255, (32, 32, 3), dtype=np.uint8)
+    ycbcr = rgb_to_ycbcr(test_img)
+    reconstructed = ycbcr_to_rgb(ycbcr)
+    assert test_img.shape == reconstructed.shape
+    assert np.mean(np.abs(test_img.astype(float) - reconstructed.astype(float))) < 2.0
+def test_bicubic_upscaling():
+    test_img = np.random.randint(0, 255, (16, 16, 3), dtype=np.uint8)
+    for scale in [1, 2, 3, 4]:
+        upscaled = bicubic_upscale_rgb(test_img, scale)
+        expected_shape = (16 * scale, 16 * scale, 3)
+        assert upscaled.shape == expected_shape
+def test_try_load_weights_error(tmp_path):
+    model = FSRCNN(scale_factor=2)
+    fake_weights = {
+        "last_part.bias": torch.zeros(1),
+        "a_fake_key.weight": torch.randn(10)
+    }
+    fake_weights_file = "test.pth"
+    torch.save(fake_weights, fake_weights_file)
+    result = try_load_weights(model, str(fake_weights_file))
+    assert result == True
+    model = FSRCNN(scale_factor=2)
+    assert try_load_weights(model, None) == False
+    model = FSRCNN(scale_factor=2)
+    corrupted_file = tmp_path/"corrupted.pth"
+    corrupted_file.write_text("this is just a text file, not a model!")
+    result = try_load_weights(model, str(corrupted_file))
+    assert result == False
+def test_try_load_weights():
+    model = FSRCNN(scale_factor=2)
+    assert try_load_weights(model, "../models/fsrcnn_x2.pth") == False
+def test_model_forward_pass():
+    for scale in [2, 3, 4]:
+        model = FSRCNN(scale_factor=scale)
+        dummy_input = np.random.rand(1, 1, 32, 32).astype(np.float32)
+        output = model(torch.from_numpy(dummy_input))
+        expected_height = 32 * scale
+        expected_width = 32 * scale
+        assert output.shape[2] == expected_height
+        assert output.shape[3] == expected_width
+def test_upscale_ui_noimage():
+    assert upscale_ui(None, 2, "FSRCNN (Y channel)") == (None, 'Please upload an image.')
+def test_upscale_ui():
+    # Float input
+    float_image = np.random.rand(32, 32, 3).astype(np.float32)
+    result = upscale_ui(
+        image=float_image,
+        scale_factor=2,
+        method="Bicubic"
+    )
+    assert result[0] is not None
+    assert result[0].dtype == np.uint8
+    assert result[0].shape == (64, 64, 3)
+    """Test upscale_ui with grayscale (2D) input"""
+    grayscale_image = np.random.randint(0, 255, (32, 32), dtype=np.uint8)
+    result = upscale_ui(
+        image=grayscale_image,
+        scale_factor=2,
+        method="FSRCNN (Y channel)",
+    )
+    assert result[0] is not None
+    assert result[0].dtype == np.uint8
+    assert result[0].shape == (64, 64, 3)
+    """Test upscale_ui with RGBA input"""
+    rgba_image = np.random.randint(0, 255, (32, 32, 4), dtype=np.uint8)
+    result = upscale_ui(
+        image=rgba_image,
+        scale_factor=2,
+        method="Bicubic",
+    )
+    assert result[0] is not None
+    assert result[0].dtype == np.uint8
+    assert result[0].shape == (64, 64, 3)
+    downloadscale_image = np.random.randint(0, 255, (4000, 4000, 3), dtype=np.uint8)
+    result = upscale_ui(
+        image=downloadscale_image,
+        scale_factor=2,
+        method="FSRCNN (Y channel)",
+    )
+    assert result[0] is not None
+    assert result[0].dtype == np.uint8
+    assert result[0].shape == (5656, 5656, 3)
+    test_img = np.random.randint(0, 255, (16, 16, 3), dtype=np.uint8)
+    for scale in [2, 3, 4]:
+        upscaled = upscale_ui(test_img, scale, "FSRCNN (Y channel)")
+        expected_shape = (16 * scale, 16 * scale, 3)
+        assert upscaled[0].shape == expected_shape
+def test_upscale_ui_bicubic():
+    test_img = np.random.randint(0, 255, (16, 16, 3), dtype=np.uint8)
+    for scale in [2, 3, 4]:
+        upscaled = upscale_ui(test_img, scale, "Bicubic")
+        expected_shape = (16 * scale, 16 * scale, 3)
+        assert upscaled[0].shape == expected_shape
+if __name__ == "__main__":
+    pytest.main([__file__])