Spaces:

MAS-AI-0000
/

Authentica

Running

App Files Files Community

MAS-AI-0000 commited on 2 days ago

Commit

0a278f1

verified ·

1 Parent(s): 5efd7a3

Update imagePreprocess.py

Browse files

Files changed (1) hide show

imagePreprocess.py +34 -94

imagePreprocess.py CHANGED Viewed

@@ -17,21 +17,19 @@ MODELS_DIR = os.path.join(BASE_DIR, "Lib/Models/Image")
 REPO_ID = "MAS-AI-0000/Authentica"
 CLIP_MODEL_FILENAME = "Lib/Models/Image/clip_model.keras"
 CNN_MODEL_FILENAME = "Lib/Models/Image/cnn_model.keras"
-RESNET_MODEL_FILENAME = "Lib/Models/Image/resnet_model.keras"
 # ==== Load assets ====
 clip_model_path = hf_hub_download(repo_id=REPO_ID, filename=CLIP_MODEL_FILENAME)
 cnn_model_path = hf_hub_download(repo_id=REPO_ID, filename=CNN_MODEL_FILENAME)
-resnet_model_path = hf_hub_download(repo_id=REPO_ID, filename=RESNET_MODEL_FILENAME)
 # Load models and preprocessing once at module level
 clip_mod, clip_pre = clip.load("ViT-B/32", jit=False)
 clip_mod.eval()
 for p in clip_mod.parameters():
     p.requires_grad = False
-mlp_model= tf.keras.models.load_model(clip_model_path)
-cnn_model = tf.keras.models.load_model(cnn_model_path)
-resnet_model = tf.keras.models.load_model(resnet_model_path)
 def center_crop(image: Image.Image, crop_size=512) -> Image.Image | str:
@@ -40,7 +38,7 @@ def center_crop(image: Image.Image, crop_size=512) -> Image.Image | str:
             w, h = image.size
             if w < crop_size or h < crop_size:
                 # skip small images
-                return f"skipped image (too small) ({w}x{h})"
             left = (w - crop_size) // 2
             top = (h - crop_size) // 2
             right = left + crop_size
@@ -48,10 +46,10 @@ def center_crop(image: Image.Image, crop_size=512) -> Image.Image | str:
             cropped = image.crop((left, top, right, bottom))
             return cropped
     except Exception as e:
-        return f"Error when cropping center: {e}"
-def denoise(src_image: Image) -> np.ndarray | str:
     """Read image, denoise (GPU if available) and return denoised image."""
     img = np.array(src_image)   # BGR uint8 numpy array
     img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
@@ -59,8 +57,8 @@ def denoise(src_image: Image) -> np.ndarray | str:
         print(f"WARNING: No source image, skipping.")
         return False
     # Denoising parameters
-    H = 10           # filter strength for luminance component (recommended 3-15)
-    H_COLOR = 10     # same for color components
     TEMPLATE_WINDOW_SIZE = 7
     SEARCH_WINDOW_SIZE = 21
     # Use CUDA if available, otherwise CPU fallback
@@ -88,79 +86,37 @@ def denoise(src_image: Image) -> np.ndarray | str:
             TEMPLATE_WINDOW_SIZE,
             SEARCH_WINDOW_SIZE
         )
-    #cv2.imwrite("denoised.png", den)  # for debugging
-    den = cv2.cvtColor(den, cv2.COLOR_BGR2RGB)
-    den = Image.fromarray(den)
-    return den
-def compute_profile(raw_image: Image, den_image: Image, normalize=False ,verbose= True) -> np.ndarray | str:
-    # read images
-    if raw_image is None:
-        return print(f"WARNING: couldn't read raw image")
-    if den_image is None:
-        return print(f"WARNING: couldn't read denoised image")
-    raw = np.array(raw_image)  # RGB uint8 numpy array
-    raw = cv2.cvtColor(raw, cv2.COLOR_RGB2BGR)
-    den = np.array(den_image)  # RGB uint8 numpy array
-    den = cv2.cvtColor(den, cv2.COLOR_RGB2BGR)
-    # if shapes differ, resize den to raw's size (keeps alignment); warn
-    if den.shape != raw.shape:
-        if verbose:
-            print(f"NOTE: shape mismatch, resizing denoised from {den.shape[:2]} to {raw.shape[:2]}")
-        den = cv2.resize(den, (raw.shape[1], raw.shape[0]), interpolation=cv2.INTER_LINEAR)
     # absolute difference per-channel
-    diff = cv2.absdiff(raw, den)               # BGR, uint8
     gray = cv2.cvtColor(diff, cv2.COLOR_BGR2GRAY)  # single-channel uint8
-    # optionally normalize to full 0-255 (per-image)
-    if normalize:
-        # cv2.normalize will map min->0 and max->255
-        # but if the image is flat (min==max) normalize will set to 0; handle that
-        minv = int(gray.min())
-        maxv = int(gray.max())
-        if maxv > minv:
             norm = cv2.normalize(gray, None, alpha=0, beta=255, norm_type=cv2.NORM_MINMAX)
             out = norm
-        else:
-            # nothing to normalize (flat), keep as-is (all zeros)
-            out = gray
     else:
-        # keep raw diff values but ensure dtype uint8 (already uint8) and values are 0..255
         out = gray
-    #cv2.imwrite("profile.png", out)  # for debugging
     return out
-def profile_image_for_cnn_predict(pil_img: Image, crop_size=512):
     """Preprocess the input image and return a numpy array ready for model prediction."""
     # Step 1: Center crop the image
-    cropped_img = center_crop(pil_img, crop_size=crop_size)
     if isinstance(cropped_img, str):
         return cropped_img  # return error message if cropping failed
-    # Step 2: Denoise the cropped image
-    denoised_img = denoise(cropped_img)
-    if isinstance(denoised_img, str):
-        return denoised_img  # return error message if denoising failed
     # Step 3: Compute the profile image
-    profile_img = compute_profile(cropped_img, denoised_img, normalize=False)
     if isinstance(profile_img, str):
         return profile_img  # return error message if profile computation failed
     return profile_img
-def prepare_cv2_image_for_resnet(cv2_gray_img, target_size=(512,512)):
-    img_rgb = cv2.cvtColor(cv2_gray_img, cv2.COLOR_GRAY2RGB)
-    img_rgb = cv2.resize(img_rgb, (target_size[1], target_size[0]), interpolation=cv2.INTER_AREA)
-    img_rgb = img_rgb.astype('float32')
-    # 5) add batch dim
-    x = np.expand_dims(img_rgb, axis=0)   # shape (1, H, W, 3)
-    x = preprocess_input(x)
-    return x
-def predict_image_prob_clip(image: Image.Image, threshold=0.5,
-                       clip_model=None, clip_preprocess=None,
-                       keras_mlp=None):
     """
     Predicts probability that image is AI-generated (AI=1) using CLIP + Keras MLP.
@@ -172,8 +128,7 @@ def predict_image_prob_clip(image: Image.Image, threshold=0.5,
     Returns:
       dict: {'prob': float_prob_AI, 'label': 'AI' or 'Real'}
     """
     # --- try to reuse provided CLIP objects, otherwise load ---
     if clip_model is None or clip_preprocess is None:
         print("Loading Default CLIP model...")
@@ -186,10 +141,12 @@ def predict_image_prob_clip(image: Image.Image, threshold=0.5,
     # --- try to reuse provided keras model, otherwise load from disk ---
     if keras_mlp is None:
-        print("No keras model provided...")
-        return None
     # --- load/normalize image ---
     # assume PIL image
     img = image.convert('RGB')
     # --- preprocess for CLIP and get embedding ---
@@ -205,32 +162,15 @@ def predict_image_prob_clip(image: Image.Image, threshold=0.5,
     prob = float(probs[0])
     return prob
-def clip_predict(pil_img: Image, crop_size=512):
-    # pass model objects explicitly (faster if you call this repeatedly)
-    pil_img = center_crop(pil_img, crop_size=crop_size)
-    if isinstance(pil_img, str):
-        return pil_img  # return error message
-    return predict_image_prob_clip(pil_img,
-                         clip_model=clip_mod,
-                         clip_preprocess=clip_pre,
-                         keras_mlp=mlp_model)
-def CNNPredict(predict_img: np.ndarray):
-    #1 Real 0 AI
-     #normalize image
-    # expand dims to add channel axis
-     predict_img = predict_img.astype('float32') / 255.0  # shape (H, W)
-     predict_img = np.expand_dims(predict_img, axis=-1)  # shape (H, W, 1)
     # expand dims to add batch axis
-     predict_img = np.expand_dims(predict_img, axis=0)   # shape (1, H, W, 1)
-     prediction = cnn_model.predict(predict_img)
-     return prediction[0][0]
-def ResnetPredict(predict_img):
-    #1 Real 0 AI
-    predict_img = prepare_cv2_image_for_resnet(predict_img)
-    prediction = resnet_model.predict(predict_img)
     return prediction[0][0]

 REPO_ID = "MAS-AI-0000/Authentica"
 CLIP_MODEL_FILENAME = "Lib/Models/Image/clip_model.keras"
 CNN_MODEL_FILENAME = "Lib/Models/Image/cnn_model.keras"
 # ==== Load assets ====
 clip_model_path = hf_hub_download(repo_id=REPO_ID, filename=CLIP_MODEL_FILENAME)
 cnn_model_path = hf_hub_download(repo_id=REPO_ID, filename=CNN_MODEL_FILENAME)
 # Load models and preprocessing once at module level
 clip_mod, clip_pre = clip.load("ViT-B/32", jit=False)
 clip_mod.eval()
 for p in clip_mod.parameters():
     p.requires_grad = False
+mlp_model= tf.keras.models.load_model(os.path.join(MODELS_DIR, "clip_model.keras"))
+cnn_model = tf.keras.models.load_model(os.path.join(MODELS_DIR, "cnn_model.keras"))
 def center_crop(image: Image.Image, crop_size=512) -> Image.Image | str:
             w, h = image.size
             if w < crop_size or h < crop_size:
                 # skip small images
+                return f"Image is too small: ({w}x{h}), Minimum size is {crop_size}x{crop_size}"
             left = (w - crop_size) // 2
             top = (h - crop_size) // 2
             right = left + crop_size
             cropped = image.crop((left, top, right, bottom))
             return cropped
     except Exception as e:
+        return f"Error when cropping image: {e}"
+def compute_profile(src_image: Image) -> np.ndarray | str:
     """Read image, denoise (GPU if available) and return denoised image."""
     img = np.array(src_image)   # BGR uint8 numpy array
     img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
         print(f"WARNING: No source image, skipping.")
         return False
     # Denoising parameters
+    H = 5           # filter strength for luminance component (recommended 3-15)
+    H_COLOR = 5     # same for color components
     TEMPLATE_WINDOW_SIZE = 7
     SEARCH_WINDOW_SIZE = 21
     # Use CUDA if available, otherwise CPU fallback
             TEMPLATE_WINDOW_SIZE,
             SEARCH_WINDOW_SIZE
         )
     # absolute difference per-channel
+    diff = cv2.absdiff(img, den)               # BGR, uint8
     gray = cv2.cvtColor(diff, cv2.COLOR_BGR2GRAY)  # single-channel uint8
+    minv = int(gray.min())
+    maxv = int(gray.max())
+    if maxv > minv:
             norm = cv2.normalize(gray, None, alpha=0, beta=255, norm_type=cv2.NORM_MINMAX)
             out = norm
     else:
+        # nothing to normalize (flat), keep as-is (all zeros)
         out = gray
     return out
+def preprocess_cnn(pil_img: Image):
     """Preprocess the input image and return a numpy array ready for model prediction."""
     # Step 1: Center crop the image
+    cropped_img = center_crop(pil_img)
     if isinstance(cropped_img, str):
         return cropped_img  # return error message if cropping failed
     # Step 3: Compute the profile image
+    profile_img = compute_profile(cropped_img)
     if isinstance(profile_img, str):
         return profile_img  # return error message if profile computation failed
     return profile_img
+def CLIPPredict(image: Image.Image,
+                       clip_model=clip_mod, clip_preprocess=clip_pre,
+                       keras_mlp=mlp_model) -> float | str:
     """
     Predicts probability that image is AI-generated (AI=1) using CLIP + Keras MLP.
     Returns:
       dict: {'prob': float_prob_AI, 'label': 'AI' or 'Real'}
     """
+    #0 Real 1 AI
     # --- try to reuse provided CLIP objects, otherwise load ---
     if clip_model is None or clip_preprocess is None:
         print("Loading Default CLIP model...")
     # --- try to reuse provided keras model, otherwise load from disk ---
     if keras_mlp is None:
+       return  "No keras model provided..."
     # --- load/normalize image ---
     # assume PIL image
+    image = center_crop(image, crop_size=512)
+    if isinstance(image, str):
+        return image  # return error message if cropping failed
     img = image.convert('RGB')
     # --- preprocess for CLIP and get embedding ---
     prob = float(probs[0])
     return prob
+def CNNPredict(img: Image.Image) -> float | str:
+    predict_img = preprocess_cnn(img)
+    if isinstance(predict_img, str):
+        return predict_img  # return error message if preprocessing failed
+    predict_img = predict_img.astype('float32') / 255.0  # shape (H, W)
+    predict_img = np.expand_dims(predict_img, axis=-1)  # shape (H, W, 1)
     # expand dims to add batch axis
+    predict_img = np.expand_dims(predict_img, axis=0)   # shape (1, H, W, 1)
+    prediction = cnn_model.predict(predict_img)
     return prediction[0][0]