Spaces:

rkonan
/

reco-api-predict

Paused

File size: 14,510 Bytes

import tensorflow as tf
import numpy as np
from PIL import Image
import tensorflow as tf
import logging
import numpy as np
from PIL import Image
from keras.applications.efficientnet_v2 import preprocess_input as effnet_preprocess
from keras.applications.resnet_v2 import preprocess_input as resnet_preprocess
import io
from tf_keras_vis.gradcam import Gradcam,GradcamPlusPlus
from tf_keras_vis.utils import normalize

import numpy as np
import tensorflow as tf
from tf_keras_vis.saliency import Saliency
from tf_keras_vis.utils import normalize
import numpy as np
import tensorflow as tf
from tf_keras_vis.saliency import Saliency
from tf_keras_vis.utils import normalize
import logging
import time

from typing import TypedDict, Callable, Any
logging.basicConfig(
    level=logging.INFO,  # ou logging.DEBUG
    format="%(asctime)s [%(levelname)s] %(name)s: %(message)s"
)
logger = logging.getLogger(__name__)
confidence_threshold=0.5
entropy_threshold=2

class ModelStruct(TypedDict):
    model_name: str
    model: tf.keras.Model
    gradcam_model:tf.keras.Model
    preprocess_input: Callable[[np.ndarray], Any]
    target_size: tuple[int, int]
    last_conv_layer:str
    gradcam_type:str


def load_models() -> list[ModelStruct]:
    model1 = tf.keras.models.load_model("model/best_efficientnetv2m_gradcam.keras",compile=False)
    model1_for_gradcam=model1
    
    model2 = tf.keras.models.load_model("model/best_ResNet50V2_gradcam.keras",compile=False)
    model2_for_gradcam=model2

    return [
    
        {
        "model_name":"EfficientNetV2M",
        "model": model1,
        "gradcam_model":model1_for_gradcam,
        "preprocess_input": effnet_preprocess,
        "target_size": (480, 480),
        "last_conv_layer":"top_activation",
        "gradcam_type":"gradcam++"

    },
    {
        "model_name":"ResNet50V2",
        "gradcam_model":model2_for_gradcam,
        "model":model2,
        "preprocess_input":resnet_preprocess,
        "target_size":(224, 224),
        "last_conv_layer":"conv5_block3_out",
        "gradcam_type":"gradcam"
        #"gradcam_type":"gradcam++"


    }
   
    ]



def compute_saliency_map(model, image_array, class_index=None):
    """
    Calcule la carte de saillance avec tf-keras-vis Saliency.

    Args:
        model: tf.keras.Model.
        image_array: np.array, shape (H, W, 3), float32, pré-traitée.
        class_index: int ou None. Si None, prend la classe prédite.

    Returns:
        saliency_map: np.array float32, normalisée entre 0 et 1, shape (H, W).
    """
    logging.info("Début du calcul de la carte de saillance")

    if image_array.ndim == 3:
        input_tensor = np.expand_dims(image_array, axis=0)
        logging.debug(f"Image d'entrée dimensionnée de {image_array.shape} à {input_tensor.shape} (batch)")
    else:
        input_tensor = image_array
        logging.debug(f"Image d'entrée déjà batchée avec shape {input_tensor.shape}")

    saliency = Saliency(model)
    logging.info("Objet Saliency initialisé")

    def loss(output):
        # output shape: (batch_size, num_classes)
        if class_index is None:
            class_index_local = tf.argmax(output[0])
            logging.info(f"Classe cible non spécifiée, utilisation de la classe prédite: {class_index_local.numpy()}")
        else:
            class_index_local = class_index
            logging.info(f"Classe cible spécifiée: {class_index_local}")
        return output[:, class_index_local]

    saliency_map = saliency(loss, input_tensor)
    logging.info("Calcul de la carte de saillance terminé")

    saliency_map = saliency_map[0]  # shape (H, W, 3)
    logging.debug(f"Shape de la carte brute: {saliency_map.shape}")

    # Prendre le max absolu sur les canaux couleurs pour avoir une carte 2D
    
    if saliency_map.ndim == 3:
        saliency_map = np.max(np.abs(saliency_map), axis=-1)
    else:
        saliency_map = np.abs(saliency_map)
    logging.debug(f"Shape de la carte après réduction canaux: {saliency_map.shape}")

    # Normaliser la carte entre 0 et 1
    saliency_map = normalize(saliency_map)
    logging.info("Normalisation de la carte de saillance terminée")

    return saliency_map


def compute_gradcam(model, image_array, class_index=None, layer_name=None,gradcam_type="gradcam"):
    """
    Calcule la carte Grad-CAM pour une image et un modèle Keras.

    Args:
        model: tf.keras.Model.
        image_array: np.array (H, W, 3), float32, pré-traitée.
        class_index: int ou None, index de la classe cible. Si None, classe prédite.
        layer_name: str ou None, nom de la couche convolutionnelle à utiliser. Si None, dernière conv.

    Returns:
        gradcam_map: np.array (H, W), normalisée entre 0 et 1.
    """
    logging.info(f"Lancement calcul de la gradcam avec le type {gradcam_type}")

    if image_array.ndim == 3:
        input_tensor = np.expand_dims(image_array, axis=0)
    else:
        input_tensor = image_array
    if gradcam_type=="gradcam++":
        gradcam = GradcamPlusPlus(model, clone=False)
    else: 
        gradcam = Gradcam(model, clone=False)

    def loss(output):
        if class_index is None:
            class_index_local = tf.argmax(output[0])
        else:
            class_index_local = class_index
        return output[:, class_index_local]

    # Choisir la couche à utiliser pour GradCAM
    if layer_name is None:
        # Si non spécifié, chercher la dernière couche conv 2D
        for layer in reversed(model.layers):
            if 'conv' in layer.name and len(layer.output_shape) == 4:
                layer_name = layer.name
                break
        if layer_name is None:
            raise ValueError("Aucune couche convolutionnelle 2D trouvée dans le modèle.")

    cam = gradcam(loss, input_tensor, penultimate_layer=layer_name)
    cam = cam[0]

    # Normaliser entre 0 et 1
    cam = normalize(cam)

    return cam


def make_gradcam_heatmap(model,img_array,  pred_index=None):
    """
    Calcule la Grad-CAM heatmap pour une image donnée et un modèle Keras.

    Args:
      img_array (numpy array): image d'entrée preprocessée, shape (1, H, W, C)
      model (tf.keras.Model): modèle Keras complet (avec la tête softmax)
      last_conv_layer_name (str): nom de la dernière couche conv (ex: 'top_conv' dans EfficientNetB0)
      pred_index (int, optional): indice de la classe ciblée. Par défaut la classe prédite par le modèle.

    Returns:
      heatmap (numpy array): heatmap 2D normalisée entre 0 et 1
    """

    # 1. Récupérer la dernière couche conv
    back_bone=model.get_layer("efficientnetv2-m")
    last_conv_layer=back_bone.get_layer('top_activation')
    # last_conv_layer = next(
    # x for x in back_bone.layers[::-1] if isinstance(x,tf.keras.layers.Conv2D) #tf.keras.layers.MBConvBlock)
    # )

    
    # 2. Créer un modèle intermédiaire qui donne les activations de la dernière couche conv
    # et la sortie finale du modèle
    grad_model = tf.keras.models.Model(
        [model.inputs], [last_conv_layer.output, model.output]
    )

    with tf.GradientTape() as tape:
        conv_outputs, predictions = grad_model([img_array])
        if pred_index is None:
            pred_index = tf.argmax(predictions[0])
        class_channel = predictions[:, pred_index]

    # 3. Calculer le gradient des logits de la classe cible par rapport aux activations conv
    grads = tape.gradient(class_channel, conv_outputs)

    # 4. Moyenne globale des gradients sur les axes spatiaux (H, W)
    pooled_grads = tf.reduce_mean(grads, axis=(1, 2))

    # 5. Pondérer chaque canal des activations par les gradients moyens
    conv_outputs = conv_outputs[0]
    pooled_grads = pooled_grads[0]

    heatmap = tf.reduce_sum(tf.multiply(pooled_grads, conv_outputs), axis=-1)

    # 6. Normaliser la heatmap entre 0 et 1
    heatmap = tf.maximum(heatmap, 0) / (tf.reduce_max(heatmap) + 1e-8)
    heatmap = heatmap.numpy()

    return heatmap

def compute_saliency_map_basic(model, image_array, class_index=None):
    logger.info("🧠 Début du calcul de la salience...")
    """
    Calcule la carte de saillance (saliency map) d'une image pour un modèle donné.

    Args:
        model : modèle Keras TensorFlow.
        image_array : np.array, image d'entrée pré-traitée, shape (H, W, 3), float32.
        class_index : int ou None, index de la classe cible. 
                      Si None, on prend la prédiction la plus probable.

    Returns:
        saliency_map : np.array, carte de saillance normalisée (valeurs entre 0 et 1), shape (H, W).
    """
    if image_array.ndim == 3:
        image_tensor = tf.expand_dims(image_array, axis=0)
    else:
        image_tensor = tf.convert_to_tensor(image_array)

    image_tensor = tf.cast(image_tensor, tf.float32)
    with tf.GradientTape() as tape:
        tape.watch(image_tensor)
        preds = model(image_tensor,training=False)
        if class_index is None:
            class_index = tf.argmax(preds[0])
        class_score = preds[:, class_index]

    grads = tape.gradient(class_score, image_tensor)  # gradient de la sortie par rapport à l'image
    saliency = tf.reduce_max(tf.abs(grads), axis=-1)[0]  # max sur canaux couleur, retirer batch

    # Normaliser entre 0 et 1
    saliency = (saliency - tf.reduce_min(saliency)) / (tf.reduce_max(saliency) - tf.reduce_min(saliency) + 1e-10)
    
    logger.info("✅ Fin du calcul de la salience.")
    return saliency.numpy()
 


def preprocess_image(image_bytes, target_size, preprocess_input):
    try:
        logger.info("📤 Lecture des bytes et conversion en image PIL")
        image = Image.open(io.BytesIO(image_bytes)).convert("RGB")
    except Exception as e:
        logger.exception("❌ Erreur lors de l'ouverture de l'image")
        raise ValueError("Impossible de décoder l'image") from e

    logger.info(f"📐 Redimensionnement de l'image à la taille {target_size}")
    image = image.resize(target_size)
    image_array = np.array(image).astype(np.float32)

    logger.debug(f"🔍 Shape de l'image après conversion en tableau : {image_array.shape}")

    if image_array.ndim != 3 or image_array.shape[-1] != 3:
        logger.error(f"❌ Image invalide : shape={image_array.shape}")
        raise ValueError("Image must have 3 channels (RGB)")

    logger.info("🎨 Conversion et prétraitement de l'image")

    # Préparation pour la prédiction
    preprocessed_input = preprocess_input(image_array.copy())
    preprocessed_input = np.expand_dims(preprocessed_input, axis=0)

    # Préparation pour Grad-CAM (non prétraitée, mais batchifiée et en float32)
    raw_input = np.expand_dims(image_array / 255.0, axis=0)  # Mise à l’échelle simple

    logger.debug(f"🧪 Shape après ajout de la dimension batch : {preprocessed_input.shape}")
    return preprocessed_input, raw_input


def preprocess_image_v1(image_bytes, target_size,preprocess_input) -> np.ndarray:
     
    try:
        logger.info("📤 Lecture des bytes et conversion en image PIL")
        image = Image.open(io.BytesIO(image_bytes)).convert("RGB")
    except Exception as e:
        logger.exception("❌ Erreur lors de l'ouverture de l'image")
        raise ValueError("Impossible de décoder l'image") from e
    
    logger.info(f"📐 Redimensionnement de l'image à la taille {target_size}")
    image = image.resize(target_size)
    image_array = np.array(image)

    logger.debug(f"🔍 Shape de l'image après conversion en tableau : {image_array.shape}")

    # Forcer RGB si jamais ce n’est pas déjà le cas
    if image_array.ndim != 3 or image_array.shape[-1] != 3:
        logger.error(f"❌ Image invalide : shape={image_array.shape}")
        raise ValueError("Image must have 3 channels (RGB)")

    logger.info("🎨 Conversion et prétraitement de l'image")
    image_array = preprocess_input(image_array)

    processed = np.expand_dims(image_array, axis=0)
    logger.debug(f"🧪 Shape après ajout de la dimension batch : {processed.shape}")
    return processed


def compute_entropy_safe(probas):
    probas = np.array(probas)
    # On garde uniquement les probabilités strictement positives
    mask = probas > 0
    entropy = -np.sum(probas[mask] * np.log(probas[mask]))
    return entropy


def predict_with_model(config, image_bytes: bytes,show_heatmap=False):
   
    input_array,raw_input = preprocess_image(image_bytes,config["target_size"],config["preprocess_input"])

    logger.info("🤖 Lancement de la prédiction avec le modèle")
    preds = config["model"].predict(input_array)
    logger.debug(f"📈 Prédictions brutes : {preds[0].tolist()}")

    predicted_class_index = int(np.argmax(preds[0]))
    confidence = float(preds[0][predicted_class_index])
    entropy=float(compute_entropy_safe(preds))
    is_uncertain_model= (confidence<confidence_threshold) or (entropy>entropy_threshold)
    logger.info(f"✅ Prédiction : classe={predicted_class_index}, confiance={confidence:.4f},entropy={entropy:.4f},is_uncertain_model={is_uncertain_model}")

    result= {
        "preds": preds[0].tolist(),
        "predicted_class": predicted_class_index,
        "confidence": confidence,
        "entropy":entropy,
        "is_uncertain_model":is_uncertain_model
    }
    if show_heatmap and not is_uncertain_model:
        try:
            logger.info("✅ Début de la génération de la heatmap")
            start_time = time.time()

            # Vérification des entrées
            logger.info(f"🖼️ Image d'entrée shape: {raw_input.shape}")
            logger.info(f"🎯 Index de classe prédite: {predicted_class_index}")
            logger.info(f"🛠️ Dernière couche utilisée: {config['last_conv_layer']}")

            # Calcul de la heatmap
            heatmap = compute_gradcam(config["gradcam_model"], raw_input, class_index=predicted_class_index, layer_name=config["last_conv_layer"],gradcam_type=config["gradcam_type"])

            elapsed_time = time.time() - start_time
            logger.info(f"✅ Heatmap générée en {elapsed_time:.2f} secondes")

            # Conversion en liste pour le JSON
            result["heatmap"] = heatmap.tolist()

        except Exception as e:
            logger.error(f"❌ Erreur lors de la génération de la heatmap: {e}")
            result["heatmap"] = []
    else:
        logger.info("ℹ️ Heatmap non générée (option désactivée ou modèle incertain)")
        result["heatmap"] = []


    return result