Spaces:

Arko007
/

Med_AI_backend

Running

github-actions[bot]

Auto-sync backend from GitHub

2279de6 19 days ago

29 kB

	"""ML model loading and inference for Valeon diagnostic endpoints."""

	from __future__ import annotations

	import io
	import logging
	import threading
	from typing import Any

	import numpy as np
	from PIL import Image

	logger = logging.getLogger(__name__)

	# ---------------------------------------------------------------------------
	# Custom Keras layers
	# Registered BEFORE any model is loaded.
	# Dual registration:
	# package="custom" -> key "custom>MBConvBlock" (Keras standard)
	# package="" -> key "MBConvBlock" (what .keras bundle stores)
	# ---------------------------------------------------------------------------
	import keras


	class _SEBlock(keras.layers.Layer):
	"""Squeeze-and-Excitation block using Dense layers.

	Matches the original saved model structure:
	se_block/global_pool (GlobalAveragePooling2D, keepdims=True)
	se_block/squeeze (Dense, swish)
	se_block/excite (Dense, sigmoid)
	"""

	def __init__(self, se_filters: int, expanded_filters: int, **kwargs):
	super().__init__(**kwargs)
	self.se_filters = se_filters
	self.expanded_filters = expanded_filters

	def build(self, input_shape):
	self.global_pool = keras.layers.GlobalAveragePooling2D(
	keepdims=True, name="global_pool"
	)
	self.squeeze = keras.layers.Dense(
	self.se_filters, activation="swish", name="squeeze"
	)
	self.excite = keras.layers.Dense(
	self.expanded_filters, activation="sigmoid", name="excite"
	)
	super().build(input_shape)

	def call(self, x):
	se = self.global_pool(x)
	se = self.squeeze(se)
	se = self.excite(se)
	return x * se

	def get_config(self):
	base = super().get_config()
	base.update(
	dict(se_filters=self.se_filters, expanded_filters=self.expanded_filters)
	)
	return base


	@keras.saving.register_keras_serializable(package="custom")
	class MBConvBlock(keras.layers.Layer):
	"""Mobile Inverted Bottleneck Conv block with Squeeze-and-Excitation.

	mixed_bfloat16 dtype fix: the model was trained with
	keras.mixed_precision.Policy('mixed_bfloat16'), which means
	BatchNormalization outputs bfloat16 while the original `inputs`
	tensor is float32. We cast `inputs` to match `x` before the residual
	add so the dtypes always agree regardless of the active policy.

	Sub-layers use explicit names that match the original saved model's
	HDF5 weight structure (depthwise_conv, depthwise_bn, expand_conv,
	expand_bn, project_conv, project_bn, se_block).
	"""

	def __init__(
	self,
	filters: int,
	kernel_size: int = 3,
	strides: int = 1,
	expand_ratio: int = 1,
	se_ratio: float = 0.25,
	drop_connect_rate: float = 0.0,
	input_filters: int = 0,
	**kwargs,
	):
	super().__init__(**kwargs)
	self.filters = filters
	self.kernel_size = kernel_size
	self.strides = strides
	self.expand_ratio = expand_ratio
	self.se_ratio = se_ratio
	self.drop_connect_rate = drop_connect_rate
	self.input_filters = input_filters

	self._expanded_filters = max(1, int(input_filters * expand_ratio))
	self._se_filters = max(1, int(self._expanded_filters * se_ratio))
	self._use_residual = (strides == 1 and input_filters == filters)

	def build(self, input_shape):
	if self.expand_ratio != 1:
	self._expand_conv = keras.layers.Conv2D(
	self._expanded_filters, 1, padding="same", use_bias=False,
	name="expand_conv",
	)
	self._expand_bn = keras.layers.BatchNormalization(name="expand_bn")

	self._dw_conv = keras.layers.DepthwiseConv2D(
	self.kernel_size,
	strides=self.strides,
	padding="same",
	use_bias=False,
	name="depthwise_conv",
	)
	self._dw_bn = keras.layers.BatchNormalization(name="depthwise_bn")

	if self.se_ratio > 0:
	self._se_block = _SEBlock(
	self._se_filters, self._expanded_filters, name="se_block"
	)

	self._project_conv = keras.layers.Conv2D(
	self.filters, 1, padding="same", use_bias=False,
	name="project_conv",
	)
	self._project_bn = keras.layers.BatchNormalization(name="project_bn")

	if self.drop_connect_rate > 0 and self._use_residual:
	self._drop = keras.layers.Dropout(
	self.drop_connect_rate, noise_shape=(None, 1, 1, 1)
	)
	else:
	self._drop = None

	super().build(input_shape)

	def call(self, inputs, training=None):
	import tensorflow as tf
	x = inputs

	if self.expand_ratio != 1:
	x = keras.activations.swish(
	self._expand_bn(self._expand_conv(x), training=training)
	)

	x = keras.activations.swish(
	self._dw_bn(self._dw_conv(x), training=training)
	)

	if self.se_ratio > 0:
	x = self._se_block(x)

	x = self._project_bn(self._project_conv(x), training=training)

	if self._use_residual:
	if self._drop is not None:
	x = self._drop(x, training=training)
	# Cast shortcut to match x dtype (handles mixed_bfloat16 training)
	shortcut = tf.cast(inputs, x.dtype)
	x = x + shortcut

	return x

	def get_config(self):
	base = super().get_config()
	base.update(
	dict(
	filters=self.filters,
	kernel_size=self.kernel_size,
	strides=self.strides,
	expand_ratio=self.expand_ratio,
	se_ratio=self.se_ratio,
	drop_connect_rate=self.drop_connect_rate,
	input_filters=self.input_filters,
	)
	)
	return base


	# Second registration: bare keys (what the .keras bundle stores)
	try:
	keras.saving.register_keras_serializable(package="")(MBConvBlock)
	except Exception:
	pass
	try:
	keras.saving.register_keras_serializable(package="custom")(_SEBlock)
	except Exception:
	pass
	try:
	keras.saving.register_keras_serializable(package="")(_SEBlock)
	except Exception:
	pass

	_SKIN_CUSTOM_OBJECTS: dict[str, Any] = {
	"MBConvBlock": MBConvBlock,
	"_SEBlock": _SEBlock,
	}


	# ---------------------------------------------------------------------------
	# TFSMLayer shim
	# Wraps keras.layers.TFSMLayer so it exposes a .predict() interface.
	# ---------------------------------------------------------------------------

	class _TFSMShim:
	"""Thin wrapper around TFSMLayer that mimics model.predict()."""

	def __init__(self, layer: Any):
	self._layer = layer

	def predict(self, x, verbose=0):
	import tensorflow as tf
	tensor = tf.constant(x, dtype=tf.float32)
	out = self._layer(tensor, training=False)
	if isinstance(out, dict):
	out = list(out.values())[0]
	return out.numpy()


	# ---------------------------------------------------------------------------
	# Model registry
	# ---------------------------------------------------------------------------

	MODEL_REGISTRY: dict[str, dict[str, Any]] = {
	"cataract": {
	"repo_id": "Arko007/Cataract-Detection-CNN",
	"arch_file": "model_architecture.json",
	"weights_file": "model_weights.weights.h5",
	"framework": "keras_json_weights",
	"input_size": (224, 224),
	"classes": ["Cataract", "Normal"],
	},
	"diabetic_retinopathy": {
	"repo_id": "Arko007/diabetic-retinopathy-v1",
	"filename": "best_model.h5",
	"framework": "tf",
	"input_size": (384, 384),
	"classes": [
	"Grade 0 - No DR",
	"Grade 1 - Mild DR",
	"Grade 2 - Moderate DR",
	"Grade 3 - Severe DR",
	"Grade 4 - Proliferative DR",
	],
	},
	"kidney": {
	"repo_id": "Arko007/kidney-ct-classifier-efficientnet",
	"filename": "best_model.pth",
	"framework": "pytorch_efficientnet",
	"input_size": (224, 224),
	"classes": ["Cyst", "Normal", "Stone", "Tumor"],
	},
	"skin": {
	"repo_id": "Arko007/skin-disease-detector-ai",
	"filename": "model.keras",
	"framework": "keras3",
	"input_size": (512, 512),
	"classes": [
	"Actinic Keratosis",
	"Basal Cell Carcinoma",
	"Dermatofibroma",
	"Nevus",
	"Pigmented Benign Keratosis",
	"Seborrheic Keratosis",
	"Squamous Cell Carcinoma",
	"Vascular Lesion",
	],
	},
	"cardiac": {
	"repo_id": "Arko007/cardiac-mri-cnn",
	"filename": "best_model_epoch20_auc0.8129.pt",
	"framework": "pytorch_cardiac",
	# Input size matches original app: 896×896
	"input_size": (896, 896),
	# Index 0 = Normal, Index 1 = Sick (matches original model_service.py)
	"classes": ["Normal", "Sick"],
	},
	}

	_loaded_models: dict[str, Any] = {}
	_load_locks: dict[str, threading.Lock] = {k: threading.Lock() for k in MODEL_REGISTRY}


	# ---------------------------------------------------------------------------
	# Image preprocessing
	# ---------------------------------------------------------------------------

	def _preprocess_image_tf(image_bytes: bytes, target_size: tuple[int, int]) -> np.ndarray:
	img = Image.open(io.BytesIO(image_bytes)).convert("RGB")
	img = img.resize(target_size, Image.LANCZOS)
	arr = np.array(img, dtype=np.float32) / 255.0
	return np.expand_dims(arr, axis=0)


	def _preprocess_dr(image_bytes: bytes) -> np.ndarray:
	img = Image.open(io.BytesIO(image_bytes)).convert("RGB")
	img = img.resize((384, 384), Image.BILINEAR)
	arr = np.array(img, dtype=np.float32) / 255.0
	return np.expand_dims(arr, axis=0)


	def _preprocess_skin(image_bytes: bytes) -> np.ndarray:
	img = Image.open(io.BytesIO(image_bytes)).convert("RGB")
	img = img.resize((512, 512))
	arr = np.array(img, dtype=np.float32) / 255.0
	return np.expand_dims(arr, axis=0)


	def _preprocess_image_torch(image_bytes: bytes, target_size: tuple[int, int]):
	import torch
	from torchvision import transforms
	img = Image.open(io.BytesIO(image_bytes)).convert("RGB")
	transform = transforms.Compose([
	transforms.Resize(target_size),
	transforms.CenterCrop(target_size),
	transforms.ToTensor(),
	transforms.Normalize(mean=[0.485, 0.456, 0.406],
	std=[0.229, 0.224, 0.225]),
	])
	return transform(img).unsqueeze(0)


	def _preprocess_cardiac(image_bytes: bytes, target_size: tuple[int, int]):
	"""Cardiac-specific preprocessing: Grayscale → 3ch, normalize with 0.5/0.5.

	Matches the original ModelService transform exactly:
	Resize → Grayscale(num_output_channels=3) → ToTensor → Normalize(0.5, 0.5)
	"""
	import torch
	from torchvision import transforms
	img = Image.open(io.BytesIO(image_bytes))
	# Convert to grayscale first (as the model was trained on grayscale MRI)
	if img.mode != "L":
	img = img.convert("L")
	transform = transforms.Compose([
	transforms.Resize(target_size),
	transforms.Grayscale(num_output_channels=3),
	transforms.ToTensor(),
	transforms.Normalize(mean=[0.5, 0.5, 0.5], std=[0.5, 0.5, 0.5]),
	])
	return transform(img).unsqueeze(0)


	# ---------------------------------------------------------------------------
	# Cardiac model: DenseNet-169 (matches original training architecture)
	# ---------------------------------------------------------------------------

	def _build_cardiac_model(num_classes: int = 2):
	"""Build DenseNet-169 with a replaced classifier head.

	The checkpoint was trained with torchvision DenseNet-169 where only
	the final Linear layer was replaced — identical to the original app's
	ModelService._load_model().
	"""
	import torch.nn as nn
	from torchvision import models
	model = models.densenet169(weights=None)
	model.classifier = nn.Linear(model.classifier.in_features, num_classes)
	return model


	# ---------------------------------------------------------------------------
	# h5py path-based weight helpers
	# ---------------------------------------------------------------------------

	# Keras auto-naming: class_name → snake_case base used as HDF5 key.
	_CLASS_TO_H5_BASE: dict[str, str] = {
	"InputLayer": "input_layer",
	"Conv2D": "conv2d",
	"BatchNormalization": "batch_normalization",
	"Activation": "activation",
	"MBConvBlock": "mb_conv_block",
	"GlobalAveragePooling2D": "global_average_pooling2d",
	"Dropout": "dropout",
	"Dense": "dense",
	}

	# Variable name → positional index inside an HDF5 ``vars/`` group.
	_VAR_NAME_TO_INDEX: dict[str, int] = {
	"kernel": 0,
	"bias": 1,
	"gamma": 0,
	"beta": 1,
	"moving_mean": 2,
	"moving_variance": 3,
	}


	def _build_outer_name_map(config: dict) -> dict[str, str]:
	"""Map config layer names → HDF5 layer keys.

	The .keras bundle may store HDF5 layer keys using Keras auto-generated
	names (e.g. ``conv2d``, ``mb_conv_block_1``) while config.json uses
	user-specified names (e.g. ``stem_conv``, ``block_1a``). This function
	re-derives the auto-name by counting class occurrences in config order.
	"""
	class_counter: dict[str, int] = {}
	outer_map: dict[str, str] = {}
	for layer_cfg in config["config"]["layers"]:
	class_name = layer_cfg["class_name"]
	layer_name = layer_cfg["name"]
	base = _CLASS_TO_H5_BASE.get(class_name, class_name.lower())
	count = class_counter.get(base, 0)
	h5_key = base if count == 0 else f"{base}_{count}"
	outer_map[layer_name] = h5_key
	class_counter[base] = count + 1
	return outer_map


	# ---------------------------------------------------------------------------
	# Model loading
	# ---------------------------------------------------------------------------

	def _download(repo_id: str, filename: str) -> str:
	from huggingface_hub import hf_hub_download
	return hf_hub_download(repo_id=repo_id, filename=filename)


	def _load_skin_model(repo_id: str, filename: str) -> Any:
	"""Four-strategy loader for the skin model.keras file.

	Strategy 1: keras.saving.load_model with safe_mode=False.
	Strategy 2: TFSMLayer on the HF snapshot (SavedModel path).
	Strategy 3: tf.keras.models.load_model with safe_mode=False.
	Strategy 4: Manual unzip + h5py index-based weight assignment.
	Reads model.weights.h5 from inside the .keras ZIP and
	assigns each tensor to model.weights[i] by DFS index
	order — bypasses ALL name/shape matching so every BN
	gamma/beta/moving_mean/moving_variance is loaded correctly.
	"""
	import tensorflow as tf
	path = _download(repo_id, filename)

	# -----------------------------------------------------------------------
	# Strategy 1 — keras.saving.load_model with safe_mode=False
	# -----------------------------------------------------------------------
	try:
	model = keras.saving.load_model(
	path,
	custom_objects=_SKIN_CUSTOM_OBJECTS,
	compile=False,
	safe_mode=False,
	)
	logger.info("Skin model loaded via keras.saving.load_model (safe_mode=False).")
	return model
	except Exception as e1:
	logger.warning("keras.saving.load_model failed for skin: %s", e1)

	# -----------------------------------------------------------------------
	# Strategy 2 — TFSMLayer on the HF snapshot directory
	# -----------------------------------------------------------------------
	try:
	from huggingface_hub import snapshot_download
	snapshot_dir = snapshot_download(repo_id=repo_id)
	layer = keras.layers.TFSMLayer(
	snapshot_dir,
	call_endpoint="serving_default",
	)
	logger.info("Skin model loaded via TFSMLayer (SavedModel snapshot).")
	return _TFSMShim(layer)
	except Exception as e2:
	logger.warning("TFSMLayer failed for skin: %s", e2)

	# -----------------------------------------------------------------------
	# Strategy 3 — tf.keras legacy loader with safe_mode=False
	# -----------------------------------------------------------------------
	try:
	import inspect
	load_kwargs: dict[str, Any] = {"compile": False}
	if "safe_mode" in inspect.signature(tf.keras.models.load_model).parameters:
	load_kwargs["safe_mode"] = False
	model = tf.keras.models.load_model(
	path,
	custom_objects=_SKIN_CUSTOM_OBJECTS,
	**load_kwargs,
	)
	logger.info("Skin model loaded via tf.keras.models.load_model.")
	return model
	except Exception as e3:
	logger.warning("tf.keras.models.load_model failed for skin: %s", e3)

	# -----------------------------------------------------------------------
	# Strategy 4 — manual unzip + h5py path-based weight assignment
	#
	# The .keras bundle contains config.json (architecture) and
	# model.weights.h5 (weights keyed by auto-generated layer names).
	# The config uses user-specified names (e.g. "block_1a") while the
	# HDF5 uses Keras auto-names (e.g. "mb_conv_block"). We bridge
	# the two by building an explicit outer-name mapping and then
	# translating each model variable path to its HDF5 dataset path.
	# -----------------------------------------------------------------------
	import zipfile, tempfile, os, json, h5py
	try:
	with tempfile.TemporaryDirectory() as tmpdir:
	with zipfile.ZipFile(path, "r") as zf:
	zf.extractall(tmpdir)

	config_path = os.path.join(tmpdir, "config.json")
	weights_candidates = [
	os.path.join(tmpdir, "model.weights.h5"),
	os.path.join(tmpdir, "weights.h5"),
	]
	weights_path = next(
	(p for p in weights_candidates if os.path.exists(p)), None
	)

	if not os.path.exists(config_path):
	raise FileNotFoundError("config.json not found inside .keras bundle")

	with open(config_path, "r") as f:
	config_data = json.load(f)

	# Rebuild architecture from config
	model = keras.models.model_from_json(
	json.dumps(config_data),
	custom_objects=_SKIN_CUSTOM_OBJECTS,
	)
	# Force all layers to create their variables
	model.build((None, 512, 512, 3))
	# Run one dummy forward pass so all sub-layers build
	dummy = np.zeros((1, 512, 512, 3), dtype=np.float32)
	try:
	model(dummy, training=False)
	except Exception:
	pass

	if not weights_path:
	logger.warning(
	"Skin model architecture rebuilt but no weights file found "
	"— predictions will be random."
	)
	return model

	# Build flat dict of all HDF5 layer datasets
	h5_data: dict[str, np.ndarray] = {}
	with h5py.File(weights_path, "r") as hf:
	def _visit(name, obj):
	if isinstance(obj, h5py.Dataset) and name.startswith("layers/"):
	h5_data[name] = np.array(obj)
	hf.visititems(_visit)

	# Build outer-name mapping (config name → HDF5 key)
	outer_map = _build_outer_name_map(config_data)

	# Debug: log first 5 H5 keys and first 5 model var paths
	h5_keys_sample = sorted(h5_data.keys())[:5]
	var_paths_sample = [v.path for v in model.weights[:5]]
	logger.info(
	"H5 keys sample: %s \| var paths sample: %s",
	h5_keys_sample, var_paths_sample,
	)

	# Assign weights by translating each model var path → HDF5 path
	assigned = 0
	skipped = 0
	for var in model.weights:
	parts = var.path.split("/")
	outer_name = parts[0]
	var_name = parts[-1]
	h5_outer = outer_map.get(outer_name)
	if h5_outer is None:
	logger.debug("No outer mapping for %s", var.path)
	skipped += 1
	continue

	var_idx = _VAR_NAME_TO_INDEX.get(var_name, 0)

	if len(parts) == 2:
	# Simple layer: outer/var_name
	h5_path = f"layers/{h5_outer}/vars/{var_idx}"
	elif len(parts) == 3:
	# Sub-layer: outer/inner/var_name
	h5_path = f"layers/{h5_outer}/{parts[1]}/vars/{var_idx}"
	elif len(parts) == 4:
	# Nested sub-layer: outer/inner/sub_inner/var_name
	h5_path = f"layers/{h5_outer}/{parts[1]}/{parts[2]}/vars/{var_idx}"
	else:
	logger.debug("Unexpected path depth for %s", var.path)
	skipped += 1
	continue

	arr = h5_data.get(h5_path)
	if arr is not None and arr.shape == tuple(var.shape):
	target_dtype = (
	var.dtype.as_numpy_dtype
	if hasattr(var.dtype, "as_numpy_dtype")
	else np.float32
	)
	var.assign(arr.astype(target_dtype))
	assigned += 1
	else:
	if arr is not None:
	logger.debug(
	"Shape mismatch for %s: model=%s h5=%s (h5_path=%s)",
	var.path, var.shape, arr.shape, h5_path,
	)
	else:
	logger.debug(
	"H5 path not found for %s → %s", var.path, h5_path,
	)
	skipped += 1

	logger.info(
	"Skin model loaded via h5py path-based assignment: "
	"%d assigned, %d skipped.",
	assigned, skipped,
	)
	if skipped > 0:
	logger.warning(
	"%d weights could not be assigned. "
	"Predictions may be partially degraded.",
	skipped,
	)

	# ---- Self-test at load time ----
	# Min confidence for any single class on the expected test image.
	# A correctly-loaded 8-class model should exceed random chance
	# (1/8 = 12.5%) by a wide margin; 35% is a conservative floor.
	_SELFTEST_MIN_CONFIDENCE = 0.35

	test_image_path = os.environ.get("SKIN_TEST_IMAGE", "")
	if test_image_path and os.path.exists(test_image_path):
	try:
	with open(test_image_path, "rb") as f:
	test_bytes = f.read()
	test_input = _preprocess_skin(test_bytes)
	test_raw = model.predict(test_input, verbose=0)
	test_probs = test_raw[0].tolist()
	max_conf = max(test_probs)
	max_class = test_probs.index(max_conf)
	logger.info(
	"Skin model self-test: max_confidence=%.4f class_index=%d",
	max_conf, max_class,
	)
	if max_conf < _SELFTEST_MIN_CONFIDENCE:
	logger.error(
	"SKIN MODEL WEIGHT LOADING FAILURE: max confidence "
	"%.4f < %.2f. Weights are not loaded correctly. "
	"All predictions will be unreliable.",
	max_conf, _SELFTEST_MIN_CONFIDENCE,
	)
	except Exception as selftest_err:
	logger.warning(
	"Skin model self-test failed: %s", selftest_err
	)

	return model

	except Exception as e4:
	logger.error("All skin model loading strategies failed. Last error: %s", e4)
	raise RuntimeError(
	"Could not load skin model after 4 strategies. "
	f"[S1] {e1} \| [S2] {e2} \| [S3] {e3} \| [S4] {e4}"
	) from e4


	def _load_model(name: str) -> Any:
	cfg = MODEL_REGISTRY[name]
	fw = cfg["framework"]

	if fw == "keras_json_weights":
	import json
	arch_path = _download(cfg["repo_id"], cfg["arch_file"])
	weights_path = _download(cfg["repo_id"], cfg["weights_file"])
	with open(arch_path, "r") as f:
	arch_json = json.load(f)
	model = keras.models.model_from_json(
	arch_json if isinstance(arch_json, str) else json.dumps(arch_json)
	)
	model.load_weights(weights_path)
	return model

	if fw == "keras3":
	return _load_skin_model(cfg["repo_id"], cfg["filename"])

	if fw == "tf":
	import tensorflow as tf
	path = _download(cfg["repo_id"], cfg["filename"])
	return tf.keras.models.load_model(path, compile=False)

	if fw == "pytorch_efficientnet":
	import torch
	from efficientnet_pytorch import EfficientNet
	path = _download(cfg["repo_id"], cfg["filename"])
	model = EfficientNet.from_name("efficientnet-b0", num_classes=len(cfg["classes"]))
	state = torch.load(path, map_location="cpu", weights_only=False)
	if isinstance(state, dict) and "model_state_dict" in state:
	state = state["model_state_dict"]
	model.load_state_dict(state, strict=False)
	model.eval()
	return model

	if fw == "pytorch_cardiac":
	import torch
	path = _download(cfg["repo_id"], cfg["filename"])
	checkpoint = torch.load(path, map_location="cpu", weights_only=False)
	state_dict = checkpoint.get("model_state_dict", checkpoint) if isinstance(checkpoint, dict) else checkpoint
	model = _build_cardiac_model(len(cfg["classes"]))
	model.load_state_dict(state_dict, strict=False)
	model.eval()
	return model

	raise ValueError(f"Unknown framework: {fw}")


	def get_model(name: str) -> Any:
	if name not in MODEL_REGISTRY:
	raise KeyError(f"Unknown model: {name}")
	if name not in _loaded_models:
	with _load_locks[name]:
	if name not in _loaded_models:
	logger.info("Loading model %s \u2026", name)
	_loaded_models[name] = _load_model(name)
	logger.info("Model %s loaded and cached.", name)
	return _loaded_models[name]


	# ---------------------------------------------------------------------------
	# Prediction
	# ---------------------------------------------------------------------------

	def predict(name: str, image_bytes: bytes) -> dict[str, float]:
	cfg = MODEL_REGISTRY[name]
	model = get_model(name)
	fw = cfg["framework"]
	classes = cfg["classes"]
	size = cfg["input_size"]

	if fw in ("tf", "keras3", "keras_json_weights"):
	if name == "diabetic_retinopathy":
	inp = _preprocess_dr(image_bytes)
	elif name == "skin":
	inp = _preprocess_skin(image_bytes)
	else:
	inp = _preprocess_image_tf(image_bytes, size)

	raw = model.predict(inp, verbose=0)
	probs = raw[0]

	if probs.shape[-1] == 1:
	p = float(probs[0])
	probs_list = [1.0 - p, p]
	else:
	probs_list = probs.tolist()
	total = sum(probs_list)
	if total > 0:
	probs_list = [x / total for x in probs_list]

	probs_list = probs_list[: len(classes)]
	while len(probs_list) < len(classes):
	probs_list.append(0.0)

	return {c: round(p, 6) for c, p in zip(classes, probs_list)}

	# PyTorch path
	import torch

	# Use cardiac-specific preprocessing for the cardiac model
	if name == "cardiac":
	inp = _preprocess_cardiac(image_bytes, size)
	else:
	inp = _preprocess_image_torch(image_bytes, size)

	with torch.no_grad():
	logits = model(inp)
	if logits.shape[-1] == 1:
	p = torch.sigmoid(logits).item()
	probs_list = [1.0 - p, p]
	else:
	probs_list = torch.softmax(logits, dim=-1).squeeze().tolist()

	if isinstance(probs_list, float):
	probs_list = [probs_list]

	probs_list = probs_list[: len(classes)]
	while len(probs_list) < len(classes):
	probs_list.append(0.0)

	return {c: round(p, 6) for c, p in zip(classes, probs_list)}