Spaces:

magnumical
/

amp

Sleeping

App Files Files Community

amp / streamlit_ui /model_deployment.py

magnumical

Upload model_deployment.py

e549051 verified about 1 year ago

raw

history blame contribute delete

14.5 kB

	import streamlit as st
	import numpy as np
	import os
	import librosa
	import matplotlib.pyplot as plt
	from sklearn.preprocessing import normalize
	from tensorflow.keras.models import load_model
	import logging
	from prometheus_client import Counter, Histogram, start_http_server
	import time
	from scipy.signal import butter, sosfilt
	import pandas as pd


	# Set up logging
	logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
	logger = logging.getLogger("audio_classifier_dep")


	# Paths and Constants
	MODEL_PATH = "./models"
	MODELS = {
	"binary": {
	"augmented": "final_model_binary_augmented.h5",
	"log_mel": "final_model_binary_log_mel.h5",
	"mfcc": "final_model_binary_mfcc.h5",
	},
	"multi": {
	"augmented": "final_model_multi_augmented.h5",
	"log_mel": "final_model_multi_log_mel.h5",
	"mfcc": "final_model_multi_mfcc.h5",
	}
	}
	CLASS_NAMES = {
	"binary": ["Abnormal", "Normal"],
	"multi": ["Chronic Respiratory Diseases", "Normal", "Respiratory Infections"]
	}

	# Define Prometheus metrics
	REQUEST_COUNT = Counter('audio_classifier_requests_total', 'Total number of requests to the classifier')
	RESPONSE_TIME = Histogram('audio_classifier_response_time_seconds', 'Time taken to process requests')
	ERROR_COUNT = Counter('audio_classifier_errors_total', 'Total number of errors during classification')

	REQUEST_COUNT._value.set(0)

	# Start Prometheus HTTP server
	start_http_server(9100, addr="0.0.0.0")

	individual_response_times = []

	def filtering(audio, sr):
	"""
	Apply a bandpass filter to audio data.

	Args:
	audio: The input audio signal.
	sr: The sampling rate of the audio.

	Returns:
	Filtered audio signal.
	"""
	# Define cutoff frequencies
	low_cutoff = 50 # 50 Hz
	high_cutoff = min(5000, sr / 2 - 1) # Ensure it is below Nyquist frequency

	if low_cutoff >= high_cutoff:
	raise ValueError(
	f"Invalid filter range: low_cutoff={low_cutoff}, high_cutoff={high_cutoff} for sampling rate {sr}"
	)

	# Design a bandpass filter
	sos = butter(N=10, Wn=[low_cutoff, high_cutoff], btype='band', fs=sr, output='sos')

	# Apply the filter
	filtered_audio = sosfilt(sos, audio)
	return filtered_audio


	def save_uploaded_file(uploaded_file):
	"""Save the uploaded file temporarily."""
	temp_file_path = os.path.join("temp_audio", uploaded_file.name)
	os.makedirs("temp_audio", exist_ok=True)
	with open(temp_file_path, "wb") as f:
	f.write(uploaded_file.getbuffer())
	return temp_file_path


	def display_results(predicted_class, probabilities, model_type):
	"""Display the classification results."""
	class_label = CLASS_NAMES[model_type][predicted_class]
	st.success(f"Classification Complete! Predicted Class: {class_label}")
	st.write("### Prediction Probabilities")
	class_probabilities = {
	CLASS_NAMES[model_type][i]: prob for i, prob in enumerate(probabilities)
	}
	st.bar_chart(class_probabilities)

	## Augmentation Functions
	def add_noise(data, noise_factor=0.001):
	noise = np.random.randn(len(data))
	return data + noise_factor * noise

	def shift(data, shift_factor=1600):
	return np.roll(data, shift_factor)

	def stretch(data, rate=1.2):
	return librosa.effects.time_stretch(data, rate=rate)

	def pitch_shift(data, sr, n_steps=3):
	return librosa.effects.pitch_shift(data, sr=sr, n_steps=n_steps)

	def preprocess_audio(audio_file, mode="augmented", input_shape=None):
	"""
	Preprocess an audio file for classification by resampling, padding/truncating,
	and extracting features (e.g., MFCC, Log-Mel spectrogram, or Augmented features).

	Args:
	audio_file: Path to the audio file.
	mode: Feature extraction mode ('mfcc', 'log_mel', or 'augmented').
	input_shape: Expected input shape of the model for feature alignment.

	Returns:
	Extracted features as per the mode.
	"""
	try:
	sr_new = 16000 # Resample audio to 16 kHz
	x, sr = librosa.load(audio_file, sr=sr_new)
	x = filtering(x, sr)

	logger.info(f"Loaded audio file '{audio_file}' with shape {x.shape} and sampling rate {sr}.")

	max_len = 5 * sr_new
	if x.shape[0] < max_len:
	x = np.pad(x, (0, max_len - x.shape[0]))
	logger.info(f"Audio padded to {max_len} samples.")
	else:
	x = x[:max_len]
	logger.info(f"Audio truncated to {max_len} samples.")

	# Handle each mode separately
	if mode == 'mfcc':
	feature = librosa.feature.mfcc(y=x, sr=sr_new, n_mfcc=20) # Extract MFCC
	feature = normalize(feature, axis=1)

	elif mode == 'log_mel':
	mel_spec = librosa.feature.melspectrogram(y=x, sr=sr_new, n_mels=20, fmax=8000)
	feature = librosa.power_to_db(mel_spec, ref=np.max) # Extract Log-Mel spectrogram
	feature = normalize(feature, axis=1)

	elif mode == 'augmented':
	features = []

	# Base MFCC
	base_mfcc = np.mean(librosa.feature.mfcc(y=x, sr=sr_new, n_mfcc=52).T, axis=0)
	features.append(base_mfcc)

	# Augmented features
	for augmentation in [
	lambda d: add_noise(d, 0.001),
	lambda d: shift(d, 1600),
	lambda d: stretch(d, 1.2),
	lambda d: pitch_shift(d, sr_new, 3)
	]:
	augmented_data = augmentation(x)
	aug_mfcc = np.mean(librosa.feature.mfcc(y=augmented_data, sr=sr_new, n_mfcc=52).T, axis=0)
	features.append(aug_mfcc)

	# Average augmented features
	feature = np.mean(features, axis=0)
	feature = normalize(feature.reshape(1, -1), axis=1).flatten() # Normalize

	else:
	raise ValueError(f"Unknown mode: {mode}")

	# Reshape for model input if required
	if input_shape:
	feature = _reshape_feature(feature, input_shape)

	logger.info(f"Feature extracted with shape {feature.shape}.")
	return np.expand_dims(feature, axis=-1) # Add channel dimension

	except Exception as e:
	logger.error(f"Error in preprocessing audio: {e}")
	raise


	def _reshape_feature(feature, input_shape):
	"""
	Reshape the feature to match the expected input shape of the model.

	Args:
	feature: The extracted feature.
	input_shape: The expected input shape of the model.

	Returns:
	Reshaped feature.
	"""
	expected_time_frames = input_shape[1]
	if len(feature) > expected_time_frames:
	feature = feature[:expected_time_frames]
	elif len(feature) < expected_time_frames:
	feature = np.pad(feature, (0, expected_time_frames - len(feature)))

	return feature


	def classify_audio(model_type, feature_type, file_path):
	"""
	Classify an audio file using the specified model.

	Args:
	model_type: Type of model ('binary' or 'multi').
	feature_type: Type of feature extraction ('mfcc', 'log_mel', or 'augmented').
	file_path: Path to the audio file.

	Returns:
	Predicted class and prediction probabilities.
	"""
	if model_type not in MODELS or feature_type not in MODELS[model_type]:
	raise ValueError(f"Invalid combination of model type and feature type: {model_type}, {feature_type}")

	# Load the correct model based on the type and feature
	model_file = os.path.join(MODEL_PATH, MODELS[model_type][feature_type])
	if not os.path.exists(model_file):
	raise FileNotFoundError(f"Model file not found: {model_file}")

	logger.info(f"Loading model from {model_file} for feature type '{feature_type}' and model type '{model_type}'...")
	model = load_model(model_file)

	# Get input shape from the model
	input_shape = model.input_shape

	# Preprocess audio
	processed_audio = preprocess_audio(file_path, mode=feature_type, input_shape=input_shape)

	# Add batch dimension
	processed_audio = np.expand_dims(processed_audio, axis=0)

	# Predict
	predictions = model.predict(processed_audio)
	predicted_class = np.argmax(predictions, axis=1)[0]
	probabilities = predictions[0].tolist()

	logger.info(f"Prediction complete. Predicted class: {predicted_class}, Probabilities: {probabilities}")
	return predicted_class, probabilities

	def classify_audio_with_metrics(model_type, feature_type, file_path):
	global individual_response_times

	logger.info("Audio classification request received.")
	REQUEST_COUNT.inc()

	start_time = time.time()
	try:
	result = classify_audio(model_type, feature_type, file_path)
	return result
	except Exception as e:
	ERROR_COUNT.inc()
	logger.error("Error during classification: %s", e)
	raise
	finally:
	response_time = time.time() - start_time
	RESPONSE_TIME.observe(response_time)
	individual_response_times.append(response_time)
	logger.info("Request processed. Response time: %.3f seconds", response_time)

	def run():
	st.title("Respiratory Sound Classifier: Inference and Deployment")

	st.markdown("""
	Welcome to the Inference and Deployment page! This tool allows you to classify respiratory sounds
	into various categories using pre-trained models. Choose one of the two modes below based on your needs:

	- Quick Multiclass Mode: A fast and straightforward way to classify audio files using a multiclass model with augmented features.
	- Flexible Mode: Customize the classification process by selecting your preferred model type (binary/multi) and feature type (MFCC, Log-Mel, or Augmented).
	- Metrics Dashboard: Monitor live metrics including request counts, response times, and error rates.
	""")

	# Tabs for three modes
	tab1, tab2, tab3 = st.tabs(["Quick Multiclass Mode", "Flexible Mode", "Metrics Dashboard"])

	# Tab 1: Quick Multiclass (Augmented) Mode
	with tab1:
	st.subheader("Quick Multiclass (Augmented) Mode")
	st.markdown("""
	This mode is optimized for quick classification of respiratory sounds into multiple categories
	(e.g., Chronic Respiratory Diseases, Normal, Respiratory Infections). It automatically uses the
	multiclass model with augmented features for robust and accurate results.
	""")

	uploaded_file = st.file_uploader(
	"Upload an Audio File for Multiclass Classification",
	type=["wav", "mp3"],
	help="Supported formats: WAV, MP3",
	)

	if uploaded_file is not None:
	temp_file_path = save_uploaded_file(uploaded_file)
	st.audio(temp_file_path, format="audio/wav", start_time=0)

	try:
	with st.spinner("Classifying the audio file, please wait..."):
	predicted_class, probabilities = classify_audio_with_metrics(
	model_type="multi", feature_type="augmented", file_path=temp_file_path
	)

	# Display results
	display_results(predicted_class, probabilities, "multi")

	except Exception as e:
	st.error(f"Error: {e}")
	finally:
	os.remove(temp_file_path)

	# Tab 2: Flexible Mode
	with tab2:
	st.subheader("Flexible Mode")
	st.markdown("""
	The Flexible Mode gives you control over the classification process. Select the model type
	(binary or multiclass) and the feature type (MFCC, Log-Mel, or Augmented) to suit your specific requirements.
	""")

	model_type = st.selectbox(
	"Select Model Type",
	["binary", "multi"],
	help="Choose between binary or multi-class classification.",
	)
	feature_type = st.selectbox(
	"Select Feature Type",
	["mfcc", "log_mel", "augmented"],
	help="Choose the feature extraction type.",
	)
	uploaded_file = st.file_uploader(
	"Upload an Audio File",
	type=["wav", "mp3"],
	help="Supported formats: WAV, MP3",
	)

	if uploaded_file is not None:
	temp_file_path = save_uploaded_file(uploaded_file)
	st.audio(temp_file_path, format="audio/wav", start_time=0)

	try:
	with st.spinner("Classifying the audio file, please wait..."):
	predicted_class, probabilities = classify_audio_with_metrics(
	model_type, feature_type, temp_file_path
	)

	# Display results
	display_results(predicted_class, probabilities, model_type)

	except Exception as e:
	st.error(f"Error: {e}")
	finally:
	os.remove(temp_file_path)

	# Tab 3: Metrics Dashboard
	with tab3:
	st.subheader("Metrics Dashboard")
	st.markdown("""
	This dashboard shows live metrics for the application, including request counts, response times,
	and error counts. These metrics are tracked internally and updated in real-time.
	""")

	col1, col2, col3 = st.columns(3)
	col1.metric("Total Requests", REQUEST_COUNT._value.get())
	col2.metric("Total Errors", ERROR_COUNT._value.get())

	if individual_response_times:
	avg_response_time = sum(individual_response_times) / len(individual_response_times)
	else:
	avg_response_time = 0
	col3.metric("Avg Response Time (s)", f"{avg_response_time:.3f}")

	st.markdown("### Individual Response Times")
	if individual_response_times:
	df = pd.DataFrame({
	"Request Index": range(1, len(individual_response_times) + 1),
	"Response Time (s)": individual_response_times
	})
	st.dataframe(df)
	else:
	st.warning("No response time data available.")



	if __name__ == "__main__":
	run()