Spaces:

Ahmedhassan54
/

Defect-Detection

Sleeping

App Files Files Community

Defect-Detection / model.py

Ahmedhassan54

Update model.py

0df65bd verified 12 months ago

raw

history blame contribute delete

15.2 kB


	import tensorflow as tf
	from tensorflow.keras import layers, models, optimizers
	import numpy as np
	import cv2
	import os
	import matplotlib.pyplot as plt
	from sklearn.model_selection import train_test_split
	from tensorflow.keras.preprocessing.image import ImageDataGenerator
	from google.colab import files
	import zipfile
	import io
	import shutil
	from tqdm import tqdm
	import time



	class ProgressFileUpload:

	def __init__(self, filename, total_size):
	self.filename = filename
	self.total_size = total_size
	self.uploaded = 0
	self.start_time = time.time()

	def update(self, chunk_size):
	self.uploaded += chunk_size
	percent = (self.uploaded / self.total_size) * 100
	elapsed = time.time() - self.start_time
	speed = self.uploaded / (1024 * 1024 * elapsed) if elapsed > 0 else 0
	print(f"\rUploading {self.filename}: {percent:.1f}% ({self.uploaded/(10241024):.1f}MB/{self.total_size/(10241024):.1f}MB) {speed:.1f}MB/s", end='')
	if percent >= 100:
	print()

	class DefectDetectorTF:
	def __init__(self, input_shape=(256, 256, 3)):
	self.input_shape = input_shape
	self.class_names = sorted(['Patches', 'Pitted', 'Scratches', 'Rolled', 'Crazing', 'Inclusion'])
	self.num_classes = len(self.class_names)
	self.model = self.build_model()

	def build_model(self):

	model = models.Sequential([
	layers.Rescaling(1./255, input_shape=self.input_shape),

	layers.Conv2D(64, (3, 3), activation='relu', padding='same'),
	layers.BatchNormalization(),
	layers.Conv2D(64, (3, 3), activation='relu', padding='same'),
	layers.BatchNormalization(),
	layers.MaxPooling2D((2, 2)),
	layers.Dropout(0.25),

	layers.Conv2D(128, (3, 3), activation='relu', padding='same'),
	layers.BatchNormalization(),
	layers.Conv2D(128, (3, 3), activation='relu', padding='same'),
	layers.BatchNormalization(),
	layers.MaxPooling2D((2, 2)),
	layers.Dropout(0.25),

	layers.Conv2D(256, (3, 3), activation='relu', padding='same'),
	layers.BatchNormalization(),
	layers.MaxPooling2D((2, 2)),
	layers.Dropout(0.25),

	layers.Flatten(),
	layers.Dense(512, activation='relu'),
	layers.BatchNormalization(),
	layers.Dropout(0.5),
	layers.Dense(self.num_classes, activation='softmax')
	])

	model.compile(
	optimizer=optimizers.Adam(learning_rate=0.001),
	loss='sparse_categorical_crossentropy',
	metrics=['accuracy']
	)
	return model

	def load_dataset(self, dataset_dir):

	images = []
	labels = []
	supported_formats = ('.jpg', '.jpeg', '.png', '.bmp')

	for class_idx, class_name in enumerate(self.class_names):
	class_dir = os.path.join(dataset_dir, class_name)
	if not os.path.exists(class_dir):
	raise ValueError(f"Missing folder for class: {class_name}")

	for img_file in os.listdir(class_dir):
	if img_file.lower().endswith(supported_formats):
	img_path = os.path.join(class_dir, img_file)
	try:
	img = cv2.imread(img_path)
	if img is None:
	continue
	img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
	img = cv2.resize(img, self.input_shape[:2])
	images.append(img)
	labels.append(class_idx)
	except Exception as e:
	print(f"Error processing {img_path}: {str(e)}")
	continue

	if len(images) == 0:
	raise ValueError("No valid images found in dataset directory")

	return np.array(images), np.array(labels)

	def save_model_with_progress(self, filepath):


	class ProgressTracker(tf.keras.callbacks.Callback):
	def __init__(self, total_size):
	self.total_size = total_size
	self.progress = 0
	self.start_time = time.time()

	def on_batch_end(self, batch, logs=None):

	self.progress += 1
	percent = min(100, (self.progress / 100) * 100)
	elapsed = time.time() - self.start_time
	speed = (self.progress * self.total_size / 100) / (1024 * 1024 * elapsed) if elapsed > 0 else 0
	print(f"\rSaving model: {percent:.1f}% ({percent/100self.total_size/(10241024):.1f}MB/{self.total_size/(1024*1024):.1f}MB) {speed:.1f}MB/s", end='')


	model_size = sum(layer.count_params() for layer in self.model.layers) * 4
	model_size = max(model_size, 50 * 1024 * 1024)

	progress_tracker = ProgressTracker(model_size)


	print(f"\nStarting model save (estimated size: {model_size/(1024*1024):.1f}MB)")
	self.model.save(filepath)
	print("\nModel saved successfully!")

	def train(self, dataset_dir, epochs=30, batch_size=32):

	X, y = self.load_dataset(dataset_dir)
	X_train, X_val, y_train, y_val = train_test_split(X, y, test_size=0.2, random_state=42, stratify=y)

	train_datagen = ImageDataGenerator(
	rotation_range=15,
	width_shift_range=0.1,
	height_shift_range=0.1,
	shear_range=0.1,
	zoom_range=0.1,
	horizontal_flip=True,
	fill_mode='nearest'
	)

	train_generator = train_datagen.flow(X_train, y_train, batch_size=batch_size)

	callbacks = [
	tf.keras.callbacks.ModelCheckpoint(
	'best_defect_model.h5',
	monitor='val_accuracy',
	save_best_only=True,
	mode='max'
	),
	tf.keras.callbacks.EarlyStopping(
	monitor='val_accuracy',
	patience=5,
	restore_best_weights=True
	)
	]

	print("\nTraining Summary:")
	print(f"Classes: {self.class_names}")
	print(f"Training samples: {len(X_train)}")
	print(f"Validation samples: {len(X_val)}\n")

	history = self.model.fit(
	train_generator,
	steps_per_epoch=len(X_train) // batch_size,
	validation_data=(X_val, y_val),
	epochs=epochs,
	callbacks=callbacks,
	verbose=1
	)

	plt.figure(figsize=(12, 5))
	plt.subplot(1, 2, 1)
	plt.plot(history.history['accuracy'], label='Train Accuracy')
	plt.plot(history.history['val_accuracy'], label='Validation Accuracy')
	plt.legend()

	plt.subplot(1, 2, 2)
	plt.plot(history.history['loss'], label='Train Loss')
	plt.plot(history.history['val_loss'], label='Validation Loss')
	plt.legend()

	plt.show()
	return history

	def predict(self, image_path):

	img = cv2.imread(image_path)
	if img is None:
	return None, "Failed to load image"

	img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
	display_img = img.copy()
	img = cv2.resize(img, self.input_shape[:2])
	img_array = tf.expand_dims(tf.keras.utils.img_to_array(img), 0) / 255.0

	predictions = self.model.predict(img_array)
	score = tf.nn.softmax(predictions[0])
	class_id = np.argmax(score)
	confidence = np.max(score)

	cv2.putText(
	display_img,
	f"{self.class_names[class_id]}: {confidence:.2f}",
	(10, 30), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 255, 0), 2
	)

	debug_text = "\n".join([
	f"{name}: {prob:.4f}"
	for name, prob in zip(self.class_names, score)
	])

	return display_img, debug_text



	print("#" * 60)
	print("### Steel Surface Defect Detection - Training ###")
	print("#" * 60)




	print("\nPlease upload your dataset as a zip file:")
	uploaded = files.upload()
	dataset_path = None

	for filename in uploaded.keys():
	if filename.endswith('.zip'):
	print(f"\nExtracting {filename}...")
	total_size = os.path.getsize(filename)
	with zipfile.ZipFile(io.BytesIO(uploaded[filename]), 'r') as zip_ref:

	file_list = zip_ref.infolist()
	for file in tqdm(file_list, desc="Extracting", unit="file"):
	zip_ref.extract(file, '/content/project_files/dataset')
	dataset_path = '/content/project_files/dataset'
	print("\nDataset extracted successfully!")
	break

	if not dataset_path:
	print("Warning: No dataset zip file uploaded. Training will fail without a dataset.")


	print("\nOptionally upload an existing model (h5 file) to continue training:")
	model_uploaded = files.upload()
	model_path = None

	for filename in model_uploaded.keys():
	if filename.endswith('.h5'):

	total_size = os.path.getsize(filename)
	progress = ProgressFileUpload(filename, total_size)
	with open(filename, 'rb') as f:
	while True:
	chunk = f.read(1024*1024)
	if not chunk:
	break
	progress.update(len(chunk))

	model_path = f'/content/project_files/{filename}'
	shutil.move(filename, model_path)
	print(f"\nModel uploaded to: {model_path}")
	break


	detector = DefectDetectorTF()


	if model_path:
	print(f"\nLoading existing model from {model_path}")
	detector.model = tf.keras.models.load_model(model_path)


	if dataset_path:
	print("\nStarting training...")
	detector.train(dataset_path, epochs=10)

	#
	model_save_path = '/content/project_files/defect_detection_model.h5'
	detector.save_model_with_progress(model_save_path)


	print("\nUpload an image for testing:")
	test_uploaded = files.upload()
	if test_uploaded:
	test_image = list(test_uploaded.keys())[0]

	total_size = os.path.getsize(test_image)
	progress = ProgressFileUpload(test_image, total_size)
	with open(test_image, 'rb') as f:
	while True:
	chunk = f.read(1024*1024)
	if not chunk:
	break
	progress.update(len(chunk))

	result, debug = detector.predict(test_image)

	plt.imshow(result)
	plt.axis('off')
	plt.show()
	print(debug)

	print("\nTraining process completed!")
	print("You can find your trained model in the 'project_files' folder.")
	print("To download the model manually:")
	print("1. Click on the folder icon on the left")
	print("2. Navigate to 'project_files' folder")
	print("3. Right-click on 'defect_detection_model.h5' and select 'Download'")



	print("\n\n" + "#" * 60)
	print("### Steel Surface Defect Detection - Testing ###")
	print("#" * 60)

	def test_model_with_zip(test_zip_path, model_path, detector):


	test_dir = '/content/project_files/test_dataset'
	os.makedirs(test_dir, exist_ok=True)


	print(f"\nExtracting test dataset from {test_zip_path}...")
	with zipfile.ZipFile(test_zip_path, 'r') as zip_ref:
	zip_ref.extractall(test_dir)
	print("Test dataset extracted successfully!")


	print(f"\nLoading model from {model_path}")
	detector.model = tf.keras.models.load_model(model_path)
	print("Model loaded successfully!")


	correct = 0
	total = 0
	class_correct = {class_name: 0 for class_name in detector.class_names}
	class_total = {class_name: 0 for class_name in detector.class_names}


	print("\nStarting evaluation on test set...")
	for class_name in detector.class_names:
	class_dir = os.path.join(test_dir, class_name)
	if not os.path.exists(class_dir):
	print(f"Warning: No test images found for class {class_name}")
	continue


	for img_file in tqdm(os.listdir(class_dir), desc=f"Testing {class_name}", unit="image"):
	if img_file.lower().endswith(('.jpg', '.jpeg', '.png', '.bmp')):
	img_path = os.path.join(class_dir, img_file)
	try:

	img = cv2.imread(img_path)
	if img is None:
	print(f"Could not read image: {img_path}")
	continue

	img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
	img = cv2.resize(img, detector.input_shape[:2])
	img_array = tf.expand_dims(tf.keras.utils.img_to_array(img), 0) / 255.0

	predictions = detector.model.predict(img_array, verbose=0)
	predicted_class = np.argmax(predictions[0])


	total += 1
	class_total[class_name] += 1

	if detector.class_names[predicted_class] == class_name:
	correct += 1
	class_correct[class_name] += 1

	except Exception as e:
	print(f"\nError processing {img_path}: {str(e)}")
	continue


	if total > 0:
	print("\n\n=== Test Results ===")
	print(f"Overall Accuracy: {correct/total:.2%} ({correct}/{total})")

	print("\nClass-wise Accuracy:")
	for class_name in detector.class_names:
	if class_total[class_name] > 0:
	acc = class_correct[class_name]/class_total[class_name]
	print(f"{class_name}: {acc:.2%} ({class_correct[class_name]}/{class_total[class_name]})")
	else:
	print(f"{class_name}: No test images found")
	else:
	print("\nNo valid test images found in the provided zip file")


	print("\n\n=== Model Testing ===")
	print("Please upload your test dataset as a zip file (with same folder structure as training):")
	uploaded = files.upload()
	test_zip_path = None

	for filename in uploaded.keys():
	if filename.endswith('.zip'):
	test_zip_path = f'/content/{filename}'
	print(f"\nTest dataset {filename} uploaded successfully!")
	break

	if test_zip_path:

	model_path = '/content/project_files/defect_detection_model.h5'


	if not os.path.exists(model_path):
	print(f"\nError: Model not found at {model_path}")
	print("Please ensure the model was saved correctly during training.")
	else:

	test_model_with_zip(test_zip_path, model_path, detector)
	else:
	print("\nNo test zip file provided. Skipping evaluation.")

	print("\nTesting process completed!")