Spaces:

Lucifer9907
/

SDK-Docker

Sleeping

App Files Files Community

SDK-Docker / train.py

Lucifer9907

Prepare Hugging Face Docker Space

ff0c419 25 days ago

raw

history blame contribute delete

9.02 kB

	from __future__ import annotations

	import json
	import os
	from pathlib import Path

	import matplotlib.pyplot as plt
	import numpy as np
	import tensorflow as tf
	from sklearn.metrics import accuracy_score, classification_report, confusion_matrix, f1_score
	from sklearn.model_selection import train_test_split
	from tensorflow.keras.callbacks import EarlyStopping, ModelCheckpoint, ReduceLROnPlateau

	from src.ai_image_detector.config import (
	ARTIFACTS_DIR,
	METRICS_PATH,
	MODEL_PATH,
	PROCESSED_DATA_DIR,
	SEED,
	THRESHOLD_PATH,
	TRAINING_PLOT_PATH,
	)
	from src.ai_image_detector.data import load_dataset
	from src.ai_image_detector.model import build_model, unfreeze_for_fine_tuning


	def get_env_int(name: str, default: int) -> int:
	value = os.getenv(name)
	if value is None:
	return default
	try:
	parsed = int(value)
	except ValueError:
	return default
	return parsed if parsed > 0 else default


	def make_datasets(
	x: np.ndarray,
	y: np.ndarray,
	batch_size: int,
	) -> tuple[tf.data.Dataset, tf.data.Dataset, np.ndarray, np.ndarray, np.ndarray, np.ndarray]:
	x_train, x_temp, y_train, y_temp = train_test_split(
	x,
	y,
	test_size=0.3,
	random_state=SEED,
	stratify=y,
	)
	x_val, x_test, y_val, y_test = train_test_split(
	x_temp,
	y_temp,
	test_size=0.5,
	random_state=SEED,
	stratify=y_temp,
	)

	augmenter = tf.keras.Sequential(
	[
	tf.keras.layers.RandomFlip("horizontal"),
	tf.keras.layers.RandomRotation(0.05),
	tf.keras.layers.RandomZoom(0.1),
	tf.keras.layers.RandomContrast(0.1),
	]
	)

	train_ds = tf.data.Dataset.from_tensor_slices((x_train, y_train))
	train_ds = train_ds.shuffle(len(x_train), seed=SEED)
	train_ds = train_ds.batch(batch_size)
	train_ds = train_ds.map(
	lambda images, labels: (augmenter(images, training=True), labels),
	num_parallel_calls=tf.data.AUTOTUNE,
	)
	train_ds = train_ds.prefetch(tf.data.AUTOTUNE)

	val_ds = tf.data.Dataset.from_tensor_slices((x_val, y_val))
	val_ds = val_ds.batch(batch_size).prefetch(tf.data.AUTOTUNE)

	return train_ds, val_ds, x_val, y_val, x_test, y_test


	def combine_histories(
	first_history: tf.keras.callbacks.History,
	second_history: tf.keras.callbacks.History,
	) -> dict[str, list[float]]:
	combined: dict[str, list[float]] = {}
	for history in (first_history.history, second_history.history):
	for key, values in history.items():
	combined.setdefault(key, []).extend(values)
	return combined


	def save_training_plot(history_data: dict[str, list[float]]) -> None:
	fig, axes = plt.subplots(1, 2, figsize=(12, 4))

	axes[0].plot(history_data["accuracy"], label="Train")
	axes[0].plot(history_data["val_accuracy"], label="Validation")
	axes[0].set_title("Accuracy")
	axes[0].set_xlabel("Epoch")
	axes[0].set_ylabel("Accuracy")
	axes[0].legend()

	axes[1].plot(history_data["loss"], label="Train")
	axes[1].plot(history_data["val_loss"], label="Validation")
	axes[1].set_title("Loss")
	axes[1].set_xlabel("Epoch")
	axes[1].set_ylabel("Loss")
	axes[1].legend()

	fig.tight_layout()
	fig.savefig(TRAINING_PLOT_PATH, dpi=150)
	plt.close(fig)


	def predict_probabilities(
	model: tf.keras.Model,
	x: np.ndarray,
	batch_size: int = 32,
	) -> np.ndarray:
	dataset = tf.data.Dataset.from_tensor_slices(x)
	dataset = dataset.batch(batch_size).prefetch(tf.data.AUTOTUNE)
	return model.predict(dataset, verbose=0).ravel()


	def evaluate_and_save_metrics(
	model: tf.keras.Model,
	x_test: np.ndarray,
	y_test: np.ndarray,
	threshold_info: dict[str, float],
	) -> None:
	threshold = float(threshold_info["threshold"])
	results = model.evaluate(x_test, y_test, verbose=0, return_dict=True)
	predictions = predict_probabilities(model, x_test, batch_size=32)
	predicted_classes = (predictions >= threshold).astype(int)
	predicted_classes_default = (predictions >= 0.5).astype(int)

	report = classification_report(
	y_test,
	predicted_classes,
	target_names=["real", "fake"],
	output_dict=True,
	zero_division=0,
	)
	matrix = confusion_matrix(y_test, predicted_classes).tolist()

	metrics = {
	"evaluation": {key: float(value) for key, value in results.items()},
	"thresholding": {
	"default_threshold": 0.5,
	"calibrated_threshold": threshold,
	"test_accuracy_default": float(accuracy_score(y_test, predicted_classes_default)),
	"test_accuracy_calibrated": float(accuracy_score(y_test, predicted_classes)),
	"test_f1_fake_calibrated": float(f1_score(y_test, predicted_classes, pos_label=1)),
	},
	"confusion_matrix": matrix,
	"classification_report": report,
	}

	METRICS_PATH.write_text(json.dumps(metrics, indent=2), encoding="utf-8")


	def calibrate_threshold(y_val: np.ndarray, val_probs: np.ndarray) -> dict[str, float]:
	thresholds = np.linspace(0.2, 0.8, 241)
	best_acc = -1.0
	best_f1 = -1.0
	best_threshold = 0.5
	default_acc = float(accuracy_score(y_val, (val_probs >= 0.5).astype(int)))

	for threshold in thresholds:
	predicted = (val_probs >= threshold).astype(int)
	acc = accuracy_score(y_val, predicted)
	f1_fake = f1_score(y_val, predicted, pos_label=1, zero_division=0)
	if acc > best_acc or (acc == best_acc and f1_fake > best_f1):
	best_acc = acc
	best_f1 = f1_fake
	best_threshold = float(threshold)

	if best_acc < default_acc + 0.02:
	best_threshold = 0.5

	best_threshold = float(np.clip(best_threshold, 0.35, 0.65))
	margin = 0.10
	uncertain_low = float(np.clip(best_threshold - margin, 0.0, 1.0))
	uncertain_high = float(np.clip(best_threshold + margin, 0.0, 1.0))

	return {
	"threshold": best_threshold,
	"uncertain_low": uncertain_low,
	"uncertain_high": uncertain_high,
	"validation_accuracy_default_0_5": default_acc,
	"validation_accuracy": float(accuracy_score(y_val, (val_probs >= best_threshold).astype(int))),
	"validation_f1_fake": float(
	f1_score(y_val, (val_probs >= best_threshold).astype(int), pos_label=1, zero_division=0)
	),
	}


	def main() -> None:
	ARTIFACTS_DIR.mkdir(parents=True, exist_ok=True)
	if not PROCESSED_DATA_DIR.exists():
	raise FileNotFoundError(
	f"Dataset folder not found at {PROCESSED_DATA_DIR}. "
	"Create data/processed/real and data/processed/fake and put images there."
	)

	batch_size = get_env_int("BATCH_SIZE", 32)
	frozen_epochs = get_env_int("FROZEN_EPOCHS", 10)
	finetune_epochs = get_env_int("FINETUNE_EPOCHS", 18)

	x, y, _ = load_dataset(PROCESSED_DATA_DIR)
	train_ds, val_ds, x_val, y_val, x_test, y_test = make_datasets(x, y, batch_size=batch_size)
	model = build_model()

	callbacks_frozen = [
	EarlyStopping(
	monitor="val_auc",
	mode="max",
	patience=4,
	restore_best_weights=True,
	),
	ReduceLROnPlateau(monitor="val_loss", factor=0.5, patience=2),
	ModelCheckpoint(
	MODEL_PATH,
	monitor="val_auc",
	mode="max",
	save_best_only=True,
	),
	]

	frozen_history = model.fit(
	train_ds,
	validation_data=val_ds,
	epochs=frozen_epochs,
	callbacks=callbacks_frozen,
	verbose=1,
	)

	model = tf.keras.models.load_model(MODEL_PATH)
	unfreeze_for_fine_tuning(model, trainable_layers=45)

	callbacks_finetune = [
	EarlyStopping(
	monitor="val_auc",
	mode="max",
	patience=5,
	restore_best_weights=True,
	),
	ReduceLROnPlateau(monitor="val_loss", factor=0.5, patience=2),
	ModelCheckpoint(
	MODEL_PATH,
	monitor="val_auc",
	mode="max",
	save_best_only=True,
	),
	]

	finetune_history = model.fit(
	train_ds,
	validation_data=val_ds,
	epochs=finetune_epochs,
	callbacks=callbacks_finetune,
	verbose=1,
	)

	model = tf.keras.models.load_model(MODEL_PATH)
	val_predictions = predict_probabilities(model, x_val, batch_size=32)
	threshold_info = calibrate_threshold(y_val, val_predictions)
	THRESHOLD_PATH.write_text(json.dumps(threshold_info, indent=2), encoding="utf-8")

	save_training_plot(combine_histories(frozen_history, finetune_history))
	evaluate_and_save_metrics(model, x_test, y_test, threshold_info)

	print(f"Training complete. Model saved to: {MODEL_PATH}")
	print(f"Threshold config saved to: {THRESHOLD_PATH}")
	print(f"Metrics saved to: {METRICS_PATH}")
	print(f"Training plot saved to: {TRAINING_PLOT_PATH}")


	if __name__ == "__main__":
	main()