Spaces:

kautilya286
/

deepscanAPI

Configuration error

deepscanAPI / scripts /augment_data.py

first commit

b5b2f19 9 months ago

1.62 kB

	import os
	import cv2
	import numpy as np
	import albumentations as A
	from glob import glob

	# Define the augmentation pipeline
	AUG = A.Compose([
	A.HorizontalFlip(p=0.5),
	A.RandomBrightnessContrast(p=0.5),
	A.GaussianBlur(blur_limit=3, p=0.3),
	A.Rotate(limit=15, p=0.3),
	A.RandomResizedCrop(160, 160, scale=(0.9, 1.0), p=0.3),
	A.ElasticTransform(alpha=1.0, sigma=50, alpha_affine=50, p=0.3), # Elastic transformation
	A.CoarseDropout(max_holes=1, max_height=8, max_width=8, p=0.3), # Random Erasing
	A.PerspectiveTransform(scale=(0.01, 0.1), p=0.5) # Random perspective shift
	])

	# Directory with input images
	INPUT_DIR = "data"
	CATEGORIES = ["real", "deepfake", "ai_gen"]
	valid_extensions = ['.jpg', '.jpeg', '.png']

	for cat in CATEGORIES:
	os.makedirs(os.path.join(INPUT_DIR, cat, 'augmented'), exist_ok=True) # Create an 'augmented' folder inside each category
	files = glob(f"{INPUT_DIR}/{cat}/*")

	for i, file in enumerate(files):
	# Skip non-image files
	if not any(file.lower().endswith(ext) for ext in valid_extensions):
	continue

	img = cv2.imread(file)
	if img is None:
	continue
	img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)

	# Generate 3 augmented images
	for j in range(3):
	aug = AUG(image=img)["image"]
	save_path = os.path.join(INPUT_DIR, cat, 'augmented', f"aug_{i}_{j}.jpg")
	cv2.imwrite(save_path, cv2.cvtColor(aug, cv2.COLOR_RGB2BGR))

	print("✅ Augmentation complete. You can now re-run feature extraction and model training.")