NavigationDetectionAI / other /NavigationDetectionAI-Train.py

Glas42

Upload NavigationDetectionAI-Train.py

dac17cf verified almost 2 years ago

6.76 kB

	print("\n------------------------------------\n\nImporting libraries...")

	from torchvision.transforms.functional import to_pil_image
	from torch.utils.data import Dataset, DataLoader
	from torchvision import transforms
	import torch.optim as optim
	import multiprocessing
	import torch.nn as nn
	from PIL import Image
	import numpy as np
	import datetime
	import torch
	import time
	import cv2
	import os

	# Constants
	SCRIPT_PATH = os.path.dirname(os.path.realpath(__file__))
	DATA_PATH = "C:/Users/olefr/Downloads/AIDATA"
	MODEL_PATH = SCRIPT_PATH
	IMG_HEIGHT = 220
	IMG_WIDTH = 420
	NUM_EPOCHS = 50
	BATCH_SIZE = 64
	OUTPUTS = 8

	print("\n------------------------------------\n")

	print(f"CUDA available: {torch.cuda.is_available()}")

	# Check for CUDA availability
	device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
	print(f"Using {device} for training")

	# Determine the number of CPU cores
	num_cpu_cores = multiprocessing.cpu_count()
	print('Number of CPU cores:', num_cpu_cores)

	image_count = 0
	for file in os.listdir(DATA_PATH):
	if file.endswith(".png"):
	image_count += 1

	print("\nTraining settings:")
	print("> Epochs:", NUM_EPOCHS)
	print("> Batch size:", BATCH_SIZE)
	print("> Image width:", IMG_WIDTH)
	print("> Image height:", IMG_HEIGHT)
	print("> Images:", image_count)

	print("\n------------------------------------\n")

	print("Loading...")

	# Define custom dataset
	class CustomDataset(Dataset):
	def __init__(self, data_path, transform=None):
	self.data_path = data_path
	self.transform = transform
	self.images, self.user_inputs = self.load_data(data_path)

	def load_data(self, data_path):
	images = []
	user_inputs = []
	for file in os.listdir(data_path):
	if file.endswith(".png"):
	# Load image
	img = Image.open(os.path.join(data_path, file))
	img = np.array(img)
	img = cv2.resize(img, (IMG_WIDTH, IMG_HEIGHT))
	img_array = np.array(img) / 255.0

	# Load steering angle if corresponding file exists
	user_inputs_file = os.path.join(data_path, file.replace(".png", ".txt"))
	if os.path.exists(user_inputs_file):
	with open(user_inputs_file, 'r') as f:
	user_input = [float(val if type(val) != str else (1 if val == "True" else 0)) for val in f.read().strip().split(',')]
	images.append(img_array)
	user_inputs.append(user_input)
	else:
	pass

	return np.array(images), np.array(user_inputs)

	def __len__(self):
	return len(self.images)

	def __getitem__(self, idx):
	image = self.images[idx]
	user_input = self.user_inputs[idx]
	if self.transform:
	image = self.transform(image)
	return image, user_input

	# Define transformation
	transform = transforms.Compose([
	transforms.Lambda(lambda x: to_pil_image(x)), # Convert to PIL Image
	transforms.Resize((IMG_HEIGHT, IMG_WIDTH)),
	transforms.Lambda(lambda x: x.convert("L")), # Convert to grayscale
	transforms.Lambda(lambda x: x.point(lambda p: p > 128 and 255)), # Convert to binary
	transforms.ToTensor()
	])

	# Load data
	dataset = CustomDataset(DATA_PATH, transform=transform)
	dataloader = DataLoader(dataset, batch_size=BATCH_SIZE, shuffle=True)

	# Define model
	class Net(nn.Module):
	def __init__(self):
	super(Net, self).__init__()
	self.conv1 = nn.Conv2d(1, 16, kernel_size=3, stride=1, padding=1) # Adjust input channels to 1
	self.pool = nn.MaxPool2d(kernel_size=2, stride=2, padding=0)
	self.conv2 = nn.Conv2d(16, 32, kernel_size=3, stride=1, padding=1)
	self.conv3 = nn.Conv2d(32, 64, kernel_size=3, stride=1, padding=1)
	self.fc_input_size = self._get_fc_input_size()
	self.fc1 = nn.Linear(self.fc_input_size, 64)
	self.fc2 = nn.Linear(64, OUTPUTS)

	def _get_fc_input_size(self):
	# Create a sample tensor and propagate it through the network to get the output shape
	with torch.no_grad():
	sample_tensor = torch.zeros(1, 1, IMG_HEIGHT, IMG_WIDTH)
	sample_tensor = self.pool(torch.relu(self.conv1(sample_tensor)))
	sample_tensor = self.pool(torch.relu(self.conv2(sample_tensor)))
	sample_tensor = self.pool(torch.relu(self.conv3(sample_tensor)))
	return sample_tensor.view(1, -1).shape[1]

	def forward(self, x):
	x = self.pool(torch.relu(self.conv1(x)))
	x = self.pool(torch.relu(self.conv2(x)))
	x = self.pool(torch.relu(self.conv3(x)))
	x = x.view(-1, self.fc_input_size)
	x = torch.relu(self.fc1(x))
	x = self.fc2(x)
	return x

	model = Net().to(device) # Move model to GPU if available

	# Define loss function and optimizer
	criterion = nn.MSELoss()
	optimizer = optim.Adam(model.parameters())

	print("Starting training...")
	print("\n--------------------------------------------------------------\n")
	start_time = time.time()
	update_time = start_time

	# Train model
	for epoch in range(NUM_EPOCHS):
	running_loss = 0.0
	for i, data in enumerate(dataloader, 0):
	inputs, labels = data
	inputs, labels = inputs.to(device), labels.to(device)
	# Explicitly convert inputs and labels to torch.float32
	inputs = inputs.float()
	labels = labels.float()
	optimizer.zero_grad()
	outputs = model(inputs) # No need to call .float() here
	loss = criterion(outputs, labels)
	loss.backward()
	optimizer.step()
	running_loss += loss.item()
	print(f"\rEpoch {epoch+1}, Loss: {running_loss / len(dataloader)}, {round((time.time() - update_time) if time.time() - update_time > 1 else (time.time() - update_time) * 1000, 2)}{'s' if time.time() - update_time > 1 else 'ms'}/Epoch, ETA: {time.strftime('%H:%M:%S', time.gmtime(round((time.time() - start_time) / (epoch + 1) * NUM_EPOCHS - (time.time() - start_time), 2)))} " + "\n\n--------------------------------------------------------------", end='', flush=True)
	update_time = time.time()

	print("\n\nTraining completed in " + time.strftime("%H:%M:%S", time.gmtime(time.time() - start_time)))

	# Save model
	print("Saving model...")
	torch.save(model.state_dict(), os.path.join(MODEL_PATH, f"EPOCHS-{NUM_EPOCHS}_BATCH-{BATCH_SIZE}_RES-{IMG_WIDTH}x{IMG_HEIGHT}_IMAGES-{len(dataset)}_TRAININGTIME-{time.strftime('%H-%M-%S', time.gmtime(time.time() - start_time))}_DATE-{datetime.datetime.now().strftime('%Y-%m-%d-%H-%M-%S')}.pt"))
	print("Model saved successfully.")

	print("\n------------------------------------\n")