File size: 4,680 Bytes
3e16037
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
"""
Training Pipeline for CIFAR-10 Image Classification.

This module provides functions to compile and train Keras models
with appropriate callbacks for preventing overfitting.
"""

import os
from keras.api.optimizers import Adam
from keras.api.callbacks import EarlyStopping, ModelCheckpoint, ReduceLROnPlateau


# Default training configuration
DEFAULT_CONFIG = {
    'learning_rate': 0.001,
    'batch_size': 64,
    'epochs': 100,          # max epochs (early stopping will cut short)
    'early_stopping_patience': 10,
    'reduce_lr_patience': 5,
    'reduce_lr_factor': 0.5,
    'min_lr': 1e-6,
}


def compile_model(model, learning_rate=DEFAULT_CONFIG['learning_rate']):
    """
    Compile a Keras model with Adam optimizer and categorical crossentropy loss.

    Args:
        model: Keras model to compile.
        learning_rate (float): Initial learning rate for Adam optimizer.

    Returns:
        Compiled Keras model.
    """
    model.compile(
        optimizer=Adam(learning_rate=learning_rate),
        loss='categorical_crossentropy',
        metrics=['accuracy']
    )
    return model


def get_callbacks(model_save_path, patience=DEFAULT_CONFIG['early_stopping_patience']):
    """
    Create a list of training callbacks for robust training.

    Callbacks:
    - EarlyStopping: Stops training if val_loss doesn't improve for `patience` epochs.
                     Restores the best weights.
    - ModelCheckpoint: Saves the best model based on val_loss.
    - ReduceLROnPlateau: Reduces learning rate by half if val_loss plateaus for 5 epochs.

    Args:
        model_save_path (str): File path to save the best model.
        patience (int): Number of epochs to wait before early stopping.

    Returns:
        list: List of Keras callback instances.
    """
    # Ensure the directory exists
    os.makedirs(os.path.dirname(model_save_path), exist_ok=True)

    callbacks = [
        EarlyStopping(
            monitor='val_loss',
            patience=patience,
            restore_best_weights=True,
            verbose=1
        ),
        ModelCheckpoint(
            filepath=model_save_path,
            monitor='val_loss',
            save_best_only=True,
            verbose=1
        ),
        ReduceLROnPlateau(
            monitor='val_loss',
            factor=DEFAULT_CONFIG['reduce_lr_factor'],
            patience=DEFAULT_CONFIG['reduce_lr_patience'],
            min_lr=DEFAULT_CONFIG['min_lr'],
            verbose=1
        )
    ]
    return callbacks


def train_model(model, x_train, y_train, datagen=None,
                validation_split=0.1, x_val=None, y_val=None,
                batch_size=DEFAULT_CONFIG['batch_size'],
                epochs=DEFAULT_CONFIG['epochs'],
                callbacks=None):
    """
    Train a Keras model with optional data augmentation.

    If `datagen` is provided, training uses the augmentation generator.
    Otherwise, trains directly on the raw data.

    Args:
        model: Compiled Keras model.
        x_train: Training images array.
        y_train: Training labels array (one-hot).
        datagen: Optional ImageDataGenerator for data augmentation.
        validation_split: Fraction of training data for validation (used if x_val is None).
        x_val: Optional separate validation images.
        y_val: Optional separate validation labels.
        batch_size (int): Training batch size.
        epochs (int): Maximum number of training epochs.
        callbacks (list): List of Keras callbacks.

    Returns:
        keras.callbacks.History: Training history object.
    """
    # Determine validation data
    if x_val is not None and y_val is not None:
        validation_data = (x_val, y_val)
    else:
        # Split training data for validation
        split_idx = int(len(x_train) * (1 - validation_split))
        x_val = x_train[split_idx:]
        y_val = y_train[split_idx:]
        x_train = x_train[:split_idx]
        y_train = y_train[:split_idx]
        validation_data = (x_val, y_val)

    if datagen is not None:
        # Train with data augmentation
        history = model.fit(
            datagen.flow(x_train, y_train, batch_size=batch_size),
            epochs=epochs,
            validation_data=validation_data,
            callbacks=callbacks or [],
            steps_per_epoch=len(x_train) // batch_size,
            verbose=1
        )
    else:
        # Train without augmentation
        history = model.fit(
            x_train, y_train,
            batch_size=batch_size,
            epochs=epochs,
            validation_data=validation_data,
            callbacks=callbacks or [],
            verbose=1
        )

    return history