Spaces:

kalhar
/

Texture_Classification_of_Stone_Brick_and_Wood

Build error

App Files Files Community

Kalhar.Pandya commited on Feb 21, 2025

Commit

600cada

1 Parent(s): 61bb710

final

Browse files

Files changed (4) hide show

__pycache__/feature_extractor.cpython-312.pyc +0 -0
app.py +30 -35
svm_model_color.pkl → svm_rf_combined.pkl +2 -2
train.py +224 -0

__pycache__/feature_extractor.cpython-312.pyc ADDED Viewed

Binary file (6.93 kB). View file

app.py CHANGED Viewed

@@ -7,8 +7,8 @@ import gradio as gr
 # Import the feature extraction function from feature_extractor.py
 from feature_extractor import extract_features_from_image
-# Global variables for the classifier, class names, and training log
-classifier = None
 class_names = []
 training_log = ""
@@ -16,26 +16,34 @@ training_log = ""
 # Model Loading
 # ---------------------------------------------------------------------
 def load_model(model_filename):
-    global classifier, class_names, training_log
     if os.path.exists(model_filename):
-        print("Found existing SVM model. Loading...")
         with open(model_filename, "rb") as f:
             model_data = pickle.load(f)
-        classifier = model_data['classifier']
         class_names = model_data['class_names']
         training_log += "Loaded model from disk.\n"
-        print("Loaded SVM model from disk.")
     else:
         print(f"Model file {model_filename} not found. Please train the model first.")
-def classify_new_image(input_image_path):
     """
-    Expects input_image_path as a file path. Loads the image,
-    processes it, and returns the final prediction and probabilities.
     """
-    global classifier, training_log, class_names
     progress_log = training_log + "\nStarting classification...\n"
     # Load image using OpenCV from file path
     image = cv2.imread(input_image_path)
     if image is None:
@@ -114,43 +122,30 @@ def classify_new_image(input_image_path):
     print(prob_dict)
     return final_prediction, prob_dict
-# Gradio Interface Setup using file paths
-if __name__ == "__main__":
-    model_filename = "svm_model_color.pkl"
-    load_model(model_filename)
-    iface = gr.Interface(
-        fn=classify_new_image,
-        inputs=gr.Image(type="filepath"),
-        outputs=[
-            gr.Label(label="Predicted Class"),
-            gr.Label(label="Probabilities")
-        ],
-        title="Stone, Wood, Brick Classifier",
-        description=("Upload an image of stone, wood, or brick to classify it.\n\n"
-                     "The image is processed by subdividing it into patches and aggregating the predictions. "
-                     "Progress logs are printed to the terminal.")
-    )
-    iface.launch(share=True)
 # ---------------------------------------------------------------------
-# Gradio Interface Setup
 # ---------------------------------------------------------------------
 if __name__ == "__main__":
-    model_filename = "svm_model2.pkl"
     load_model(model_filename)
     iface = gr.Interface(
         fn=classify_new_image,
-        inputs=gr.Image(type="filepath"),
         outputs=[
             gr.Label(label="Predicted Class"),
             gr.Label(label="Probabilities")
         ],
         title="Stone, Wood, Brick Classifier",
-        description=("Upload an image of stone, wood, or brick to classify it.\n\n"
                      "The image is processed by subdividing it into patches and aggregating the predictions. "
                      "Progress logs are printed to the terminal.")
     )
-    iface.launch()

 # Import the feature extraction function from feature_extractor.py
 from feature_extractor import extract_features_from_image
+# Global variables for the models, class names, and training log
+models = {}  # This will be a dictionary with keys: 'svm', 'rf', 'combined'
 class_names = []
 training_log = ""
 # Model Loading
 # ---------------------------------------------------------------------
 def load_model(model_filename):
+    global models, class_names, training_log
     if os.path.exists(model_filename):
+        print("Found existing model file. Loading...")
         with open(model_filename, "rb") as f:
             model_data = pickle.load(f)
+        models = model_data['models']   # Expecting a dict: {'svm': ..., 'rf': ..., 'combined': ...}
         class_names = model_data['class_names']
         training_log += "Loaded model from disk.\n"
+        print("Loaded models from disk.")
     else:
         print(f"Model file {model_filename} not found. Please train the model first.")
+# ---------------------------------------------------------------------
+# Gradio Classification Function with Model Selection
+# ---------------------------------------------------------------------
+def classify_new_image(input_image_path, model_choice):
     """
+    Expects input_image_path as a file path and model_choice as one of the keys in models.
+    Loads the image, processes it by extracting patches and computing predictions on each patch,
+    aggregates patch predictions, and returns the final predicted class and probabilities.
     """
+    global models, training_log, class_names
     progress_log = training_log + "\nStarting classification...\n"
+    if model_choice not in models:
+        raise ValueError(f"Model choice '{model_choice}' not found. Available choices: {list(models.keys())}")
+    classifier = models[model_choice]
     # Load image using OpenCV from file path
     image = cv2.imread(input_image_path)
     if image is None:
     print(prob_dict)
     return final_prediction, prob_dict
 # ---------------------------------------------------------------------
+# Gradio Interface Setup using file paths and model selection
 # ---------------------------------------------------------------------
 if __name__ == "__main__":
+    model_filename = "./svm_rf_combined.pkl"  # Adjust filename as needed
     load_model(model_filename)
+    # Create a dropdown for model selection.
+    # If models dict is not yet populated, we set default choices.
+    model_choices = list(models.keys()) if models else ['svm', 'rf', 'combined']
     iface = gr.Interface(
         fn=classify_new_image,
+        inputs=[
+            gr.Image(type="filepath", label="Input Image"),
+            gr.Dropdown(choices=model_choices, label="Select Model", value=model_choices[0])
+        ],
         outputs=[
             gr.Label(label="Predicted Class"),
             gr.Label(label="Probabilities")
         ],
         title="Stone, Wood, Brick Classifier",
+        description=("Upload an image and select a classifier model (svm, rf, combined) to classify it.\n\n"
                      "The image is processed by subdividing it into patches and aggregating the predictions. "
                      "Progress logs are printed to the terminal.")
     )
+    iface.launch(share=True)

svm_model_color.pkl → svm_rf_combined.pkl RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:421f593486e03e780e4376677331aa39bc65dc7d128152e19f9f6178ad9e4a69
-size 23294

 version https://git-lfs.github.com/spec/v1
+oid sha256:0b503cc65a0f39fb172da810a87a81b2bdc62c578f5fed681a16b472116d7733
+size 11463562

train.py ADDED Viewed

	@@ -0,0 +1,224 @@

+import os
+import cv2
+import numpy as np
+import pickle
+import sys
+import threading
+import concurrent.futures
+from sklearn.model_selection import train_test_split
+from sklearn.svm import SVC
+from sklearn.metrics import classification_report, confusion_matrix
+# Import the feature extraction function (from feature_extractor.py)
+from feature_extractor import extract_features_from_image
+training_log = ""
+# Helper function for parallel processing
+def process_image(file_path, class_name):
+    """
+    Reads the image, extracts combined features, and returns (features, label).
+    Returns (None, None) if image reading fails.
+    """
+    image = cv2.imread(file_path, cv2.IMREAD_COLOR)
+    if image is None:
+        print(f"Warning: Could not read {file_path}")
+        return None, None
+    feats = extract_features_from_image(image)
+    return feats['combined_features'], class_name
+# ---------------------------------------------------------------------
+# 1. Data Loading with Parallel Feature Extraction
+# ---------------------------------------------------------------------
+def load_dataset(dataset_folder, max_workers=4):
+    """
+    Expects dataset_folder to contain subfolders (one per class).
+    Each subfolder has images of that class. This function:
+      - Reads each image (in parallel)
+      - Extracts a feature vector
+      - Returns arrays of feature vectors (X) and labels (y).
+    """
+    X = []
+    y = []
+    classes = []  # list of class names
+    print(f"Scanning dataset folder: {dataset_folder}")
+    for class_name in os.listdir(dataset_folder):
+        class_path = os.path.join(dataset_folder, class_name)
+        if not os.path.isdir(class_path):
+            continue
+        classes.append(class_name)
+        print(f"\nProcessing class: {class_name}")
+        image_files = [
+            f for f in os.listdir(class_path)
+            if f.lower().endswith(('.jpg', '.jpeg', '.png', '.bmp', '.tiff'))
+        ]
+        total_images = len(image_files)
+        image_count = 0
+        # Use ThreadPoolExecutor for parallel extraction
+        with concurrent.futures.ThreadPoolExecutor(max_workers=max_workers) as executor:
+            future_to_file = {}
+            for filename in image_files:
+                file_path = os.path.join(class_path, filename)
+                # Submit tasks
+                future = executor.submit(process_image, file_path, class_name)
+                future_to_file[future] = filename
+            for future in concurrent.futures.as_completed(future_to_file):
+                filename = future_to_file[future]
+                features, label = future.result()
+                if features is not None:
+                    X.append(features)
+                    y.append(label)
+                    image_count += 1
+                    print(
+                        f"\rProcessed {image_count}/{total_images} images in '{class_name}'",
+                        end="", flush=True
+                    )
+        print(f"\nCompleted class: {class_name} with {image_count} images.")
+    X = np.array(X, dtype=np.float32)
+    y = np.array(y)
+    print(f"Finished loading dataset. Total classes: {len(classes)}. Total images: {len(X)}.")
+    return X, y, classes
+from sklearn.svm import LinearSVC
+from sklearn.ensemble import BaggingClassifier
+from sklearn.metrics import classification_report, confusion_matrix
+from sklearn.model_selection import train_test_split
+from sklearn.preprocessing import StandardScaler
+from sklearn.pipeline import make_pipeline
+from sklearn.ensemble import VotingClassifier, BaggingClassifier, RandomForestClassifier
+from sklearn.pipeline import make_pipeline
+from sklearn.svm import LinearSVC
+from sklearn.preprocessing import StandardScaler
+from sklearn.model_selection import train_test_split
+from sklearn.metrics import classification_report, confusion_matrix
+def train_classifiers(X, y):
+    """
+    Splits data into training/test sets, trains:
+      - A Bagging ensemble of LinearSVC classifiers (with scaling)
+      - A RandomForestClassifier
+      - A VotingClassifier that combines both
+    Returns:
+        models (dict): A dictionary with keys 'svm', 'rf', 'combined'
+        test_data (tuple): (X_test, y_test)
+    """
+    # Split dataset: 80% train, 20% test
+    X_train, X_test, y_train, y_test = train_test_split(
+        X, y, test_size=0.2, random_state=31, shuffle=True
+    )
+    # --- Train SVM Ensemble ---
+    svm_pipeline = make_pipeline(StandardScaler(),
+                                 LinearSVC(random_state=31))
+    svm_ensemble = BaggingClassifier(
+        estimator=svm_pipeline,
+        n_estimators=10,  # Adjust for speed/accuracy trade-off
+        n_jobs=-1,
+        verbose=1
+    )
+    print("Training SVM ensemble classifier...")
+    svm_ensemble.fit(X_train, y_train)
+    print("\nSVM Ensemble Classification Report:")
+    y_pred_svm = svm_ensemble.predict(X_test)
+    print(classification_report(y_test, y_pred_svm))
+    print("Confusion Matrix:")
+    print(confusion_matrix(y_test, y_pred_svm))
+    # --- Train RandomForest ---
+    rf = RandomForestClassifier(
+        n_estimators=100,  # Adjust as needed
+        random_state=31,
+        n_jobs=-1
+    )
+    print("\nTraining RandomForest classifier...")
+    rf.fit(X_train, y_train)
+    print("\nRandomForest Classification Report:")
+    y_pred_rf = rf.predict(X_test)
+    print(classification_report(y_test, y_pred_rf))
+    print("Confusion Matrix:")
+    print(confusion_matrix(y_test, y_pred_rf))
+    # --- Train Combined Voting Classifier ---
+    combined_clf = VotingClassifier(
+        estimators=[('svm', svm_ensemble), ('rf', rf)],
+        voting='soft'
+    )
+    print("\nTraining Combined Voting classifier...")
+    combined_clf.fit(X_train, y_train)
+    print("\nCombined Voting Classifier Report:")
+    y_pred_combined = combined_clf.predict(X_test)
+    print(classification_report(y_test, y_pred_combined))
+    print("Confusion Matrix:")
+    print(confusion_matrix(y_test, y_pred_combined))
+    models = {
+        'svm': svm_ensemble,
+        'rf': rf,
+        'combined': combined_clf
+    }
+    return models, (X_test, y_test)
+# ---------------------------------------------------------------------
+# 3. Training Thread
+# ---------------------------------------------------------------------
+def train_model_thread(dataset_folder, model_filename, max_workers=4):
+    global training_log
+    training_log += "Starting training...\n"
+    print("Starting training...")
+    # (A) Load Data (in parallel)
+    X, y, classes = load_dataset(dataset_folder, max_workers=max_workers)
+    # (B) Train Classifier and Print Metrics
+    models, _ = train_classifiers(X, y)
+    print("Training complete.")
+    training_log += "Training complete.\n"
+    # (C) Save the Model
+    model_data = {'models': models, 'class_names': classes}
+    with open(model_filename, "wb") as f:
+        pickle.dump(model_data, f)
+    training_log += f"Model saved to {model_filename}\n"
+    print(f"Model saved to {model_filename}")
+# ---------------------------------------------------------------------
+# Main
+# ---------------------------------------------------------------------
+if __name__ == "__main__":
+    dataset_folder = "./../images_dataset"   # Adjust path as needed
+    model_filename = "svm_rf_combined.pkl"
+    # Launch training in a separate thread
+    # You can tune 'max_workers' to the number of desired threads.
+    max_workers = 32
+    training_thread = threading.Thread(
+        target=train_model_thread,
+        args=(dataset_folder, model_filename, max_workers)
+    )
+    training_thread.start()
+    # Wait until training finishes
+    training_thread.join()