INF2008ML/testModelEvaluation.py at main · XavLimSG/INF2008ML · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
import os
import cv2
import numpy as np
from skimage.feature import hog
from sklearn.metrics import accuracy_score, classification_report
import joblib
from tabulate import tabulate
import time
from memory_profiler import memory_usage

# HOG parameters
IMG_SIZE = (150, 150)
orientations = 9
pixels_per_cell = (8, 8)
cells_per_block = (2, 2)
block_norm = 'L2-Hys'

# Function to preprocess image using HOG parameters
def preprocess_image(image_path):
    img = cv2.imread(image_path, cv2.IMREAD_GRAYSCALE)
    if img is None:
        raise ValueError(f"Error loading image: {image_path}")
    img = cv2.resize(img, IMG_SIZE)
    features = hog(
        img,
        orientations=orientations,
        pixels_per_cell=pixels_per_cell,
        cells_per_block=cells_per_block,
        block_norm=block_norm
    )
    return features

# Function to load unseen data
def load_unseen_data(genuine_folder, forged_folder):
    X_unseen = []
    y_unseen = []

    # Genuine images (label = 1)
    for filename in os.listdir(genuine_folder):
        file_path = os.path.join(genuine_folder, filename)
        if os.path.isfile(file_path):
            try:
                features = preprocess_image(file_path)
                X_unseen.append(features)
                y_unseen.append(1)
            except Exception as e:
                print(e)

    # Forged images (label = 0)
    for filename in os.listdir(forged_folder):
        file_path = os.path.join(forged_folder, filename)
        if os.path.isfile(file_path):
            try:
                features = preprocess_image(file_path)
                X_unseen.append(features)
                y_unseen.append(0)
            except Exception as e:
                print(e)

    return np.array(X_unseen), np.array(y_unseen)

# Function to evaluate the machine learning model (file size, inference time, memory overhead, performance metrics [F1, Precision, Recall, Accuracy])
def evaluate_model(model_file, model_name, X_data, y_true):
    # File size in KB
    file_size = os.path.getsize(model_file) / 1024  # in KB

    # Load the model
    model = joblib.load(model_file)
    print(f"{model_name} model loaded.")

    # Measure inference time
    start_time = time.time()
    predictions = model.predict(X_data)
    inference_time = time.time() - start_time

    # Measure memory overhead
    mem_usage = memory_usage((model.predict, (X_data,)), interval=0.01)
    memory_overhead = max(mem_usage) - min(mem_usage)

    # Compute performance metrics
    accuracy = accuracy_score(y_true, predictions)
    report = classification_report(y_true, predictions, output_dict=True)
    precision = report['1']['precision']
    recall = report['1']['recall']
    f1 = report['1']['f1-score']

    return [model_name, round(file_size, 2), round(inference_time, 4),
            round(memory_overhead, 4), round(accuracy, 6), round(precision, 6),
            round(recall, 6), round(f1, 6)]

# Function to evaluate the ensemble model
def evaluate_ensemble(ensemble_model_paths, ensemble_models, X_data, y_true):
    # Calculate the file size for the ensemble model (sum of the individual model sizes)
    ensemble_model_size = sum([os.path.getsize(model_path) for model_path in ensemble_model_paths]) / 1024  # in KB
    ensemble_model_size_rounded = round(ensemble_model_size, 2)

    # Measure the inference time for all models in the ensemble
    start_time = time.time()
    ensemble_predictions = []
    for model in ensemble_models:
        predictions = model.predict(X_data)
        ensemble_predictions.append(predictions)
    inference_time = time.time() - start_time
    inference_time_rounded = round(inference_time, 4)

    # Measure memory overhead during prediction using memory_usage for all ensemble models
    mem_usage_list = []
    for model in ensemble_models:
        mem_usage = memory_usage((model.predict, (X_data,)), interval=0.01)
        mem_usage_list.append(max(mem_usage) - min(mem_usage))
    ensemble_memory_overhead = sum(mem_usage_list)  # Sum the memory overheads of all models in MiB
    ensemble_memory_overhead_rounded = round(ensemble_memory_overhead, 4)

    # Average the ensemble predictions
    ensemble_predictions = np.mean(ensemble_predictions, axis=0)
    ensemble_predictions = np.where(ensemble_predictions >= 0.5, 1, 0)  # Binary classification

    accuracy = accuracy_score(y_true, ensemble_predictions)
    report = classification_report(y_true, ensemble_predictions, output_dict=True)
    precision = report['1']['precision']
    recall = report['1']['recall']
    f1 = report['1']['f1-score']

    return [
        "Ensemble", round(ensemble_model_size_rounded,6), round(inference_time_rounded,6),
        round(ensemble_memory_overhead_rounded,6), round(accuracy, 6), round(precision, 6),
        round(recall, 6), round(f1, 6)
    ]

# Path to the unseen data folders
genuine_unseen_folder = r"C:\Users\Vyse\Documents\GitHub\INF2008ML\signatures_cedar\unseen_data_for_testing\unseen_org"   # Update this path
forged_unseen_folder  = r"C:\Users\Vyse\Documents\GitHub\INF2008ML\signatures_cedar\unseen_data_for_testing\unseen_forg"    # Update this path

if __name__ == '__main__':
    # Load unseen data and extract features
    X_unseen, y_unseen = load_unseen_data(genuine_unseen_folder, forged_unseen_folder)
    print("Unseen data samples:", X_unseen.shape)

    # Load the individual models
    models_info = [
        ("adaboost_model.pkl", "AdaBoost"),
        ("random_forest_model.pkl", "Random Forest"),
        ("knn_model.pkl", "KNN"),
        ("svm_model.pkl", "SVM"),
        ("writer_independent_logreg_model.pkl", "LogReg")
    ]

    ensemble_model_paths = [
    "knn_model.pkl", "random_forest_model.pkl", "svm_model.pkl",
    "writer_independent_logreg_model.pkl", "adaboost_model.pkl"
    ]

    ensemble_models = [joblib.load(model_path) for model_path in ensemble_model_paths]

    # Evaluate ensemble model
    ensemble_metrics = evaluate_ensemble(ensemble_model_paths, ensemble_models, X_unseen, y_unseen)

    results = []
    for model_file, model_name in models_info:
        metrics = evaluate_model(model_file, model_name, X_unseen, y_unseen)
        results.append(metrics)
    results.append(ensemble_metrics)


    # Display results in a table
    headers = ["Model","File Size (KB)","Inference Time (s)", "Memory Overhead (MiB)", "Accuracy", "Precision", "Recall", "F1-Score"]
    print("\nModel Performance Comparison:")
    print(tabulate(results, headers=headers, tablefmt="pretty"))