Source code for library.models.evaluate

"""
Module for evaluating the performance of trained models
using both Sklearn and FHE implementations.

This module includes functionality to compare the accuracy and
execution times of models trained with Scikit-learn and
Fully Homomorphic Encryption (FHE). Results are saved as a CSV file.
"""

import time
import pandas as pd
from sklearn.metrics import accuracy_score
import joblib



[docs]
def evaluate_models(models, datasets, training_times):
    """
    Evaluate trained models and compare performance.

    This function computes accuracy and execution time metrics
    for Scikit-learn and FHE models and calculates their ratios.

    Args:
        models (dict):
            Dictionary where keys are model names and values are tuples
            containing Scikit-learn and FHE models:
            {
                "model_name": (sklearn_model, fhe_model)
            }.
        datasets (dict):
            Dictionary containing training and validation datasets:
            {
                "x_train": np.ndarray, "x_val": np.ndarray,
                "y_train": np.ndarray, "y_val": np.ndarray
            }.
        training_times (dict):
            Dictionary containing training times for Scikit-learn models:
            {
                "model_name": float
            }.

    Returns:
        list: A list of dictionaries, where each dictionary contains
        evaluation metrics for a model:
        [
            {
                "Model": str,
                "Sklearn Accuracy": float,
                "FHE Accuracy": float,
                "Sklearn Time": float,
                "FHE Time": float,
                "Time Ratio (FHE/Sklearn)": float,
                "Accuracy Ratio (FHE/Sklearn)": float
            },
            ...
        ].
    """
    x_train, y_train = datasets["x_train"], datasets["y_train"].astype(int)
    x_val, y_val = datasets["x_val"], datasets["y_val"].astype(int)

    results = []
    for model_name, (sk_model, fhe_model) in models.items():
        obj = {"Model": model_name}
        # Predict with Sklearn model
        sk_y_pred = sk_model.predict(x_val)
        obj["Sklearn Accuracy"] = accuracy_score(y_val, sk_y_pred)

        # Train FHE model
        start_time = time.time()
        fhe_model.fit(x_train, y_train)
        obj["FHE Time"] = time.time() - start_time
        # Predict with FHE model
        fhe_y_pred = fhe_model.predict(x_val)
        obj["FHE Accuracy"] = accuracy_score(y_val, fhe_y_pred)

        # Calculate ratios
        obj["Sklearn Time"] = training_times[model_name]
        obj["Time Ratio (FHE/Sklearn)"] = obj["FHE Time"] / obj["Sklearn Time"]
        obj["Accuracy Ratio (FHE/Sklearn)"] = (
            obj["FHE Accuracy"] / obj["Sklearn Accuracy"]
        )

        # Store results
        results.append(obj)

    return results




[docs]
def main():
    """
    Main function to load data, evaluate models, and save results.

    This function loads processed data and pre-trained models,
    evaluates their performance using `evaluate_models`, and saves
    the results to a CSV file.

    Steps:
    1. Load the processed datasets and models from serialized files.
    2. Evaluate the models on accuracy and execution time metrics.
    3. Save the evaluation results in a CSV file for further analysis.

    Outputs:
        results.csv: A CSV file containing model evaluation metrics.
    """
    # Load data and models
    x_train, x_val, _, y_train, y_val, _ = joblib.load(
        "library/data/processed_data.pkl"
    )

    datasets = {"x_train": x_train, "x_val": x_val, "y_train": y_train, "y_val": y_val}

    trained_models, training_times = joblib.load("trained_and_times_models.pkl")

    # Evaluate models
    results = evaluate_models(trained_models, datasets, training_times)

    # Save results to a CSV file
    df = pd.DataFrame(results)
    df.to_csv("results.csv", index=False)



if __name__ == "__main__":
    main()