import pandas as pd
from typing import Callable
from moco.profiling import profile_method_real_time
from sklearn.neural_network import MLPClassifier
from sklearn.model_selection import train_test_split
from sklearn.metrics import precision_recall_fscore_support
import time
from moco.binary_logit_classifier import BinaryLogitClassifier
import matplotlib.pyplot as plt
import numpy as np

def load_dataset(path: str):
    df = pd.read_csv(path)
    X = df[[col for col in df.columns if col.startswith('V')]].to_numpy()
    y = df['Class'].to_numpy()
    return X, y

# Load Dataset
X, y = load_dataset('/Users/samrandall/Downloads/creditcard.csv')

# Split the data
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size = 0.2, random_state = 2)
X_train, X_val, y_train, y_val = train_test_split(X_train, y_train, test_size = 0.2, random_state = 2)

X.shape, pd.Series(y).value_counts().to_dict()

# Train initial model
mlp = MLPClassifier(random_state = 4)
mlp.fit(X_train, y_train)

from sklearn.metrics import PrecisionRecallDisplay

display = PrecisionRecallDisplay.from_estimator(
    mlp, X_val, y_val, name="MLP", plot_chance_level=True, despine=True
)
_ = display.ax_.set_title("2-class Precision-Recall curve")

threshold = 0.9
blc = BinaryLogitClassifier(mlp, threshold)
y_hat_t_train = blc.predict(X_train)
y_hat_t_train.shape

y_hat_t_test = blc.predict(X_test)
p, r, _, _ = precision_recall_fscore_support(y_hat_t_test, y_test, average = 'binary')
p, r

original_timings = profile_method_real_time(mlp.predict, X_test)

np.mean(original_timings)

for i, (W, b) in enumerate(zip(mlp.coefs_, mlp.intercepts_)):
    print(f"Layer {i}: {W.shape} {b.shape}")

from moco.partition import Partition, RoutedModel

p_train = blc.predict(X_train)
partition = Partition()
C = 2
partition.find_sufficient_groups(X_train, y_train, min_group_size = X_train.shape[0] / (C * 10))
partition.summary_table

mask = partition.subset_predictors[0].predict(X_train)
pd.Series(y_train[mask]).value_counts()

# Problem is Need to Pass in MLP 
rm = RoutedModel.from_partition(partition, blc.predict)

p_train_new = rm.predict(X_train)
mlp_train_new = mlp.predict_proba(X_train)[:, 1] > threshold
print("train")
p, r, _, _ = precision_recall_fscore_support(mlp_train_new, y_train, average = 'binary')
print("MLP", p, r)
p, r, _, _ = precision_recall_fscore_support(p_train_new, y_train, average = 'binary')
print("Routed Model", p, r)

p_test_new = rm.predict(X_test)
mlp_test = (mlp.predict_proba(X_test)[:, 1] > threshold).astype(np.int64)

print("test")
print(mlp_test.dtype, y_test.dtype)
print(mlp_test.shape, y_test.shape)
p, r, _, _ = precision_recall_fscore_support(mlp_test, y_test, average = 'binary')
print("MLP", p, r)

mlp_precision = p
mlp_recall = r
p, r, _, _ = precision_recall_fscore_support(p_test_new, y_test, average = 'binary')
print("Routed Model", p, r)

routed_precision = p
routed_recall = r

np.isnan(partition.transform(X_train)).mean()

indices = np.flatnonzero(~np.isnan(partition.transform(X_test)))
vcs_test = pd.Series(y_test[indices]).value_counts()

indices = np.flatnonzero(~np.isnan(partition.transform(X_train)))
vcs_train = pd.Series(y_train[indices]).value_counts()

print(vcs_train, vcs_test)

blc = BinaryLogitClassifier(mlp, threshold)
rm = RoutedModel.from_partition(partition, blc.predict)

rm_times_raced = profile_method_real_time(rm.predict_race, X_test)
rm_seq_times = profile_method_real_time(rm.predict, X_test)
df = pd.DataFrame({"original": original_timings, "optimized_best_of": rm_times_raced, "optimized_sequential": rm_seq_times})

df.mean(axis = 0).to_dict()

speedup = df.mean(axis = 0).to_dict()
ratio = speedup['optimized_best_of'] / speedup['original']
ratio

benchmark_analysis = {
    "experiment": ["baseline", "optimized"],
    "Latency per transaction, raced (ms)": [speedup['original'], speedup['optimized_best_of']],
    "Number of FLOPs per transaction (ms)": [3104, 1627.6],
    "Precision": [mlp_precision, routed_precision],
    "Recall" : [mlp_recall, routed_recall]
}

benchmark_df = pd.DataFrame(benchmark_analysis)
s = benchmark_df.to_markdown()

# Put this above as summary!
s

benchmark_df

Credit Card Transaction Demo¶

Imports¶

Step 1: Audio initial model¶

Choose a threshold based on precision-recall curve on validation set.¶

Benchmark its latency and accuracy.¶

FLOPs (Baseline)¶

Accelerating the model with `moco`¶

Evaluation of the `RoutedModel`¶

FLOPs in the New Model¶

Real Time Latency Analysis¶

Latency Result¶

experiment	Latency per transaction, raced (ms)	Number of FLOPs per transaction (ms)	Precision	Recall
baseline	5.20875e-05	3104	0.630952	1
optimized	2.30249e-05	1627.6	0.630952	1

Credit Card Transaction Demo¶

Imports¶

Step 1: Audio initial model¶

Choose a threshold based on precision-recall curve on validation set.¶

Benchmark its latency and accuracy.¶

FLOPs (Baseline)¶

Accelerating the model with moco¶

Evaluation of the RoutedModel¶

FLOPs in the New Model¶

Real Time Latency Analysis¶

Latency Result¶

Accelerating the model with `moco`¶

Evaluation of the `RoutedModel`¶