from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
import matplotlib.pyplot as plt
import numpy as np
import torch as th
import torch.nn as nn
import torch.nn.functional as F
import torch.optim

X, y = load_iris(return_X_y=True)

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.5)

class GeneralizedLinearClassifier(nn.Module):
    def __init__(self, n_dims, lambda_coef=1, p=2, n_classes=3):
        super(GeneralizedLinearClassifier, self).__init__()
        self.lambda_coef = lambda_coef
        self.weight = nn.Parameter(th.randn((n_dims,n_classes)))
        self.bias = nn.Parameter(th.randn((n_classes)))
        self.p = p

    def predict(self, input):
        return input @ self.weight + self.bias

    def learn(self, inputs, labels, num_steps=1):
        optimizer = torch.optim.SGD(self.parameters(), lr=0.001)

        for ii in  range(num_steps):
            predictions = self.predict(inputs)
            loss = F.cross_entropy(predictions, labels) \
                  + (self.weight.abs()**self.p).sum()*self.lambda_coef
            optimizer.zero_grad()
            loss.backward()
            optimizer.step()

# Convert data into the Torch format
X_train = torch.tensor(X_train).float()
X_test = torch.tensor(X_test).float()
y_train = torch.tensor(y_train).long()
y_test = torch.tensor(y_test).long()

# z-score normalization
m = th.mean(X_train,axis=0)
std = th.std(X_train,axis=0)
X_train = (X_train-m)/std
X_test = (X_test-m)/std

# Train our model
model_glc = GeneralizedLinearClassifier(n_dims=X_train.shape[1],
                                        lambda_coef=1, p=2)
# Number of gradient descent iterations
num_iterations = 1000

# Collect the train and test errors here.
train_errors = np.zeros(num_iterations)
test_errors = np.zeros(num_iterations)

for ii in  range(num_iterations):
    model_glc.learn(X_train, y_train)

    predictions = model_glc.predict(X_train)
    pred_class = th.argmax(predictions, dim=1)
    train_errors[ii] = (pred_class != y_train.reshape(-1)).float().mean()
    
    # Test our model
    predictions = model_glc.predict(X_test)
    pred_class = th.argmax(predictions, dim=1)
    test_errors[ii] = (pred_class != y_test.reshape(-1)).float().mean()

# Plot the learning curve
plt.plot(np.arange(num_iterations),train_errors,'b-', label="Train Error")
plt.plot(np.arange(num_iterations),test_errors,'r-', label="Test Error")
plt.xlabel("Iteration")
plt.ylabel("Error")
plt.legend(loc="upper right")
plt.show()

from sklearn.metrics import confusion_matrix, ConfusionMatrixDisplay

cm= confusion_matrix(y_test.detach().numpy(), pred_class.detach().numpy())
disp = ConfusionMatrixDisplay(confusion_matrix=cm, 
                display_labels=['setosa','versicolor','virginica'])

disp.plot()
plt.show()

precision_setosa = cm[0,0]/(cm[0,0]+cm[1,0]+cm[2,0]) # sum towards the column
recall_setosa = cm[0,0]/(cm[0,0]+cm[0,1]+cm[0,2]) # sum towards the row
print("Precision: ", precision_setosa)
print("Recall: ", recall_setosa)
print("F1: ", 2*precision_setosa*recall_setosa/(precision_setosa+recall_setosa))

Precision:  0.9
Recall:  1.0
F1:  0.9473684210526316

from sklearn.metrics import roc_curve, RocCurveDisplay

roc_curve_setosa = roc_curve(y_test.detach().numpy(), 
                            pred_class.detach().numpy(), pos_label=1)

disp = RocCurveDisplay(fpr=roc_curve_setosa[0], tpr=roc_curve_setosa[1], 
                       roc_auc=0.5, estimator_name='versicolor')

disp.plot()
plt.show()

import matplotlib.pyplot as plt
import seaborn as sns
from matplotlib.colors import ListedColormap

from sklearn import datasets, neighbors
from sklearn.inspection import DecisionBoundaryDisplay

n_neighbors = 1

iris = datasets.load_iris()

idx = np.random.permutation(iris.data.shape[0])
X = iris.data[idx[:10], :2]
y = iris.target[idx[:10]]

# Create color maps
cmap_light = ListedColormap(["orange", "cyan", "cornflowerblue"])
cmap_bold = ["darkorange", "c", "darkblue"]

for weights in ["uniform", "distance"]:
    # weights=uniform: All points in each neighborhood are weighted equally
    # weights=distance: weight points by the inverse of their distance
    clf = neighbors.KNeighborsClassifier(n_neighbors, weights=weights)
    clf.fit(X, y)

    _, ax = plt.subplots()
    DecisionBoundaryDisplay.from_estimator(
        clf,
        X,
        cmap=cmap_light,
        ax=ax,
        response_method="predict",
        plot_method="pcolormesh",
        xlabel=iris.feature_names[0],
        ylabel=iris.feature_names[1],
        shading="auto",
    )

    # Plot also the training points
    sns.scatterplot(
        x=X[:, 0],
        y=X[:, 1],
        hue=iris.target_names[y],
        palette=cmap_bold,
        alpha=1.0,
        edgecolor="black",
    )
    plt.title(
    "3-Class classification (k = %i, weights = '%s')" % (n_neighbors, weights)
    )

plt.show()

	Predicted Positive	Predicted Negative
Actual Positive	TP	FN
Actual Negative	FP	TN

Logistic Regression¶

Extension to multi-class classification¶

Performance Metrics for Classification¶

K-Fold Cross Validation¶

K-Nearest Neighbors (kNN) Classifier¶