import matplotlib.pyplot as plt
import numpy as np
import torch as th
import torch.nn as nn

# This is the true data generating process. 
# We do not have access to this information in a typical machine learning problem
inputs = np.linspace(0, 1, 50)              
outputs = np.sin(2*np.pi*inputs)                  
labels = outputs + np.random.randn(inputs.shape[0])*0.25

plt.plot(inputs,labels,'bo')
plt.xlabel("inputs (x)")
plt.ylabel("labels (y)")
plt.show()

num_samples = inputs.shape[0]
num_train_samples = num_samples // 2 
# draw a random permutation of indices
idx = np.random.permutation(num_samples) 
inputs_train = inputs[idx[:num_train_samples]]
labels_train = labels[idx[:num_train_samples]]
inputs_test = inputs[idx[num_train_samples:]]
labels_test = labels[idx[num_train_samples:]]

class PolynomialModel:
    def __init__(self, num_polynomial_degrees = 1, regularizer=0):
        self.M = num_polynomial_degrees
        self.regularization_factor = regularizer
      
    def extract_features(self, inputs):
        input_features = np.zeros([inputs.shape[0], self.M+1])

        for m in range(self.M+1):
            input_features[:,m] = inputs ** m 

        return input_features

    def learn(self, inputs, labels):
        prediction = np.zeros_like(labels)

        input_features = self.extract_features(inputs)
        XtX_inv = np.linalg.inv(input_features.T.dot(input_features)
                +self.regularization_factor*np.eye(input_features.shape[1]))
        self.weights = XtX_inv.dot(input_features.T).dot(labels)

    def predict(self, inputs):

        input_features = self.extract_features(inputs)
        predictions = input_features.dot(self.weights)
        return predictions

model = PolynomialModel(num_polynomial_degrees=3) # Create the model instance

# Training
model.learn(inputs_train, labels_train) 

# Testing
predictions_test = model.predict(inputs_test) 
root_mean_squared_error = np.sqrt(((labels_test - predictions_test) ** 2).mean()) 

print(root_mean_squared_error)

0.3107401395935377

plt.plot(inputs,outputs,'k-', label="True function")
plt.plot(inputs_train,labels_train,'bo', label="Training data")
plt.plot(inputs_test, labels_test,'go', label="Test data")
plt.plot(inputs_test,predictions_test,'ro', label="Test predictions")
plt.legend(loc="upper right")
plt.show()

# The performance score
def root_mean_squared_error(labels_true, predictions):
    return np.sqrt(((labels_true - predictions) ** 2).mean())

Mmax = 10
train_errors = np.zeros(Mmax)
test_errors = np.zeros(Mmax)

for M in range(Mmax):
    model = PolynomialModel(num_polynomial_degrees=M) 
    # Create the model instance

    # Training
    model.learn(inputs_train, labels_train) # Fit parameters to data on the training split.
    predictions_train = model.predict(inputs_train)
    train_err = root_mean_squared_error(labels_train, predictions_train)

    # Testing
    predictions_test = model.predict(inputs_test) # Make predictions on the test split.
    test_err = root_mean_squared_error(labels_test, predictions_test) # Evaluate performance.

    train_errors[M] = train_err
    test_errors[M] = test_err

plt.plot(np.arange(Mmax),train_errors,"bo-", label="Training")
plt.plot(np.arange(Mmax),test_errors,"ro-", label="Test")
plt.xlabel("Polynomial degree")
plt.ylabel("Error")
plt.legend(loc="upper right")
plt.show()

model0 = PolynomialModel(num_polynomial_degrees=0) 
model0.learn(inputs_train, labels_train) 
pred_0 = model0.predict(inputs)

model1 = PolynomialModel(num_polynomial_degrees=1) 
model1.learn(inputs_train, labels_train) 
pred_1 = model1.predict(inputs)

model6 = PolynomialModel(num_polynomial_degrees=4) 
model6.learn(inputs_train, labels_train) 
pred_6 = model6.predict(inputs)

model9 = PolynomialModel(num_polynomial_degrees=9) 
model9.learn(inputs_train, labels_train) 
pred_9 = model9.predict(inputs)

fig, axs = plt.subplots(2, 2)

for ax in axs.flat:
    ax.plot(inputs, outputs,'k-', label="True f")
    ax.plot(inputs_train, labels_train,'ro', label="Tr data")

axs[0, 0].plot(inputs, pred_0,'b-', label="M=0")
axs[0, 1].plot(inputs, pred_1,'g-', label="M=1")
axs[1, 0].plot(inputs, pred_6,'c-', label="M=7")
axs[1, 1].plot(inputs, pred_9,'m-', label="M=9")

for ax in axs.flat:
    ax.legend(loc="upper right")
    ax.label_outer()

for M in range(Mmax):
    model = PolynomialModel(num_polynomial_degrees=M, regularizer=0.01) 
    # Create the model instance

    # Training
    model.learn(inputs_train, labels_train) # Fit parameters to data on the training split.
    predictions_train = model.predict(inputs_train)
    train_err = root_mean_squared_error(labels_train, predictions_train)

    # Testing
    predictions_test = model.predict(inputs_test) # Make predictions on the test split.
    test_err = root_mean_squared_error(labels_test, predictions_test) # Evaluate performance.

    train_errors[M] = train_err
    test_errors[M] = test_err

plt.plot(np.arange(Mmax),train_errors,"bo-", label="Training")
plt.plot(np.arange(Mmax),test_errors,"ro-", label="Test")
plt.xlabel("Polynomial degree")
plt.ylabel("Error")
plt.legend(loc="upper right")
plt.show()

What is machine learning?¶

Formal definitions¶

Experience (E)¶

Task (T)¶

Performance Measure (P)¶

The Empirical Risk Minimization (ERM) Paradigm¶

Example: Polynomial curve fitting¶