import numpy as np
np.set_printoptions(precision=3)
import ipywidgets as widgets
import matplotlib.pyplot as plt
import pandas as pd
%matplotlib inline

DATASET = 'toy'

if DATASET == 'toy':
    x = np.array([0, 1, 2, 3])
    y_true = np.array([-1.01, .56, 2.02, 3.51])
if DATASET == 'toy2':
    x = np.array([0, 1, 2, 3])
    y_true = np.array([-1, .5, 2.0, 25])
elif DATASET == "temps":
    data = pd.read_csv("https://data.giss.nasa.gov/gistemp/graphs_v4/graph_data/Global_Mean_Estimates_based_on_Land_and_Ocean_Data/graph.csv", skiprows=1)
    # Shape x to be items-by-features
    x = data.iloc[:, 0].values.astype(np.float32)
    # scale x to a reasonable range
    x -= 1880.0
    x /= 100.
    y_true = data.iloc[:, 1].values.astype(np.float32)

# Plot the data so we can see it
if len(x) < 50:
    plt.scatter(x, y_true)
else:
    plt.plot(x, y_true)
print("x.shape", x.shape)
print("y_true.shape", y_true.shape)

x.shape (4,)
y_true.shape (4,)

np.random.seed(0)
params = np.random.randn(2)

x_i = x[0] # pick an example data point
weight = params[0]
bias = params[1]

y_pred_i = ...
print("predicted value:", y_pred_i)

predicted value: 0.4001572083672233

def linreg_forward(params, x):
    weight = params[0]
    bias = params[1]
    return ...

y_pred = linreg_forward(params, x) # make predictions for all data points
print("predicted values:", y_pred)

predicted values: [0.4   2.164 3.928 5.692]

def plot_predictions(x, y_true, y_pred):
    plt.scatter(x, y_true, label="true")
    plt.plot(x, y_pred, label="predicted")
    plt.legend()
    plt.xlabel("x value")

plot_predictions(x, y_true, y_pred)

def compute_mse_loss(y_true, ...):
    return ...

def compute_mae_loss(y_true, ...):
    return ...

mse_loss = compute_mse_loss(..., ...)
print("MSE loss:", mse_loss)

mae_loss = compute_mae_loss(..., ...)
print("MAE loss:", mae_loss)

MSE loss: 3.241497649037405
MAE loss: 1.7762357273187195

def loss_given_params(params, x, y_true):
    y_pred = ...
    return compute_mse_loss(...)

loss = loss_given_params(params, x, y_true)
print("loss:", loss)

loss: 3.241497649037405

from scipy.optimize import minimize

optimization_result = minimize(loss_given_params, params, args=(x, y_true))
fitted_params = optimization_result.x
print("fitted params:", fitted_params)

fitted params: [ 1.502 -0.983]

plot_predictions(x, y_true, linreg_forward(fitted_params, x))

y_pred = ...
print("MSE loss:", compute_mse_loss(..., ...))
print("MAE loss:", compute_mae_loss(..., ...))

MSE loss: 0.0006450000093661442
MAE loss: 0.020500116851778938

Linear Regression the Hard Way¶

Objectives¶

Setup¶

Task¶

Step 0: Initialize the model¶

Step 1: Single prediction¶

Step 2: Prediction for all inputs¶

Visualizing the predictions¶

Step 3: Compute loss¶

Step 4: Compute loss given parameters¶

Check in¶

Guided Extension¶