import torch
from torch import tensor
import ipywidgets as widgets
import matplotlib.pyplot as plt
%matplotlib inline

def softmax_torch(x):
    '''Compute the softmax along the last axis, using PyTorch'''
    # axis=-1 means the last axis
    # This won't matter in this exercise, but it will matter when we get to batches of data.
    return torch.softmax(x, axis=-1)

x = tensor([1., 2., 3.])
softmax_torch(x)

tensor([0.0900, 0.2447, 0.6652])

def softmax(xx):
    # Exponentiate x so all numbers are positive.
    expos = xx.exp()
    assert expos.min() >= 0
    # Normalize (divide by the sum).
    return ...

softmax(x)

tensor([0.0900, 0.2447, 0.6652])

x + 1

tensor([2., 3., 4.])

softmax_torch(x + 1)

tensor([0.0900, 0.2447, 0.6652])

y2 = tensor([1., 0.,])
y3 = y2 - 1
y3

tensor([ 0., -1.])

y4 = y2 * 2
y4

tensor([2., 0.])

x2 = 50 * x
softmax(x2)

tensor([0., nan, nan])

# your code here (the first mathematical operation in `softmax`)

tensor([5.1847e+21,        inf,        inf])

# your code here

tensor([3.7835e-44, 1.9287e-22, 1.0000e+00])

# your code here

tensor([3.7835e-44, 1.9287e-22, 1.0000e+00])

softmax_torch(x2)

tensor([3.7835e-44, 1.9287e-22, 1.0000e+00])

Softmax, part 1¶

Setup¶

Task¶

Analysis¶

Optional Extension: Numerical Issues¶

Task for Numerical Issues¶

Analysis of Numerical Issues¶

Extension optional¶