import torch
from torch import tensor
import ipywidgets as widgets
import matplotlib.pyplot as plt
%matplotlib inline


def softmax_torch(x):
    '''Compute the softmax along the last axis, using PyTorch'''
    # axis=-1 means the last axis
    # This won't matter in this exercise, but it will matter when we get to batches of data.
    return torch.softmax(x, axis=-1)


r = 2.0 # specify the range of the sliders
@widgets.interact(x0=(-r, r), x1=(-r, r), x2=(-r, r))
def show_softmax(x0, x1, x2):
    x = tensor([x0, x1, x2])
    xs = softmax_torch(x)
    plt.barh([2, 1, 0], xs)
    plt.xlim(0, 1)
    plt.yticks([2, 1, 0], ['output 0', 'output 1', 'output 2'])
    plt.ylabel("softmax(x)")
    return xs

interactive(children=(FloatSlider(value=0.0, description='x0', max=2.0, min=-2.0), FloatSlider(value=0.0, desc…


x = tensor([1., 2., 3.])
softmax_torch(x)

tensor([0.0900, 0.2447, 0.6652])


def softmax(xx):
    # Exponentiate x so all numbers are positive.
    expos = xx.exp()
    assert expos.min() >= 0
    # Normalize (divide by the sum).
    return ...


softmax(x)

tensor([0.0900, 0.2447, 0.6652])


y2 = tensor([1., 0.,])
y3 = y2 - 1
y3

tensor([ 0., -1.])


y4 = y2 * 2
y4

tensor([2., 0.])


x2 = 50 * x
softmax(x2)

tensor([0., nan, nan])


# your code here (the first mathematical operation in `softmax`)

tensor([5.1847e+21,        inf,        inf])


# your code here

tensor([3.7835e-44, 1.9287e-22, 1.0000e+00])


# your code here

tensor([3.7835e-44, 1.9287e-22, 1.0000e+00])


softmax_torch(x2)

tensor([3.7835e-44, 1.9287e-22, 1.0000e+00])

Softmax, part 1¶

Setup¶

Task¶

Analysis¶

Optional Extension: Numerical Issues¶

Task for Numerical Issues¶

Analysis of Numerical Issues¶

Extension optional¶