# If the import fails, uncomment the following line:
#!pip install transformers
import torch
from torch import tensor
import numpy as np
from transformers import AutoTokenizer, AutoModelForCausalLM
import pandas as pd
import matplotlib.pyplot as plt
# Avoid a warning message
import os; os.environ["TOKENIZERS_PARALLELISM"] = "false"

model_name = 'openai-community/gpt2'
tokenizer = AutoTokenizer.from_pretrained(model_name, add_prefix_space=True)
tokenizer.pad_token = tokenizer.eos_token
tokenizer.padding_side = 'left'
model = AutoModelForCausalLM.from_pretrained(model_name)

print(f"The tokenizer has {len(tokenizer.get_vocab())} strings in its vocabulary.")
print(f"The model has {model.num_parameters():,d} parameters.")

The tokenizer has 50257 strings in its vocabulary.
The model has 124,439,808 parameters.

phrase = "Alice is my aunt, so my mother is her"

input_ids = tokenizer(phrase, return_tensors='pt')['input_ids']; input_ids

tensor([[14862,   318,   616, 25949,    11,   523,   616,  2802,   318,   607]])

token_embedding_module = model.transformer.wte
token_embedding_module

Embedding(50257, 768)

lm_head_module = model.lm_head
lm_head_module

Linear(in_features=768, out_features=50257, bias=False)

lm_head_module.weight.shape

torch.Size([50257, 768])

(token_embedding_module.weight.data == lm_head_module.weight.data).all()

tensor(True)

token_embedding_table = token_embedding_module.weight.data

last_token_id = input_ids[0, -1]
print(last_token_id,
    "which corresponds to",
    repr(tokenizer.decode(last_token_id)))

tensor(607) which corresponds to ' her'

with torch.no_grad():
    last_token_embedding = token_embedding_module(last_token_id)
last_token_embedding.shape

torch.Size([768])

plt.figure(figsize=(10, .5))
plt.pcolormesh(last_token_embedding[None, :])
plt.axis('off');

with torch.no_grad():
    last_token_dot_products = lm_head_module(last_token_embedding)
last_token_dot_products.shape

torch.Size([50257])

print([tokenizer.decode(x) for x in last_token_dot_products.topk(k=10).indices])

[' her', ' hers', ' herself', 'Her', ' she', 'She', 'she', ' HER', ' Her', ' She']

import pandas as pd
logits = lm_head_module(token_embedding_module(input_ids))
for y in logits.topk(k=10, axis=2).indices[0]:
    print([tokenizer.decode(x).replace(' ', '_') for x in y])

['_Alice', 'Alice', '_Wonderland', '_Ellen', '田', '_Eleanor', '_Sakuya', '_Louise', '_Ellie', '_Alic']
['_is', '_has', '_was', '_does', '_are', '_will', "'s", '_isn', '_can', '_may']
['_my', 'My', '_myself', 'my', '_MY', '_My', '_me', '_our', '_mine', '_I']
['_aunt', '_Aunt', '_niece', '_grandmother', '_uncle', '_grandma', 'uncle', '_granddaughter', '_nephew', '_grandparents']
[',', '.', '-', "'s", ':', '/', ';', ')', '"', '?']
['_so', 'so', '_So', 'So', '_SO', '_thus', '_mathemat', '_such', '_too', '_rul']
['_my', 'My', '_myself', 'my', '_MY', '_My', '_me', '_our', '_mine', '_I']
['_mother', 'Mother', 'mother', '_mothers', '_mom', '_father', '_grandmother', '_moms', '_Mother', '_maternal']
['_is', '_has', '_was', '_does', '_are', '_will', "'s", '_isn', '_can', '_may']
['_her', '_hers', '_herself', 'Her', '_she', 'She', 'she', '_HER', '_Her', '_She']

# get the vectors for the tokens "he", "she", and "his"
@torch.no_grad()
def get_vector(token):
    token_id = tokenizer.encode(token)
    return token_embedding_table[token_id[0]]
    
he = get_vector("he")
she = get_vector("she")
his = get_vector("his")

he.shape, she.shape, his.shape

(torch.Size([768]), torch.Size([768]), torch.Size([768]))

direction = she - he
query_vector = his + direction
query_vector.shape

torch.Size([768])

# find the token with the highest dot product with the query vector
dot_products = token_embedding_table @ query_vector
closest_token = dot_products.argmax()
tokenizer.decode([closest_token])

' her'

small = get_vector("small")
big = get_vector("big")
biggest = get_vector("biggest")

tokenizer.decode([
    (token_embedding_table @ (small + (biggest - big))).argmax(),
])

' smallest'

vecs = torch.stack([small, big, biggest, she, he, his, query_vector])
embedding_dim_order = np.argsort(vecs.std(axis=0))
plt.figure(figsize=(10, 5))
plt.pcolormesh(vecs[:, embedding_dim_order])
plt.yticks(np.arange(len(vecs)) + .5, ["small", "big", "biggest", "she", "he", "his", "query_vector"]);

with torch.no_grad():
    model_output = model(input_ids, output_hidden_states=True, output_attentions=True)
hidden_states = model_output.hidden_states

len(hidden_states) # this is model.config.n_layer + 1, to include the input embeddings.

13

layer = 0

if layer < 0: layer += len(hidden_states)
logits = lm_head_module(hidden_states[layer])
for seq_idx, y in enumerate(logits.topk(k=10).indices[0]):
    token_in_input = tokenizer.decode(input_ids[0, seq_idx])
    print(f"Most similar to hidden state before layer {layer} at token {seq_idx} ({token_in_input}):")
    print([tokenizer.decode(x) for x in y])
    print()

Most similar to hidden state before layer 0 at token 0 ( Alice):
[' Alice', 'Alice', '���', 'ּ', 'ignty', 'wcsstore', '▬', '��', '田', 'bil']

Most similar to hidden state before layer 0 at token 1 ( is):
[' is', ' has', ' was', ' will', "'s", ' can', ' does', ' isn', ' may', ' are']

Most similar to hidden state before layer 0 at token 2 ( my):
[' my', 'my', ' myself', 'My', ' My', ' MY', ' me', ' our', ' mine', ' mathemat']

Most similar to hidden state before layer 0 at token 3 ( aunt):
[' aunt', ' niece', ' Aunt', ' grandmother', ' uncle', 'uncle', ' cousin', ' grandma', 'unts', ' grandparents']

Most similar to hidden state before layer 0 at token 4 (,):
[',', '.', '-', ':', "'s", '/', ';', '"', ')', ' and']

Most similar to hidden state before layer 0 at token 5 ( so):
[' so', 'so', 'So', ' So', ' mathemat', ' thus', 'theless', ' arrang', ' destro', ' SO']

Most similar to hidden state before layer 0 at token 6 ( my):
[' my', 'my', ' myself', 'My', ' MY', ' My', ' me', ' mathemat', ' our', ' mine']

Most similar to hidden state before layer 0 at token 7 ( mother):
[' mother', 'mother', 'Mother', ' mothers', ' mom', ' father', ' grandmother', ' moms', ' maternal', ' Mothers']

Most similar to hidden state before layer 0 at token 8 ( is):
[' is', ' has', ' was', ' does', ' will', ' can', ' are', ' isn', "'s", ' may']

Most similar to hidden state before layer 0 at token 9 ( her):
[' her', ' herself', ' hers', 'Her', ' she', 'She', ' Her', ' She', ' HER', 'she']

layer = 1
plt.pcolormesh(model_output.attentions[layer][0].mean(dim=0).cpu().numpy())
plt.title(f"Decoder Self-Attention Weights for layer {layer} (avg over all {model.config.num_attention_heads} heads)")
plt.xticks(torch.arange(len(input_ids[0]))+.5, tokenizer.convert_ids_to_tokens(input_ids[0]))
plt.yticks(torch.arange(len(input_ids[0]))+.5, tokenizer.convert_ids_to_tokens(input_ids[0]))
plt.colorbar();

Demo of Logits and Embeddings from a Language Model¶

Tokenization¶

Embeddings¶

Example of mapping¶

Vector Analogies¶

What the model does¶