# !pip install torch transformers accelerate matplotlib

import torch
from transformers import AutoModelForCausalLM, AutoTokenizer
import numpy as np
import matplotlib.pyplot as plt

torch.manual_seed(42)
device = 'cuda' if torch.cuda.is_available() else 'cpu'

MODEL = 'EleutherAI/pythia-1b'
tokenizer = AutoTokenizer.from_pretrained(MODEL)
model = AutoModelForCausalLM.from_pretrained(MODEL).to(device).eval()
print('parameters:', sum(p.numel() for p in model.parameters()) / 1e9, 'B')

PROMPT = 'The capital of Cameroon is'
STRATEGIES = {
  'greedy':    {'do_sample': False},
  'temp_0.5':  {'do_sample': True, 'temperature': 0.5},
  'temp_1.0':  {'do_sample': True, 'temperature': 1.0},
  'top_k_50':  {'do_sample': True, 'top_k': 50},
  'top_p_0.9': {'do_sample': True, 'top_p': 0.9},
}

# YOUR TURN — generate 10 continuations per strategy at max_new_tokens=80.

# YOUR TURN
# For each strategy, compute distinct-2 (fraction of unique bigrams across samples).

# YOUR TURN
# Coherence: average per-token perplexity of each sample under the same model.
# Factuality: did the sample correctly say 'Yaoundé'? Manual or string match.

Lab 2 — Sampling-strategy analysis¶

Setup¶

Load a small open model¶

Exercise 1 — Generate under each sampling strategy¶

Exercise 2 — Quantify diversity¶

Exercise 3 — Quantify coherence and factuality¶

Done?¶