# !pip install torch transformers peft accelerate bitsandbytes datasets

import torch
from transformers import AutoModelForCausalLM, AutoTokenizer, TrainingArguments
from peft import LoraConfig, get_peft_model, TaskType
from datasets import load_dataset
from trl import SFTTrainer

torch.manual_seed(42)

DATASET = 'medalpaca/medical_meadow_medqa'
BASE_MODEL = 'mistralai/Mistral-7B-Instruct-v0.2'
ds = load_dataset(DATASET, split='train').select(range(1000))
test = load_dataset(DATASET, split='train').select(range(1000, 1050))
print('train:', len(ds), 'test:', len(test))

# YOUR TURN
# Load BASE_MODEL in 4-bit. Run zero-shot on the 50-example test set.
# Record exact-match accuracy.

# YOUR TURN
# Configure LoraConfig(r=16, lora_alpha=32, target_modules=['q_proj','v_proj']).
# Train with SFTTrainer for 200-500 steps on the 1000-example train set.

# YOUR TURN
# Re-run on the same 50-example test set with the fine-tuned model.
# Print a table: base accuracy vs fine-tuned accuracy.

Lab 3 — LoRA fine-tune of a small open model¶

Setup¶

Pick a domain dataset¶

Exercise 1 — Zero-shot baseline¶

Exercise 2 — LoRA fine-tune¶

Exercise 3 — Side-by-side eval¶

Done?¶