import pandas as pd

from transformers import (
    AutoModelForCausalLM, 
    AutoTokenizer, 
    DataCollatorForSeq2Seq,
    TrainingArguments, 
    Trainer
)
from peft import (
    PeftModel,
    LoraConfig, 
    TaskType,
    get_peft_model
)
from datasets import Dataset

from src.utils.data.files import *

kids_qa, _ = download_dataset("text/llm/finetuning/llm-finetuning-kids-qa.csv")

File 'data/datasets/text/llm/finetuning/llm-finetuning-kids-qa.csv' already exists (use 'overwrite=True' to overwrite it).

TARGET_PATH = "data/generated/finetuning/lora-hf-kidsqa/"

model_id="TinyLlama/TinyLlama-1.1B-Chat-v1.0"

model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto", dtype="auto")

tokenizer = AutoTokenizer.from_pretrained(model_id)

tokenizer.pad_token = tokenizer.eos_token

messages = [
    {"role": "system", "content": "You are a helpful tutor that helps kids answering their questions."},
    {"role": "user", "content": "What is the capital of France?"},
]

text = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)

print(text)

<|system|>
You are a helpful tutor that helps kids answering their questions.</s>
<|user|>
What is the capital of France?</s>
<|assistant|>

def generate_output(model, tokenizer, messages, max_length=100):
    # Apply prompt template and convert to token ids (important: add "<|assistant|>" as generation prompt)
    prompt_ids = tokenizer.apply_chat_template(messages, add_generation_prompt=True, return_tensors="pt").to(model.device)
    # Use model to generate output
    outputs = model.generate(
        prompt_ids,
        max_new_tokens=max_length,              # Limit the number of tokens in the response
        do_sample=True,                         # Enable sampling for diversity
        temperature=0.75,                       # Sampling temperature; lower = more deterministic
    )
    # Decode the generated token IDs back into text
    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
    # Extract and return only the assistant's reply (remove the prompt)
    return response.split("<|assistant|>\n")[-1].strip()

example_questions = [
    "What is the capital of France?",
    "How tall is the Mount Everest?",
    "Why do we have seasons?",
    "When do we have a leap year?",
    "Who built the pyramids of Giza?",
]

def run_questions(questions):
    for question in questions:
        # Define prompt
        messages = [
            {"role": "system", "content": "You are a helpful tutor that helps kids answering their questions. Keep it short and simple."},
            {"role": "user", "content": question},
        ]
        # Use model to generate answer
        answer = generate_output(model, tokenizer, messages)
        # Simply print both the question and the answer
        print(f"Question: {question}")
        print(f"Answer: {answer}\n")

run_questions(example_questions)

Question: What is the capital of France?
Answer: The capital of France is Paris.

Question: How tall is the Mount Everest?
Answer: Mount Everest is the highest mountain on Earth, standing at a height of 29,029 feet (8,848 meters). It is located in the Nepal-China border region and is shared equally by both countries by the 1953 Treaty of Amity, Economic Relations, Science and Technological Cooperation, and Cultural Provisions.

Question: Why do we have seasons?
Answer: The seasons are a natural phenomenon that occur on Earth. They are caused by the Earth's rotation around the sun, which causes the Earth's poles to change. The Earth's poles are located at its northern and southern poles, and as a result, the Earth rotates.

The four seasons, Fall, Winter, Spring, and Summer, are caused by the Earth's tilt on its axis. The seasons vary from year to year, with the

Question: When do we have a leap year?
Answer: A leap year occurs every four years, with the exception of years divisible by 400 (e.g. 1900, 2000, 2012, 2020). The next leap year is scheduled to occur in 2024.

Question: Who built the pyramids of Giza?
Answer: The pyramids of Giza were built by the ancient Egyptians around 2500 BC. The construction of the pyramids was done by pharaohs (emperors) who ruled Egypt during that time. The pyramids were built using a combination of skills and labor, including carving, building, and assembling the stones. Archaeological evidence indicates that the entire construction process took decades to complete.

df_qa = pd.read_csv(kids_qa)

df_qa.head()

qa_pairs = []

for idx, row in df_qa.iterrows():
    question, answer = row["QUESTION"], row["ANSWER"]
    qa_pairs.append({
        "messages": [
            {"role": "system", "content": "You are a helpful tutor that helps kids answering their questions. Keep it short and simple."},
            {"role": "user", "content": question.strip()},
            {"role": "assistant", "content": answer.strip()}
        ]
    })

dataset = Dataset.from_list(qa_pairs)

print(dataset)

Dataset({
    features: ['messages'],
    num_rows: 550
})

def preprocess(batch):
    input_ids_list, labels_list, attn_masks_list = [], [], []
    # Iterate through all messages (i.e., prompts in role-based message format)
    for msgs in batch["messages"]:
        # Apply TinyLlama chat template
        text = tokenizer.apply_chat_template(msgs, tokenize=False, add_generation_prompt=False)
        # Tokenize + convert to token indices
        tokenized = tokenizer(text)
        # Extract input ids
        input_ids = tokenized["input_ids"]
        attention_mask = tokenized["attention_mask"]
        # The labels are just a copy of the input ids
        labels = input_ids.copy()
        # Add information for current prompt to respective lists
        input_ids_list.append(input_ids)
        labels_list.append(labels)
        attn_masks_list.append(attention_mask)
    # Return dictionary of all input_ids, attention_masks, and labels
    return {"input_ids": input_ids_list, "labels": labels_list, "attention_mask": attn_masks_list}

dataset_processed = dataset.map(preprocess, batched=True)

print(dataset_processed)

Map:   0%|          | 0/550 [00:00<?, ? examples/s]

Dataset({
    features: ['messages', 'input_ids', 'labels', 'attention_mask'],
    num_rows: 550
})

data_collator = DataCollatorForSeq2Seq(
    tokenizer=tokenizer,
    padding=True,
    return_tensors="pt"
)

lora_config = LoraConfig(
    r=8,                                  # low-rank adaptation dimension
    lora_alpha=16,                        # scaling factor
    target_modules=["q_proj", "v_proj"],  # module to which LoRA is applied
    lora_dropout=0.1,                     # dropout probability
    task_type=TaskType.CAUSAL_LM          # task type
)

ADAPTER_NAME = "lora-kids-qa"

model = get_peft_model(model, lora_config, adapter_name=ADAPTER_NAME)

model.print_trainable_parameters()

trainable params: 1,126,400 || all params: 1,101,174,784 || trainable%: 0.1023

training_args = TrainingArguments(
    output_dir=TARGET_PATH,
    per_device_train_batch_size=10,
    num_train_epochs=10,
    logging_steps=50,
    save_steps=10000,                # A very high number to avoid saving checkpoints for our toy example
    fp16=True
)

trainer = Trainer(
    model=model,
    args=training_args,
    train_dataset=dataset_processed,
    data_collator=data_collator
)

trainer.train()

TrainOutput(global_step=550, training_loss=0.7330795808271928, metrics={'train_runtime': 133.6531, 'train_samples_per_second': 41.151, 'train_steps_per_second': 4.115, 'total_flos': 3977847143792640.0, 'train_loss': 0.7330795808271928, 'epoch': 10.0})

run_questions(example_questions)

Question: What is the capital of France?
Answer: The capital of France is Paris! You can visit it and learn all about its history and culture. It's a cool idea to learn about different places and cultures.

Question: How tall is the Mount Everest?
Answer: Mount Everest is the highest peak in the world! It's so tall that it almost touches the clouds. It's really tall and impressive!

Question: Why do we have seasons?
Answer: Seasons are a natural phenomenon that happen every year. They change the weather and help plants and animals prepare for the new season. It's cool to learn about how nature works!

Question: When do we have a leap year?
Answer: A leap year occurs every four years. It's a nice surprise to see extra days in February!

Question: Who built the pyramids of Giza?
Answer: The ancient Egyptians built the pyramids of Giza to honor their pharaohs. It's amazing how they were able to make such big structures with just stone tools!

model.save_pretrained(TARGET_PATH + "final-lora-adapters", safe_serialization=True)

model = AutoModelForCausalLM.from_pretrained(model_id, device_map="auto", dtype="auto")
model = PeftModel.from_pretrained(model, TARGET_PATH + "final-lora-adapters/" + ADAPTER_NAME, adapter_name=ADAPTER_NAME)

print(f"Available adapters: {list(model.peft_config.keys())}")

Available adapters: ['lora-kids-qa']

model.set_adapter(ADAPTER_NAME)

with model.disable_adapter():
    run_questions(example_questions)

Question: What is the capital of France?
Answer: The capital of France is Paris, located in the Ile-de-France region.

Question: How tall is the Mount Everest?
Answer: Yes, I can tell you the height of Mount Everest. Mount Everest is the tallest mountain in the world, standing at an elevation of 8,848 meters (29,029 feet) above sea level. It is located in the Himalayas, between Nepal and China, and is the world's highest peak.

Question: Why do we have seasons?
Answer: The concept of seasons has been observed in various cultures for thousands of years. In the Northern Hemisphere, spring is the period of time from the vernal equinox to the longest day (which is in August) when the sun reaches its highest point in the sky. This is marked by the changing of the seasons as plants and animals begin to prepare for the growing season.

The seasons are thought to be caused by a cycle of changes in the Earth's orbit around the

Question: When do we have a leap year?
Answer: A leap year occurs every four years, so the next leap year is in 2022.

Question: Who built the pyramids of Giza?
Answer: The pyramids of Giza are a series of three monumental rock-cut tombs built by the ancient Egyptians during the 4th dynasty (around 2582-2571 BCE) as burial sites for the pharaohs of the same dynasty. Their architectural wonders continue to captivate visitors and scholars from all around the globe. The pyramids were built by the pharaohs Khufu

run_questions(example_questions)

Question: What is the capital of France?
Answer: The capital of France is Paris! Keep learning new things!

Question: How tall is the Mount Everest?
Answer: The Mount Everest is the highest mountain in the world. It's really tall!

Question: Why do we have seasons?
Answer: Seasons are really important because they help us understand what's happening outside! There are four seasons here on Earth - Spring, Summer, Fall, and Winter. We can observe the changes in the seasons, like when plants bloom, and when the trees start to drop their leaves. It's amazing how nature works!

Question: When do we have a leap year?
Answer: A leap year has 366 days in a year, so it's a year with 365 days in it! Just like it has 365 days, we have another one every 4 years! It's a fun thing to learn about!

Question: Who built the pyramids of Giza?
Answer: The great pyramid of Giza was built by the Egyptians. It was a huge monument that helped them to rule over their land and build their empire. Keep exploring the world of ancient civilizations!

merged_model = model.merge_and_unload()
merged_model.save_pretrained(TARGET_PATH + "full-model-kidsqa")

	QUESTION	ANSWER
0	How many days do we have in a week?	We have 7 days in a week! Each day is special ...
1	How many days are there in a normal year?	There are 365 days in a normal year. That's a ...
2	How many colors are there in a rainbow?	There are seven colors in a rainbow: red, oran...
3	How many letters are there in the English alph...	There are 26 letters in the English alphabet!
4	How many consonants are there in the English a...	There are 21 consonants in the English alphabe...

Parameter	Description
`output_dir`	Directory where model checkpoints and training logs will be stored.
`evaluation_strategy`	Specifies when evaluation is performed. Common values: `"steps"` (after a set number of steps) or `"epoch"` (after each epoch).
`eval_steps`	Number of steps between each evaluation run when `evaluation_strategy="steps"`.
`per_device_train_batch_size`	Batch size per device (GPU or CPU) used during training. Larger batch sizes speed up training but use more memory.
`per_device_eval_batch_size`	Batch size per device used during evaluation. Larger batches speed up evaluation but use more memory.
`num_train_epochs`	Total number of passes (epochs) over the entire training dataset.
`save_steps`	Number of steps between model checkpoint saves during training.
`logging_steps`	Number of steps between logging entries (loss, metrics, etc.).
`learning_rate`	Starting value of the learning rate for the optimizer (controls how fast the model learns).
`save_total_limit`	Maximum number of checkpoints to keep. Older checkpoints beyond this limit will be deleted.
`fp16`	Whether to use 16-bit (mixed precision) training instead of 32-bit. Saves GPU memory and can make training faster.
`report_to`	List of integrations for logging (e.g., `"none"`, `"tensorboard"`). `"none"` disables integration logging.

Step	Training Loss
50	1.640500
100	0.873500
150	0.676400
200	0.637700
250	0.626800
300	0.612200
350	0.612200
400	0.598300
450	0.596900
500	0.593300
550	0.596100

LoRA Fine-Tuning — A Basic Example¶

Setting up the Notebook¶

Make Required Imports¶

Download Required Data¶

Preliminaries¶

Overview & Use Case¶

Load Pretrained LLM¶

Load Pretrained Model¶

Load Pretrained Tokenizer¶

Test Model¶

Prepare Fine-Tuning Dataset¶

Load Dataset from File¶

Transform Dataset into Required Format¶

Support Padding for Batch Processing¶

Fine-Tuning with LoRA¶

Create LoRA Model¶

Perform LoRA Training¶

Post-Training Steps¶

Discussion & What's Next?¶

Scaling Up¶

Evaluation¶

Summary¶