Training Using Google Colab

In [None]:
# ✅ Step 1: Install dependencies
!pip install -q transformers datasets accelerate

In [None]:
# ✅ Step 2: Check GPU availability
import torch
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print("Using device:", device)

In [None]:
from huggingface_hub import login

# Paste your token between the quotes
login("LOGIN_TOKEN")

In [None]:
# ✅ Step 3: Load tokenizer and model
from transformers import AutoTokenizer, AutoModelForCausalLM

model_name = "meta-llama/Llama-3.2-1B"

tokenizer = AutoTokenizer.from_pretrained(model_name, use_fast=True)
tokenizer.pad_token = tokenizer.eos_token  # LLaMA needs a pad token

model = AutoModelForCausalLM.from_pretrained(
    model_name,
    torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
    device_map="auto"
)

In [None]:
!rm -rf ~/.cache/huggingface/datasets


In [None]:
import json
from datasets import Dataset

# Load JSON file manually
with open("/content/medical_dataset_llama3_format.json") as f:
    data = json.load(f)

# Convert to Hugging Face Dataset
dataset = Dataset.from_list(data)

# Train/test split
dataset = dataset.train_test_split(test_size=0.2)

# View a sample
print(dataset["train"][0])
