In [24]:
from transformers import AutoModelForCausalLM, AutoTokenizer
from transformers import pipeline

import torch

model_id = "meta-llama/Llama-3.2-1B-Instruct"
device = "cpu"

tokenizer = AutoTokenizer.from_pretrained(model_id, padding_side="left")
tokenizer.pad_token = tokenizer.eos_token

model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype = torch.bfloat16, device_map = device)

In [5]:
generation_pipeline = pipeline(task = "text-generation", model = model, tokenizer = tokenizer)
generation_pipeline("Hello How are you?")

Device set to use cpu
Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


[{'generated_text': "Hello How are you? I am 20 years old. I have been working in a restaurant for a couple of years. I am an independent contractor and I don't have any direct supervision or support from the restaurant. I am responsible for managing my own schedule, ordering food, and interacting with customers.\n\nI am not sure if I am doing enough to improve my skills and grow professionally in this role. I feel like I need to step up my game to get ahead in this industry. I am interested in learning new skills and taking on more responsibility. I am not sure how to get started.\n\nWhat advice would you give to a young professional like myself who is just starting out in the food service industry? Here are some of the challenges I am facing:\n\n* Lack of direct supervision and support\n* Limited access to training and resources\n* Limited opportunities for advancement and professional development\n* High stress levels and pressure to perform\n\nWhat advice would you give to someone 

In [7]:
generation_pipeline(["Hello, how are you?", "What is the capital of India?"], max_new_tokens = 25)

Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


[[{'generated_text': "Hello, how are you? I'm doing great, thanks for asking!\n\nYou know what's even better than being great? Being able to ask great questions"}],
 [{'generated_text': 'What is the capital of India? New Delhi.\nNew Delhi is the capital city of India and is also the seat of the Indian government. It is located in'}]]

In [14]:
input_prompt = "Hello How are you"

tokenized = tokenizer(input_prompt)
print(tokenized)

tokenized = tokenizer(input_prompt, return_tensors="pt")
print(tokenized)

print(tokenized["input_ids"].shape)

{'input_ids': [128000, 9906, 2650, 527, 499], 'attention_mask': [1, 1, 1, 1, 1]}
{'input_ids': tensor([[128000,   9906,   2650,    527,    499]]), 'attention_mask': tensor([[1, 1, 1, 1, 1]])}
torch.Size([1, 5])


In [19]:
print(tokenizer("hello"))
print(tokenizer("hello how"))
print(tokenizer("hello how are"))
print(tokenizer("hello how are you"))

{'input_ids': [128000, 15339], 'attention_mask': [1, 1]}
{'input_ids': [128000, 15339, 1268], 'attention_mask': [1, 1, 1]}
{'input_ids': [128000, 15339, 1268, 527], 'attention_mask': [1, 1, 1, 1]}
{'input_ids': [128000, 15339, 1268, 527, 499], 'attention_mask': [1, 1, 1, 1, 1]}


In [36]:
input_prompt = ["Hello How are you", "Something new is going on"]

tokenized = tokenizer(input_prompt, return_tensors="pt", padding=True)
print(tokenized)

{'input_ids': tensor([[128009, 128000,   9906,   2650,    527,    499],
        [128000,  23958,    502,    374,   2133,    389]]), 'attention_mask': tensor([[0, 1, 1, 1, 1, 1],
        [1, 1, 1, 1, 1, 1]])}


In [31]:
print(tokenizer.decode(23958))
print(tokenizer.decode(502))
print(tokenizer.decode(374))
print(tokenizer.decode(2133))
print(tokenizer.decode(389))

Something
 new
 is
 going
 on


In [43]:
print(tokenizer.batch_decode(tokenized["input_ids"]))
print(tokenized.keys())
print(tokenized["attention_mask"])
print(tokenized["input_ids"])

['<|eot_id|><|begin_of_text|>Hello How are you', '<|begin_of_text|>Something new is going on']
dict_keys(['input_ids', 'attention_mask'])
tensor([[0, 1, 1, 1, 1, 1],
        [1, 1, 1, 1, 1, 1]])
tensor([[128009, 128000,   9906,   2650,    527,    499],
        [128000,  23958,    502,    374,   2133,    389]])
