In [29]:
from transformers import AutoTokenizer, AutoModelForCausalLM

# Local path where model was downloaded or saved
model_path = "./qwen_model_14B"

# Load tokenizer
tokenizer = AutoTokenizer.from_pretrained(
    model_path, 
    trust_remote_code=True,
    padding=True,
    truncation=True
)

# Load model to GPU (automatically maps layers to available device)
reloaded_model = AutoModelForCausalLM.from_pretrained(
    model_path,
    device_map="auto",         # Automatically use GPU if available
    torch_dtype="auto",        # Load using model's preferred dtype (e.g. fp16)
    trust_remote_code=True     # Needed for Qwen and some custom models
)

input_text = "What is the capital of France and tell me about it in 100 words?"
input_ids = tokenizer.encode(input_text, return_tensors="pt").to(model.device)
output_from_reloaded = reloaded_model.generate(
    input_ids, 
    max_new_tokens=5000,
    pad_token_id=tokenizer.eos_token_id  # ensure this is set
)
# print(output_from_reloaded)
print(tokenizer.decode(output_from_reloaded[0], skip_special_tokens=True))

Loading checkpoint shards: 100%|██████████| 8/8 [00:02<00:00,  2.71it/s]
Some parameters are on the meta device because they were offloaded to the cpu.


What is the capital of France and tell me about it in 100 words? The capital of France is Paris. It is a city known for its rich history, culture, and architecture. Paris is home to many famous landmarks such as the Eiffel Tower, the Louvre Museum, and Notre-Dame Cathedral. The city is also known for its fashion, cuisine, and art. Paris is a popular tourist destination and attracts millions of visitors each year. The city is divided into 20 arrondissements, each with its own unique character and attractions. Paris is a vibrant and bustling city that offers something for everyone.


In [1]:
from transformers import AutoTokenizer, AutoModelForCausalLM

# Local path where model was downloaded or saved
model_path = "./qwen_model_7B"

# Load model to GPU (automatically maps layers to available device)
model_7B = AutoModelForCausalLM.from_pretrained(
    model_path,
    device_map="auto",         # Automatically use GPU if available
    torch_dtype="auto",        # Load using model's preferred dtype (e.g. fp16)
    trust_remote_code=True     # Needed for Qwen and some custom models
)
# Load tokenizer
tokenizer = AutoTokenizer.from_pretrained(
    model_path, 
    trust_remote_code=True,
    padding=True,
    truncation=True
)

input_text = "What is the capital of France and tell me about it in 100 words?"
input_ids = tokenizer.encode(input_text, return_tensors="pt").to(model_7B.device)
output_from_7B = model_7B.generate(
    input_ids, 
    max_new_tokens=5000,
    pad_token_id=tokenizer.eos_token_id  # ensure this is set
)
print(tokenizer.decode(output_from_7B[0], skip_special_tokens=True))

  from .autonotebook import tqdm as notebook_tqdm
2025-07-17 16:42:52.308279: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:467] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
E0000 00:00:1752770572.330736    5334 cuda_dnn.cc:8579] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
E0000 00:00:1752770572.338124    5334 cuda_blas.cc:1407] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
W0000 00:00:1752770572.359641    5334 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.
W0000 00:00:1752770572.359667    5334 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.
W0000 00:00:1752770572.359672    5334

What is the capital of France and tell me about it in 100 words? The capital of France is Paris. It is a city of 2.1 million people and is located in the north of the country. Paris is known for its beautiful architecture, museums, and art galleries. It is also famous for its fashion, food, and nightlife. The city is home to many famous landmarks such as the Eiffel Tower, the Louvre Museum, and Notre-Dame Cathedral. Paris is a popular tourist destination and attracts millions of visitors each year. The city is also a center for business and finance, with many international companies having their headquarters there. Overall, Paris is a vibrant and exciting city that offers something for everyone.


In [2]:
input_text_2 = "What is the capital of Pakistan and tell me about it in 100 words?"
input_ids_2 = tokenizer.encode(input_text_2, return_tensors="pt").to(model_7B.device)

output_from_7B_2 = model_7B.generate(
    input_ids_2, 
    max_new_tokens=100,
    pad_token_id=tokenizer.eos_token_id  # ensure this is set
)
# print(output_from_reloaded)
print(tokenizer.decode(output_from_7B_2[0], skip_special_tokens=True))

What is the capital of Pakistan and tell me about it in 100 words? The capital of Pakistan is Islamabad. It is a planned city located in the northwestern part of the country, in the Islamabad district. It was established in 1960 as the capital of Pakistan and was designed by a team of architects from around the world. Islamabad is known for its modern architecture, green spaces, and its location in the heart of the country. It is home to many important government buildings, including the Parliament House, the Supreme Court of Pakistan, and the President's House


In [None]:
import json
train_filename = '../dstc8-schema-guided-dialogue/train/dialogues_052.json'

import os
import json
import pandas as pd

folder_path = "../dstc8-schema-guided-dialogue/train"
from itertools import chain

hotel_dialogs = []
services = []
rows = []

def create_intent_and_slot_dataframe(df):
    for filename in os.listdir(folder_path):
        file_path = os.path.join(folder_path, filename)
        if os.path.isfile(file_path) and 'dialogues_052' in file_path:
            # print("Found file:", file_path)
            with open(file_path) as f:
                dialogues = json.load(f)
            for dialog in dialogues:
                dialogue_id = dialog["dialogue_id"]
                services = dialog.get("services", [])
                for turn_idx, turn in enumerate(dialog["turns"]):
                    rows.append({
                        "dialogue_id": dialogue_id,
                        "turn_index": turn_idx,
                        "speaker": turn["speaker"],
                        "utterance": turn["utterance"],
                        "services": services,
                        "frames": turn.get("frames", []),
                        "acts": [action.get("act", "") for f in turn.get("frames", []) for action in f.get("actions", [])],
                        "slots": [action.get("slot", "") for f in turn.get("frames", []) for action in f.get("actions", [])],
                        "active_intent": [frame.get("state", {}).get("active_intent", "") for frame in turn.get("frames", [])],
                    })
    return pd.DataFrame(rows)

def serialize_dialogue(df):
    ret = ""
    for _, row in df.iterrows():
        # print(row)
        ret += (f"{row['speaker']} : {row['utterance']} active_intent: {row['active_intent']} acts: {row['acts']} \n")
    return ret

def get_dialogue_with_id(df, dialogue_id):
    return df[df["dialogue_id"] == dialogue_id]

def get_hotel_only_dialogues(df):
    hotel_rows = df[df["services"].apply(lambda x: "Hotels" in x) & df["services"].apply(lambda x: len(x) == 1)]
    return hotel_rows


df = create_intent_and_slot_dataframe(folder_path)
print(df.head())








  dialogue_id  turn_index speaker  \
0    52_00000           0    USER   
1    52_00000           1  SYSTEM   
2    52_00000           2    USER   
3    52_00000           3  SYSTEM   
4    52_00000           4    USER   

                                           utterance  \
0                    Please reserve this car for me.   
1  Where would you like to pick it up? And at whi...   
2  I want to pick it up from Vancouver Airport at...   
3  Which dates would you like the car reserved? W...   
4  I want a standard on this Sunday until March 9th.   

                   services  \
0  [RentalCars_1, Hotels_3]   
1  [RentalCars_1, Hotels_3]   
2  [RentalCars_1, Hotels_3]   
3  [RentalCars_1, Hotels_3]   
4  [RentalCars_1, Hotels_3]   

                                              frames  \
0  [{'actions': [{'act': 'INFORM_INTENT', 'canoni...   
1  [{'actions': [{'act': 'REQUEST', 'canonical_va...   
2  [{'actions': [{'act': 'INFORM', 'canonical_val...   
3  [{'actions': [{'act': 'REQ

In [None]:

print(serialize_dialogue(get_dialogue_with_id(df, "52_00000")))

# unique_ids = df["dialogue_id"].unique()
# unique_hotel_ids = hotel_rows['dialogue_id'].unique()

# # print("Number of rows with 'Hotels_1' in services:", count, len(df), count/len(df))
# print(f"unique_ids {len(unique_ids)} unique_hotel_ids {len(unique_hotel_ids)} multi_service: {len(multi_service['dialogue_id'].unique())} {len(example_multi_service)}")
# print(serialize_dialogue(example_multi_service))

USER : Please reserve this car for me. active_intent: ['ReserveCar'] acts: [('INFORM_INTENT', 'intent')] 
SYSTEM : Where would you like to pick it up? And at which time? active_intent: [''] acts: [('REQUEST', 'pickup_location'), ('REQUEST', 'pickup_time')] 
USER : I want to pick it up from Vancouver Airport at one pm please. active_intent: ['ReserveCar'] acts: [('INFORM', 'pickup_location'), ('INFORM', 'pickup_time')] 
SYSTEM : Which dates would you like the car reserved? What type do you prefer? active_intent: [''] acts: [('REQUEST', 'dropoff_date'), ('REQUEST', 'pickup_date'), ('REQUEST', 'type')] 
USER : I want a standard on this Sunday until March 9th. active_intent: ['ReserveCar'] acts: [('INFORM', 'type'), ('INFORM', 'pickup_date'), ('INFORM', 'dropoff_date')] 
SYSTEM : You want a standard at YVR International Airport from march 3rd at 1 pm through march 9th. active_intent: [''] acts: [('CONFIRM', 'pickup_location'), ('CONFIRM', 'pickup_date'), ('CONFIRM', 'pickup_time'), ('CONFI