In [None]:
# Import necessary libraries
from transformers import AutoModelForCausalLM, AutoTokenizer

# Specify the path to the local QwenCoder model and tokenizer
model_path = "<path_to_your_qwencoder_model>"  # Replace with your local model path
tokenizer_path = "<path_to_your_qwencoder_tokenizer>"  # Replace with your tokenizer path

# Load the tokenizer
tokenizer = AutoTokenizer.from_pretrained(tokenizer_path)

# Load the QwenCoder model
model = AutoModelForCausalLM.from_pretrained(model_path)

# Define a function to generate responses from QwenCoder
def generate_response(system_prompt, user_prompt, max_length=512):
    """
    Generate a response using QwenCoder.

    Args:
        system_prompt (str): The system prompt providing instructions or context.
        user_prompt (str): The user input or query.
        max_length (int): Maximum length of the response.

    Returns:
        str: The generated response.
    """
    # Combine system prompt and user prompt
    full_prompt = f"System: {system_prompt}\nUser: {user_prompt}\nAssistant:"
    
    # Tokenize the input
    inputs = tokenizer(full_prompt, return_tensors="pt", truncation=True)
    
    # Generate response
    outputs = model.generate(**inputs, max_length=max_length, pad_token_id=tokenizer.eos_token_id)
    
    # Decode and return the response
    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
    return response.split("Assistant:")[-1].strip()

# Example usage
system_prompt = "You are a highly knowledgeable and friendly assistant."
user_prompt = "Can you explain how QwenCoder works?"
response = generate_response(system_prompt, user_prompt)
print("Assistant:", response)