In [None]:
# STEP 1: Install necessary libraries (if not already installed)
!pip install --upgrade bitsandbytes
!pip install --upgrade transformers accelerate

# STEP 2: Import required modules
from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
import torch

# STEP 3: Specify model (DeepSeek 7B base)
model_name = "deepseek-ai/deepseek-llm-7b-base"

# STEP 4: Quantization config for faster performance
quant_config = BitsAndBytesConfig(load_in_8bit=True)

# STEP 5: Load tokenizer and model using GPU
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForCausalLM.from_pretrained(
    model_name,
    device_map="auto",
    quantization_config=quant_config,
    torch_dtype=torch.float16
)

# STEP 6: Translate using a prompt
prompt = "Translate to French:\nEnglish: Hello, how are you?\nFrench:"
input_ids = tokenizer(prompt, return_tensors="pt").input_ids.to(model.device)
output = model.generate(input_ids, max_length=40, temperature=0.7)
print(tokenizer.decode(output[0], skip_special_tokens=True))
