In [2]:
import tensorflow as tf

# List available GPUs
gpus = tf.config.experimental.list_physical_devices('GPU')
if gpus:
    print(f"GPUs detected: {gpus}")
    # Optionally, set memory growth to prevent TensorFlow from allocating all GPU memory
    for gpu in gpus:
        tf.config.experimental.set_memory_growth(gpu, True)
else:
    print("No GPUs detected.")


GPUs detected: [PhysicalDevice(name='/physical_device:GPU:0', device_type='GPU')]


In [6]:
# Use a pipeline as a high-level helper
from transformers import pipeline

messages = [
    {"role": "user", "content": "Who are you?"},
]
pipe = pipeline("text-generation", model="deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B")
pipe(messages)

Device set to use cuda:0


[{'generated_text': [{'role': 'user', 'content': 'Who are you?'},
   {'role': 'assistant',
    'content': "Greetings! I'm DeepSeek-R1, an artificial intelligence assistant created by DeepSeek. I'm"}]}]

In [21]:
from transformers import pipeline, AutoModelForCausalLM, PreTrainedTokenizerFast

# Load tokenizer from local file
tokenizer = PreTrainedTokenizerFast(tokenizer_file="Bitnet B1 Tokenizer.json")

# Load model from Hugging Face
model = AutoModelForCausalLM.from_pretrained("1bitLLM/bitnet_b1_58-large", trust_remote_code=True)
model.to('cuda')

# Create the text generation pipeline with both model and tokenizer
pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)

# Define input messages in plain text (since `pipeline` expects raw strings, not message objects)
user_input = "Who are you?"

inputs = tokenizer(user_input, return_tensors="pt")
inputs = {key: value.to('cuda') for key, value in inputs.items()}

# Generate a response
output = model.generate(
    inputs['input_ids'],
    max_length=50,
    temperature=0.7,
    top_k=50,
    top_p=0.9
)


# Print the result
print(output)


Device set to use cuda:0


tensor([[    1,  3575,  1881,  1426,  1244, 29889, 29889, 29889, 29889, 29889,
         29889, 29871, 29871, 29889, 29871, 29871, 29871, 29871, 29871, 29871,
         29871, 29871, 29871, 29871, 29871, 29871, 29871, 29871, 29871, 29871,
         29871, 29871, 29871, 29871, 29871, 29871, 29871, 29871, 29871, 29871,
         29871, 29871, 29871, 29871, 29871, 29871, 29871, 29871, 29871, 29871]],
       device='cuda:0')
