kshama/llama-3.2.py
2025-06-29 20:49:04 +06:00

27 lines
590 B
Python

import time
begin_time = time.time()
import torch
from transformers import pipeline
model_id = "meta-llama/Llama-3.2-1B-Instruct"
pipe = pipeline(
"text-generation",
model=model_id,
torch_dtype=torch.bfloat16,
device_map="auto",
)
messages = [
{"role": "system", "content": "You are a pirate chatbot who always responds in pirate speak!"},
{"role": "user", "content": "Who are you?"},
]
outputs = pipe(
messages,
max_new_tokens=256,
)
print(f"Time elapsed: {time.time() - begin_time:.2f} seconds")
#print(outputs[0]["generated_text"][-1])
print(outputs)