llama_v2_or / inference.py
Ranjit's picture
Create inference.py
5f2a34c
raw
history blame contribute delete
946 Bytes
# Specify input
text = "ଓଡ଼ିଶାରେ କେଉଁ ପ୍ରକାରର ଜଙ୍ଗଲ ରହିଛି?"
from transformers import AutoTokenizer, AutoModelForCausalLM
import torch
# Specify device
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
# Load model and tokenizer
tokenizer = AutoTokenizer.from_pretrained("Ranjit/llama_v2_or")
model = AutoModelForCausalLM.from_pretrained("Ranjit/llama_v2_or", trust_remote_code=True, torch_dtype=torch.float16).to(device)
# Tokenize input
inputs = tokenizer(text, return_tensors="pt").to(device)
# Generate output
with torch.no_grad():
outputs = model.generate(input_ids=inputs["input_ids"],
attention_mask=inputs["attention_mask"],
max_new_tokens=1024,
pad_token_id=tokenizer.eos_token_id)
# Decode and print
print(tokenizer.decode(outputs[0], skip_special_tokens=True))