arabic-gov-copilot / init_model.py
HemanM's picture
Update init_model.py
b663f38 verified
raw
history blame contribute delete
323 Bytes
from transformers import AutoTokenizer, AutoModel
# Arabic tokenizer from AraBERT v2
tokenizer = AutoTokenizer.from_pretrained("aubmindlab/bert-base-arabertv2")
base_model = AutoModel.from_pretrained("aubmindlab/bert-base-arabertv2")
def get_tokenizer():
return tokenizer
def get_base_model():
return base_model