new_gradio_space / train.py
broadfield-dev's picture
Initial Space setup of broadfield-dev/new_gradio_space via Builder
b882201 verified
raw
history blame contribute delete
476 Bytes
# Import necessary libraries
import torch
import json
from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
from model import TranslationModel
# Load pre-trained model and tokenizer
model = AutoModelForSeq2SeqLM.from_pretrained("t5-small")
tokenizer = AutoTokenizer.from_pretrained("t5-small")
# Load custom model
custom_model = TranslationModel()
# Train custom model
custom_model.train(model, tokenizer)
# Save custom model
custom_model.save("custom_model.pth")