Spaces:

monsimas
/

do-i-really-need-a-huge-llm

Sleeping

do-i-really-need-a-huge-llm / bertmodel.py

Claude AI

Add application files with improved energy tracking

1ec5d3f 3 months ago

2.08 kB

	# my_text_classifier.py

	from transformers import AutoTokenizer, AutoModelForSequenceClassification
	import torch
	from typing import Optional
	from pathlib import Path

	# Use the model from Hugging Face
	_MODEL_NAME = "monsimas/ModernBERT-ecoRouter"

	# Load tokenizer and model at import time so we don’t pay the I/O cost on every call
	try:
	_TOKENIZER = AutoTokenizer.from_pretrained(_MODEL_NAME)
	except Exception as e:
	raise RuntimeError(f"Failed to load tokenizer from {_MODEL_NAME}: {e}")

	try:
	_MODEL = AutoModelForSequenceClassification.from_pretrained(_MODEL_NAME)
	_MODEL.eval() # evaluation mode
	except Exception as e:
	raise RuntimeError(f"Failed to load model from {_MODEL_NAME}: {e}")


	def predict_label(
	text: str,
	tokenizer: Optional[AutoTokenizer] = None,
	model: Optional[AutoModelForSequenceClassification] = None
	) -> str:
	"""
	Classify a single string and return the predicted label.

	Args:
	text: The input text to classify.
	tokenizer: (optional) tokenizer instance; defaults to the module-level tokenizer.
	model: (optional) model instance; defaults to the module-level model.

	Returns:
	The name of the predicted class (as per `model.config.id2label`).

	Raises:
	ValueError: if the model’s config has no `id2label` mapping.
	"""
	tok = tokenizer or _TOKENIZER
	mdl = model or _MODEL

	# Tokenize
	inputs = tok([text], padding=True, truncation=True, return_tensors="pt")

	# Inference
	with torch.no_grad():
	outputs = mdl(**inputs)

	logits = outputs.logits
	pred_id = torch.argmax(logits, dim=-1).item()

	# Map to label name
	if not hasattr(mdl.config, "id2label") or len(mdl.config.id2label) == 0:
	raise ValueError("Model config does not contain an id2label mapping.")
	return mdl.config.id2label[pred_id]

	"""
	# Example usage
	if __name__ == "__main__":
	sample = "This is an example sentence to classify."
	label = predict_label(sample)
	print(f"Input: {sample}\nPredicted label: {label}")

	"""