Spaces:

phanerozoic
/

SchoolSpiritAI

Paused

App Files Files Community

SchoolSpiritAI / app.py

phanerozoic

Create app.py

e1aeada verified 3 months ago

raw

history blame

2.87 kB

	"""
	SchoolSpirit AI – minimal public chatbot Space
	---------------------------------------------
	• Loads Meta’s Llama‑3 3 B‑Instruct (fits HF CPU Space).
	• Uses Hugging Face transformers + Gradio; no external deps.
	• Keeps prompt short and trims history to fit the model context.
	• Gracefully handles model‑load or inference errors.
	"""

	import gradio as gr
	from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
	from transformers.utils import logging as hf_logging

	hf_logging.set_verbosity_error() # keep Space logs clean

	MODEL_ID = "meta-llama/Llama-3.2-3B-Instruct"
	MAX_TURNS = 6 # retain last N exchanges
	MAX_TOKENS = 220 # response length
	SYSTEM_MSG = (
	"You are SchoolSpirit AI, the friendly digital mascot for a company that "
	"provides on‑prem AI chat mascots, fine‑tuning services, and turnkey GPU "
	"hardware for schools. Keep answers concise, upbeat, and age‑appropriate. "
	"If you don’t know, say so and suggest contacting a human. Never request "
	"personal data."
	)

	# ---------------- Model ------------------------------------------------------
	try:
	tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
	model = AutoModelForCausalLM.from_pretrained(
	MODEL_ID,
	device_map="auto", # auto‑detect CPU / GPU if available
	torch_dtype="auto"
	)
	gen = pipeline(
	"text-generation",
	model=model,
	tokenizer=tokenizer,
	max_new_tokens=MAX_TOKENS,
	do_sample=True,
	temperature=0.7,
	)
	except Exception as e: # noqa: BLE001
	# Fatal startup failure – expose error in UI
	def chat(history, user_msg):
	return history + [(user_msg, f"Model load error: {e}")], ""
	else:
	# ---------------- Chat handler ------------------------------------------
	def chat(history, user_msg):
	"""Gradio ChatInterface callback."""
	# Trim history to last N turns
	if len(history) > MAX_TURNS:
	history = history[-MAX_TURNS:]

	# Build prompt
	prompt = SYSTEM_MSG + "\n"
	for u, a in history:
	prompt += f"User: {u}\nAI: {a}\n"
	prompt += f"User: {user_msg}\nAI:"

	# Generate
	try:
	completion = gen(prompt)[0]["generated_text"]
	reply = completion.split("AI:", 1)[-1].strip()
	except Exception as err: # noqa: BLE001
	reply = "Sorry, something went wrong. Please try again later."
	hf_logging.get_logger("SchoolSpirit").error(str(err))

	history.append((user_msg, reply))
	return history, ""


	# ---------------- UI ---------------------------------------------------------
	gr.ChatInterface(
	chat,
	title="SchoolSpirit AI Chat",
	theme=gr.themes.Soft(primary_hue="blue"), # light‑blue chat UI
	).launch()