Spaces:

princemaxp
/

Guardian-AI

Sleeping

App Files Files Community

princemaxp commited on Sep 8

Commit

2a46434

verified ·

1 Parent(s): 7344869

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -6

app.py CHANGED Viewed

@@ -1,21 +1,46 @@
 import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
-# Load model & tokenizer
 model_id = "google/gemma-2b-it"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(model_id)
-# Create pipeline
-generator = pipeline("text-generation", model=model, tokenizer=tokenizer, device=-1)
-# System instruction
 SYSTEM_PROMPT = """You are Guardian AI, a friendly cybersecurity educator.
 Your goal is to explain cybersecurity concepts in simple, engaging language with examples.
 Always keep answers clear, short, and focused on security awareness.
 """
-# Chat function
 def chat(history, user_input):
     prompt = SYSTEM_PROMPT + "\nUser: " + user_input + "\nGuardian AI:"
     result = generator(
@@ -28,13 +53,18 @@ def chat(history, user_input):
     response = result.split("Guardian AI:")[-1].strip()
     history.append((user_input, response))
     return history, history
-# Gradio UI
 with gr.Blocks() as demo:
     gr.Markdown("## 🛡️ Guardian AI – Cybersecurity Educator")
     chatbot = gr.Chatbot()
     state = gr.State([])
     with gr.Row():
         with gr.Column(scale=8):
             user_input = gr.Textbox(show_label=False, placeholder="Ask me about cybersecurity...")

 import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
+from datasets import load_dataset, Dataset
+from huggingface_hub import login
+import os
+# --- Hugging Face Dataset Setup ---
+HF_TOKEN = os.environ.get("dataset_HF_TOKEN")  # Secret in your HF Space
+login(token=HF_TOKEN)
+dataset_name = "YOUR_USERNAME/guardian-ai-qna"  # Replace YOUR_USERNAME
+try:
+    dataset = load_dataset(dataset_name)
+except:
+    # If dataset is empty or not yet created, create an empty one
+    dataset = Dataset.from_dict({"question": [], "answer": []})
+# --- Load model & tokenizer ---
 model_id = "google/gemma-2b-it"
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 model = AutoModelForCausalLM.from_pretrained(model_id)
+generator = pipeline(
+    "text-generation",
+    model=model,
+    tokenizer=tokenizer,
+    device=-1  # CPU, change to 0 if GPU available
+)
+# --- System instruction ---
 SYSTEM_PROMPT = """You are Guardian AI, a friendly cybersecurity educator.
 Your goal is to explain cybersecurity concepts in simple, engaging language with examples.
 Always keep answers clear, short, and focused on security awareness.
 """
+# --- Save Q&A to dataset ---
+def save_qna(question, answer):
+    global dataset
+    new_entry = Dataset.from_dict({"question": [question], "answer": [answer]})
+    dataset = dataset.concat(new_entry)
+    dataset.push_to_hub(dataset_name, private=False)  # push updates
+# --- Chat function ---
 def chat(history, user_input):
     prompt = SYSTEM_PROMPT + "\nUser: " + user_input + "\nGuardian AI:"
     result = generator(
     response = result.split("Guardian AI:")[-1].strip()
     history.append((user_input, response))
+    # Save to dataset
+    save_qna(user_input, response)
     return history, history
+# --- Gradio UI ---
 with gr.Blocks() as demo:
     gr.Markdown("## 🛡️ Guardian AI – Cybersecurity Educator")
     chatbot = gr.Chatbot()
     state = gr.State([])
     with gr.Row():
         with gr.Column(scale=8):
             user_input = gr.Textbox(show_label=False, placeholder="Ask me about cybersecurity...")