Spaces:

sufian7755
/

NEW-Ai

Sleeping

sufian7755 commited on 8 days ago

Commit

3338976

verified ·

1 Parent(s): 92eaa32

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,25 +1,27 @@
 import gradio as gr
-from transformers import AutoTokenizer, AutoModelForCausalLM
-# Load DeepSeek-R1 model
-model_name = "deepseek-ai/DeepSeek-R1"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForCausalLM.from_pretrained(model_name)
-# Chat function
 def chat_with_ai(prompt):
-    inputs = tokenizer(prompt, return_tensors="pt")
-    outputs = model.generate(**inputs, max_new_tokens=250)
-    response = tokenizer.decode(outputs[0], skip_special_tokens=True)
-    return response
-# Gradio UI
 ui = gr.Interface(
     fn=chat_with_ai,
-    inputs=gr.Textbox(label="Ask me anything..."),
     outputs="text",
-    title="💬 DeepSeek-R1 AI",
-    description="Chat with your own DeepSeek-R1 model hosted on Hugging Face Cloud!"
 )
 ui.launch()

 import gradio as gr
+from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
+# ✅ Smaller DeepSeek model that runs on CPU
+model_name = "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B"
+# Load tokenizer & model
 tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto")
+# Create a text generation pipeline
+chatbot = pipeline("text-generation", model=model, tokenizer=tokenizer)
 def chat_with_ai(prompt):
+    response = chatbot(prompt, max_new_tokens=200, do_sample=True, temperature=0.7)
+    return response[0]["generated_text"]
+# Gradio interface
 ui = gr.Interface(
     fn=chat_with_ai,
+    inputs=gr.Textbox(label="Ask DeepSeek something..."),
     outputs="text",
+    title="🤖 DeepSeek-R1 (Distilled Version)",
+    description="Chat with the smaller DeepSeek-R1 that runs even without a GPU!"
 )
 ui.launch()