Spaces:

brignt
/

Chatbot

Sleeping

App Files Files Community

brignt commited on Apr 9

Commit

5d1455b

verified ·

1 Parent(s): 3aac496

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -52

app.py CHANGED Viewed

@@ -6,23 +6,33 @@ import numpy as np
 from sentence_transformers import SentenceTransformer
 from sklearn.metrics.pairwise import cosine_similarity
-# ===== 0) OpenAI API Key (Secrets) =====
-# Hugging Face Spaces에선 Settings -> Repository secrets -> OPENAI_API_KEY 등록
-openai.api_key = os.getenv("OPENAI_API_KEY")
-# ===== 1) 모델 & 데이터프레임 로드 =====
-# Example: jhgan/ko-sroberta-multitask
-model = SentenceTransformer("jhgan/ko-sroberta-multitask")
-# 임의 예시: 세브란스 정신의학챗봇 데이터 (URL)
-df = pd.read_csv("https://raw.githubusercontent.com/kairess/mental-health-chatbot/master/wellness_dataset_original.csv")
 df = df.dropna()
-df["embedding"] = df["유저"].map(lambda x: model.encode(str(x)))
-# ===== 하이퍼파라미터 =====
-MAX_TURN = 5  # 소크라테스식 질문 최대 횟수
-# ===== 프롬프트 =====
 EMPATHY_PROMPT = """\
 당신은 친절한 정신의학과 전문의이며 심리상담 전문가입니다.
 사용자의 문장을 거의 그대로 요약하되, 끝에 '는군요.' 같은 공감 어미를 붙여 자연스럽게 응답하세요.
@@ -59,24 +69,10 @@ ADVICE_PROMPT = """\
 조언:
 """
-def set_openai_model():
-    """
-    유저 요청대로 'gpt-4o' 모델명 반환
-    (실제로는 존재하지 않을 가능성 큼)
-    """
-    return "gpt-4o"
-# ===== 함수들 =====
-def kb_search(user_input: str) -> str:
-    """SentenceTransformer로 임베딩 후, df에서 가장 유사한 챗봇 답변 획득."""
-    emb = model.encode(user_input)
-    df["sim"] = df["embedding"].map(lambda e: cosine_similarity([emb],[e]).squeeze())
-    idx = df["sim"].idxmax()
-    return df.loc[idx, "챗봇"]
 def call_empathy(user_input: str) -> str:
-    """EMPATHY 단계: 공감 요약."""
     prompt = EMPATHY_PROMPT.format(sentence=user_input)
     resp = openai.ChatCompletion.create(
         model=set_openai_model(),
@@ -90,7 +86,7 @@ def call_empathy(user_input: str) -> str:
     return resp.choices[0].message.content.strip()
 def call_socratic_question(context: str) -> str:
-    """SQ 단계: 후속 질문 한 문장 생성."""
     prompt = f"{SOCRATIC_PROMPT}\n\n대화 힌트:\n{context}"
     resp = openai.ChatCompletion.create(
         model=set_openai_model(),
@@ -104,7 +100,7 @@ def call_socratic_question(context: str) -> str:
     return resp.choices[0].message.content.strip()
 def call_advice(hints: str) -> str:
-    """ADVICE 단계: CBT 조언 생성."""
     final_prompt = ADVICE_PROMPT.format(hints=hints)
     resp = openai.ChatCompletion.create(
         model=set_openai_model(),
@@ -117,8 +113,8 @@ def call_advice(hints: str) -> str:
     )
     return resp.choices[0].message.content.strip()
 def predict(user_input: str, state: dict):
-    """Gradio Callback: 소크라테스 CBT 챗봇 흐름 (EMPATHY→SQ→ADVICE)."""
     history = state.get("history", [])
     stage = state.get("stage", "EMPATHY")
     turn = state.get("turn", 0)
@@ -127,11 +123,20 @@ def predict(user_input: str, state: dict):
     # 1) 사용자 발화 기록
     history.append(("User", user_input))
-    # 2) KB 검색 → hints
-    kb_answer = kb_search(user_input)
     hints.append(f"[KB] {kb_answer}")
-    # 3) 단계 분기
     if stage == "EMPATHY":
         empathic = call_empathy(user_input)
         history.append(("Chatbot", empathic))
@@ -141,7 +146,7 @@ def predict(user_input: str, state: dict):
         return history, {"history": history, "stage": stage, "turn": turn, "hints": hints}
     if stage == "SQ" and turn < MAX_TURN:
-        # 전체 대화 + hints 합쳐 context
         context_text = "\n".join([f"{r}: {c}" for (r,c) in history]) + "\n" + "\n".join(hints)
         sq = call_socratic_question(context_text)
         history.append(("Chatbot", sq))
@@ -150,50 +155,50 @@ def predict(user_input: str, state: dict):
         return history, {"history": history, "stage": stage, "turn": turn, "hints": hints}
     # ADVICE 단계
-    stage = "ADVICE"
     combined_hints = "\n".join(hints)
     advice = call_advice(combined_hints)
     history.append(("Chatbot", advice))
-    stage = "END"
     return history, {"history":history, "stage":stage, "turn":turn, "hints":hints}
 def gradio_predict(user_input, chat_state):
-    """Gradio에서 user_input, state를 받아 predict → (chatbot 출력, state 갱신)."""
     new_history, new_state = predict(user_input, chat_state)
-    # display_history: list of (user, assistant)
     display_history = []
     for (role, txt) in new_history:
         if role == "User":
-            display_history.append([txt, ""])
-        else:  # Chatbot
-            if not display_history:
                 display_history.append(["", txt])
-            elif display_history[-1][1] == "":
-                display_history[-1][1] = txt
             else:
-                display_history.append(["", txt])
     return display_history, new_state
 def create_app():
-    """Gradio Blocks UI 구성."""
     with gr.Blocks() as demo:
-        gr.Markdown("## 🏥 소크라테스 CBT 챗봇 (GPT-4o)")
-        chatbot = gr.Chatbot(label="Socratic CBT Chatbot")
         chat_state = gr.State({
             "history": [],
             "stage":"EMPATHY",
             "turn":0,
             "hints":[]
         })
-        txt = gr.Textbox(show_label=False, placeholder="고민이나 궁금한 점을 입력하세요.")
-        txt.submit(fn=gradio_predict, inputs=[txt, chat_state], outputs=[chatbot, chat_state], scroll_to_output=True)
     return demo
 app = create_app()
 if __name__ == "__main__":
-    # Launch Gradio app
     app.launch(debug=True, share=True)

 from sentence_transformers import SentenceTransformer
 from sklearn.metrics.pairwise import cosine_similarity
+# OpenAI API Key (Hugging Face Secrets)
+openai.api_key = os.getenv("OPENAI_API_KEY", "")
+# =============== 0) 모델 / df 준비 ===============
+# SentenceTransformer
+model = SentenceTransformer('jhgan/ko-sroberta-multitask')
+# 정신의학챗봇 CSV 로드
+df = pd.read_csv('https://raw.githubusercontent.com/kairess/mental-health-chatbot/master/wellness_dataset_original.csv')
 df = df.dropna()
+# Unnamed 컬럼 제거
+if 'Unnamed: 3' in df.columns:
+    df = df.drop(columns=['Unnamed: 3'])
+# 임베딩 필드
+df['embedding'] = df['유저'].map(lambda x: model.encode(str(x)))
+# ============== 1) 파라미터/프롬프트 ==============
+MAX_TURN = 5  # 최대 소크라테스 질문 회수
+def set_openai_model():
+    """
+    GPT-4 대신 'gpt-4o' (실제론 비존재 모델)
+    => 실제로는 'gpt-3.5-turbo' 등으로 교체 권장
+    """
+    return "gpt-4o"
 EMPATHY_PROMPT = """\
 당신은 친절한 정신의학과 전문의이며 심리상담 전문가입니다.
 사용자의 문장을 거의 그대로 요약하되, 끝에 '는군요.' 같은 공감 어미를 붙여 자연스럽게 응답하세요.
 조언:
 """
+# ============== 2) OpenAI 호출 함수들 ==============
 def call_empathy(user_input: str) -> str:
+    """ 공감 요약 생성 """
     prompt = EMPATHY_PROMPT.format(sentence=user_input)
     resp = openai.ChatCompletion.create(
         model=set_openai_model(),
     return resp.choices[0].message.content.strip()
 def call_socratic_question(context: str) -> str:
+    """ 소크라테스 후속질문 1문장 생성 """
     prompt = f"{SOCRATIC_PROMPT}\n\n대화 힌트:\n{context}"
     resp = openai.ChatCompletion.create(
         model=set_openai_model(),
     return resp.choices[0].message.content.strip()
 def call_advice(hints: str) -> str:
+    """ 최종 CBT 조언 """
     final_prompt = ADVICE_PROMPT.format(hints=hints)
     resp = openai.ChatCompletion.create(
         model=set_openai_model(),
     )
     return resp.choices[0].message.content.strip()
+# ============== 3) predict 함수: EMPATHY→SQ→ADVICE ==============
 def predict(user_input: str, state: dict):
     history = state.get("history", [])
     stage = state.get("stage", "EMPATHY")
     turn = state.get("turn", 0)
     # 1) 사용자 발화 기록
     history.append(("User", user_input))
+    # 2) 유사도 계산 → df['챗봇']
+    query_emb = model.encode(user_input)
+    df["sim"] = df["embedding"].map(lambda emb: cosine_similarity([query_emb],[emb]).squeeze())
+    # idxmax() 에러 방지: df가 비었거나 sim이 NaN인 경우 처리
+    if df["sim"].count() == 0:
+        # fallback: 그냥 "지식베이스가 비어 있습니다" 등
+        kb_answer = "적합한 지식베이스 응답을 찾지 못했어요."
+    else:
+        kb_answer = df.loc[df["sim"].idxmax(), "챗봇"]
     hints.append(f"[KB] {kb_answer}")
+    # 3) 단계별 분기
     if stage == "EMPATHY":
         empathic = call_empathy(user_input)
         history.append(("Chatbot", empathic))
         return history, {"history": history, "stage": stage, "turn": turn, "hints": hints}
     if stage == "SQ" and turn < MAX_TURN:
+        # 전체 대화 + hints → 소크라테스 질문
         context_text = "\n".join([f"{r}: {c}" for (r,c) in history]) + "\n" + "\n".join(hints)
         sq = call_socratic_question(context_text)
         history.append(("Chatbot", sq))
         return history, {"history": history, "stage": stage, "turn": turn, "hints": hints}
     # ADVICE 단계
+    stage = "END"
     combined_hints = "\n".join(hints)
     advice = call_advice(combined_hints)
     history.append(("Chatbot", advice))
     return history, {"history":history, "stage":stage, "turn":turn, "hints":hints}
+# ============== 4) Gradio UI ==============
 def gradio_predict(user_input, chat_state):
+    """Gradio callback"""
     new_history, new_state = predict(user_input, chat_state)
+    # Gradio Chatbot expects list of [user, bot] pairs
     display_history = []
     for (role, txt) in new_history:
         if role == "User":
+            display_history.append([txt, ""])   # user in left
+        else:
+            if len(display_history)==0:
                 display_history.append(["", txt])
             else:
+                display_history[-1][1] = txt    # bot in right
     return display_history, new_state
 def create_app():
     with gr.Blocks() as demo:
+        gr.Markdown("## 다중턴 소크라테스 CBT 챗봇")
+        chatbot = gr.Chatbot(label="CBT Chatbot")
         chat_state = gr.State({
             "history": [],
             "stage":"EMPATHY",
             "turn":0,
             "hints":[]
         })
+        txt = gr.Textbox(show_label=False, placeholder="뭐든 물어보세요")
+        # submit
+        txt.submit(fn=gradio_predict, inputs=[txt, chat_state], outputs=[chatbot, chat_state])
     return demo
 app = create_app()
 if __name__ == "__main__":
+    # 실제 배포/실행
     app.launch(debug=True, share=True)