GAIA-Agent

Sleeping

Essi commited on Jun 2

Commit

2f99f18

1 Parent(s): 315ed41

perf: enhance search functionality and update prompt guidelines for clarity

Files changed (3) hide show

app.py CHANGED Viewed

@@ -138,12 +138,14 @@ def gather_context(state: AgentState) -> AgentState:
         if matched_obj:
             url = matched_obj[0]
             state["context"] = youtube_transcript.invoke({"url": url})
-    else:  # general
-        print("[TOOL] general")
         search_json = web_multi_search.invoke({"query": question})
         wiki_text = wiki_search.invoke({"query": question})
         state["context"] = f"{search_json}\n\n{wiki_text}"
     return state

         if matched_obj:
             url = matched_obj[0]
             state["context"] = youtube_transcript.invoke({"url": url})
+    elif label == "search":
+        print("[TOOL] web search")
         search_json = web_multi_search.invoke({"query": question})
         wiki_text = wiki_search.invoke({"query": question})
         state["context"] = f"{search_json}\n\n{wiki_text}"
+    else:
+        print("[TOOL] reasoning only (no search)")
+        state["context"] = ""
     return state

prompts.yaml CHANGED Viewed

@@ -8,13 +8,19 @@ router: |
   Guidelines
   ----------
-  • **math**: the question is a pure arithmetic/numeric expression.
-  • **youtube**: the question contains a YouTube URL and asks about its content.
-  • **code**: the task references attached Python code; caller wants its output.
-  • **excel**: the task references an attached .xlsx/.xls/.csv and asks for a sum, average, etc.
-  • **audio**: the task references an attached audio file and asks for its transcript or facts in it.
-  • **image**: the task could be either generic like "what is in the picture (e.g. Which animal is shown?) or could be a puzzle like asking for a *move, count, coordinate,* or other board-game tactic that needs an exact piece layout (e.g. "What is Black's winning move?").
-  • **general**: anything else (fallback).
   ~~~
   User question:
@@ -46,8 +52,8 @@ excel_system: |
   Context
   -------
-  • A full DataFrame named `df` is already loaded.
-  • Only the preview below is shown for reference; use column names from it.
   Preview
   -------

   Guidelines
   ----------
+  - **math**: the question is a pure arithmetic/numeric expression.
+  - **youtube**: the question contains a YouTube URL and asks about its content.
+  - **code**: the task references attached Python code; caller wants its output.
+  - **excel**: the task references an attached .xlsx/.xls/.csv and asks for a sum, average, etc.
+  - **audio**: the task references an attached audio file and asks for its transcript or facts in it.
+  - **image**: the task could be either generic like "what is in the picture (e.g. Which animal is shown?) or could be a puzzle like asking for a *move, count, coordinate,* or other board-game tactic that needs an exact piece layout (e.g. "What is Black's winning move?").
+  - **search** : needs external factual information from the web
+  - **reason** : answer can be produced by analyzing the question text alone
+  Examples
+  ----------
+  (search) What is the last name of the person who founded Mercedes Benz company?
+  (reasoning) what is the third item of following list that is a fruit after sorting it alphabetically: ['parsley', 'orange', 'apple', 'coriander', 'lettuce', 'kiwi', 'apricot']" Answer is 'kiwi'
   ~~~
   User question:
   Context
   -------
+  - A full DataFrame named `df` is already loaded.
+  - Only the preview below is shown for reference; use column names from it.
   Preview
   -------

tools.py CHANGED Viewed

@@ -87,17 +87,22 @@ def web_multi_search(query: str, k: int = 6) -> str:
         pass
     try:
-        tavily_hits = TavilySearchResults(max_results=k).invoke(query=query)
         print(
-            f"[TOOL] TAVILY search is triggered with following response: {tavily_hits}"
         )
         formatted = [
             {
-                "title": d.metadata.get("title", "")[:500],
-                "snippet": d.page_content[:750],
-                "link": d.metadata.get("source", "")[:300],
             }
-            for d in tavily_hits
         ]
         return json.dumps(formatted, ensure_ascii=False)
     except Exception as exc:

         pass
     try:
+        tavily_results = TavilySearchResults(
+            max_results=5,
+            # include_answer=True,
+            # search_depth="advanced",
+        )
+        search_result = tavily_results.invoke({"query": query})
         print(
+            f"[TOOL] TAVILY search is triggered with following response: {search_result}"
         )
         formatted = [
             {
+                "title": d.get("title", "")[:500],
+                "snippet": d.get("content", "")[:750],
+                "link": d.get("url", "")[:300],
             }
+            for d in search_result
         ]
         return json.dumps(formatted, ensure_ascii=False)
     except Exception as exc: