GAIA-Agent

Sleeping

App Files Files Community

Essi commited on Jun 1

Commit

ce76bed

1 Parent(s): 21394c0

feat: add prompt retrieval functionality and new Excel analysis prompt template

Browse files

Files changed (4) hide show

.pre-commit-config.yaml +3 -2
helpers.py +15 -4
prompts.yaml +22 -0
tools.py +34 -24

.pre-commit-config.yaml CHANGED Viewed

@@ -1,19 +1,20 @@
 repos:
 # ── FORMATTERS ─────────────────────────────────────────────────────────────
 - repo: https://github.com/astral-sh/ruff-pre-commit
-  rev: v0.11.11
   hooks:
     - id: ruff-check
     - id: ruff-format
 # ── STATIC ANALYSIS ────────────────────────────────────────────────────────
 - repo: https://github.com/pre-commit/mirrors-mypy
-  rev: v1.15.0
   hooks:
     - id: mypy
       additional_dependencies:
         - "pydantic==1.10.*"
         - "types-requests"
         - "mypy-extensions"
 # ── SECRET / KEY DETECTORS ─────────────────────────────────────────────────
 - repo: https://github.com/pre-commit/pre-commit-hooks
   rev: v5.0.0

 repos:
 # ── FORMATTERS ─────────────────────────────────────────────────────────────
 - repo: https://github.com/astral-sh/ruff-pre-commit
+  rev: v0.11.12
   hooks:
     - id: ruff-check
     - id: ruff-format
 # ── STATIC ANALYSIS ────────────────────────────────────────────────────────
 - repo: https://github.com/pre-commit/mirrors-mypy
+  rev: v1.16.0
   hooks:
     - id: mypy
       additional_dependencies:
         - "pydantic==1.10.*"
         - "types-requests"
         - "mypy-extensions"
+        - "types-PyYAML"
 # ── SECRET / KEY DETECTORS ─────────────────────────────────────────────────
 - repo: https://github.com/pre-commit/pre-commit-hooks
   rev: v5.0.0

helpers.py CHANGED Viewed

@@ -1,8 +1,14 @@
 import csv
-import io
-import zipfile
 import requests
 def fetch_task_file(api_url: str, task_id: str) -> tuple[bytes, str]:
@@ -29,11 +35,11 @@ def sniff_excel_type(blob: bytes) -> str:
     # 1️⃣ XLSX / XLSM / ODS  (ZIP container)
     if blob[:4] == b"PK\x03\x04":
         try:
-            with zipfile.ZipFile(io.BytesIO(blob)) as zf:
                 names = set(zf.namelist())
                 if {"xl/workbook.xml", "[Content_Types].xml"} & names:
                     return "xlsx"
-        except zipfile.BadZipFile:
             pass  # fall through
     # 2️⃣ Legacy XLS (OLE Compound File)
@@ -52,3 +58,8 @@ def sniff_excel_type(blob: bytes) -> str:
         pass
     return ""

 import csv
+from io import BytesIO
+from pathlib import Path
+from zipfile import BadZipFile, ZipFile
 import requests
+from yaml import safe_load
+CURRENT_DIR = Path(__file__).parent
+_PROMPTS = safe_load(CURRENT_DIR.joinpath("prompts.yaml").read_text())
 def fetch_task_file(api_url: str, task_id: str) -> tuple[bytes, str]:
     # 1️⃣ XLSX / XLSM / ODS  (ZIP container)
     if blob[:4] == b"PK\x03\x04":
         try:
+            with ZipFile(BytesIO(blob)) as zf:
                 names = set(zf.namelist())
                 if {"xl/workbook.xml", "[Content_Types].xml"} & names:
                     return "xlsx"
+        except BadZipFile:
             pass  # fall through
     # 2️⃣ Legacy XLS (OLE Compound File)
         pass
     return ""
+def get_prompt(prompt_key: str, **kwargs: str) -> str:
+    """Get a prompt by key and fill in placeholders via `.format(**kwargs)`"""
+    return _PROMPTS[prompt_key].format(**kwargs)

prompts.yaml ADDED Viewed

	@@ -0,0 +1,22 @@

+excel_analysis_one_liner: |
+  You are a **pandas one-liner generator**.
+  Context
+  -------
+  • A full DataFrame named `df` is already loaded.
+  • Only the preview below is shown for reference; use column names from it.
+  Preview
+  -------
+  {preview}
+  Formatting rules
+  ----------------
+  1. Result must be a plain Python scalar (use .item(), float(), int() …).
+  2. If the question asks for currency / 2 decimals → wrap in an f-string.
+  3. If the question asks for a count → wrap in int().
+  4. Return **one** expression, nothing else.
+  Question
+  --------
+  {question}

tools.py CHANGED Viewed

@@ -8,15 +8,18 @@ from functools import lru_cache
 from io import BytesIO
 from tempfile import NamedTemporaryFile
 from langchain_community.document_loaders import WikipediaLoader
 from langchain_community.tools.tavily_search import TavilySearchResults
 from langchain_community.utilities import DuckDuckGoSearchAPIWrapper
 from langchain_core.messages import HumanMessage, SystemMessage
 from langchain_core.tools import tool
 from langchain_openai import ChatOpenAI
-from transformers import pipeline
 from youtube_transcript_api import YouTubeTranscriptApi
 # --------------------------------------------------------------------------- #
 #                       ARITHMETIC (SAFE CALCULATOR)                         #
 # --------------------------------------------------------------------------- #
@@ -57,8 +60,6 @@ def calculator(expression: str) -> str:
 # --------------------------------------------------------------------------- #
 #                             WEB  &  WIKI  SEARCH                           #
 # --------------------------------------------------------------------------- #
 @lru_cache(maxsize=256)
 def _ddg_search(query: str, k: int = 6) -> list[dict[str, str]]:
     """Cached DuckDuckGo JSON search."""
@@ -114,8 +115,6 @@ def wiki_search(query: str, max_pages: int = 2) -> str:
 # --------------------------------------------------------------------------- #
 #                               YOUTUBE  TRANSCRIPT                          #
 # --------------------------------------------------------------------------- #
 @tool
 def youtube_transcript(url: str, chars: int = 10_000) -> str:
     """Fetch full YouTube transcript (first *chars* characters)."""
@@ -137,10 +136,9 @@ def youtube_transcript(url: str, chars: int = 10_000) -> str:
 # Instantiate a lightweight CLIP‑based zero‑shot image classifier (runs on CPU)
 ### The model 'openai/clip-vit-base-patch32' is a vision transformer (ViT) model trained as part of OpenAI’s CLIP project.
 ### It performs zero-shot image classification by mapping images and labels into the same embedding space.
-_image_pipe = pipeline(
-    "image-classification", model="openai/clip-vit-base-patch32", device="cpu"
-)
 # @tool
 # def image_describe(img_bytes: bytes, top_k: int = 3) -> str:
@@ -200,8 +198,6 @@ def vision_task(img_bytes: bytes, question: str) -> str:
 # --------------------------------------------------------------------------- #
 #                                 FILE  UTILS                                 #
 # --------------------------------------------------------------------------- #
 @tool
 def run_py(code: str) -> str:
     """Execute Python code in a sandboxed subprocess and return last stdout line."""
@@ -237,27 +233,41 @@ def transcribe_via_whisper(mp3_bytes: bytes) -> str:
 @tool
 def analyze_excel_file(xls_bytes: bytes, question: str) -> str:
-    """Generic Excel/CSV aggregation handler."""
-    import pandas as pd
-    # Try both Excel and CSV loaders
     try:
         df = pd.read_excel(BytesIO(xls_bytes))
     except Exception:
         df = pd.read_csv(BytesIO(xls_bytes))
-    numeric = df.select_dtypes("number")
-    if numeric.empty:
-        return "No numeric data"
-    q = question.lower()
-    if any(term in q for term in ["total", "sum", "aggregate"]):
-        return f"{numeric.sum().sum():.2f}"
-    if any(term in q for term in ["average", "mean"]):
-        return f"{numeric.mean().mean():.2f}"
-    # Fallback: return first 10 rows as csv for LLM to reason on
-    return df.head(10).to_csv(index=False)
 __all__ = [

 from io import BytesIO
 from tempfile import NamedTemporaryFile
+import numpy as np
+import pandas as pd
 from langchain_community.document_loaders import WikipediaLoader
 from langchain_community.tools.tavily_search import TavilySearchResults
 from langchain_community.utilities import DuckDuckGoSearchAPIWrapper
 from langchain_core.messages import HumanMessage, SystemMessage
 from langchain_core.tools import tool
 from langchain_openai import ChatOpenAI
 from youtube_transcript_api import YouTubeTranscriptApi
+from helpers import get_prompt
 # --------------------------------------------------------------------------- #
 #                       ARITHMETIC (SAFE CALCULATOR)                         #
 # --------------------------------------------------------------------------- #
 # --------------------------------------------------------------------------- #
 #                             WEB  &  WIKI  SEARCH                           #
 # --------------------------------------------------------------------------- #
 @lru_cache(maxsize=256)
 def _ddg_search(query: str, k: int = 6) -> list[dict[str, str]]:
     """Cached DuckDuckGo JSON search."""
 # --------------------------------------------------------------------------- #
 #                               YOUTUBE  TRANSCRIPT                          #
 # --------------------------------------------------------------------------- #
 @tool
 def youtube_transcript(url: str, chars: int = 10_000) -> str:
     """Fetch full YouTube transcript (first *chars* characters)."""
 # Instantiate a lightweight CLIP‑based zero‑shot image classifier (runs on CPU)
 ### The model 'openai/clip-vit-base-patch32' is a vision transformer (ViT) model trained as part of OpenAI’s CLIP project.
 ### It performs zero-shot image classification by mapping images and labels into the same embedding space.
+# _image_pipe = pipeline(
+#     "image-classification", model="openai/clip-vit-base-patch32", device="cpu"
+# )
 # @tool
 # def image_describe(img_bytes: bytes, top_k: int = 3) -> str:
 # --------------------------------------------------------------------------- #
 #                                 FILE  UTILS                                 #
 # --------------------------------------------------------------------------- #
 @tool
 def run_py(code: str) -> str:
     """Execute Python code in a sandboxed subprocess and return last stdout line."""
 @tool
 def analyze_excel_file(xls_bytes: bytes, question: str) -> str:
+    "Analyze Excel or CSV file by passing the data preview to LLM and getting the Python Pandas operation to run"
+    llm = ChatOpenAI(model="gpt-4o-mini", temperature=0, max_tokens=64)
+    # 1. full dataframe
     try:
         df = pd.read_excel(BytesIO(xls_bytes))
     except Exception:
         df = pd.read_csv(BytesIO(xls_bytes))
+    for col in df.select_dtypes(include="number").columns:
+        df[col] = df[col].astype(float)
+    # 2. ask the LLM for a single expression
+    prompt = get_prompt(
+        prompt_key="excel_analysis_one_liner", preview=df.head(5).to_dict(orient="list")
+    )
+    expr = llm.invoke(prompt).content.strip()
+    # 3. run it on the FULL df
+    try:
+        result = eval(expr, {"df": df, "pd": pd, "__builtins__": {}})
+        # ── normalize scalars to string -------------------------------------------
+        if isinstance(result, np.generic):
+            # keep existing LLM formatting (e.g. {:.2f}) if it's already a str
+            result = float(result)  # → plain Python float
+            return f"{result:.2f}"  # or str(result) if no decimals needed
+        # DataFrame / Series → single-line string
+        return (
+            result.to_string(index=False)
+            if hasattr(result, "to_string")
+            else str(result)
+        )
+    except Exception as e:
+        return f"eval_error:{e}"
 __all__ = [