Spaces:

Agents-MCP-Hackathon
/

TDAgent

Running

App Files Files Community

Fix Huggingface Inference

#12

by jponf - opened Jun 5

base: refs/heads/main

←

from: refs/pr/12

Discussion Files changed

+2071

-1496

Files changed (6) hide show

pyproject.toml +1 -0
requirements-dev.txt +9 -0
requirements.txt +9 -0
tdagent/grchat.py +71 -29
tdagent/grcomponents/mcbgroup.py +13 -5
uv.lock +0 -0

pyproject.toml CHANGED Viewed

@@ -13,6 +13,7 @@ requires-python = ">=3.10,<4"
 readme = "README.md"
 license = ""
 dependencies = [
     "gradio[mcp]~=5.31",
     "huggingface-hub>=0.32.3",
     "langchain-aws>=0.2.24",

 readme = "README.md"
 license = ""
 dependencies = [
+    "aiohttp>=3.12.9",
     "gradio[mcp]~=5.31",
     "huggingface-hub>=0.32.3",
     "langchain-aws>=0.2.24",

requirements-dev.txt CHANGED Viewed

@@ -1,8 +1,13 @@
 # This file was autogenerated by uv via the following command:
 #    uv export --format requirements-txt --no-hashes --no-annotate --group dev --group test -o requirements-dev.txt
 aiofiles==24.1.0
 annotated-types==0.7.0
 anyio==4.9.0
 audioop-lts==0.2.1 ; python_full_version >= '3.13'
 boolean-py==5.0
 boto3==1.38.27
@@ -23,6 +28,7 @@ exceptiongroup==1.3.0 ; python_full_version < '3.11'
 fastapi==0.115.12
 ffmpy==0.6.0
 filelock==3.18.0
 fsspec==2025.5.1
 gradio==5.32.1
 gradio-client==1.10.2
@@ -58,6 +64,7 @@ mcp==1.9.0
 mdurl==0.1.2
 mpmath==1.3.0
 msgpack==1.1.0
 mypy==1.16.0
 mypy-extensions==1.1.0
 networkx==3.4.2 ; python_full_version < '3.11'
@@ -94,6 +101,7 @@ pip-requirements-parser==32.0.1
 platformdirs==4.3.8
 pluggy==1.6.0
 pre-commit==3.8.0
 py-serializable==2.0.0
 pycparser==2.22 ; platform_python_implementation == 'PyPy'
 pydantic==2.11.5
@@ -150,4 +158,5 @@ virtualenv==20.31.2
 websockets==15.0.1
 xdoctest==1.2.0
 xxhash==3.5.0
 zstandard==0.23.0

 # This file was autogenerated by uv via the following command:
 #    uv export --format requirements-txt --no-hashes --no-annotate --group dev --group test -o requirements-dev.txt
 aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.9
+aiosignal==1.3.2
 annotated-types==0.7.0
 anyio==4.9.0
+async-timeout==5.0.1 ; python_full_version < '3.11'
+attrs==25.3.0
 audioop-lts==0.2.1 ; python_full_version >= '3.13'
 boolean-py==5.0
 boto3==1.38.27
 fastapi==0.115.12
 ffmpy==0.6.0
 filelock==3.18.0
+frozenlist==1.6.2
 fsspec==2025.5.1
 gradio==5.32.1
 gradio-client==1.10.2
 mdurl==0.1.2
 mpmath==1.3.0
 msgpack==1.1.0
+multidict==6.4.4
 mypy==1.16.0
 mypy-extensions==1.1.0
 networkx==3.4.2 ; python_full_version < '3.11'
 platformdirs==4.3.8
 pluggy==1.6.0
 pre-commit==3.8.0
+propcache==0.3.1
 py-serializable==2.0.0
 pycparser==2.22 ; platform_python_implementation == 'PyPy'
 pydantic==2.11.5
 websockets==15.0.1
 xdoctest==1.2.0
 xxhash==3.5.0
+yarl==1.20.0
 zstandard==0.23.0

requirements.txt CHANGED Viewed

@@ -1,8 +1,13 @@
 # This file was autogenerated by uv via the following command:
 #    uv export --format requirements-txt --no-hashes --no-annotate --no-dev -o requirements.txt
 aiofiles==24.1.0
 annotated-types==0.7.0
 anyio==4.9.0
 audioop-lts==0.2.1 ; python_full_version >= '3.13'
 boto3==1.38.27
 botocore==1.38.27
@@ -17,6 +22,7 @@ exceptiongroup==1.3.0 ; python_full_version < '3.11'
 fastapi==0.115.12
 ffmpy==0.6.0
 filelock==3.18.0
 fsspec==2025.5.1
 gradio==5.32.1
 gradio-client==1.10.2
@@ -49,6 +55,7 @@ markupsafe==3.0.2
 mcp==1.9.0
 mdurl==0.1.2 ; sys_platform != 'emscripten'
 mpmath==1.3.0
 networkx==3.4.2 ; python_full_version < '3.11'
 networkx==3.5 ; python_full_version >= '3.11'
 numpy==1.26.4 ; python_full_version < '3.12'
@@ -74,6 +81,7 @@ packaging==24.2
 pandas==2.2.3
 pillow==11.2.1
 pluggy==1.6.0
 pycparser==2.22 ; platform_python_implementation == 'PyPy'
 pydantic==2.11.5
 pydantic-core==2.33.2
@@ -125,4 +133,5 @@ uvicorn==0.34.3 ; sys_platform != 'emscripten'
 websockets==15.0.1
 xdoctest==1.2.0
 xxhash==3.5.0
 zstandard==0.23.0

 # This file was autogenerated by uv via the following command:
 #    uv export --format requirements-txt --no-hashes --no-annotate --no-dev -o requirements.txt
 aiofiles==24.1.0
+aiohappyeyeballs==2.6.1
+aiohttp==3.12.9
+aiosignal==1.3.2
 annotated-types==0.7.0
 anyio==4.9.0
+async-timeout==5.0.1 ; python_full_version < '3.11'
+attrs==25.3.0
 audioop-lts==0.2.1 ; python_full_version >= '3.13'
 boto3==1.38.27
 botocore==1.38.27
 fastapi==0.115.12
 ffmpy==0.6.0
 filelock==3.18.0
+frozenlist==1.6.2
 fsspec==2025.5.1
 gradio==5.32.1
 gradio-client==1.10.2
 mcp==1.9.0
 mdurl==0.1.2 ; sys_platform != 'emscripten'
 mpmath==1.3.0
+multidict==6.4.4
 networkx==3.4.2 ; python_full_version < '3.11'
 networkx==3.5 ; python_full_version >= '3.11'
 numpy==1.26.4 ; python_full_version < '3.12'
 pandas==2.2.3
 pillow==11.2.1
 pluggy==1.6.0
+propcache==0.3.1
 pycparser==2.22 ; platform_python_implementation == 'PyPy'
 pydantic==2.11.5
 pydantic-core==2.33.2
 websockets==15.0.1
 xdoctest==1.2.0
 xxhash==3.5.0
+yarl==1.20.0
 zstandard==0.23.0

tdagent/grchat.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from __future__ import annotations
 from collections.abc import Mapping, Sequence
 from types import MappingProxyType
 from typing import TYPE_CHECKING, Any
@@ -8,9 +9,10 @@ import boto3
 import botocore
 import botocore.exceptions
 import gradio as gr
 from langchain_aws import ChatBedrock
 from langchain_core.messages import AIMessage, HumanMessage, SystemMessage
-from langchain_huggingface import HuggingFaceEndpoint
 from langchain_mcp_adapters.client import MultiServerMCPClient
 from langgraph.prebuilt import create_react_agent
 from openai import OpenAI
@@ -51,15 +53,32 @@ GRADIO_ROLE_TO_LG_MESSAGE_TYPE = MappingProxyType(
     },
 )
-MODEL_OPTIONS = {
-    "AWS Bedrock": {
-        "Anthropic Claude 3.5 Sonnet": "eu.anthropic.claude-3-5-sonnet-20240620-v1:0",
-        #  "Anthropic Claude 3.7 Sonnet": "anthropic.claude-3-7-sonnet-20250219-v1:0",
-    },
-    "HuggingFace": {
-        "Mistral 7B Instruct": "mistralai/Mistral-7B-Instruct",
-    },
-}
 #### Shared variables ####
@@ -109,18 +128,20 @@ def create_bedrock_llm(
 def create_hf_llm(
     hf_model_id: str,
     huggingfacehub_api_token: str | None = None,
-) -> tuple[HuggingFaceEndpoint | None, str]:
     """Create a LangGraph Hugging Face agent."""
     try:
         llm = HuggingFaceEndpoint(
             model=hf_model_id,
-            huggingfacehub_api_token=huggingfacehub_api_token,
             temperature=0.8,
         )
     except Exception as e:  # noqa: BLE001
         return None, str(e)
-    return llm, ""
 ## OpenAI LLM creation ##
@@ -286,14 +307,18 @@ async def gr_chat_function(  # noqa: D103
         messages.append(message_type(content=hist_msg["content"]))
     messages.append(HumanMessage(content=message))
-    llm_response = await llm_agent.ainvoke(
-        {
-            "messages": messages,
-        },
-    )
-    return llm_response["messages"][-1].content
 ## UI components ##
@@ -314,7 +339,12 @@ def toggle_model_fields(
     # Update model choices based on the selected provider
     if provider in MODEL_OPTIONS:
         model_choices = list(MODEL_OPTIONS[provider].keys())
-        model_pretty = gr.update(choices=model_choices, visible=True, interactive=True)
     else:
         model_pretty = gr.update(choices=[], visible=False)
@@ -346,7 +376,9 @@ async def update_connection_status(  # noqa: PLR0913
     """Update the connection status based on the selected provider and model."""
     if not provider or not pretty_model:
         return "❌ Please select a provider and model."
     model_id = MODEL_OPTIONS.get(provider, {}).get(pretty_model)
     if model_id:
         if provider == "AWS Bedrock":
             connection = await gr_connect_to_bedrock(
@@ -363,15 +395,21 @@ async def update_connection_status(  # noqa: PLR0913
             connection = await gr_connect_to_hf(model_id, hf_token, mcp_list_state)
         elif provider == "Nebius":
             connection = await gr_connect_to_nebius(model_id, hf_token, mcp_list_state)
-        else:
-            return "❌ Invalid provider"
-    return connection if connection else "❌ Invalid provider"
-with gr.Blocks(
-    theme=gr.themes.Origin(primary_hue="teal", spacing_size="sm", font="sans-serif"),
-    title="TDAgent",
-) as gr_app, gr.Row():
     with gr.Column(scale=1):
         with gr.Accordion("🔌  MCP Servers", open=False):
             mcp_list = MutableCheckBoxGroup(
@@ -382,6 +420,10 @@ with gr.Blocks(
                     ),
                 ],
                 label="MCP Servers",
             )
         with gr.Accordion("⚙️  Provider Configuration", open=True):

 from __future__ import annotations
+from collections import OrderedDict
 from collections.abc import Mapping, Sequence
 from types import MappingProxyType
 from typing import TYPE_CHECKING, Any
 import botocore
 import botocore.exceptions
 import gradio as gr
+import gradio.themes as gr_themes
 from langchain_aws import ChatBedrock
 from langchain_core.messages import AIMessage, HumanMessage, SystemMessage
+from langchain_huggingface import ChatHuggingFace, HuggingFaceEndpoint
 from langchain_mcp_adapters.client import MultiServerMCPClient
 from langgraph.prebuilt import create_react_agent
 from openai import OpenAI
     },
 )
+MODEL_OPTIONS = OrderedDict(  # Initialize with tuples to preserve options order
+    (
+        (
+            "HuggingFace",
+            {
+                "Mistral 7B Instruct": "mistralai/Mistral-7B-Instruct-v0.3",
+                "Llama 3.1 8B Instruct": "meta-llama/Llama-3.1-8B-Instruct",
+                # "Qwen3 235B A22B": "Qwen/Qwen3-235B-A22B",  # Slow inference
+                "Microsoft Phi-3.5-mini Instruct": "microsoft/Phi-3.5-mini-instruct",
+                # "Deepseek R1 distill-llama 70B": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",  # noqa: E501
+                # "Deepseek V3": "deepseek-ai/DeepSeek-V3",
+            },
+        ),
+        (
+            "AWS Bedrock",
+            {
+                "Anthropic Claude 3.5 Sonnet (EU)": (
+                    "eu.anthropic.claude-3-5-sonnet-20240620-v1:0"
+                ),
+                #  "Anthropic Claude 3.7 Sonnet": (
+                #   "anthropic.claude-3-7-sonnet-20250219-v1:0"
+                # ),
+            },
+        ),
+    ),
+)
 #### Shared variables ####
 def create_hf_llm(
     hf_model_id: str,
     huggingfacehub_api_token: str | None = None,
+) -> tuple[ChatHuggingFace | None, str]:
     """Create a LangGraph Hugging Face agent."""
     try:
         llm = HuggingFaceEndpoint(
             model=hf_model_id,
             temperature=0.8,
+            task="text-generation",
+            huggingfacehub_api_token=huggingfacehub_api_token,
         )
+        chat_llm = ChatHuggingFace(llm=llm)
     except Exception as e:  # noqa: BLE001
         return None, str(e)
+    return chat_llm, ""
 ## OpenAI LLM creation ##
         messages.append(message_type(content=hist_msg["content"]))
     messages.append(HumanMessage(content=message))
+    try:
+        llm_response = await llm_agent.ainvoke(
+            {
+                "messages": messages,
+            },
+        )
+        return llm_response["messages"][-1].content
+    except Exception as err:
+        raise gr.Error(
+            f"We encountered an error while invoking the model:\n{err}",
+            print_exception=True,
+        ) from err
 ## UI components ##
     # Update model choices based on the selected provider
     if provider in MODEL_OPTIONS:
         model_choices = list(MODEL_OPTIONS[provider].keys())
+        model_pretty = gr.update(
+            choices=model_choices,
+            value=model_choices[0],
+            visible=True,
+            interactive=True,
+        )
     else:
         model_pretty = gr.update(choices=[], visible=False)
     """Update the connection status based on the selected provider and model."""
     if not provider or not pretty_model:
         return "❌ Please select a provider and model."
     model_id = MODEL_OPTIONS.get(provider, {}).get(pretty_model)
+    connection = "❌ Invalid provider"
     if model_id:
         if provider == "AWS Bedrock":
             connection = await gr_connect_to_bedrock(
             connection = await gr_connect_to_hf(model_id, hf_token, mcp_list_state)
         elif provider == "Nebius":
             connection = await gr_connect_to_nebius(model_id, hf_token, mcp_list_state)
+    return connection
+with (
+    gr.Blocks(
+        theme=gr_themes.Origin(
+            primary_hue="teal",
+            spacing_size="sm",
+            font="sans-serif",
+        ),
+        title="TDAgent",
+    ) as gr_app,
+    gr.Row(),
+):
     with gr.Column(scale=1):
         with gr.Accordion("🔌  MCP Servers", open=False):
             mcp_list = MutableCheckBoxGroup(
                     ),
                 ],
                 label="MCP Servers",
+                new_value_label="MCP endpoint",
+                new_name_label="MCP endpoint name",
+                new_value_placeholder="https://my-cool-mcp-server.com/mcp/sse",
+                new_name_placeholder="Swiss army knife of MCPs",
             )
         with gr.Accordion("⚙️  Provider Configuration", open=True):

tdagent/grcomponents/mcbgroup.py CHANGED Viewed

@@ -19,7 +19,7 @@ class MutableCheckBoxGroupEntry(NamedTuple):
 class MutableCheckBoxGroup(gr.Blocks):
     """Check box group with controls to add or remove values."""
-    def __init__(  # noqa: PLR0913
         self,
         values: list[MutableCheckBoxGroupEntry] | None = None,
         label: str = "Extendable List",
@@ -68,16 +68,24 @@ class MutableCheckBoxGroup(gr.Blocks):
                 self.input_value = gr.Textbox(
                     label=self.new_value_label,
                     placeholder=self.new_value_placeholder,
-                    scale=4,
                 )
                 self.input_name = gr.Textbox(
                     label=self.new_name_label,
                     placeholder=self.new_name_placeholder,
                     scale=2,
                 )
-                with gr.Column():
-                    self.add_btn = gr.Button("Add", variant="primary", scale=1)
-                    self.delete_btn = gr.Button("Delete Selected", variant="stop")
             # Vertical checkbox group
             self.items_group = gr.CheckboxGroup(

 class MutableCheckBoxGroup(gr.Blocks):
     """Check box group with controls to add or remove values."""
+    def __init__(
         self,
         values: list[MutableCheckBoxGroupEntry] | None = None,
         label: str = "Extendable List",
                 self.input_value = gr.Textbox(
                     label=self.new_value_label,
                     placeholder=self.new_value_placeholder,
+                    scale=3,
                 )
                 self.input_name = gr.Textbox(
                     label=self.new_name_label,
                     placeholder=self.new_name_placeholder,
                     scale=2,
                 )
+            with gr.Row():
+                self.add_btn = gr.Button(
+                    "Add",
+                    variant="primary",
+                    scale=1,
+                )
+                self.delete_btn = gr.Button(
+                    "Delete Selected",
+                    variant="stop",
+                    scale=1,
+                )
             # Vertical checkbox group
             self.items_group = gr.CheckboxGroup(

uv.lock CHANGED Viewed

The diff for this file is too large to render. See raw diff