Spaces:

sanbo1200
/

pekingduck

Running

App Files Files Community

sanbo commited on Jan 25

Commit

f118c0c

1 Parent(s): 509a621

update sth. at 2025-01-26 00:51:18

Browse files

Files changed (8) hide show

.dockerignore +128 -0
.gitignore +79 -0
Dockerfile +48 -1
base_chat_format.py +30 -0
base_get_channel.py +39 -0
duckai_service.py +543 -0
more_core.py +327 -0
requirements.txt +13 -0

.dockerignore ADDED Viewed

	@@ -0,0 +1,128 @@

+# Version Control Systems
+.git/
+.gitignore
+.gitattributes
+.svn/
+.hg/
+.github/
+# Environment and Configuration
+.env
+.env.*
+*.env
+.venv/
+venv/
+env/
+ENV/
+.python-version
+pip-selfcheck.json
+requirements.txt.bak
+# Python Specific
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+# IDE and Editors
+.idea/
+.vscode/
+*.swp
+*.swo
+*~
+.DS_Store
+.settings/
+.project
+.pydevproject
+.classpath
+*.sublime-project
+*.sublime-workspace
+.editorconfig
+# Testing and Documentation
+.tox/
+.coverage
+.coverage.*
+htmlcov/
+.pytest_cache/
+nosetests.xml
+coverage.xml
+*.cover
+.hypothesis/
+docs/
+*.md
+LICENSE*
+README*
+# Logs and Data
+*.log
+*.sql
+*.sqlite
+*.db
+logs/
+log/
+data/
+tmp/
+# Cache and Temporary Files
+.cache/
+.mypy_cache/
+.dmypy.json
+dmypy.json
+*.bak
+*.tmp
+*.temp
+.*.swp
+*.out
+# Build and Deployment
+.dockerignore
+Dockerfile*
+docker-compose*
+*.yml
+*.yaml
+.gitlab-ci.yml
+.travis.yml
+.circleci/
+# Dependencies and Packages
+node_modules/
+package-lock.json
+yarn.lock
+*.pyc
+*.pyo
+*.pyd
+*.so
+*.dylib
+*.dll
+# System Files
+.DS_Store
+Thumbs.db
+desktop.ini
+*.swp
+*~
+# Project Specific Backups
+*_backup/
+*_bak/
+*.old
+*.orig
+*.rej

.gitignore ADDED Viewed

	@@ -0,0 +1,79 @@

+.externalNativeBuild
+import-summary.txt
+#java files
+*.class
+*.dex
+.sync/
+#for idea temp file
+*.iws
+*.ipr
+*.iml
+target/
+.idea/
+.idea
+.gradle/
+release/
+build/
+spoon/
+releasebak/
+#mac temp file
+__MACOSX
+.DS_Store
+._.DS_Store
+#for eclipse
+.settings/
+local.properties
+*gen/
+*.classpath
+*/bin/
+bin/
+.project
+#temp file
+*.bak
+*.pmd
+sh.exe.stackdump
+.vs/
+.vscode/
+*.log
+*.ctxt
+.mtj.tmp/
+# virtual machine crash logs, see http://www.java.com/en/download/help/error_hotspot.xml
+hs_err_pid*
+# Package Files #
+# *.jar
+*.war
+*.nar
+*.ear
+*.zip
+*.tar.gz
+*.rar
+*.cxx
+*.cfg
+# for nodejs
+node_modules/
+# for python
+package-lock.json
+.$*
+*.drawio.bkp
+__pycache__
+*.pyc
+*.pyo
+*.pyd
+.Python
+env
+.env
+.venv
+pip-log.txt
+dev.md

Dockerfile CHANGED Viewed

	@@ -1 +1,48 @@
1	- ~~FROM~~ ~~ghcr.io/hhhaiai/pekingduck:latest~~

+# 使用官方Python镜像
+FROM python:3.11-slim
+# 设置工作目录
+WORKDIR /app
+# 安装系统依赖和字体
+RUN apt-get update && apt-get install -y \
+    fonts-ipafont-gothic \
+    fonts-wqy-zenhei \
+    fonts-thai-tlwg \
+    fonts-kacst \
+    fonts-freefont-ttf \
+    libxss1 \
+    libnss3 \
+    libnspr4 \
+    libatk1.0-0 \
+    libatk-bridge2.0-0 \
+    libcups2 \
+    libdrm2 \
+    libxkbcommon0 \
+    libxcomposite1 \
+    libxdamage1 \
+    libxfixes3 \
+    libxrandr2 \
+    libgbm1 \
+    libasound2 \
+    && rm -rf /var/lib/apt/lists/*
+# 复制项目文件
+COPY . .
+# 安装Python依赖
+RUN pip install --no-cache-dir -r requirements.txt
+# 安装Playwright及其依赖
+RUN playwright install chromium --with-deps
+# 环境变量配置
+ENV PYTHONUNBUFFERED=1
+ENV DEBUG=false
+ENV PORT=7860
+# 暴露端口
+EXPOSE 7860
+# 启动命令
+CMD ["python", "more_core.py"]

base_chat_format.py ADDED Viewed

	@@ -0,0 +1,30 @@

+import json
+import random
+import string
+def is_chatgpt_format(data):
+    """Check if the data is in the expected ChatGPT format"""
+    try:
+        # If the data is a string, try to parse it as JSON
+        if isinstance(data, str):
+            try:
+                data = json.loads(data)
+            except json.JSONDecodeError:
+                return False  # If the string can't be parsed, it's not in the expected format
+        # Now check if data is a dictionary and contains the necessary structure
+        if isinstance(data, dict):
+            # Ensure 'choices' is a list and the first item has a 'message' field
+            if "choices" in data and isinstance(data["choices"], list) and len(data["choices"]) > 0:
+                if "message" in data["choices"][0]:
+                    return True
+    except Exception as e:
+        print(f"Error checking ChatGPT format: {e}")
+    return False
+def _generate_id(letters: int = 4, numbers: int = 6) -> str:
+    """Generate unique chat completion ID"""
+    letters_str = ''.join(random.choices(string.ascii_lowercase, k=letters))
+    numbers_str = ''.join(random.choices(string.digits, k=numbers))
+    return f"chatcmpl-{letters_str}{numbers_str}"

base_get_channel.py ADDED Viewed

	@@ -0,0 +1,39 @@

+import re
+def get_channel_company(value: str, description: str = "") -> str:
+    """
+    提取模型所属公司，优先级：value > description > 截取value首段
+    """
+    # 匹配规则表（可扩展）
+    RULES = [
+        (r"claude", "Anthropic"),
+        (r"gemini|palm", "Google"),
+        (r"llama2?|llama3?|meta-llama", "Meta"),
+        (r"gpt-|dall·e|o1|o2|o3|o4", "OpenAI"),
+        (r"deepseek", "DeepSeek"),
+        (r"abab|minimax", "MiniMax"),
+        (r"mistral", "Mistral"),
+        (r"ernie|文心一言", "Baidu"),
+        (r"chatglm|智谱", "Zhipu")
+    ]
+    def _match(text: str) -> str | None:
+        """从文本中匹配公司（兼容空值）"""
+        if not text: return None
+        return next((owner for pattern, owner in RULES if re.search(pattern, text.lower())), None)
+    # 优先级逻辑
+    owner = _match(value) or _match(description)
+    if owner: return owner
+    # 截取首段逻辑优化（过滤空字符）
+    if value:
+        # 分割并过滤空字符串
+        #parts = [p for p in re.split(r'[-\s/]+', value) if p.strip()]
+        parts = [p for p in re.split(r'[-\s/._]+', value) if p.strip()]
+        if parts:
+            return parts[0].capitalize()  # 首字母大写
+    return "unknown"  # 全空或无有效内容

duckai_service.py ADDED Viewed

	@@ -0,0 +1,543 @@

+import requests
+from playwright.sync_api import sync_playwright
+import json
+import base_get_channel as channel
+from typing import Optional, Dict
+import time
+from datetime import datetime, timedelta
+# 禁用 SSL 警告
+import urllib3
+urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
+debug = True
+last_request_time = 0  # 上次请求的时间戳
+cache_duration = 14400  # 缓存有效期，单位：秒 (4小时)
+'''用于存储缓存的模型数据'''
+cached_models = {
+    "object": "list",
+    "data": [],
+    "version": "1.0.0",
+    "provider": "DuckAI",
+    "name": "DuckAI",
+    "default_locale": "zh-CN",
+    "status": True,
+    "time": 0
+}
+'''基础模型'''
+base_model = "gpt-4o-mini"
+# 全局变量：存储所有模型的统计信息
+# 格式：{model_name: {"calls": 调用次数, "fails": 失败次数, "last_fail": 最后失败时间}}
+MODEL_STATS: Dict[str, Dict] = {}
+def record_call(model_name: str, success: bool = True) -> None:
+    """
+    记录模型调用情况
+    Args:
+        model_name: 模型名称
+        success: 调用是否成功
+    """
+    global MODEL_STATS
+    if model_name not in MODEL_STATS:
+        MODEL_STATS[model_name] = {"calls": 0, "fails": 0, "last_fail": None}
+    stats = MODEL_STATS[model_name]
+    stats["calls"] += 1
+    if not success:
+        stats["fails"] += 1
+        stats["last_fail"] = datetime.now()
+def get_auto_model(cooldown_seconds: int = 300) -> str:
+    """异步获取最优模型"""
+    try:
+        if not MODEL_STATS:
+            get_models()
+        best_model = None
+        best_rate = -1.0
+        now = datetime.now()
+        for name, stats in MODEL_STATS.items():
+            if stats.get("last_fail") and (now - stats["last_fail"]) < timedelta(seconds=cooldown_seconds):
+                continue
+            total_calls = stats["calls"]
+            if total_calls > 0:
+                success_rate = (total_calls - stats["fails"]) / total_calls
+                if success_rate > best_rate:
+                    best_rate = success_rate
+                    best_model = name
+        default_model = best_model or base_model
+        if debug:
+            print(f"选择模型: {default_model}")
+        return default_model
+    except Exception as e:
+        if debug:
+            print(f"模型选择错误: {e}")
+        return base_model
+def get_models():
+    """model data retrieval with thread safety"""
+    global cached_models, last_request_time
+    current_time = time.time()
+    if (current_time - last_request_time) > cache_duration:
+        try:
+            if debug:
+                print(f"will get model ")
+            # Update timestamp before awaiting to prevent concurrent updates
+            get_model_impl_by_playwright()
+            last_request_time = current_time
+            if debug:
+                print(f"success get model ")
+        except Exception as e:
+            print(f"000000---{e}")
+    return json.dumps(cached_models)
+def get_model_impl_by_playwright():
+    global cached_models
+    """
+        从网页获取获取模型
+    """
+    with sync_playwright() as p:
+        browser = p.chromium.launch(headless=True)
+        context = browser.new_context()
+        page = context.new_page()
+        try:
+            # 访问页面
+            page.goto("https://duckduckgo.com/?q=DuckDuckGo+AI+Chat&ia=chat&duckai=1")
+            # 点击 Get Started 按钮
+            get_started_button_xpath = '//*[@id="react-layout"]/div/div[2]/main/div/div/div[2]/div/button'
+            page.wait_for_selector(get_started_button_xpath)
+            page.click(get_started_button_xpath)
+            # 等待所有模型加载完成
+            page.wait_for_function(
+                "document.querySelectorAll('ul[role=\"radiogroup\"] > li').length > 0"
+            )
+            # 解析模型信息
+            parser_models_info_form_page(page)
+        except Exception as e:
+            print(f"发生错误: {e}")
+        finally:
+            browser.close()
+        return cached_models
+def parser_models_info_form_page(page):
+    global cached_models
+    models = page.query_selector_all('ul[role="radiogroup"] > li')
+    # 创建现有模型的 ID 集合用于快速查找
+    existing_ids = {item["id"] for item in cached_models['data']}
+    result = []
+    # 确保有内容时更新
+    is_update = False
+    for model in models:
+        # 使用更精确的选择器
+        name_element = model.query_selector('.J58ouJfofMIxA2Ukt6lA')
+        description_element = model.query_selector('.tDjqHxDUIeGL37tpvoSI')
+        # 模型真实名字
+        value = model.query_selector('input').get_attribute('value')
+        # 确保有效
+        if not name_element or not value:
+            continue
+        # 模型描述
+        name = name_element.inner_text()
+        description = description_element.inner_text() if description_element else ""
+        # 确定描述供应商
+        owned_by = channel.get_channel_company(value, description)
+        # 生成新模型数据
+        new_model = {
+            "id": value,
+            "object": "model",
+            "_type": "text",
+            "created": int(time.time() * 1000),  # 使用当前时间戳
+            "owned_by": owned_by,
+            "description": name
+        }
+        # 记录成功
+        record_call(value)
+        # 检查是否已存在相同 ID 的模型
+        if new_model['id'] in existing_ids:
+            # 更新已存在的模型数据
+            for idx, item in enumerate(cached_models['data']):
+                if item['id'] == new_model['id']:
+                    cached_models['data'][idx] = new_model  # 完全替换旧数据
+                    break
+        else:
+            # 添加新模型到缓存
+            cached_models['data'].append(new_model)
+        is_updated = True
+    # 仅在检测到更新时刷新时间戳
+    if is_updated:
+        cached_models['time'] = int(time.time() * 1000)
+    return json.dumps(cached_models, ensure_ascii=False)
+def is_model_available(model_id: str, cooldown_seconds: int = 300) -> bool:
+    """
+    判断模型是否在模型列表中且非最近失败的模型
+    Args:
+        model_id: 模型ID，需要检查的模型标识符
+        cooldown_seconds: 失败冷却时间（秒），默认300秒
+    Returns:
+        bool: 如果模型可用返回True，否则返回False
+    Note:
+        - 当MODEL_STATS为空时会自动调用get_models()更新数据
+        - 检查模型是否在冷却期内，如果在冷却期则返回False
+    """
+    global MODEL_STATS
+    # 如果MODEL_STATS为空，加载模型数据
+    if not MODEL_STATS:
+        get_models()
+    # 检查模型是否在统计信息中
+    if model_id not in MODEL_STATS:
+        return False
+    # 检查是否在冷却期内
+    stats = MODEL_STATS[model_id]
+    if stats["last_fail"]:
+        time_since_failure = datetime.now() - stats["last_fail"]
+        if time_since_failure < timedelta(seconds=cooldown_seconds):
+            return False
+    return True
+def get_model_by_autoupdate(model_id: Optional[str] = None, cooldown_seconds: int = 300) -> Optional[str]:
+    """
+    检查提供的model_id是否可用，如果不可用则返回成功率最高的模型
+    Args:
+        model_id: 指定的模型ID，可选参数
+        cooldown_seconds: 失败冷却时间（秒），默认300秒
+    Returns:
+        str | None: 返回可用的模型ID，如果没有可用模型则返回None
+    Note:
+        - 当MODEL_STATS为空时会自动调用get_models()更新数据
+        - 如果指定的model_id可用，则直接返回
+        - 如果指定的model_id不可用，则返回成功率最高的模型
+    """
+    global MODEL_STATS
+    # 如果MODEL_STATS为空，加载模型数据
+    if not MODEL_STATS:
+        get_models()
+    # 如果提供了model_id且可用，直接返回
+    if model_id and is_model_available(model_id, cooldown_seconds):
+        return model_id
+    # 否则返回成功率最高的可用模型
+    return get_auto_model(cooldown_seconds=cooldown_seconds)
+################################################################################################
+# 元素存放变量及时间
+vqd4_time = ("", 0)
+def extract_x_vqd_4(default_host='duckduckgo.com', max_retries=3, retry_delay=1):
+    """
+    获取 x-vqd-4 token
+    Args:
+        default_host: 请求的主机地址
+        max_retries: 最大重试次数
+        retry_delay: 重试延迟时间(秒)
+    Returns:
+        str: 成功返回token，失败返回空字符串
+    """
+    url = f"https://{default_host}/duckchat/v1/status"
+    global vqd4_time
+    headers = {
+        'Accept': '*/*',  # 修正 Accept 头
+        'Accept-Encoding': 'gzip, deflate, br',
+        'Accept-Language': 'zh-CN,zh-Hans;q=0.9',
+        'Cache-Control': 'no-store',  # 修正缓存控制
+        'Connection': 'keep-alive',
+        'Host': default_host,
+        'Pragma': 'no-cache',
+        'Referer': f"https://{default_host}/",
+        'Sec-Fetch-Dest': 'empty',
+        'Sec-Fetch-Mode': 'cors',
+        'Sec-Fetch-Site': 'same-origin',
+        'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/17.4.1 Safari/605.1.15 Ddg/17.4.1',
+        'X-DuckDuckGo-Client': 'macOS',
+        'x-vqd-accept': '1'
+    }
+    for attempt in range(max_retries):
+        try:
+            response = requests.get(
+                url,
+                headers=headers,
+                timeout=10,  # 添加超时设置
+                verify=False  # 忽略 SSL 验证
+            )
+            response.encoding = 'utf-8'
+            if response.status_code == 200:
+                if 'x-vqd-4' in response.headers:
+                    vqd4 = response.headers['x-vqd-4']
+                    if vqd4.strip():  # 验证token不为空
+                        vqd4_time = (vqd4, int(time.time() * 1000))
+                        if debug:
+                            print(f"成功获取token: {vqd4}")
+                        return vqd4
+                if debug:
+                    print(f"Token为空，尝试次数: {attempt + 1}/{max_retries}")
+            else:
+                if debug:
+                    print(f"请求失败，状态码: {response.status_code}，尝试次数: {attempt + 1}/{max_retries}")
+            # 如果不是最后一次尝试，则等待后重试
+            if attempt < max_retries - 1:
+                time.sleep(retry_delay)
+        except requests.RequestException as e:
+            if debug:
+                print(f"请求异常: {e}，尝试次数: {attempt + 1}/{max_retries}")
+            if attempt < max_retries - 1:
+                time.sleep(retry_delay)
+            continue
+    if debug:
+        print("获取token失败，已达到最大重试次数")
+    return ""  # 所有重试都失败后返回空字符串
+# def makesure_token():
+#     """
+#     确保获取token:
+#     1. 如内存没有，则新建
+#     2. 内存键值对有，若失效，更新
+#     2. 内存键值对有，且无失效，直接使用
+#     """
+#     global vqd4_time
+#     x_vqd_4_value = ''
+#     if not vqd4_time[0].strip():
+#         # 字符串为空或仅包含空格
+#         x_vqd_4_value = extract_x_vqd_4()
+#     else:
+#         # 字符串非空
+#         print("字符串非空")
+#         t = vqd4_time[1]
+#         # 获取当前的 UNIX 时间戳（以毫秒为单位）
+#         current_time = int(time.time() * 1000)
+#         # 计算时间差（绝对值）
+#         time_difference = abs(current_time - t)
+#         # 检查时间差是否大于 2 分钟 (120,000 毫秒)
+#         if time_difference > 2 * 60 * 1000:
+#             print("时间差大于 2 分钟")
+#             x_vqd_4_value = extract_x_vqd_4()
+#         else:
+#             print("时间差在 2 分钟以内")
+#             x_vqd_4_value = vqd4_time[0]  # 直接使用缓存的 x_vqd_4
+#     # 确保有值
+#     if not x_vqd_4_value.strip():
+#         x_vqd_4_value = extract_x_vqd_4()
+#     return x_vqd_4_value
+def parse_response(response_text):
+    """
+    逐行解析
+    """
+    lines = response_text.split('\n')
+    result = ""
+    for line in lines:
+        if line.startswith("data:"):
+            data = json.loads(line[len("data:"):])
+            if "message" in data:
+                result += data["message"]
+    print(result)
+def chat_completion_message(user_prompt, x_vqd_4='', model=base_model,
+                            system_message='You are a helpful assistant.',
+                            user_id: str = None, session_id: str = None, default_host="duckduckgo.com"
+                            , stream=False, temperature=0.3, max_tokens=1024, top_p=0.5, frequency_penalty=0,
+                            presence_penalty=0):
+    """
+    单条消息请求: https://duckduckgo.com/duckchat/v1/chat
+    """
+    messages = [
+        # 需要 system-> user
+        {"role": "user", "content": system_message},
+        {"role": "user", "content": user_prompt}
+    ]
+    return chat_completion_messages(messages=messages, x_vqd_4=x_vqd_4, model=model, default_host=default_host
+                                    , user_id=user_id
+                                    , session_id=session_id
+                                    , stream=stream
+                                    , temperature=temperature
+                                    , max_tokens=max_tokens
+                                    , top_p=top_p
+                                    , frequency_penalty=frequency_penalty
+                                    , presence_penalty=presence_penalty
+                                    )
+def chat_completion_messages(
+        messages,
+        x_vqd_4='',
+        model=base_model,
+        user_id: str = None,
+        session_id: str = None,
+        default_host="duckduckgo.com",
+        stream=False, temperature=0.3, max_tokens=1024, top_p=0.5,
+        frequency_penalty=0, presence_penalty=0):
+    try:
+        # 确保model有效
+        if not model or model == "auto":
+            model = get_auto_model()
+        else:
+            model = get_model_by_autoupdate(model)
+        if debug:
+            print(f"校准后的model: {model}")
+        # 处理 token
+        if x_vqd_4 is None or not x_vqd_4.strip():
+            x_vqd_4 = extract_x_vqd_4()  # 使用 makesure_token 确保获取有效的 token
+        # # 验证 token 格式
+        # if not x_vqd_4.strip() or x_vqd_4.startswith("x-vqd-4 parameter not found"):
+        #     x_vqd_4 = makesure_token()  # token 无效时重新获取
+        print(f"send_request 获取的token: {x_vqd_4}")
+        headers = {
+            'Accept': 'text/event-stream',
+            'Accept-Encoding': 'gzip, deflate, br',
+            'Accept-Language': 'zh-CN,zh-Hans;q=0.9',
+            'Cache-Control': 'no-cache',
+            'Connection': 'keep-alive',
+            # 'Content-Length': '',
+            'Content-Type': 'application/json',
+            # 'Cookie': 'av=1; bf=1; dcm=3; dcs=1; n=1',
+            'Host': default_host,
+            'Origin': f"https://{default_host}",
+            'Pragma': 'no-cache',
+            'Referer': f"https://{default_host}/",
+            'Sec-Fetch-Dest': 'empty',
+            'Sec-Fetch-Mode': 'cors',
+            'Sec-Fetch-Site': 'same-origin',
+            'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/17.4.1 Safari/605.1.15 Ddg/17.4.1',
+            'X-DuckDuckGo-Client': 'macOS'
+        }
+        #  chat 独有请求头
+        # header.Set("accept", "text/event-stream")
+        # header.Set("x-vqd-4", token)
+        # 检查模型，如果messages 包含 system那么修改为user
+        for message in messages:
+            if message.get("role") == "system":
+                message["role"] = "user"
+        if x_vqd_4:
+            headers['x-vqd-4'] = x_vqd_4
+        data = {
+            "model": model,
+            "messages": messages
+        }
+        return chat_completion(default_host=default_host, model=model, headers=headers, payload=data)
+    except Exception as e:
+        print(f"使用模型[{model}]发生了异常：", e)
+    return ""
+def chat_completion(default_host, model, headers, payload):
+    global vqd4_time
+    try:
+        response = requests.post(f'https://{default_host}/duckchat/v1/chat', headers=headers, json=payload)
+        response.encoding = 'utf-8'  # 明确设置字符编码
+        response.raise_for_status()
+        # print("Status Code:", response.status_code)
+        # print("Content-Type:", response.headers.get('Content-Type'))
+        # print(response.text)
+        # print(response.headers)
+        final_content = ""
+        if response.status_code == 200:
+            # # 将 headers 转换为普通字典
+            # headers_dict = dict(response.headers)
+            # # 将字典转换为 JSON 字符串
+            # headers_json = json.dumps(headers_dict, ensure_ascii=False, indent=4)
+            # print(headers_json)
+            # 解析请求头
+            if 'x-vqd-4' in response.headers:
+                vqd4 = response.headers['x-vqd-4']
+                vqd4_time = (vqd4, int(time.time() * 1000))
+            # 解析响应内容
+            for line in response.iter_lines(decode_unicode=True):
+                # print(line)
+                # 检查 if 'data: [DONE]'在行中进行下一步动作
+                if 'data: [DONE]' in line:
+                    # 如果找到结束信号，退出循环
+                    break
+                elif line.startswith('data: '):  # 确保行以'data: '开头
+                    data_json = line[6:]  # 删除行前缀'data: '
+                    datax = json.loads(data_json)  # 解析JSON字符串为字典
+                    if 'message' in datax:
+                        final_content += datax['message']
+                        # print( final_content)
+            # 保存最终的content结果
+            final_result = final_content
+        return final_result
+    except Exception as e:
+        print(f"使用模型[{model}]发生了异常：", e)
+# 测试代码
+if __name__ == "__main__":
+    time1 = time.time() * 1000
+    result_json = get_models()
+    time2 = time.time() * 1000
+    print(f"耗时: {time2 - time1}")
+    print(result_json)
+    result_json2 = get_models()
+    time3 = time.time() * 1000
+    print(f"耗时2: {time3 - time2}")
+    print(result_json2)
+    print(f"获取自动模型1:{get_model_by_autoupdate('hello')}")
+    print(f"获取自动模型2:{get_auto_model()}")
+    t1 = time.time()
+    res = chat_completion_message("你是谁?你使用的是什么模型?你的知识库截止到什么时间? ")
+    t2 = time.time()
+    print(
+        f"====================================={base_model} --->测试结果【{t2 - t1}】=====================================\r\n{res}\r\n")
+    res2 = chat_completion_message("你比较擅长什么技能? ")
+    t3 = time.time()
+    print(
+        f"====================================={base_model} --->测试结果【{t3 - t2}】=====================================\r\n{res2}\r\n")

more_core.py ADDED Viewed

	@@ -0,0 +1,327 @@

+import json
+import multiprocessing
+import os
+import time
+from typing import Dict, Any, List
+import tiktoken
+import uvicorn
+from apscheduler.schedulers.background import BackgroundScheduler
+from fastapi import FastAPI, Request, HTTPException
+from fastapi.responses import JSONResponse
+from starlette.responses import HTMLResponse
+# 禁用 SSL 警告
+import urllib3
+urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
+import duckai_service as dg
+import base_chat_format as forts
+# debug for Log
+debug = True
+app = FastAPI(
+    title="pekingduck",
+    description="Pekingduck is delious~",
+    version="1.0.0|2025.1.26"
+)
+class APIServer:
+    """High-performance API server implementation"""
+    def __init__(self, app: FastAPI):
+        self.app = app
+        self.encoding = tiktoken.get_encoding("cl100k_base")
+        self._setup_routes()
+        self._setup_scheduler()
+        dg.get_models()
+    def _setup_scheduler(self):
+        """ Schedule tasks to check and reload routes and models at regular intervals. """
+        self.scheduler = BackgroundScheduler()
+        # Scheduled Task 1: Check and reload routes every 30 seconds. Calls _reload_routes_if_needed method to check if routes need to be updated
+        self.scheduler.add_job(self._reload_routes_if_needed, 'interval', seconds=30)
+        # Scheduled Task 2: Reload models every 30 minutes (1800 seconds). This task will check and update the model data periodically
+        self.scheduler.add_job(self._reload_check, 'interval', seconds=60 * 30)
+        self.scheduler.start()
+    def _setup_routes(self) -> None:
+        """Initialize API routes"""
+        self.routes = """Initialize API routes"""
+        # Static routes with names for filtering
+        @self.app.get("/", name="root", include_in_schema=False)
+        def root():
+            return HTMLResponse(content="<h1>hello. It's home page.</h1>")
+        @self.app.get("/web", name="web")
+        def web():
+            return HTMLResponse(content="<h1>hello. It's web page.</h1>")
+        @self.app.get("/health", name="health")
+        def health():
+            return JSONResponse(content={"status": "working"})
+        @self.app.get("/v1/models", name="models")
+        def models():
+            if debug:
+                print("Fetching models...")
+            models_str = dg.get_models()
+            try:
+                models_json = json.loads(models_str)
+                return JSONResponse(content=models_json)
+            except json.JSONDecodeError as e:
+                raise HTTPException(status_code=500,
+                                    detail=f"Invalid models data: {str(e)}")
+        # Register dynamic chat completion routes
+        routes = self._get_routes()
+        if debug:
+            print(f"Registering routes: {routes}")
+        for path in routes:
+            self._register_route(path)
+        existing_routes = [route.path for route in self.app.routes if hasattr(route, 'path')]
+        if debug:
+            print(f"All routes now: {existing_routes}")
+    def _get_routes(self) -> List[str]:
+        """Get configured API routes"""
+        default_path = "/api/v1/chat/completions"
+        replace_chat = os.getenv("REPLACE_CHAT", "")
+        prefix_chat = os.getenv("PREFIX_CHAT", "")
+        append_chat = os.getenv("APPEND_CHAT", "")
+        if replace_chat:
+            return [path.strip() for path in replace_chat.split(",") if path.strip()]
+        routes = []
+        if prefix_chat:
+            routes.extend(f"{prefix.rstrip('/')}{default_path}"
+                          for prefix in prefix_chat.split(","))
+            return routes
+        if append_chat:
+            append_paths = [path.strip() for path in append_chat.split(",") if path.strip()]
+            routes = [default_path] + append_paths
+            return routes
+        return [default_path]
+    def _register_route(self, path: str) -> None:
+        """Register a single API route"""
+        global debug
+        async def chat_endpoint(request: Request) -> Dict[str, Any]:
+            try:
+                if debug:
+                    print(f"Request chat_endpoint...")
+                headers = dict(request.headers)
+                data = await request.json()
+                if debug:
+                    print(f"Request received...\r\n\tHeaders: {headers},\r\n\tData: {data}")
+                return self._generate_response(headers, data)
+            except Exception as e:
+                if debug:
+                    print(f"Request processing error: {e}")
+                raise HTTPException(status_code=500, detail="Internal server error") from e
+        self.app.post(path)(chat_endpoint)
+    def _calculate_tokens(self, text: str) -> int:
+        """Calculate token count for text"""
+        return len(self.encoding.encode(text))
+    def process_result(self, result, model):
+        # 如果result是字符串，尝试将其转换为JSON
+        if isinstance(result, str):
+            try:
+                result = json.loads(result)  # 转换为JSON
+            except json.JSONDecodeError:
+                return result
+        # 确保result是一个字典（JSON对象）
+        if isinstance(result, dict):
+            # 设置新的id和object值
+            result['id'] = forts._generate_id()  # 根据需要设置新的ID值
+            result['object'] = "chat.completion"  # 根据需要设置新的object值
+            # 添加model值
+            result['model'] = model  # 根据需要设置model值
+        return result
+    def _generate_response(self, headers: Dict[str, str], data: Dict[str, Any]) -> Dict[str, Any]:
+        """Generate API response"""
+        global debug
+        if debug:
+            print("inside _generate_response")
+        try:
+            # check model
+            model = data.get("model")
+            # print(f"model: {model}")
+            # just auto will check
+            if "auto" == model:
+                model = dg.get_auto_model()
+            # else:
+            #     if not dg.is_model_available(model):
+            #         raise HTTPException(status_code=400, detail="Invalid Model")
+            # ## kuan
+            # model = dg.get_model_by_autoupdate(model)
+            # must has token ? token check
+            authorization = headers.get('Authorization')
+            token = os.getenv("TOKEN", "")
+            if token and token not in authorization:
+                raise HTTPException(status_code=401, detail="无效的Token")
+            # call ai
+            msgs = data.get("messages")
+            if not msgs:
+                raise HTTPException(status_code=400, detail="消息不能为空")
+            if debug:
+                print(f"request model: {model}")
+                if token:
+                    print(f"request token: {token}")
+                print(f"request messages: {msgs}")
+            result = dg.chat_completion_messages(
+                messages=msgs,
+                model=model
+            )
+            if debug:
+                print(f"result: {result}---- {forts.is_chatgpt_format(result)}")
+            # If the request body data already matches ChatGPT format, return it directly
+            if forts.is_chatgpt_format(result):
+                # If data already follows ChatGPT format, use it directly
+                response_data = self.process_result(result, model)
+            else:
+                # Calculate the current timestamp
+                current_timestamp = int(time.time() * 1000)
+                # Otherwise, calculate the tokens and return a structured response
+                prompt_tokens = self._calculate_tokens(str(data))
+                completion_tokens = self._calculate_tokens(result)
+                total_tokens = prompt_tokens + completion_tokens
+                response_data = {
+                    "id": forts._generate_id(),
+                    "object": "chat.completion",
+                    "created": current_timestamp,
+                    "model": data.get("model", "gpt-4o"),
+                    "usage": {
+                        "prompt_tokens": prompt_tokens,
+                        "completion_tokens": completion_tokens,
+                        "total_tokens": total_tokens
+                    },
+                    "choices": [{
+                        "message": {
+                            "role": "assistant",
+                            "content": result
+                        },
+                        "finish_reason": "stop",
+                        "index": 0
+                    }]
+                }
+            # Print the response for debugging (you may remove this in production)
+            if debug:
+                print(f"Response Data: {response_data}")
+            return response_data
+        except Exception as e:
+            dg.record_call(model,False)
+            if debug:
+                print(f"Response generation error: {e}")
+            raise HTTPException(status_code=500, detail=str(e)) from e
+    def _get_workers_count(self) -> int:
+        """Calculate optimal worker count"""
+        try:
+            cpu_cores = multiprocessing.cpu_count()
+            recommended_workers = (2 * cpu_cores) + 1
+            return min(max(4, recommended_workers), 8)
+        except Exception as e:
+            if debug:
+                print(f"Worker count calculation failed: {e}, using default 4")
+            return 4
+    def get_server_config(self, host: str = "0.0.0.0", port: int = 7860) -> uvicorn.Config:
+        """Get server configuration"""
+        workers = self._get_workers_count()
+        if debug:
+            print(f"Configuring server with {workers} workers")
+        return uvicorn.Config(
+            app=self.app,
+            host=host,
+            port=port,
+            workers=workers,
+            loop="uvloop",
+            limit_concurrency=1000,
+            timeout_keep_alive=30,
+            access_log=True,
+            log_level="info",
+            http="httptools"
+        )
+    def run(self, host: str = "0.0.0.0", port: int = 7860) -> None:
+        """Run the API server"""
+        config = self.get_server_config(host, port)
+        server = uvicorn.Server(config)
+        server.run()
+    def _reload_check(self) -> None:
+        dg.reload_check()
+    def _reload_routes_if_needed(self) -> None:
+        """Check if routes need to be reloaded based on environment variables"""
+        # reload Debug
+        global debug
+        debug = os.getenv("DEBUG", "False").lower() in ["true", "1", "t"]
+        # relaod routes
+        new_routes = self._get_routes()
+        current_routes = [route for route in self.app.routes if hasattr(route, 'path')]
+        # Check if the current routes are different from the new routes
+        if [route.path for route in current_routes] != new_routes:
+            if debug:
+                print("Routes changed, reloading...")
+            self._reload_routes(new_routes)
+    # def _reload_routes(self, new_routes: List[str]) -> None:
+    #     """Reload the routes based on the updated configuration"""
+    #     # Clear existing routes
+    #     self.app.routes.clear()
+    #     # Register new routes
+    #     for path in new_routes:
+    #         self._register_route(path)
+    def _reload_routes(self, new_routes: List[str]) -> None:
+        """Reload only dynamic routes while preserving static ones"""
+        # Define static route names
+        static_routes = {"root", "web", "health", "models"}
+        # Remove only dynamic routes
+        self.app.routes[:] = [
+            route for route in self.app.routes
+            if not hasattr(route, 'name') or route.name in static_routes
+        ]
+        # Register new dynamic routes
+        for path in new_routes:
+            self._register_route(path)
+def create_server() -> APIServer:
+    """Factory function to create server instance"""
+    return APIServer(app)
+if __name__ == "__main__":
+    port = int(os.getenv("PORT", "7860"))
+    server = create_server()
+    server.run(port=port)

requirements.txt ADDED Viewed

	@@ -0,0 +1,13 @@

+playwright
+aiohttp
+apscheduler
+beautifulsoup4
+fastapi
+requests
+starlette
+tiktoken
+urllib3
+uvicorn
+uvloop
+httptools