#!/usr/bin/env python3 # -*- coding: utf-8 -*- """ Warp API 桥接路由 提供 /healthz、/api/warp/send_stream、/api/warp/send_stream_sse 等最小桥接端点与 JWT 管理。 """ import json import asyncio import httpx from typing import Any, Dict, List, Optional from datetime import datetime from fastapi import FastAPI, HTTPException from fastapi.middleware.cors import CORSMiddleware from pydantic import BaseModel from ..core.logging import logger from ..core.protobuf_utils import protobuf_to_dict, dict_to_protobuf_bytes from ..core.auth import get_jwt_token, refresh_jwt_if_needed, is_token_expired, get_valid_jwt, acquire_anonymous_access_token from ..config.settings import CLIENT_VERSION, OS_CATEGORY, OS_NAME, OS_VERSION, WARP_URL as CONFIG_WARP_URL from ..core.server_message_data import decode_server_message_data, encode_server_message_data def _encode_smd_inplace(obj: Any) -> Any: if isinstance(obj, dict): new_d = {} for k, v in obj.items(): if k in ("server_message_data", "serverMessageData") and isinstance(v, dict): try: b64 = encode_server_message_data( uuid=v.get("uuid"), seconds=v.get("seconds"), nanos=v.get("nanos"), ) new_d[k] = b64 except Exception: new_d[k] = v else: new_d[k] = _encode_smd_inplace(v) return new_d elif isinstance(obj, list): return [_encode_smd_inplace(x) for x in obj] else: return obj def _decode_smd_inplace(obj: Any) -> Any: if isinstance(obj, dict): new_d = {} for k, v in obj.items(): if k in ("server_message_data", "serverMessageData") and isinstance(v, str): try: dec = decode_server_message_data(v) new_d[k] = dec except Exception: new_d[k] = v else: new_d[k] = _decode_smd_inplace(v) return new_d elif isinstance(obj, list): return [_decode_smd_inplace(x) for x in obj] else: return obj from ..core.schema_sanitizer import sanitize_mcp_input_schema_in_packet class EncodeRequest(BaseModel): json_data: Optional[Dict[str, Any]] = None message_type: str = "warp.multi_agent.v1.Request" task_context: Optional[Dict[str, Any]] = None input: Optional[Dict[str, Any]] = None settings: Optional[Dict[str, Any]] = None metadata: Optional[Dict[str, Any]] = None mcp_context: Optional[Dict[str, Any]] = None existing_suggestions: Optional[Dict[str, Any]] = None client_version: Optional[str] = None os_category: Optional[str] = None os_name: Optional[str] = None os_version: Optional[str] = None class Config: extra = "allow" def get_data(self) -> Dict[str, Any]: if self.json_data is not None: return self.json_data else: data: Dict[str, Any] = {} if self.task_context is not None: data["task_context"] = self.task_context if self.input is not None: data["input"] = self.input if self.settings is not None: data["settings"] = self.settings if self.metadata is not None: data["metadata"] = self.metadata if self.mcp_context is not None: data["mcp_context"] = self.mcp_context if self.existing_suggestions is not None: data["existing_suggestions"] = self.existing_suggestions if self.client_version is not None: data["client_version"] = self.client_version if self.os_category is not None: data["os_category"] = self.os_category if self.os_name is not None: data["os_name"] = self.os_name if self.os_version is not None: data["os_version"] = self.os_version skip_keys = { "json_data", "message_type", "task_context", "input", "settings", "metadata", "mcp_context", "existing_suggestions", "client_version", "os_category", "os_name", "os_version" } try: for k, v in self.__dict__.items(): if v is None: continue if k in skip_keys: continue if k not in data: data[k] = v except Exception: pass return data app = FastAPI(title="Warp Protobuf编解码服务器", version="1.0.0") app.add_middleware( CORSMiddleware, allow_origins=["*"], allow_credentials=True, allow_methods=["*"], allow_headers=["*"], ) @app.get("/") async def root(): return {"message": "Warp Protobuf编解码服务器", "version": "1.0.0"} @app.get("/healthz") async def health_check(): return {"status": "ok", "timestamp": datetime.now().isoformat()} @app.post("/api/auth/refresh") async def refresh_auth_token(): try: success = await refresh_jwt_if_needed() if success: return {"success": True, "message": "JWT token刷新成功", "timestamp": datetime.now().isoformat()} else: return {"success": False, "message": "JWT token刷新失败", "suggestion": "检查网络连接或手动运行 'uv run refresh_jwt.py'"} except Exception as e: logger.error(f"❌ 刷新JWT token失败: {e}") raise HTTPException(500, f"刷新token失败: {e}") @app.post("/api/warp/send_stream") async def send_to_warp_api_parsed( request: EncodeRequest ): try: logger.info(f"收到Warp API解析发送请求,消息类型: {request.message_type}") actual_data = request.get_data() if not actual_data: raise HTTPException(400, "数据包不能为空") wrapped = {"json_data": actual_data} wrapped = sanitize_mcp_input_schema_in_packet(wrapped) actual_data = wrapped.get("json_data", actual_data) actual_data = _encode_smd_inplace(actual_data) protobuf_bytes = dict_to_protobuf_bytes(actual_data, request.message_type) logger.info(f"✅ JSON编码为protobuf成功: {len(protobuf_bytes)} 字节") from ..warp.api_client import send_protobuf_to_warp_api_parsed response_text, conversation_id, task_id, parsed_events = await send_protobuf_to_warp_api_parsed(protobuf_bytes) parsed_events = _decode_smd_inplace(parsed_events) response_data = {"response": response_text, "conversation_id": conversation_id, "task_id": task_id, "parsed_events": parsed_events} result = {"response": response_text, "conversation_id": conversation_id, "task_id": task_id, "request_size": len(protobuf_bytes), "response_size": len(response_text), "message_type": request.message_type, "parsed_events": parsed_events, "events_count": len(parsed_events), "events_summary": {}} if parsed_events: event_type_counts = {} for event in parsed_events: event_type = event.get("event_type", "UNKNOWN") event_type_counts[event_type] = event_type_counts.get(event_type, 0) + 1 result["events_summary"] = event_type_counts logger.info(f"✅ Warp API解析调用成功,响应长度: {len(response_text)} 字符,事件数量: {len(parsed_events)}") return result except Exception as e: import traceback error_details = {"error": str(e), "error_type": type(e).__name__, "traceback": traceback.format_exc(), "request_info": {"message_type": request.message_type, "json_size": len(str(actual_data)) if 'actual_data' in locals() else 0, "has_tools": "mcp_context" in (actual_data or {}), "has_history": "task_context" in (actual_data or {})}} logger.error(f"❌ Warp API解析调用失败: {e}") logger.error(f"错误详情: {error_details}") raise HTTPException(500, detail=error_details) @app.post("/api/warp/send_stream_sse") async def send_to_warp_api_stream_sse(request: EncodeRequest): from fastapi.responses import StreamingResponse import os as _os import re as _re try: actual_data = request.get_data() if not actual_data: raise HTTPException(400, "数据包不能为空") wrapped = {"json_data": actual_data} wrapped = sanitize_mcp_input_schema_in_packet(wrapped) actual_data = wrapped.get("json_data", actual_data) actual_data = _encode_smd_inplace(actual_data) protobuf_bytes = dict_to_protobuf_bytes(actual_data, request.message_type) async def _agen(): warp_url = CONFIG_WARP_URL def _parse_payload_bytes(data_str: str): s = _re.sub(r"\s+", "", data_str or "") if not s: return None if _re.fullmatch(r"[0-9a-fA-F]+", s or ""): try: return bytes.fromhex(s) except Exception: pass pad = "=" * ((4 - (len(s) % 4)) % 4) try: import base64 as _b64 return _b64.urlsafe_b64decode(s + pad) except Exception: try: return _b64.b64decode(s + pad) except Exception: return None verify_opt = True insecure_env = _os.getenv("WARP_INSECURE_TLS", "").lower() if insecure_env in ("1", "true", "yes"): verify_opt = False logger.warning("TLS verification disabled via WARP_INSECURE_TLS for Warp API stream endpoint") async with httpx.AsyncClient(http2=True, timeout=httpx.Timeout(60.0), verify=verify_opt, trust_env=True) as client: # 最多尝试两次:第一次失败且为配额429时申请匿名token并重试一次 jwt = None for attempt in range(2): if attempt == 0 or jwt is None: jwt = await get_valid_jwt() headers = { "accept": "text/event-stream", "content-type": "application/x-protobuf", "x-warp-client-version": CLIENT_VERSION, "x-warp-os-category": OS_CATEGORY, "x-warp-os-name": OS_NAME, "x-warp-os-version": OS_VERSION, "authorization": f"Bearer {jwt}", "content-length": str(len(protobuf_bytes)), } async with client.stream("POST", warp_url, headers=headers, content=protobuf_bytes) as response: if response.status_code != 200: error_text = await response.aread() error_content = error_text.decode("utf-8") if error_text else "" # 401 token无效时,尝试刷新JWT token后重试一次 if response.status_code == 401 and attempt == 0: logger.warning("Warp API 返回 401 (token无效, SSE 代理)。尝试刷新JWT token并重试一次…") try: refresh_success = await refresh_jwt_if_needed() if refresh_success: jwt = await get_valid_jwt() logger.info("JWT token刷新成功,重试API调用 (SSE 代理)") continue else: logger.warning("JWT token刷新失败,尝试申请匿名token (SSE 代理)") new_jwt = await acquire_anonymous_access_token() if new_jwt: jwt = new_jwt continue except Exception as e: logger.warning(f"JWT token刷新异常 (SSE 代理): {e}") # 429 且包含配额信息时,申请匿名token后重试一次 if response.status_code == 429 and attempt == 0 and ( ("No remaining quota" in error_content) or ("No AI requests remaining" in error_content) ): logger.warning("Warp API 返回 429 (配额用尽, SSE 代理)。尝试申请匿名token并重试一次…") try: new_jwt = await acquire_anonymous_access_token() except Exception: new_jwt = None if new_jwt: jwt = new_jwt # 重试 continue logger.error(f"Warp API HTTP error {response.status_code}: {error_content[:300]}") yield f"data: {{\"error\": \"HTTP {response.status_code}\"}}\n\n" yield "data: [DONE]\n\n" return try: logger.info(f"✅ Warp API SSE连接已建立: {warp_url}") logger.info(f"📦 请求字节数: {len(protobuf_bytes)}") except Exception: pass current_data = "" event_no = 0 async for line in response.aiter_lines(): if line.startswith("data:"): payload = line[5:].strip() if not payload: continue if payload == "[DONE]": break current_data += payload continue if (line.strip() == "") and current_data: raw_bytes = _parse_payload_bytes(current_data) current_data = "" if raw_bytes is None: continue try: event_data = protobuf_to_dict(raw_bytes, "warp.multi_agent.v1.ResponseEvent") except Exception: continue def _get(d: Dict[str, Any], *names: str) -> Any: for n in names: if isinstance(d, dict) and n in d: return d[n] return None event_type = "UNKNOWN_EVENT" if isinstance(event_data, dict): if "init" in event_data: event_type = "INITIALIZATION" else: client_actions = _get(event_data, "client_actions", "clientActions") if isinstance(client_actions, dict): actions = _get(client_actions, "actions", "Actions") or [] event_type = f"CLIENT_ACTIONS({len(actions)})" if actions else "CLIENT_ACTIONS_EMPTY" elif "finished" in event_data: event_type = "FINISHED" event_no += 1 try: logger.info(f"🔄 SSE Event #{event_no}: {event_type}") except Exception: pass out = {"event_number": event_no, "event_type": event_type, "parsed_data": event_data} try: chunk = json.dumps(out, ensure_ascii=False) except Exception: continue yield f"data: {chunk}\n\n" try: logger.info("="*60) logger.info("📊 SSE STREAM SUMMARY (代理)") logger.info("="*60) logger.info(f"📈 Total Events Forwarded: {event_no}") logger.info("="*60) except Exception: pass yield "data: [DONE]\n\n" return return StreamingResponse(_agen(), media_type="text/event-stream", headers={"Cache-Control": "no-cache", "Connection": "keep-alive"}) except HTTPException: raise except Exception as e: import traceback error_details = {"error": str(e), "error_type": type(e).__name__, "traceback": traceback.format_exc()} logger.error(f"Warp SSE转发端点错误: {e}") raise HTTPException(500, detail=error_details) if __name__ == "__main__": import uvicorn uvicorn.run(app, host="0.0.0.0", port=8000)