From 8a9aef87aa1df6549e042583b596ea7d466b746d Mon Sep 17 00:00:00 2001 From: jeremygan2021 Date: Tue, 4 Nov 2025 23:57:37 +0800 Subject: [PATCH] =?UTF-8?q?=E5=B0=81=E8=A3=85fastAPI=20openAI=E6=8E=A5?= =?UTF-8?q?=E5=8F=A3=E8=A7=84=E8=8C=83?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .DS_Store | Bin 0 -> 6148 bytes .dockerignore | 45 +++++ Dockerfile | 31 ++++ docker-compose.yml | 25 +++ fastapi_server/Dockerfile.api | 20 +++ fastapi_server/OpenAI_API_README.md | 220 ++++++++++++++++++++++++ fastapi_server/README.md | 179 +++++++++++++++++++ fastapi_server/docker-compose.api.yml | 18 ++ fastapi_server/openai_client_example.py | 129 ++++++++++++++ fastapi_server/requirements.txt | 24 +++ fastapi_server/server.py | 163 ++++++++++++++++++ fastapi_server/start_server.sh | 19 ++ lang_agent/rag/simple.py | 30 +++- lang_agent/test.py | 0 lang_agent/tool_manager.py | 8 +- 15 files changed, 904 insertions(+), 7 deletions(-) create mode 100644 .DS_Store create mode 100644 .dockerignore create mode 100644 Dockerfile create mode 100644 docker-compose.yml create mode 100644 fastapi_server/Dockerfile.api create mode 100644 fastapi_server/OpenAI_API_README.md create mode 100644 fastapi_server/README.md create mode 100644 fastapi_server/docker-compose.api.yml create mode 100644 fastapi_server/openai_client_example.py create mode 100644 fastapi_server/requirements.txt create mode 100644 fastapi_server/server.py create mode 100755 fastapi_server/start_server.sh create mode 100644 lang_agent/test.py diff --git a/.DS_Store b/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..022c56e1e44bf3bfee7e99e7a153f3eaff9daf03 GIT binary patch literal 6148 zcmeHKO)mpc6g`iIDiL90Bbh(YN&JH$wXm?^2hdKdL7ApX!fN*Zim>(9tT^|+7nwJ$ zEh6{IduQg&J@?~`_Vod9`*;0aU;{vtL$J}}G{@w*j2T-9D{Dk2F%CyX-WwG?-b+9; zQ@|AX+X~2Mw}BJ`+~7X`{4NanEd5Z^CYI2}E&m3X;x_hmFZ6h;__nIPjQ@xWjBA|t zTKr|?C|JiieTVf7*sFPOqEGJ}SFC4(wsNmA=9*NP;sMtf#Tm7u=cvj~C5Gf3VGwiN z4)azy>#R?7m~tMIajN+yxR*L&?u>#h#_zJjAz59{qWU!E;I-E0);x~Bu^}V0S%D~4 z#8I^B>bqNKtq&X%_It^^IqOe3idmIZ>1xL-IK}~2J2)byWc1@~T62}LOigm;;ya)7 zzw%V;khf;PpaA!5vF55rn@s^zz!dmWK)xRm4#6y7=~2HrIO!39*x<4nul1)tF_8sg z7O?cl6`J!@qNloW#Bkx{;5?nrv*2HP^mI7Q%s3&l3nvs84jwL1ceu=>&8C1U5G%0g zZ#QKBKluLqACv6P6fgz;l>)BOIqB@PrLecoG$(s)!g0nSCVr(yrEm({v0lhlyv?D; ZXNg=8vw)>XuF&j=0.104.0 +uvicorn>=0.24.0 +pydantic>=2.0.0,<2.12 +loguru>=0.7.0 +python-dotenv>=1.0.0 +langchain==1.0 +langchain-core>=0.1.0 +langchain-community +langchain-openai +langchain-mcp-adapters +langgraph>=0.0.40 +tyro>=0.7.0 +commentjson>=0.9.0 +matplotlib>=3.7.0 +Pillow>=10.0.0 +jax>=0.4.0 +httpx[socks] +dashscope +websockets>=11.0.3 +mcp>=1.8.1 +mcp-proxy>=0.8.2 +faiss-cpu +fastmcp +pandas diff --git a/fastapi_server/server.py b/fastapi_server/server.py new file mode 100644 index 0000000..394d404 --- /dev/null +++ b/fastapi_server/server.py @@ -0,0 +1,163 @@ +from fastapi import FastAPI, HTTPException, Depends, Security +from fastapi.middleware.cors import CORSMiddleware +from fastapi.security import HTTPBearer, HTTPAuthorizationCredentials +from pydantic import BaseModel, Field +from typing import List, Optional, Dict, Any, Union +import os +import sys +import time +import uvicorn +from loguru import logger + +# 添加父目录到系统路径,以便导入lang_agent模块 +sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))) + +from lang_agent.pipeline import Pipeline, PipelineConfig + +# 定义OpenAI格式的请求模型 +class ChatMessage(BaseModel): + role: str = Field(..., description="消息角色,可以是 'system', 'user', 'assistant'") + content: str = Field(..., description="消息内容") + +class ChatCompletionRequest(BaseModel): + model: str = Field(default="qwen-flash", description="模型名称") + messages: List[ChatMessage] = Field(..., description="对话消息列表") + temperature: Optional[float] = Field(default=0.7, description="采样温度") + max_tokens: Optional[int] = Field(default=500, description="最大生成token数") + stream: Optional[bool] = Field(default=False, description="是否流式返回") + thread_id: Optional[int] = Field(default=3, description="线程ID,用于多轮对话") + +class ChatCompletionResponseChoice(BaseModel): + index: int + message: ChatMessage + finish_reason: str + +class ChatCompletionResponseUsage(BaseModel): + prompt_tokens: int + completion_tokens: int + total_tokens: int + +class ChatCompletionResponse(BaseModel): + id: str + object: str = "chat.completion" + created: int + model: str + choices: List[ChatCompletionResponseChoice] + usage: Optional[ChatCompletionResponseUsage] = None + +# 初始化FastAPI应用 +app = FastAPI(title="Lang Agent Chat API", description="使用OpenAI格式调用pipeline.invoke的聊天API") + +# 设置API密钥 +API_KEY = "123tangledup-ai" + +# 创建安全方案 +security = HTTPBearer() + +# 验证API密钥的依赖项 +async def verify_api_key(credentials: HTTPAuthorizationCredentials = Security(security)): + if credentials.credentials != API_KEY: + raise HTTPException( + status_code=401, + detail="无效的API密钥", + headers={"WWW-Authenticate": "Bearer"}, + ) + return credentials + +# 添加CORS中间件 +app.add_middleware( + CORSMiddleware, + allow_origins=["*"], + allow_credentials=True, + allow_methods=["*"], + allow_headers=["*"], +) + +# 初始化Pipeline +pipeline_config = PipelineConfig() +pipeline_config.llm_name = "qwen-flash" +pipeline_config.llm_provider = "openai" +pipeline_config.base_url = "https://dashscope.aliyuncs.com/compatible-mode/v1" + +pipeline = Pipeline(pipeline_config) + +@app.post("/v1/chat/completions", response_model=ChatCompletionResponse) +async def chat_completions( + request: ChatCompletionRequest, + credentials: HTTPAuthorizationCredentials = Depends(verify_api_key) +): + """ + 使用OpenAI格式的聊天完成API + """ + try: + # 提取用户消息 + user_message = None + system_message = None + + for message in request.messages: + if message.role == "user": + user_message = message.content + elif message.role == "system": + system_message = message.content + + if not user_message: + raise HTTPException(status_code=400, detail="缺少用户消息") + + # 调用pipeline的chat方法 + response_content = pipeline.chat( + inp=user_message, + as_stream=request.stream, + thread_id=request.thread_id + ) + + # 构建响应 + response = ChatCompletionResponse( + id=f"chatcmpl-{os.urandom(12).hex()}", + created=int(time.time()), + model=request.model, + choices=[ + ChatCompletionResponseChoice( + index=0, + message=ChatMessage(role="assistant", content=response_content), + finish_reason="stop" + ) + ] + ) + + return response + + except Exception as e: + logger.error(f"处理聊天请求时出错: {str(e)}") + raise HTTPException(status_code=500, detail=f"内部服务器错误: {str(e)}") + +@app.get("/") +async def root(): + """ + 根路径,返回API信息 + """ + return { + "message": "Lang Agent Chat API", + "version": "1.0.0", + "description": "使用OpenAI格式调用pipeline.invoke的聊天API", + "authentication": "Bearer Token (API Key)", + "endpoints": { + "/v1/chat/completions": "POST - 聊天完成接口,兼容OpenAI格式,需要API密钥验证", + "/": "GET - API信息", + "/health": "GET - 健康检查接口" + } + } + +@app.get("/health") +async def health_check(): + """ + 健康检查接口 + """ + return {"status": "healthy"} + +if __name__ == "__main__": + uvicorn.run( + "server:app", + host="0.0.0.0", + port=8488, + reload=True + ) \ No newline at end of file diff --git a/fastapi_server/start_server.sh b/fastapi_server/start_server.sh new file mode 100755 index 0000000..852ab95 --- /dev/null +++ b/fastapi_server/start_server.sh @@ -0,0 +1,19 @@ +#!/bin/bash + +echo "启动Lang Agent Chat API服务器..." + +# 检查Python环境 +if ! command -v python &> /dev/null; then + echo "错误: 未找到Python。请确保Python已安装并添加到PATH中。" + exit 1 +fi + +# 检查环境变量 +if [ -z "$ALI_API_KEY" ]; then + echo "警告: 未设置ALI_API_KEY环境变量。请确保已设置此变量。" + echo "例如: export ALI_API_KEY='your_api_key'" +fi + +# 启动服务器 +cd "$(dirname "$0")" +python server.py \ No newline at end of file diff --git a/lang_agent/rag/simple.py b/lang_agent/rag/simple.py index bb64487..f7724cd 100644 --- a/lang_agent/rag/simple.py +++ b/lang_agent/rag/simple.py @@ -21,8 +21,21 @@ class SimpleRagConfig(ToolConfig, KeyConfig): model_name:str = "text-embedding-v4" """embedding model name""" - folder_path:str = "/home/smith/projects/work/langchain-agent/assets/xiaozhan_emb" - """path to local database""" + folder_path:str = "/Users/jeremygan/Desktop/TangledupAI/lang-agent/assets/xiaozhan_emb" + """path to docker database""" + + # @property + # def folder_path(self) -> str: + # """Dynamically determine the folder path for the vector store""" + # # Check if environment variable is set + # env_path = os.environ.get("RAG_FOLDER_PATH") + # if env_path: + # return env_path + + # # Default to relative path from current working directory + # return os.path.join(os.getcwd(), "assets", "xiaozhan_emb") + + @@ -31,8 +44,19 @@ class SimpleRag(LangToolBase): self.config = config self.emb = QwenEmbeddings(self.config.api_key, self.config.model_name) + + # Determine the folder path dynamically + # folder_path = os.environ.get("RAG_FOLDER_PATH") + # if not folder_path: + # # Default to relative path from current working directory + # folder_path = os.path.join(os.getcwd(), "assets", "xiaozhan_emb") + + # logger.info(f"Loading FAISS index from: {folder_path}") + + folder_path = "/Users/jeremygan/Desktop/TangledupAI/lang-agent/assets/xiaozhan_emb" + self.vec_store = FAISS.load_local( - folder_path=self.config.folder_path, + folder_path=folder_path, embeddings=self.emb, allow_dangerous_deserialization=True # Required for LangChain >= 0.1.1 ) diff --git a/lang_agent/test.py b/lang_agent/test.py new file mode 100644 index 0000000..e69de29 diff --git a/lang_agent/tool_manager.py b/lang_agent/tool_manager.py index c63d36b..73f0ef8 100644 --- a/lang_agent/tool_manager.py +++ b/lang_agent/tool_manager.py @@ -6,14 +6,14 @@ import inspect import asyncio import os.path as osp from loguru import logger -from fastmcp.tools.tool import FunctionTool +from fastmcp.tools.tool import Tool from lang_agent.config import InstantiateConfig, ToolConfig from lang_agent.base import LangToolBase from lang_agent.rag.simple import SimpleRagConfig from lang_agent.dummy.calculator import CalculatorConfig -from catering_end.lang_tool import CartToolConfig, CartTool +# from catering_end.lang_tool import CartToolConfig, CartTool from langchain_core.tools.structured import StructuredTool import jax @@ -26,7 +26,7 @@ class ToolManagerConfig(InstantiateConfig): # tool configs here; MUST HAVE 'config' in name and must be dataclass rag_config: SimpleRagConfig = field(default_factory=SimpleRagConfig) - cart_config: CartToolConfig = field(default_factory=CartToolConfig) + # cart_config: CartToolConfig = field(default_factory=CartToolConfig) calc_config: CalculatorConfig = field(default_factory=CalculatorConfig) @@ -78,7 +78,7 @@ class ToolManager: def _get_tool_fnc(self, tool_obj:LangToolBase)->List: fnc_list = [] for fnc in tool_obj.get_tool_fnc(): - if isinstance(fnc, FunctionTool): + if isinstance(fnc, Tool): fnc = fnc.fn fnc_list.append(fnc)