From c570e362ed163412658d1c1648e938a027529fed Mon Sep 17 00:00:00 2001 From: zhangqian <zhangqian@123.com> Date: 星期四, 17 十月 2024 21:38:19 +0800 Subject: [PATCH] 文档上传接口支持ragflow上传并解析 --- app/service/ragflow.py | 41 +++++++++++++++++++++++++++++------------ 1 files changed, 29 insertions(+), 12 deletions(-) diff --git a/app/service/ragflow.py b/app/service/ragflow.py index 4021866..65c5a27 100644 --- a/app/service/ragflow.py +++ b/app/service/ragflow.py @@ -1,5 +1,9 @@ import httpx from typing import Union, Dict, List + +from fastapi import HTTPException +from starlette import status + from app.config.config import settings from app.utils.rsa_crypto import RagflowCrypto @@ -8,12 +12,17 @@ def __init__(self, base_url: str): self.base_url = base_url - async def _handle_response(self, response: httpx.Response) -> Union[Dict, List]: + def _handle_response(self, response: httpx.Response) -> Union[Dict, List]: if response.status_code != 200: return {} data = response.json() ret_code = data.get("retcode") + if ret_code == 401: + raise HTTPException( + status_code=status.HTTP_401_UNAUTHORIZED, + detail="鐧诲綍杩囨湡", + ) if ret_code != 0: return {} @@ -80,7 +89,7 @@ headers = {"Authorization": token} async with httpx.AsyncClient() as client: response = await client.get(url, headers=headers) - data = await self._handle_response(response) + data = self._handle_response(response) result = [ { "id": item["id"], @@ -91,28 +100,24 @@ ] return result - async def set_session(self, token: str, dialog_id: str, name: str, chat_id: str, is_new: bool) -> list: + async def set_session(self, token: str, dialog_id: str, message: dict, chat_id: str, is_new: bool) -> list: url = f"{self.base_url}/v1/conversation/set?dialog_id={dialog_id}" headers = {"Authorization": token} data = { "dialog_id": dialog_id, - "name": name, + "name": message["message"], "is_new": is_new, "conversation_id": chat_id, } async with httpx.AsyncClient() as client: response = await client.post(url, headers=headers, json=data) - data = await self._handle_response(response) + data = self._handle_response(response) return [ { "content": "浣犲ソ锛� 鎴戞槸浣犵殑鍔╃悊锛屾湁浠�涔堝彲浠ュ府鍒颁綘鐨勫悧锛�", "role": "assistant" }, - { - "content": name, - "doc_ids": [], - "role": "user" - } + message, ] if data else [] async def get_session_history(self, token: str, chat_id: str) -> list: @@ -120,5 +125,17 @@ headers = {"Authorization": token} async with httpx.AsyncClient() as client: response = await client.get(url, headers=headers) - data = await self._handle_response(response) - return data.get("message", []) \ No newline at end of file + data = self._handle_response(response) + return data.get("message", []) + + async def upload_and_parse(self, token: str, chat_id: str, filename: str, file: bytes) -> str: + url = f"{self.base_url}/v1/document/upload_and_parse" + headers = {"Authorization": token} + data = {"conversation_id": chat_id} + + # 鍒涘缓琛ㄥ崟鏁版嵁锛屽寘鍚枃浠� + files = {"file": (filename, file)} + async with httpx.AsyncClient(timeout=60) as client: + response = await client.post(url, headers=headers, files=files, data=data) + data = self._handle_response(response) + return data -- Gitblit v1.8.0