From c570e362ed163412658d1c1648e938a027529fed Mon Sep 17 00:00:00 2001
From: zhangqian <zhangqian@123.com>
Date: 星期四, 17 十月 2024 21:38:19 +0800
Subject: [PATCH] 文档上传接口支持ragflow上传并解析

---
 app/service/ragflow.py |   41 +++++++++++++++++++++++++++++------------
 1 files changed, 29 insertions(+), 12 deletions(-)

diff --git a/app/service/ragflow.py b/app/service/ragflow.py
index 4021866..65c5a27 100644
--- a/app/service/ragflow.py
+++ b/app/service/ragflow.py
@@ -1,5 +1,9 @@
 import httpx
 from typing import Union, Dict, List
+
+from fastapi import HTTPException
+from starlette import status
+
 from app.config.config import settings
 from app.utils.rsa_crypto import RagflowCrypto
 
@@ -8,12 +12,17 @@
     def __init__(self, base_url: str):
         self.base_url = base_url
 
-    async def _handle_response(self, response: httpx.Response) -> Union[Dict, List]:
+    def _handle_response(self, response: httpx.Response) -> Union[Dict, List]:
         if response.status_code != 200:
             return {}
 
         data = response.json()
         ret_code = data.get("retcode")
+        if ret_code == 401:
+            raise HTTPException(
+                status_code=status.HTTP_401_UNAUTHORIZED,
+                detail="鐧诲綍杩囨湡",
+            )
         if ret_code != 0:
             return {}
 
@@ -80,7 +89,7 @@
         headers = {"Authorization": token}
         async with httpx.AsyncClient() as client:
             response = await client.get(url, headers=headers)
-            data = await self._handle_response(response)
+            data = self._handle_response(response)
             result = [
                 {
                     "id": item["id"],
@@ -91,28 +100,24 @@
             ]
             return result
 
-    async def set_session(self, token: str, dialog_id: str, name: str, chat_id: str, is_new: bool) -> list:
+    async def set_session(self, token: str, dialog_id: str, message: dict, chat_id: str, is_new: bool) -> list:
         url = f"{self.base_url}/v1/conversation/set?dialog_id={dialog_id}"
         headers = {"Authorization": token}
         data = {
             "dialog_id": dialog_id,
-            "name": name,
+            "name": message["message"],
             "is_new": is_new,
             "conversation_id": chat_id,
         }
         async with httpx.AsyncClient() as client:
             response = await client.post(url, headers=headers, json=data)
-            data = await self._handle_response(response)
+            data = self._handle_response(response)
             return [
                 {
                     "content": "浣犲ソ锛� 鎴戞槸浣犵殑鍔╃悊锛屾湁浠�涔堝彲浠ュ府鍒颁綘鐨勫悧锛�",
                     "role": "assistant"
                 },
-                {
-                    "content": name,
-                    "doc_ids": [],
-                    "role": "user"
-                }
+                message,
             ] if data else []
 
     async def get_session_history(self, token: str, chat_id: str) -> list:
@@ -120,5 +125,17 @@
         headers = {"Authorization": token}
         async with httpx.AsyncClient() as client:
             response = await client.get(url, headers=headers)
-            data = await self._handle_response(response)
-            return data.get("message", [])
\ No newline at end of file
+            data = self._handle_response(response)
+            return data.get("message", [])
+
+    async def upload_and_parse(self, token: str, chat_id: str, filename: str, file: bytes) -> str:
+        url = f"{self.base_url}/v1/document/upload_and_parse"
+        headers = {"Authorization": token}
+        data = {"conversation_id": chat_id}
+
+        # 鍒涘缓琛ㄥ崟鏁版嵁锛屽寘鍚枃浠�
+        files = {"file": (filename, file)}
+        async with httpx.AsyncClient(timeout=60) as client:
+            response = await client.post(url, headers=headers, files=files, data=data)
+            data = self._handle_response(response)
+            return data

--
Gitblit v1.8.0