From 6202db458678153934fb4a31a041c58764a69138 Mon Sep 17 00:00:00 2001
From: zhangqian <zhangqian@123.com>
Date: 星期五, 18 十月 2024 22:59:51 +0800
Subject: [PATCH] 增加文件下载转发接口,把毕昇返回的文件地址改成我们的下载地址
---
pip_install.sh | 3 +
app/api/report.py | 3 +
app/api/__init__.py | 46 ++++++++++++++++++++++
app/api/files.py | 49 ++++++++++++++++++++++++
4 files changed, 97 insertions(+), 4 deletions(-)
diff --git a/app/api/__init__.py b/app/api/__init__.py
index 8bd4579..a96baa1 100644
--- a/app/api/__init__.py
+++ b/app/api/__init__.py
@@ -1,3 +1,6 @@
+import urllib
+from urllib.parse import urlencode
+
import jwt
from fastapi import FastAPI, Depends, HTTPException
from fastapi.security import OAuth2PasswordBearer
@@ -72,4 +75,45 @@
except jwt.PyJWTError as e:
print(e)
await websocket.close(code=1008)
- raise WebSocketDisconnect(code=status.WS_1008_POLICY_VIOLATION)
\ No newline at end of file
+ raise WebSocketDisconnect(code=status.WS_1008_POLICY_VIOLATION)
+
+
+def format_file_url(agent_id: str, file_url: str, doc_id: str = None, doc_name: str = None) -> str:
+ if file_url:
+ # 瀵� file_url 杩涜 URL 缂栫爜
+ encoded_file_url = urllib.parse.quote(file_url, safe=':/')
+ return f"./api/files/download/?url={encoded_file_url}&agent_id={agent_id}"
+
+ if doc_id:
+ # 瀵� doc_id 鍜� doc_name 杩涜 URL 缂栫爜
+ encoded_doc_id = urllib.parse.quote(doc_id, safe='')
+ encoded_doc_name = urllib.parse.quote(doc_name, safe='')
+ return f"./api/files/download/?doc_id={encoded_doc_id}&doc_name={encoded_doc_name}&agent_id={agent_id}"
+
+ return file_url
+
+
+def process_files(files, agent_id):
+ """
+ 澶勭悊鏂囦欢鍒楄〃锛屾牸寮忓寲姣忎釜鏂囦欢鐨� URL銆�
+
+ :param files: 鏂囦欢鍒楄〃锛屾瘡涓枃浠舵槸涓�涓瓧鍏�
+ :param agent_id: 浠g悊 ID
+ """
+ if not files:
+ return # 濡傛灉鏂囦欢鍒楄〃涓虹┖锛岀洿鎺ヨ繑鍥�
+
+ for file in files:
+ if "file_url" in file and file["file_url"]:
+ try:
+ file["file_url"] = format_file_url(agent_id, file["file_url"])
+ except Exception as e:
+ # 璁板綍寮傚父淇℃伅锛屼絾缁х画澶勭悊鍏朵粬鏂囦欢
+ print(f"Error processing file URL: {e}")
+if __name__=="__main__":
+
+ files1 = [{"file_url": "aaa.com"}, {"file_url":"bbb.com"}]
+ print(files1)
+
+ process_files(files1,11111)
+ print(files1)
\ No newline at end of file
diff --git a/app/api/files.py b/app/api/files.py
index 5da2cc4..12c55b0 100644
--- a/app/api/files.py
+++ b/app/api/files.py
@@ -1,5 +1,10 @@
-from fastapi import Depends, APIRouter, HTTPException, UploadFile, File, requests, Query
+from typing import Optional
+
+import requests
+from fastapi import Depends, APIRouter, HTTPException, UploadFile, File, Query
+from pydantic import BaseModel
from sqlalchemy.orm import Session
+from starlette.responses import StreamingResponse
from app.api import Response, get_current_user, ResponseList
from app.config.config import settings
@@ -9,6 +14,7 @@
from app.service.bisheng import BishengService
from app.service.ragflow import RagflowService
from app.service.token import get_ragflow_token, get_bisheng_token
+import urllib.parse
router = APIRouter()
@@ -55,3 +61,44 @@
else:
return Response(code=200, msg="Unsupported agent type")
+
+
+@router.get("/download/", response_model=Response)
+async def download_file(
+ url: Optional[str] = Query(None, description="URL of the file to download for bisheng"),
+ agent_id: str = Query(..., description="Agent ID"),
+ doc_id: Optional[str] = Query(None, description="Optional doc id for ragflow agents"),
+ doc_name: Optional[str] = Query(None, description="Optional doc name for ragflow agents"),
+ db: Session = Depends(get_db)
+):
+ agent = db.query(AgentModel).filter(AgentModel.id == agent_id).first()
+ if not agent:
+ return Response(code=404, msg="Agent not found")
+
+ if agent.agent_type == AgentType.BISHENG:
+ url = urllib.parse.unquote(url)
+ # 浠� URL 涓彁鍙栨枃浠跺悕
+ parsed_url = urllib.parse.urlparse(url)
+ filename = urllib.parse.unquote(parsed_url.path.split('/')[-1])
+ url = url.replace("http://minio:9000", settings.bisheng_base_url)
+ elif agent.agent_type == AgentType.RAGFLOW:
+ if not doc_id:
+ return Response(code=400, msg="doc_id is required")
+ url = f"{settings.ragflow_base_url}/v1/document/get/{doc_id}"
+ filename = doc_name
+ else:
+ return Response(code=400, msg="Unsupported agent type")
+
+ try:
+ # 鍙戦�丟ET璇锋眰鑾峰彇鏂囦欢鍐呭
+ response = requests.get(url, stream=True)
+ response.raise_for_status() # 妫�鏌ヨ姹傛槸鍚︽垚鍔�
+
+ # 杩斿洖娴佸紡鍝嶅簲
+ return StreamingResponse(
+ response.iter_content(chunk_size=1024),
+ media_type="application/octet-stream",
+ headers={"Content-Disposition": f"attachment; filename*=utf-8''{urllib.parse.quote(filename)}"}
+ )
+ except Exception as e:
+ raise HTTPException(status_code=400, detail=f"Error downloading file: {e}")
diff --git a/app/api/report.py b/app/api/report.py
index 386dcf1..516ead9 100644
--- a/app/api/report.py
+++ b/app/api/report.py
@@ -4,7 +4,7 @@
import asyncio
import websockets
from sqlalchemy.orm import Session
-from app.api import get_current_user_websocket, ResponseList, get_current_user
+from app.api import get_current_user_websocket, ResponseList, get_current_user, format_file_url, process_files
from app.config.config import settings
from app.models.agent_model import AgentModel, AgentType
from app.models.base_model import get_db
@@ -68,6 +68,7 @@
t = "close"
else:
t = "stream"
+ process_files(files, agent_id)
result = {"step_message": steps, "type": t, "files": files}
await websocket.send_json(result)
print(f"Forwarded to client, {chat_id}: {result}")
diff --git a/pip_install.sh b/pip_install.sh
index c4519b8..d25c9b7 100644
--- a/pip_install.sh
+++ b/pip_install.sh
@@ -1,4 +1,5 @@
pip install PyMySQL & pip install fastapi & pip install sqlalchemy & pip install PyJWT & pip install rsa & pip install httpx & pip install uvicorn & pip install bcrypt & pip install PyYAML & pip install pycryptodomex & pip install passlib
pip install werkzeug
pip install xlwings
-pip install python-multipart
\ No newline at end of file
+pip install python-multipart
+pip install requests
\ No newline at end of file
--
Gitblit v1.8.0