From 992d91359f4e4437ddba9843173254441c896918 Mon Sep 17 00:00:00 2001
From: zhaoqingang <zhaoqg0118@163.com>
Date: 星期四, 02 一月 2025 18:03:28 +0800
Subject: [PATCH] 报告生成文档清洗

---
 app/api/chat.py |  200 ++++++++++++++++++++++++++++++-------------------
 1 files changed, 121 insertions(+), 79 deletions(-)

diff --git a/app/api/chat.py b/app/api/chat.py
index 3c8e9c7..2993b2a 100644
--- a/app/api/chat.py
+++ b/app/api/chat.py
@@ -436,6 +436,10 @@
                         title_number = receive_message.get('title_number', 8)
                         title_style = receive_message.get('title_style', "")
                         title_query = receive_message.get('title_query', "")
+                        is_clean = receive_message.get('is_clean', 0)
+                        file_type = receive_message.get('file_type', 1)
+                        max_token = receive_message.get('max_tokens', 100000)
+                        tokens = receive_message.get('tokens', 0)
                         if upload_files:
                             title_query = "start"
                         # if not upload_files:
@@ -456,15 +460,27 @@
                         }
                         files = []
                         for file in upload_files:
-                            files.append({
-                                "type": "document",
-                                "transfer_method": "local_file",
-                                "url": "",
-                                "upload_file_id": file
-                            })
+                            if file_type == 1:
+                                files.append({
+                                    "type": "document",
+                                    "transfer_method": "local_file",
+                                    "url": "",
+                                    "upload_file_id": file
+                                })
+                            else:
+                                files.append({
+                                    "type": "document",
+                                    "transfer_method": "remote_url",
+                                    "url": file,
+                                    "upload_file_id": ""
+                                })
+                        inputs_list = []
+                        token_list = []
                         if workflow_type == 1:
                             inputs["input_files"] = files
-                        elif workflow_type == 2:
+                            inputs_list.append(inputs)
+                            token_list.append(token)
+                        elif workflow_type == 2 and is_clean == 0:
                             inputs["file_list"] = files
                             inputs["Completion_of_main_indicators"] = title
                             inputs["sub_titles"] = sub_titles
@@ -472,6 +488,8 @@
                             if not token:
                                 await websocket.send_json(
                                     {"message": "Invalid token document_to_report", "type": "error"})
+                            inputs_list.append(inputs)
+                            token_list.append(token)
                         elif workflow_type == 3:
                             inputs["file_list"] = files
                             inputs["number_of_title"] = title_number
@@ -480,89 +498,113 @@
                             if not token:
                                 await websocket.send_json(
                                     {"message": "Invalid token document_to_title", "type": "error"})
+                            # inputs_list.append(inputs)
+                            # token_list.append(token)
+                        elif workflow_type == 2 and is_clean == 1:
+                            # inputs["input_files"] = files
+                            inputs_list.append(inputs)
+                            token_list.append(token)
+                            inputs1 = {}
+                            # inputs1["file_list"] = files
+                            inputs1["Completion_of_main_indicators"] = title
+                            inputs1["sub_titles"] = sub_titles
+                            token = DfTokenDao(db).get_token_by_id(DOCUMENT_TO_REPORT_TITLE)
+                            if not token:
+                                await websocket.send_json(
+                                    {"message": "Invalid token document_to_report", "type": "error"})
+                            inputs_list.append(inputs1)
+                            token_list.append(token)
 
                         complete_response = ""
                         if workflow_type == 1 or workflow_type == 2:
-                            async for rag_response in dify_service.workflow(token, current_user.id, inputs):
-                                # print(rag_response)
-                                try:
-                                    if rag_response[:5] == "data:":
-                                        # 濡傛灉鏄紝鍒欐埅鍙栨帀鍓�5涓瓧绗︼紝骞跺幓闄ら灏剧┖鐧界
-                                        complete_response = rag_response[5:].strip()
-                                    elif "event: ping" in rag_response:
-                                        continue
-                                    else:
-                                        # 鍚﹀垯锛屼繚鎸佸師鏍�
-                                        complete_response += rag_response
+                            for inputs in inputs_list:
+                                inputs["input_files"] = files
+                                async for rag_response in dify_service.workflow(token, current_user.id, inputs):
+                                    # print(rag_response)
                                     try:
-                                        data = json.loads(complete_response)
-                                        complete_response = ""
-                                        if data.get("event") == "node_started" or data.get("event") == "node_finished":  # "event": "message_end"
-                                            if "data" not in data or not data["data"]:  # 淇℃伅杩囨护
-                                                logger.error("闈炴硶鏁版嵁--------------------")
-                                                logger.error(data)
-                                                continue
-                                            else:  # 姝e父杈撳嚭
+                                        if rag_response[:5] == "data:":
+                                            # 濡傛灉鏄紝鍒欐埅鍙栨帀鍓�5涓瓧绗︼紝骞跺幓闄ら灏剧┖鐧界
+                                            complete_response = rag_response[5:].strip()
+                                        elif "event: ping" in rag_response:
+                                            continue
+                                        else:
+                                            # 鍚﹀垯锛屼繚鎸佸師鏍�
+                                            complete_response += rag_response
+                                        try:
+                                            data = json.loads(complete_response)
+                                            complete_response = ""
+                                            if data.get("event") == "node_started" or data.get("event") == "node_finished":  # "event": "message_end"
+                                                if "data" not in data or not data["data"]:  # 淇℃伅杩囨护
+                                                    logger.error("闈炴硶鏁版嵁--------------------")
+                                                    logger.error(data)
+                                                    continue
+                                                else:  # 姝e父杈撳嚭
+                                                    answer = data.get("data", "")
+                                                    if isinstance(answer, str):
+                                                        logger.error("----------------鏈煡鏁版嵁--------------------")
+                                                        logger.error(data)
+                                                        continue
+                                                    elif isinstance(answer, dict):
+
+                                                        message = answer.get("title", "")
+
+                                                    result = {"message": message, "type": "system"}
+                                            elif data.get("event") == "workflow_finished":
                                                 answer = data.get("data", "")
                                                 if isinstance(answer, str):
                                                     logger.error("----------------鏈煡鏁版嵁--------------------")
                                                     logger.error(data)
-                                                    continue
+                                                    result = {"message": "", "type": "close", "download_url": ""}
                                                 elif isinstance(answer, dict):
-
-                                                    message = answer.get("title", "")
-
-                                                result = {"message": message, "type": "system"}
-                                        elif data.get("event") == "workflow_finished":
-                                            answer = data.get("data", "")
-                                            if isinstance(answer, str):
-                                                logger.error("----------------鏈煡鏁版嵁--------------------")
-                                                logger.error(data)
-                                                result = {"message": "", "type": "close", "download_url": ""}
-                                            elif isinstance(answer, dict):
-                                                download_url = ""
-                                                outputs = answer.get("outputs", {})
-                                                if outputs:
-                                                    message = outputs.get("output", "")
-                                                    download_url = outputs.get("download_url", "")
-                                                else:
-                                                    message = answer.get("error", "")
-
-                                                result = {"message": message, "type": "message", "download_url": download_url}
-                                                try:
-                                                    SessionService(db).update_session(chat_id,
-                                                                                      message={"role": "assistant",
-                                                                                               "content": {
-                                                                                                   "answer": message,
-                                                                                                   "download_url": download_url}},
-                                                                                      conversation_id=data.get(
-                                                                                          "conversation_id"))
-                                                except Exception as e:
-                                                    logger.error("淇濆瓨dify鐨勪細璇濆紓甯革紒")
-                                                    logger.error(e)
-                                                try:
-                                                    await websocket.send_json(result)
-                                                except Exception as e:
-                                                    logger.error(e)
-                                                    logger.error("杩斿洖瀹㈡埛绔秷鎭紓甯�!")
-                                                result = {"message": "", "type": "close", "download_url": ""}
+                                                    download_url = ""
+                                                    outputs = answer.get("outputs", {})
+                                                    if outputs:
+                                                        message = outputs.get("output", "")
+                                                        download_url = outputs.get("download_url", "")
+                                                    else:
+                                                        message = answer.get("error", "")
+                                                    if download_url:
+                                                        files = [{
+                                                            "type": "document",
+                                                            "transfer_method": "remote_url",
+                                                            "url": download_url,
+                                                            "upload_file_id": ""
+                                                        }]
+                                                    result = {"message": message, "type": "message", "download_url": download_url}
+                                                    try:
+                                                        SessionService(db).update_session(chat_id,
+                                                                                          message={"role": "assistant",
+                                                                                                   "content": {
+                                                                                                       "answer": message,
+                                                                                                       "download_url": download_url}},
+                                                                                          conversation_id=data.get(
+                                                                                              "conversation_id"))
+                                                    except Exception as e:
+                                                        logger.error("淇濆瓨dify鐨勪細璇濆紓甯革紒")
+                                                        logger.error(e)
+                                                    try:
+                                                        await websocket.send_json(result)
+                                                    except Exception as e:
+                                                        logger.error(e)
+                                                        logger.error("杩斿洖瀹㈡埛绔秷鎭紓甯�!")
+                                                    result = {"message": "", "type": "close", "download_url": ""}
 
 
-                                        else:
-                                            continue
-                                        try:
-                                            await websocket.send_json(result)
-                                        except Exception  as e:
-                                            logger.error(e)
-                                            logger.error("杩斿洖瀹㈡埛绔秷鎭紓甯�!")
-                                        complete_response = ""
-                                    except json.JSONDecodeError as e:
-                                        print(f"Error decoding JSON: {e}")
-                                        # print(f"Response text: {text}")
-                                except Exception as e2:
-                                    result = {"message": f"鍐呴儴閿欒锛� {e2}", "type": "close"}
-                                    await websocket.send_json(result)
-                                    print(f"Error process message of ragflow: {e2}")
+                                            else:
+                                                continue
+                                            try:
+                                                await websocket.send_json(result)
+                                            except Exception  as e:
+                                                logger.error(e)
+                                                logger.error("杩斿洖瀹㈡埛绔秷鎭紓甯�!")
+                                            complete_response = ""
+                                        except json.JSONDecodeError as e:
+                                            print(f"Error decoding JSON: {e}")
+                                            # print(f"Response text: {text}")
+                                    except Exception as e2:
+                                        result = {"message": f"鍐呴儴閿欒锛� {e2}", "type": "close"}
+                                        await websocket.send_json(result)
+                                        print(f"Error process message of ragflow: {e2}")
                         elif workflow_type == 3:
                             image_list = []
                             # print(inputs)

--
Gitblit v1.8.0