From 633a8ed975625851f23398f896594581c179f612 Mon Sep 17 00:00:00 2001 From: zhaoqingang <zhaoqg0118@163.com> Date: 星期一, 23 十二月 2024 09:45:50 +0800 Subject: [PATCH] mysql链接数量 --- app/task/fetch_agent.py | 263 +++++++++++++++++++++++++++++++++++++++++++++++++++- 1 files changed, 255 insertions(+), 8 deletions(-) diff --git a/app/task/fetch_agent.py b/app/task/fetch_agent.py index 80ac763..303d8f6 100644 --- a/app/task/fetch_agent.py +++ b/app/task/fetch_agent.py @@ -1,19 +1,27 @@ +from pickle import PROTO from typing import Dict, List, Tuple -from sqlalchemy import create_engine, Column, String, Integer +from sqlalchemy import create_engine, Column, String, Integer, Text from sqlalchemy.exc import IntegrityError from sqlalchemy.orm import sessionmaker from app.config.config import settings +from app.config.const import RAGFLOW, BISHENG, DIFY +from app.models import KnowledgeModel +from app.models.dialog_model import DialogModel +from app.models.user_model import UserAppModel from app.models.agent_model import AgentModel from app.models.base_model import SessionLocal, Base +from app.service.v2.app_register import AppRegisterDao # 鍒涘缓鏁版嵁搴撳紩鎿庡拰浼氳瘽宸ュ巶 engine_bisheng = create_engine(settings.sgb_db_url) engine_ragflow = create_engine(settings.fwr_db_url) +engine_dify = create_engine(settings.dify_database_url) SessionBisheng = sessionmaker(autocommit=False, autoflush=False, bind=engine_bisheng) SessionRagflow = sessionmaker(autocommit=False, autoflush=False, bind=engine_ragflow) +SessionDify = sessionmaker(autocommit=False, autoflush=False, bind=engine_dify) class Flow(Base): @@ -21,6 +29,8 @@ id = Column(String(255), primary_key=True) name = Column(String(255), nullable=False) status = Column(Integer, nullable=False) + description = Column(String(255), nullable=False) + user_id = Column(Integer, nullable=False) class Dialog(Base): @@ -28,7 +38,29 @@ id = Column(String(255), primary_key=True) name = Column(String(255), nullable=False) status = Column(String(1), nullable=False) + description = Column(String(255), nullable=False) + tenant_id = Column(String(36), nullable=False) + +class DfApps(Base): + __tablename__ = 'apps' + id = Column(String(36), primary_key=True) + name = Column(String(255), nullable=False) + status = Column(String(16), nullable=False) + description = Column(Text, nullable=False) + tenant_id = Column(String(36), nullable=False) + mode = Column(String(36), nullable=False) + + +class RgKnowledge(Base): + __tablename__ = 'knowledgebase' + id = Column(String(36), primary_key=True) # id + name = Column(String(128)) # 鍚嶇О + permission = Column(String(32), default="me") + tenant_id = Column(String(32)) # 鍒涘缓浜篿d + description = Column(Text) # 璇存槑 + status = Column(String(1)) # 鐘舵�� + doc_num = Column(Integer) # 鏂囨。 # 瑙f瀽鍚嶅瓧 def parse_names(names_str: str) -> List[str]: @@ -108,16 +140,19 @@ try: count = db.query(AgentModel).count() if count > 0: - return + result = db.query(AgentModel).delete() + db.commit() # 鎻愪氦浜嬪姟 initial_agents = [ - ('80ee430a-e396-48c4-a12c-7c7cdf5eda51', 1, '鎶ュ憡鐢熸垚', 'BISHENG', 'report'), + # ('80ee430a-e396-48c4-a12c-7c7cdf5eda51', 1, '鎶ュ憡鐢熸垚', 'DIFY', 'report'), ('basic_excel_merge', 2, '鎶ヨ〃鍚堝苟', 'BASIC', 'excelMerge'), - ('bfd090d589d811efb3630242ac190006', 4, '鏂囨。鏅鸿兘', 'BISHENG', 'report'), + ('7638f00638a24c21a68ec6c49b304a35', 4, '鏂囨。鏅鸿兘', 'DIFY', 'documentIa'), ('da3451da89d911efb9490242ac190006', 3, '鐭ヨ瘑闂瓟', 'RAGFLOW', 'knowledgeQA'), ('e96eb7a589db11ef87d20242ac190006', 5, '鏅鸿兘闂瓟', 'RAGFLOW', 'chat'), ('basic_excel_talk', 6, '鏅鸿兘鏁版嵁', 'BASIC', 'excelTalk'), - ('basic_question_talk', 7, '鏂囨。鍑哄嵎', 'BASIC', 'questionTalk'), - ('9d75142a-66eb-4e23-b7d4-03efe4584915', 8, '灏忔暟缁樺浘', 'DIFY', 'imageTalk') + ('basic_question_talk', 7, '鍑洪缁勫嵎', 'BASIC', 'questionTalk'), + ('9d75142a-66eb-4e23-b7d4-03efe4584915', 8, '灏忔暟缁樺浘', 'DIFY', 'imageTalk'), + ('basic_paper_talk', 9, '鏂囨。鍑哄嵎', 'BASIC', 'paperTalk'), + ('basic_report_clean', 10, '鏂囨。鎶ュ憡', 'DIFY', 'reportWorkflow') ] for agent in initial_agents: @@ -135,12 +170,224 @@ def sync_agents(): try: - bisheng_data = get_data_from_bisheng(BISHENG_NAMES_TO_SYNC) + # bisheng_data = get_data_from_bisheng(BISHENG_NAMES_TO_SYNC) ragflow_data = get_data_from_ragflow(RAGFLOW_NAMES_TO_SYNC) - update_ids_in_local(bisheng_data) + # update_ids_in_local(bisheng_data) update_ids_in_local(ragflow_data) print("Agents synchronized successfully") except Exception as e: print(f"Failed to sync agents: {str(e)}") + + +def update_ids_in_local(data: List[Tuple]): + db = SessionLocal() + try: + for row in data: + name = row[1] + new_id = row[0] + existing_agent = db.query(AgentModel).filter_by(name=name).first() + if existing_agent: + existing_agent.id = new_id + db.add(existing_agent) + db.commit() + except IntegrityError: + db.rollback() + raise + finally: + db.close() + +def get_rag_user_id(db, tenant_id, app_type): + + user = db.query(UserAppModel).filter(UserAppModel.app_type==app_type, UserAppModel.app_id==tenant_id).first() + if user: + return user.user_id + return tenant_id + + +def get_data_from_bisheng_v2(names: List[str]) -> List[Dict]: + db = SessionBisheng() + try: + if names: + query = db.query(Flow.id, Flow.name, Flow.description, Flow.status, Flow.user_id) \ + .filter(Flow.name.in_(names), Flow.status=="1") + else: + query = db.query(Flow.id, Flow.name, Flow.description, Flow.status, Flow.user_id).filter(Flow.status=="1") + + results = query.all() + # print(f"Executing query: {query}") + # 鏍煎紡鍖杋d涓篣UID + formatted_results = [{"id":row[0], "name": row[1], "description": row[2], "status": row[3], "user_id": str(row[4]), "mode": "agent-dialog"} for row in results] + return formatted_results + finally: + db.close() + +def get_data_from_ragflow_v2(names: List[str]) -> List[Dict]: + db = SessionRagflow() + try: + if names: + query = db.query(Dialog.id, Dialog.name, Dialog.description, Dialog.status, Dialog.tenant_id) \ + .filter( Dialog.name.in_(names)) + else: + query = db.query(Dialog.id, Dialog.name, Dialog.description, Dialog.status, Dialog.tenant_id) + + results = query.all() + formatted_results = [ + {"id": row[0], "name": row[1], "description": row[2], "status": "1" if row[3] == "1" else "2", + "user_id": str(row[4]), "mode": "agent-dialog"} for row in results] + return formatted_results + finally: + db.close() + + +def get_data_from_dify_v2(names: List[str]) -> List[Dict]: + db = SessionDify() + try: + if names: + query = db.query(DfApps.id, DfApps.name, DfApps.description, DfApps.status, DfApps.tenant_id, DfApps.mode) \ + .filter( DfApps.name.in_(names)) + else: + query = db.query(DfApps.id, DfApps.name, DfApps.description, DfApps.status, DfApps.tenant_id, DfApps.mode) + + results = query.all() + formatted_results = [ + {"id": str(row[0]), "name": row[1], "description": row[2], "status": "1", + "user_id": str(row[4]), "mode": row[5]} for row in results] + return formatted_results + finally: + db.close() + + + +def update_ids_in_local_v2(data: List[Dict], dialog_type:str): + db = SessionLocal() + agent_id_list = [] + type_dict = {"1": RAGFLOW,"2": BISHENG,"4": DIFY} + try: + for row in data: + agent_id_list.append(row["id"]) + existing_agent = db.query(DialogModel).filter_by(id=row["id"]).first() + if existing_agent: + existing_agent.name = row["name"] + existing_agent.description = row["description"] + existing_agent.status = row["status"] + existing_agent.mode = row["mode"] + # existing_agent.tenant_id = get_rag_user_id(db, row["user_id"], type_dict[dialog_type]) + else: + existing = DialogModel(id=row["id"], status=row["status"], name=row["name"], description=row["description"], tenant_id=get_rag_user_id(db, row["user_id"], type_dict[dialog_type]), dialog_type=dialog_type, mode=row["mode"]) + db.add(existing) + db.commit() + for dialog in db.query(DialogModel).filter_by(dialog_type=dialog_type).all(): + if dialog.id not in agent_id_list: + # print(dialog.id) + db.query(DialogModel).filter_by(id=dialog.id).update({"status": "2"}) + db.commit() + except IntegrityError: + db.rollback() + raise + finally: + db.close() + + + +def get_data_from_ragflow_knowledge(): + db = SessionRagflow() + try: + + results = db.query(RgKnowledge.id, RgKnowledge.name, RgKnowledge.description, RgKnowledge.status, RgKnowledge.tenant_id, RgKnowledge.doc_num, RgKnowledge.permission).all() + formatted_results = [ + {"id": row[0], "name": row[1], "description": row[2], "status": str(row[3]), + "user_id": str(row[4]), "doc_num": row[5], "permission": row[6]} for row in results] + return formatted_results + finally: + db.close() + +def sync_agents_v2(): + db = SessionLocal() + + try: + app_register = AppRegisterDao(db).get_apps() + for app in app_register: + if app["id"] == RAGFLOW: + ragflow_data = get_data_from_ragflow_v2([]) + if ragflow_data: + update_ids_in_local_v2(ragflow_data, "1") + elif app["id"] == BISHENG: + bisheng_data = get_data_from_bisheng_v2([]) + if bisheng_data: + update_ids_in_local_v2(bisheng_data, "2") + elif app["id"] == DIFY: + dify_data = get_data_from_dify_v2([]) + if dify_data: + update_ids_in_local_v2(dify_data, "4") + print("v2 Agents synchronized successfully") + except Exception as e: + print(f"v2 Failed to sync agents: {str(e)}") + +def update_ids_in_local_knowledge(data, klg_type): + type_dict = {"1": RAGFLOW, "2": BISHENG, "4": DIFY} + db = SessionLocal() + agent_id_list = [] + try: + for row in data: + agent_id_list.append(row["id"]) + existing_agent = db.query(KnowledgeModel).filter_by(id=row["id"]).first() + if existing_agent: + existing_agent.name = row["name"] + existing_agent.description = row["description"] + # existing_agent.tenant_id = get_rag_user_id(db, row["user_id"], type_dict[klg_type]) + existing_agent.permission = row["permission"] + existing_agent.documents = row["doc_num"] + existing_agent.status = row["status"] + else: + existing = KnowledgeModel(id=row["id"], name=row["name"], description=row["description"], + tenant_id=get_rag_user_id(db, row["user_id"], type_dict[klg_type]),status=row["status"], + knowledge_type=1, permission=row["permission"], documents=row["doc_num"]) + db.add(existing) + db.commit() + for dialog in db.query(KnowledgeModel).filter_by(knowledge_type=klg_type).all(): + if dialog.id not in agent_id_list: + db.query(KnowledgeModel).filter_by(id=dialog.id).delete() + db.commit() + except IntegrityError: + db.rollback() + raise + finally: + db.close() + +def get_one_from_ragflow_knowledge(klg_id): + db = SessionRagflow() + try: + + row = db.query(RgKnowledge.id, RgKnowledge.name, RgKnowledge.description, RgKnowledge.status, RgKnowledge.tenant_id, RgKnowledge.doc_num, RgKnowledge.permission).filter(RgKnowledge.id==klg_id).first() + return {"id": row[0], "name": row[1], "description": row[2], "status": str(row[3]), + "user_id": str(row[4]), "doc_num": row[5], "permission": row[6]} if row else {} + finally: + db.close() + + +def sync_knowledge(): + db = SessionLocal() + + try: + app_register = AppRegisterDao(db).get_apps() + for app in app_register: + if app["id"] == RAGFLOW: + ragflow_data = get_data_from_ragflow_knowledge() + if ragflow_data: + update_ids_in_local_knowledge(ragflow_data, "1") + # elif app["id"] == BISHENG: + # bisheng_data = get_data_from_bisheng_v2([]) + # update_ids_in_local_v2(bisheng_data, "2") + # elif app["id"] == DIFY: + # dify_data = get_data_from_dify_v2([]) + # update_ids_in_local_v2(dify_data, "4") + print("sync knowledge successfully") + except Exception as e: + print(f"Failed to sync knowledge: {str(e)}") + + +if __name__ == "__main__": + a = get_data_from_dify_v2([]) + print(a) -- Gitblit v1.8.0