diff --git a/flask_app/general/多线程提问.py b/flask_app/general/多线程提问.py index 8fdba84..5417c27 100644 --- a/flask_app/general/多线程提问.py +++ b/flask_app/general/多线程提问.py @@ -183,7 +183,7 @@ def multi_threading(queries, knowledge_name="", file_id="", llm_type=1,need_extr return [] print("多线程提问:starting multi_threading...") result_queue = queue.Queue() - with concurrent.futures.ThreadPoolExecutor(max_workers=30) as executor: + with concurrent.futures.ThreadPoolExecutor(max_workers=40) as executor: future_to_index = { executor.submit(llm_call, query, knowledge_name, file_id, result_queue, index, llm_type,need_extra): index for index, query in enumerate(queries) diff --git a/flask_app/general/投标人须知正文条款提取成json文件.py b/flask_app/general/投标人须知正文条款提取成json文件.py index f84cbde..6089498 100644 --- a/flask_app/general/投标人须知正文条款提取成json文件.py +++ b/flask_app/general/投标人须知正文条款提取成json文件.py @@ -449,7 +449,7 @@ def convert_clause_to_json(file_path,output_folder,type=1): ) if file_path.endswith('.pdf'): text = extract_text_from_pdf(file_path, end_pattern, start_pattern_1, start_pattern_2) - print(text) + # print(text) else: raise ValueError("Unsupported file format") parsed_data = parse_text_by_heading(text) diff --git a/flask_app/routes/货物标解析main.py b/flask_app/routes/货物标解析main.py index 60744d1..54bd8cc 100644 --- a/flask_app/routes/货物标解析main.py +++ b/flask_app/routes/货物标解析main.py @@ -274,17 +274,13 @@ def goods_bid_main(output_folder, file_path, file_type, unique_id): #TODO: ec7d5328-9c57-450f-baf4-2e5a6f90ed1d #TODO: -# 2.废标项这边,考虑大模型+正则并用 -# 废标项,增加对表格的提取+排除重复项,按顺序处理 # 考虑将工程标和货物标的 投标人须知那块逻辑结合 # D:\flask_project\flask_app\static\output\output1\2c4be864-bdab-405d-95cb-9d945d8627b3排查一下 clause 有问题+ # C:\Users\Administrator\Desktop\fsdownload\bbf7504f-3c75-45e5-b3e2-ab0a15ec9c14 # 解决禅道 测试的bug -# 国网湖北电力荆州供电公司2024年第四次服务授权竞争性谈判采购-采购文件(15DJ04).docx 废标项 段落和表格混杂 # 货物标和工程标的资格审查整合 ##TODO:招标文件111_tobidders_notice_part2.pdf 陕西省公安厅交通警察总队高速公路交通安全智能感知巡查系统项目(1)_tobidders_notice_part2.pdf 唐山市公安交通警察支队机动车查验机构视频存储回放系统竞争性谈判-招标文件正文(1)_tobidders_notice_part1.pdf #TODO:2024-陕西-陕西省某单位2024年执勤化妆服采购项目.pdf -# C:\Users\Administrator\Desktop\货物\test3 废标排查 if __name__ == "__main__": # 配置日志器