1.17 小bug
This commit is contained in:
parent
90940bc4a0
commit
9207aef9a2
@ -183,7 +183,7 @@ def multi_threading(queries, knowledge_name="", file_id="", llm_type=1,need_extr
|
|||||||
return []
|
return []
|
||||||
print("多线程提问:starting multi_threading...")
|
print("多线程提问:starting multi_threading...")
|
||||||
result_queue = queue.Queue()
|
result_queue = queue.Queue()
|
||||||
with concurrent.futures.ThreadPoolExecutor(max_workers=30) as executor:
|
with concurrent.futures.ThreadPoolExecutor(max_workers=40) as executor:
|
||||||
future_to_index = {
|
future_to_index = {
|
||||||
executor.submit(llm_call, query, knowledge_name, file_id, result_queue, index, llm_type,need_extra): index
|
executor.submit(llm_call, query, knowledge_name, file_id, result_queue, index, llm_type,need_extra): index
|
||||||
for index, query in enumerate(queries)
|
for index, query in enumerate(queries)
|
||||||
|
@ -449,7 +449,7 @@ def convert_clause_to_json(file_path,output_folder,type=1):
|
|||||||
)
|
)
|
||||||
if file_path.endswith('.pdf'):
|
if file_path.endswith('.pdf'):
|
||||||
text = extract_text_from_pdf(file_path, end_pattern, start_pattern_1, start_pattern_2)
|
text = extract_text_from_pdf(file_path, end_pattern, start_pattern_1, start_pattern_2)
|
||||||
print(text)
|
# print(text)
|
||||||
else:
|
else:
|
||||||
raise ValueError("Unsupported file format")
|
raise ValueError("Unsupported file format")
|
||||||
parsed_data = parse_text_by_heading(text)
|
parsed_data = parse_text_by_heading(text)
|
||||||
|
@ -274,17 +274,13 @@ def goods_bid_main(output_folder, file_path, file_type, unique_id):
|
|||||||
#TODO: ec7d5328-9c57-450f-baf4-2e5a6f90ed1d
|
#TODO: ec7d5328-9c57-450f-baf4-2e5a6f90ed1d
|
||||||
|
|
||||||
#TODO:
|
#TODO:
|
||||||
# 2.废标项这边,考虑大模型+正则并用
|
|
||||||
# 废标项,增加对表格的提取+排除重复项,按顺序处理
|
|
||||||
# 考虑将工程标和货物标的 投标人须知那块逻辑结合
|
# 考虑将工程标和货物标的 投标人须知那块逻辑结合
|
||||||
# D:\flask_project\flask_app\static\output\output1\2c4be864-bdab-405d-95cb-9d945d8627b3排查一下 clause 有问题+
|
# D:\flask_project\flask_app\static\output\output1\2c4be864-bdab-405d-95cb-9d945d8627b3排查一下 clause 有问题+
|
||||||
# C:\Users\Administrator\Desktop\fsdownload\bbf7504f-3c75-45e5-b3e2-ab0a15ec9c14
|
# C:\Users\Administrator\Desktop\fsdownload\bbf7504f-3c75-45e5-b3e2-ab0a15ec9c14
|
||||||
# 解决禅道 测试的bug
|
# 解决禅道 测试的bug
|
||||||
# 国网湖北电力荆州供电公司2024年第四次服务授权竞争性谈判采购-采购文件(15DJ04).docx 废标项 段落和表格混杂
|
|
||||||
# 货物标和工程标的资格审查整合
|
# 货物标和工程标的资格审查整合
|
||||||
##TODO:招标文件111_tobidders_notice_part2.pdf 陕西省公安厅交通警察总队高速公路交通安全智能感知巡查系统项目(1)_tobidders_notice_part2.pdf 唐山市公安交通警察支队机动车查验机构视频存储回放系统竞争性谈判-招标文件正文(1)_tobidders_notice_part1.pdf
|
##TODO:招标文件111_tobidders_notice_part2.pdf 陕西省公安厅交通警察总队高速公路交通安全智能感知巡查系统项目(1)_tobidders_notice_part2.pdf 唐山市公安交通警察支队机动车查验机构视频存储回放系统竞争性谈判-招标文件正文(1)_tobidders_notice_part1.pdf
|
||||||
#TODO:2024-陕西-陕西省某单位2024年执勤化妆服采购项目.pdf
|
#TODO:2024-陕西-陕西省某单位2024年执勤化妆服采购项目.pdf
|
||||||
# C:\Users\Administrator\Desktop\货物\test3 废标排查
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
# 配置日志器
|
# 配置日志器
|
||||||
|
Loading…
x
Reference in New Issue
Block a user