10.24
This commit is contained in:
parent
7776c41ed0
commit
8f428e73da
@ -42,6 +42,7 @@ def get_filename_and_folder(file_path):
|
|||||||
def pdf2docx(local_path_in):
|
def pdf2docx(local_path_in):
|
||||||
remote_url = 'http://47.98.59.178:8000/v3/3rd/files/transfer/p2d'
|
remote_url = 'http://47.98.59.178:8000/v3/3rd/files/transfer/p2d'
|
||||||
receive_download_url = upload_file(local_path_in, remote_url) #转换完成,得到下载链接
|
receive_download_url = upload_file(local_path_in, remote_url) #转换完成,得到下载链接
|
||||||
|
print(receive_download_url)
|
||||||
filename, folder = get_filename_and_folder(local_path_in) #输入输出在同一个文件夹
|
filename, folder = get_filename_and_folder(local_path_in) #输入输出在同一个文件夹
|
||||||
local_filename=os.path.join(folder,filename) #输出文件名 C:\Users\Administrator\Desktop\货物标\zbfiles\6.2定版视频会议磋商文件 不带后缀
|
local_filename=os.path.join(folder,filename) #输出文件名 C:\Users\Administrator\Desktop\货物标\zbfiles\6.2定版视频会议磋商文件 不带后缀
|
||||||
downloaded_filepath,file_type=download_file(receive_download_url, local_filename)
|
downloaded_filepath,file_type=download_file(receive_download_url, local_filename)
|
||||||
@ -162,7 +163,8 @@ def doc2docx(file_path):
|
|||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
# 替换为你的文件路径和API URL
|
# 替换为你的文件路径和API URL
|
||||||
local_path_in="C:\\Users\\Administrator\\Desktop\\fsdownload\\1fbbb6ff-7ddc-40bb-8857-b7de37aece3f\\兴欣工程.pdf"
|
# local_path_in="C:\\Users\\Administrator\\Desktop\\fsdownload\\1fbbb6ff-7ddc-40bb-8857-b7de37aece3f\\兴欣工程.pdf"
|
||||||
|
local_path_in="C:\\Users\\Administrator\\Desktop\\fsdownload\\ztbfile.pdf"
|
||||||
# downloaded_file=doc2docx(local_path_in)
|
# downloaded_file=doc2docx(local_path_in)
|
||||||
downloaded_file=pdf2docx(local_path_in)
|
downloaded_file=pdf2docx(local_path_in)
|
||||||
print(downloaded_file)
|
print(downloaded_file)
|
||||||
|
@ -381,6 +381,7 @@ def process_and_stream(file_url, zb_type):
|
|||||||
includes = ["基础信息", "资格审查", "商务评分", "技术评分", "无效标与废标项", "投标文件要求", "开评定标流程"]
|
includes = ["基础信息", "资格审查", "商务评分", "技术评分", "无效标与废标项", "投标文件要求", "开评定标流程"]
|
||||||
final_result, extracted_info,procurement_reqs = outer_post_processing(combined_data, includes)
|
final_result, extracted_info,procurement_reqs = outer_post_processing(combined_data, includes)
|
||||||
|
|
||||||
|
logger.info(f"Procurement requirements extracted: {json.dumps(procurement_reqs, ensure_ascii=False, indent=4)}") # 添加日志记录
|
||||||
procurement_reqs_response={
|
procurement_reqs_response={
|
||||||
'message': 'procurement_reqs',
|
'message': 'procurement_reqs',
|
||||||
'filename': os.path.basename(downloaded_filepath),
|
'filename': os.path.basename(downloaded_filepath),
|
||||||
|
@ -1,24 +1,14 @@
|
|||||||
import re
|
from flask_app.general.通义千问long import upload_file,qianwen_long
|
||||||
|
file_path="C:\\Users\\Administrator\\Desktop\\招标文件\\招标test文件夹\\zbtest19\\zbtest19_214-320.pdf"
|
||||||
begin_pattern = re.compile(r'第[一二三四五六七八九十]+章\s*(招标公告|投标须知.*)|(^|\n)第一卷|招标编号:|招标编号:')
|
user_query="""该文件为投标文件格式要求,请你根据该招标文件回答:营业执照应该附在哪个地方?你可能需要查找以下章节出现的地方:'具有独立承担民事责任能力的法人','投标人基本信息表','法人或者其他组织的营业执照等证明文件,自然人的身份证明','投标人情况介绍','投标人简介','企业相关证件'。
|
||||||
|
我需要将营业执照贴在该章节的最后面,目前我需要定位到插入的位置,请你返回给我插入位置的上下文,字数限制在30字以内,以json格式返回,键名分别是'上文','下文',上下文应格式内容完全与原文保持一致,不得擅自删减总结,示例输出如下:
|
||||||
# 测试用例
|
{
|
||||||
test_cases = [
|
"上文":"投标人: (盖单位章)
|
||||||
"第一章 招标公告",
|
年 月 日",
|
||||||
"\n第一章 招标公告", # 在第二行
|
"下文":"四、投标保证金
|
||||||
"第二章 投标须知",
|
(招标人名称):"
|
||||||
"第三章 投标须知要求",
|
}
|
||||||
"第一卷 投标文件格式",
|
"""
|
||||||
"招标编号: ABC123",
|
file_id=upload_file(file_path)
|
||||||
"招标编号:DEF456",
|
res=qianwen_long(file_id,user_query)
|
||||||
"第三章 项目概述",
|
print(res)
|
||||||
"第四章 评标办法"
|
|
||||||
]
|
|
||||||
|
|
||||||
# 测试匹配
|
|
||||||
for i, case in enumerate(test_cases, 1):
|
|
||||||
match = begin_pattern.search(case)
|
|
||||||
if match:
|
|
||||||
print(f"Test case {i}: Matched - '{case}'")
|
|
||||||
else:
|
|
||||||
print(f"Test case {i}: Not matched - '{case}'")
|
|
Loading…
x
Reference in New Issue
Block a user