From 04816cdedff3588d5de09b29db0d6223707a5a2e Mon Sep 17 00:00:00 2001 From: zy123 <646228430@qq.com> Date: Mon, 6 Jan 2025 10:34:30 +0800 Subject: [PATCH] =?UTF-8?q?1.6=20insert=5Fdel=5Fpagemark.py=E4=BF=AE?= =?UTF-8?q?=E6=94=B9?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- flask_app/general/insert_del_pagemark.py | 12 +++++++----- flask_app/货物标/截取pdf货物标版.py | 4 ++-- 2 files changed, 9 insertions(+), 7 deletions(-) diff --git a/flask_app/general/insert_del_pagemark.py b/flask_app/general/insert_del_pagemark.py index 3157871..de3f645 100644 --- a/flask_app/general/insert_del_pagemark.py +++ b/flask_app/general/insert_del_pagemark.py @@ -5,7 +5,7 @@ from PyPDF2 import PdfReader, PdfWriter from docx import Document from reportlab.pdfgen import canvas from reportlab.lib.units import cm - +import copy #复制input_pdf_path的内容到invalid_added.pdf 这一步可能报错!绘制新的一页基本不会报错 def insert_mark(input_pdf_path): @@ -48,8 +48,10 @@ def insert_mark(input_pdf_path): # 将内存中的PDF读入PyPDF2 packet.seek(0) new_pdf = PdfReader(packet) - blank_page = new_pdf.pages[0] - + # blank_page = new_pdf.pages[0] + blank_page = copy.deepcopy(new_pdf.pages[0]) + packet.truncate(0) + packet.seek(0) # 将带有文本的空白页添加到写入器 pdf_writer.add_page(blank_page) @@ -92,10 +94,10 @@ def delete_mark(docx_path): return new_file_path if __name__ == '__main__': - # input=r'D:\flask_project\flask_app\static\output\output1\90b073b5-b8fb-4b11-9962-10de7c3f3854\invalid_added.docx' + # input=r'C:\Users\Administrator\Desktop\fsdownload\0bb9cf31-280c-4d96-bc21-0871ee7fd6df\tmp\ztbfile.pdf' # input=r'C:\Users\Administrator\Desktop\new招标文件\output5\广水市公安局音视频监控系统设备采购项目_procurement.pdf' # output=insert_mark(input) - doc_path = r'D:\flask_project\flask_app\static\output\output1\90b073b5-b8fb-4b11-9962-10de7c3f3854\invalid_added.docx' + doc_path = r'C:\Users\Administrator\Desktop\fsdownload\0bb9cf31-280c-4d96-bc21-0871ee7fd6df\tmp\invalid_added.docx' res=delete_mark(doc_path) if res: print(res) diff --git a/flask_app/货物标/截取pdf货物标版.py b/flask_app/货物标/截取pdf货物标版.py index a4867ac..d485944 100644 --- a/flask_app/货物标/截取pdf货物标版.py +++ b/flask_app/货物标/截取pdf货物标版.py @@ -612,10 +612,10 @@ if __name__ == "__main__": logger = get_global_logger("123") # input_path = r"C:\Users\Administrator\Desktop\new招标文件\货物标" # pdf_path = r"C:\Users\Administrator\Desktop\招标文件-采购类\2024-贵州-贵州医科大学附属医院导视系统零星制作安装项目.pdf" - pdf_path=r"D:\flask_project\flask_app\static\output\output1\a43b4a55-06c1-465d-afb3-5844695ad9d8\ztbfile.pdf" + pdf_path=r"C:\Users\Administrator\Desktop\fsdownload\0bb9cf31-280c-4d96-bc21-0871ee7fd6df\ztbfile.pdf" # input_path = r"C:\Users\Administrator\Desktop\货物标\zbfiles\2-招标文件(广水市教育局封闭管理).pdf" # pdf_path=r"C:\Users\Administrator\Desktop\文件解析问题\文件解析问题\1414cb9c-7bf4-401c-8761-2acde151b9c2\ztbfile.pdf" - output_folder = r"D:\flask_project\flask_app\static\output\output1\a43b4a55-06c1-465d-afb3-5844695ad9d8\tmp" + output_folder = r"C:\Users\Administrator\Desktop\fsdownload\0bb9cf31-280c-4d96-bc21-0871ee7fd6df\tmp" # output_folder = r"C:\Users\Administrator\Desktop\new招标文件\output2" selection = 5 # 例如:1 - 公告, 2 - 评标办法, 3 - 资格审查后缀有qualification1或qualification2(与评标办法一致) 4.投标人须知前附表part1 投标人须知正文part2 5-采购需求 generated_files = truncate_pdf_main_goods(pdf_path, output_folder, selection,logger)