From dc30de3087321f3f7cd144daf32e9ab73470951b Mon Sep 17 00:00:00 2001 From: zy123 <646228430@qq.com> Date: Thu, 12 Dec 2024 10:59:51 +0800 Subject: [PATCH] =?UTF-8?q?12.12=20=E8=B1=86=E5=8C=85=E6=B5=8B=E8=AF=95?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- flask_app/general/file2markdown.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/flask_app/general/file2markdown.py b/flask_app/general/file2markdown.py index 036f48e..48a2c22 100644 --- a/flask_app/general/file2markdown.py +++ b/flask_app/general/file2markdown.py @@ -50,12 +50,12 @@ def convert_pdf_to_markdown(file_path): resp = textin.recognize_pdf2md(image, { 'page_start': 0, 'page_count': 50, # 设置解析页数为50页 - 'table_flavor': 'md', # html 按html语法输出表格 - 'parse_mode': 'scan', # 设置解析模式为scan模式 + 'table_flavor': 'html', # html 按html语法输出表格 + 'parse_mode': 'auto', # 设置解析模式为scan模式 'page_details': 0, # 不包含页面细节 'markdown_details': 1, 'apply_document_tree': 1, - 'dpi': 144 # 分辨率设置为144 dpi + 'dpi': 216 # 分辨率设置默认为144 dpi }) print("request time: ", resp.elapsed.total_seconds()) data = json.loads(resp.text)