-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpreprocess1.py
31 lines (30 loc) · 1.26 KB
/
preprocess1.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
'''
Author: Victor-kawai [email protected]
Date: 2024-05-22 11:18:46
LastEditors: Victor-kawai [email protected]
LastEditTime: 2024-06-06 14:37:55
FilePath: \毕设\code\preprocess1.py
Description: 这是默认设置,请设置`customMade`, 打开koroFileHeader查看配置 进行设置: https://github.com/OBKoro1/koro1FileHeader/wiki/%E9%85%8D%E7%BD%AE
'''
from pdf2jpg import *
from cut_image import *
from format_change import *
'''
该脚本用于处理PDF到图片切割的自动化步骤:
1、将PDF转化为图片;
2、对图片进行切割;
3、对图片的表述格式进行转换。
最后的处理结果需要人工检查图片切分状况,需对切分不良的图片进行人工重新切分。
'''
if __name__ == "__main__":
# 1、PDF地址
pdfPath = '元丰新制/枢密院门/264-278枢密院门.pdf'
print("开始处理PDF文件:", pdfPath)
# 2、需要储存图片的目录
imagePath = pdfPath[:pdfPath.rfind('.')]
print("图片将被储存在:", imagePath)
pyMuPDF_fitz(pdfPath, imagePath)
cut_image_path = cut_image(imagePath)
print("切割后图片将存储在:", cut_image_path)
change_format(cut_image_path)
print("\n处理结束,请对切分图片进行人工检查!")