Files
work-secretfile-selfcheck/UmiOCR-data/py_src/mission/doc_preview_connector.py

115 lines
4.2 KiB
Python

# ===============================================
# =============== 文档预览 - 连接器 ===============
# ===============================================
from PySide2.QtCore import QObject, Slot, Signal
from PySide2.QtGui import QPixmap, QImage
import fitz # PyMuPDF
from umi_log import logger
from .simple_mission import SimpleMission
from ..image_controller.image_provider import PixmapProvider
from ..utils.call_func import CallFunc
from .mission_doc import MissionDOC
MinSize = 0 # 最小渲染分辨率
# 文档预览连接器
class DocPreviewConnector(QObject):
previewImg = Signal(str) # imgID
previewOcr = Signal("QVariant") # [path, page, res]
# 注:信号中含多个变量可能导致崩溃?
def __init__(self, *args):
super().__init__(*args)
self._previewMission = SimpleMission(self._previewTask) # 简单任务对象
self._previewDoc = None # 当前预览的对象
self._previewPath = ""
self._zooms = {} # 缓存页面缩放系数
# 预览PDF画面
@Slot(str, int, str)
def preview(self, path, page, password):
page -= 1
self._previewMission.addMissionList([(path, page, password)])
def _previewTask(self, msn):
path, page, password = msn
if path == self._previewPath: # 已经加载了
doc = self._previewDoc
else: # 新加载
try:
doc = fitz.open(path)
if doc.is_encrypted and not doc.authenticate(password):
msg = "[Warning] is_encrypted" # 固定指令,不能改
self.previewImg.emit(msg)
return
except Exception as e:
msg = f"[Error] 打开文档失败:{path} {e}"
self.previewImg.emit(msg)
return
self._previewDoc = doc
self._previewPath = path
self._zooms = {}
page_count = doc.page_count
if page < 0 or page > page_count:
logger.error(f"页数 {page} 超出范围 0-{page_count}")
return
# 检查页面边长,如果低于阈值,则增加放大系数,以提高渲染清晰度
rect = doc[page].rect
w, h = abs(rect[2] - rect[0]), abs(rect[3] - rect[1])
m = min(w, h)
if m < MinSize:
zoom = MinSize / max(m, 1)
matrix = fitz.Matrix(zoom, zoom)
self._zooms[page] = zoom
else:
matrix = fitz.Identity
self._zooms[page] = 1
p = doc[page].get_pixmap(matrix=matrix)
# 通过 QImage fromImage 转换
# 必须先使用变量提取出图像 https://github.com/pymupdf/PyMuPDF/issues/1210
samples = p.samples
# 必须传入 pix.stride ,否则部分格式的图像会导致崩溃
qimage = QImage(samples, p.width, p.height, p.stride, QImage.Format_RGB888)
qpixmap = QPixmap.fromImage(qimage)
imgID = PixmapProvider.addPixmap(qpixmap)
self.previewImg.emit(imgID)
# 预览一页OCR内容
@Slot(str, int, str, "QVariant")
def ocr(self, path, page, password, argd):
argd = argd.toVariant() # qml对象转python字典
# if "tbpu.ignoreArea" in argd: # 删除忽略区域参数
# del argd["tbpu.ignoreArea"]
def _onGet(msnInfo, page_, res):
# 缩放文本位置
if page_ in self._zooms and res["code"] == 100:
z = self._zooms[page_]
for r in res["data"]:
for bi in range(4):
r["box"][bi][0] = r["box"][bi][0] * z
r["box"][bi][1] = r["box"][bi][1] * z
page_ += 1
self.previewOcr.emit([path, page_, res])
def _onEnd(msnInfo, msg):
if not msg.startswith("[Success]"):
res = {"code": 103, "data": msg}
self.previewOcr.emit([path, -1, res])
msnInfo = {
"argd": argd,
"onGet": _onGet,
"onEnd": _onEnd,
}
MissionDOC.addMission(msnInfo, path, (page, page), password=password)
# 清空缓存
@Slot()
def clear(self):
self._previewDoc = None
self._previewPath = ""