docs: 添加涉密文件自检工具实施计划
This commit is contained in:
46
UmiOCR-data/py_src/ocr/output/output_md.py
Normal file
46
UmiOCR-data/py_src/ocr/output/output_md.py
Normal file
@@ -0,0 +1,46 @@
|
||||
# 输出markdown格式
|
||||
|
||||
from .output import Output
|
||||
from .tools import getDataText
|
||||
|
||||
import os
|
||||
|
||||
|
||||
class OutputMD(Output):
|
||||
def __init__(self, argd):
|
||||
self.dir = argd["outputDir"] # 输出路径(文件夹)
|
||||
self.fileName = argd["outputFileName"] # 文件名
|
||||
self.outputPath = f"{self.dir}/{self.fileName}.md" # 输出路径
|
||||
self.ignoreBlank = argd["ignoreBlank"] # 忽略空白文件
|
||||
# 创建输出文件
|
||||
try:
|
||||
with open(self.outputPath, "w", encoding="utf-8") as f: # 覆盖创建文件
|
||||
f.write(f'> {argd["startDatetime"]}\n\n')
|
||||
except Exception as e:
|
||||
raise Exception(f"Failed to create jsonl file. {e}\n创建jsonl文件失败。")
|
||||
|
||||
def print(self, res): # 输出图片结果
|
||||
if not res["code"] == 100 and self.ignoreBlank:
|
||||
return # 忽略空白图片
|
||||
name = res["fileName"]
|
||||
path = os.path.relpath( # 从md文件到图片的相对路径
|
||||
res["path"], os.path.dirname(self.outputPath)
|
||||
)
|
||||
path = path.replace(" ", "%20") # 空格转 %20
|
||||
textOut = f"""
|
||||
---
|
||||

|
||||
[{name}]({path})
|
||||
|
||||
"""
|
||||
# 正文
|
||||
if res["code"] == 100:
|
||||
texts = getDataText(res["data"]).split("\n") # 获取拼接结果列表
|
||||
for t in texts:
|
||||
textOut += f"> {t} \n"
|
||||
elif res["code"] == 101:
|
||||
pass
|
||||
else:
|
||||
textOut += f'> [Error] OCR failed. Code: {res["code"]}, Msg: {res["data"]} \n> 【异常】OCR识别失败。 \n'
|
||||
with open(self.outputPath, "a", encoding="utf-8") as f: # 追加写入本地文件
|
||||
f.write(textOut)
|
||||
Reference in New Issue
Block a user