We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 59b0b0c commit f06a321Copy full SHA for f06a321
magic_pdf/dict2md/ocr_mkcontent.py
@@ -42,7 +42,7 @@ def ocr_mk_mm_markdown(pdf_info_dict: dict):
42
if not span.get('image_path'):
43
continue
44
else:
45
- content = f""
+ content = f""
46
47
content = ocr_escape_special_markdown_char(span['content']) # 转义特殊符号
48
if span['type'] == ContentType.InlineEquation:
@@ -53,3 +53,11 @@ def ocr_mk_mm_markdown(pdf_info_dict: dict):
53
# 在行末添加两个空格以强制换行
54
markdown.append(line_text.strip() + ' ')
55
return '\n'.join(markdown)
56
+
57
+def ocr_mk_mm_standard_format():
58
+ '''
59
+ content_list
60
+ type string image/text/table/equation(行间的单独拿出来,行内的和text合并)
61
62
63
+ pass
0 commit comments