diff --git a/tests/test_tables.py b/tests/test_tables.py index 745369c06..843de4787 100644 --- a/tests/test_tables.py +++ b/tests/test_tables.py @@ -1,9 +1,11 @@ import os import io from pprint import pprint -import pymupdf +import textwrap import pickle +import pymupdf + scriptdir = os.path.abspath(os.path.dirname(__file__)) filename = os.path.join(scriptdir, "resources", "chinese-tables.pdf") pickle_file = os.path.join(scriptdir, "resources", "chinese-tables.pickle") @@ -294,15 +296,29 @@ def test_markdown(): doc = pymupdf.open(filename) page = doc[0] tab = page.find_tables(strategy="lines_strict")[0] - text = ( - "|Header1|Header2|Header3|\n" - "|---|---|---|\n" - "|Col11
Col12|Col21
Col22|Col31
Col32
Col33|\n" - "|Col13|Col23|Col34
Col35|\n" - "|Col14|Col24|Col36|\n" - "|Col15|Col25
Col26||\n\n" - ) - assert tab.to_markdown() == text + if pymupdf.mupdf_version_tuple < (1, 27): + md_expected = textwrap.dedent(''' + |Header1|Header2|Header3| + |---|---|---| + |Col11
Col12|~~Col21~~
~~Col22~~|Col31
Col32
Col33| + |Col13|~~Col23~~|Col34
Col35| + |Col14|~~Col24~~|Col36| + |Col15|~~Col25~~
~~Col26~~|| + + ''').lstrip() + else: + md_expected = ( + "|Header1|Header2|Header3|\n" + "|---|---|---|\n" + "|Col11
Col12|Col21
Col22|Col31
Col32
Col33|\n" + "|Col13|Col23|Col34
Col35|\n" + "|Col14|Col24|Col36|\n" + "|Col15|Col25
Col26||\n\n" + ) + + + md = tab.to_markdown() + assert md == md_expected, f'Incorrect md:\n{textwrap.indent(md, " ")}' def test_paths_param():