You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
31 lines
1006 B
Python
31 lines
1006 B
Python
1 month ago
|
import pytest
|
||
|
from marker.converters.table import TableConverter
|
||
|
from marker.renderers.markdown import MarkdownOutput
|
||
|
from marker.util import classes_to_strings
|
||
|
|
||
|
def _table_converter(config, model_dict, renderer, temp_pdf):
|
||
|
converter = TableConverter(
|
||
|
artifact_dict=model_dict,
|
||
|
processor_list=None,
|
||
|
renderer=classes_to_strings([renderer])[0],
|
||
|
config=config
|
||
|
)
|
||
|
|
||
|
markdown_output: MarkdownOutput = converter(temp_pdf.name)
|
||
|
markdown = markdown_output.markdown
|
||
|
|
||
|
assert len(markdown) > 0
|
||
|
assert "cyclic" in markdown
|
||
|
|
||
|
|
||
|
@pytest.mark.output_format("markdown")
|
||
|
@pytest.mark.config({"page_range": [5]})
|
||
|
def test_table_converter(config, model_dict, renderer, temp_doc):
|
||
|
_table_converter(config, model_dict, renderer, temp_doc)
|
||
|
|
||
|
@pytest.mark.output_format("markdown")
|
||
|
@pytest.mark.config({"page_range": [5], "force_ocr": True})
|
||
|
def test_table_converter_ocr(config, model_dict, renderer, temp_doc):
|
||
|
_table_converter(config, model_dict, renderer, temp_doc)
|
||
|
|