27 lines
940 B
Python
27 lines
940 B
Python
import io
|
|
from markitdown.converters._doc_intel_converter import (
|
|
DocumentIntelligenceConverter,
|
|
DocumentIntelligenceFileType,
|
|
)
|
|
from markitdown._stream_info import StreamInfo
|
|
|
|
|
|
def _make_converter(file_types):
|
|
conv = DocumentIntelligenceConverter.__new__(DocumentIntelligenceConverter)
|
|
conv._file_types = file_types
|
|
return conv
|
|
|
|
|
|
def test_docintel_accepts_html_extension():
|
|
conv = _make_converter([DocumentIntelligenceFileType.HTML])
|
|
stream_info = StreamInfo(mimetype=None, extension=".html")
|
|
assert conv.accepts(io.BytesIO(b""), stream_info)
|
|
|
|
|
|
def test_docintel_accepts_html_mimetype():
|
|
conv = _make_converter([DocumentIntelligenceFileType.HTML])
|
|
stream_info = StreamInfo(mimetype="text/html", extension=None)
|
|
assert conv.accepts(io.BytesIO(b""), stream_info)
|
|
stream_info = StreamInfo(mimetype="application/xhtml+xml", extension=None)
|
|
assert conv.accepts(io.BytesIO(b""), stream_info)
|