Cleanup and refactor, in preparation for plugin support. (#318)
* Work started moving converters to individual files. * Significant cleanup and refactor. * Moved everything to a packages subfolder. * Added sample plugin. * Added instructions to the README.md * Bumped version, and added a note about compatibility.
This commit is contained in:
BIN
packages/markitdown/tests/test_files/test.docx
Normal file
BIN
packages/markitdown/tests/test_files/test.docx
Normal file
Binary file not shown.
BIN
packages/markitdown/tests/test_files/test.jpg
Normal file
BIN
packages/markitdown/tests/test_files/test.jpg
Normal file
Binary file not shown.
|
After Width: | Height: | Size: 463 KiB |
10
packages/markitdown/tests/test_files/test.json
Normal file
10
packages/markitdown/tests/test_files/test.json
Normal file
@@ -0,0 +1,10 @@
|
||||
{
|
||||
"key1": "string_value",
|
||||
"key2": 1234,
|
||||
"key3": [
|
||||
"list_value1",
|
||||
"list_value2"
|
||||
],
|
||||
"5b64c88c-b3c3-4510-bcb8-da0b200602d8": "uuid_key",
|
||||
"uuid_value": "9700dc99-6685-40b4-9a3a-5e406dcb37f3"
|
||||
}
|
||||
BIN
packages/markitdown/tests/test_files/test.pptx
Normal file
BIN
packages/markitdown/tests/test_files/test.pptx
Normal file
Binary file not shown.
BIN
packages/markitdown/tests/test_files/test.xls
Normal file
BIN
packages/markitdown/tests/test_files/test.xls
Normal file
Binary file not shown.
BIN
packages/markitdown/tests/test_files/test.xlsx
Normal file
BIN
packages/markitdown/tests/test_files/test.xlsx
Normal file
Binary file not shown.
69
packages/markitdown/tests/test_files/test_blog.html
Normal file
69
packages/markitdown/tests/test_files/test_blog.html
Normal file
File diff suppressed because one or more lines are too long
BIN
packages/markitdown/tests/test_files/test_files.zip
Normal file
BIN
packages/markitdown/tests/test_files/test_files.zip
Normal file
Binary file not shown.
BIN
packages/markitdown/tests/test_files/test_llm.jpg
Normal file
BIN
packages/markitdown/tests/test_files/test_llm.jpg
Normal file
Binary file not shown.
|
After Width: | Height: | Size: 145 KiB |
4
packages/markitdown/tests/test_files/test_mskanji.csv
Normal file
4
packages/markitdown/tests/test_files/test_mskanji.csv
Normal file
@@ -0,0 +1,4 @@
|
||||
<EFBFBD><EFBFBD><EFBFBD>O,<EFBFBD>N<EFBFBD><EFBFBD>,<EFBFBD>Z<EFBFBD><EFBFBD>
|
||||
<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Y,30,<EFBFBD><EFBFBD><EFBFBD><EFBFBD>
|
||||
<EFBFBD>O<EFBFBD>؉p<EFBFBD>q,25,<EFBFBD><EFBFBD><EFBFBD><EFBFBD>
|
||||
<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>~,35,<EFBFBD><EFBFBD><EFBFBD>É<EFBFBD>
|
||||
|
89
packages/markitdown/tests/test_files/test_notebook.ipynb
Normal file
89
packages/markitdown/tests/test_files/test_notebook.ipynb
Normal file
@@ -0,0 +1,89 @@
|
||||
{
|
||||
"cells": [
|
||||
{
|
||||
"cell_type": "markdown",
|
||||
"id": "0f61db80",
|
||||
"metadata": {},
|
||||
"source": [
|
||||
"# Test Notebook"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 11,
|
||||
"id": "3f2a5bbd",
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"markitdown\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"print('markitdown')"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "markdown",
|
||||
"id": "9b9c0468",
|
||||
"metadata": {},
|
||||
"source": [
|
||||
"## Code Cell Below"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 10,
|
||||
"id": "37d8088a",
|
||||
"metadata": {},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"42\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"# comment in code\n",
|
||||
"print(42)"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "markdown",
|
||||
"id": "2e3177bd",
|
||||
"metadata": {},
|
||||
"source": [
|
||||
"End\n",
|
||||
"\n",
|
||||
"---"
|
||||
]
|
||||
}
|
||||
],
|
||||
"metadata": {
|
||||
"kernelspec": {
|
||||
"display_name": "Python 3",
|
||||
"language": "python",
|
||||
"name": "python3"
|
||||
},
|
||||
"language_info": {
|
||||
"codemirror_mode": {
|
||||
"name": "ipython",
|
||||
"version": 3
|
||||
},
|
||||
"file_extension": ".py",
|
||||
"mimetype": "text/x-python",
|
||||
"name": "python",
|
||||
"nbconvert_exporter": "python",
|
||||
"pygments_lexer": "ipython3",
|
||||
"version": "3.12.8"
|
||||
},
|
||||
"title": "Test Notebook Title"
|
||||
},
|
||||
"nbformat": 4,
|
||||
"nbformat_minor": 5
|
||||
}
|
||||
BIN
packages/markitdown/tests/test_files/test_outlook_msg.msg
Normal file
BIN
packages/markitdown/tests/test_files/test_outlook_msg.msg
Normal file
Binary file not shown.
1
packages/markitdown/tests/test_files/test_rss.xml
Normal file
1
packages/markitdown/tests/test_files/test_rss.xml
Normal file
File diff suppressed because one or more lines are too long
147
packages/markitdown/tests/test_files/test_serp.html
Normal file
147
packages/markitdown/tests/test_files/test_serp.html
Normal file
File diff suppressed because one or more lines are too long
2232
packages/markitdown/tests/test_files/test_wikipedia.html
Normal file
2232
packages/markitdown/tests/test_files/test_wikipedia.html
Normal file
File diff suppressed because one or more lines are too long
BIN
packages/markitdown/tests/test_files/test_with_comment.docx
Normal file
BIN
packages/markitdown/tests/test_files/test_with_comment.docx
Normal file
Binary file not shown.
Reference in New Issue
Block a user