LICENSE
README.md
pyproject.toml
setup.py
doc2mark/__init__.py
doc2mark/__main__.py
doc2mark/cli.py
doc2mark.egg-info/PKG-INFO
doc2mark.egg-info/SOURCES.txt
doc2mark.egg-info/dependency_links.txt
doc2mark.egg-info/entry_points.txt
doc2mark.egg-info/requires.txt
doc2mark.egg-info/top_level.txt
doc2mark/core/__init__.py
doc2mark/core/base.py
doc2mark/core/loader.py
doc2mark/formats/__init__.py
doc2mark/formats/legacy.py
doc2mark/formats/markup.py
doc2mark/formats/office.py
doc2mark/formats/pdf.py
doc2mark/formats/text.py
doc2mark/formats/unified_processor.py
doc2mark/ocr/__init__.py
doc2mark/ocr/base.py
doc2mark/ocr/openai.py
doc2mark/ocr/prompts.py
doc2mark/ocr/tesseract.py
doc2mark/pipelines/__init__.py
doc2mark/pipelines/legacy_converter.py
doc2mark/pipelines/office_advanced_pipeline.py
doc2mark/pipelines/pymupdf_advanced_pipeline.py
doc2mark/utils/__init__.py
tests/test_basic.py
tests/test_ocr.py
tests/test_pipelines.py
tests/test_simple.py
tests/test_text_formats.py