https://github.com/opendataloader-project/opendataloader-pdf
uv pip install opendataloader-pdf["hybrid"]
import opendataloader_pdf
opendataloader_pdf.convert(
input_path="sb0818E.pdf",
output_dir="output",
format="markdown",
#detect_strikethrough=True,
)
opendataloader-pdf-hybrid --port 5002
opendataloader-pdf --hybrid docling-fast --format markdown sb0818E.pdf