{"library":"mineru","type":"library","category":null,"description":"MinerU is a robust document parsing tool designed to convert various input formats, including PDF, images, DOCX, PPTX, and XLSX, into machine-readable Markdown and JSON. It is optimized for downstream retrieval, extraction, and processing, especially for LLM-ready formats. Currently at version 3.0.9, the library is actively maintained with ongoing architectural enhancements and feature improvements, particularly in handling scientific literature and complex document structures.","language":"python","status":"active","version":"3.0.9","tags":["PDF","Markdown","conversion","document-processing","OCR","LLM-ready","LaTeX","HTML"],"install":[{"cmd":"pip install -U \"mineru[all]\"","imports":["from mineru.utils.demo_utils import parse_doc"]},{"cmd":"pip install \"mineru[core]\"","imports":[]}],"homepage":"https://mineru.net/","github":"https://github.com/opendatalab/MinerU","docs":"https://opendatalab.github.io/MinerU/","changelog":null,"pypi":"https://pypi.org/project/mineru/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":20,"avg_install_s":109.8,"avg_import_s":null,"wheel_type":"sdist"},"url":"https://checklist.day/v1/registry/mineru/compatibility"},"provenance":{"verified_status":"install_fail","verified_at":"Sun Jun 28","last_verified":"Sun Jun 28","next_check":"Sun Jul 05","install_tag":null}}