{"library":"boilerpy3","type":"library","category":null,"description":"BoilerPy3 is an active Python port of Christian Kohlschütter's Boilerpipe library, designed for robust HTML boilerplate removal and main text extraction from web pages. It is currently at version 1.0.7 and is based on Boilerpipe 1.2 functionality. The library focuses on providing a more Pythonic interface, including type-hinting and snake_case conventions.","language":"python","status":"active","version":"1.0.7","tags":["HTML","text extraction","boilerplate removal","web scraping","content extraction"],"last_verified":"Mon May 25","install":[{"cmd":"pip install boilerpy3","imports":["from boilerpy3 import extractors\nextractor = extractors.ArticleExtractor()","from boilerpy3 import extractors\nextractor = extractors.DefaultExtractor()"]}],"homepage":null,"github":"https://github.com/jmriebold/BoilerPy3","docs":null,"changelog":null,"pypi":"https://pypi.org/project/boilerpy3/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":1.5,"avg_import_s":0.17,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/boilerpy3/compatibility"}}