{"library":"goose3","type":"library","category":null,"description":"Goose3 is an HTML content/article extractor and web scraper for Python 3 (requires Python >=3.9). It extracts the main content, title, authors, metadata (OpenGraph, schema.org), and images from news articles and web pages. The current version is 3.1.21, with irregular releases as fixes accumulate.","language":"python","status":"active","version":"3.1.21","tags":["web scraping","content extraction","article extraction","html parser","news"],"last_verified":"Fri May 01","install":[{"cmd":"pip install goose3","imports":["from goose3 import Goose","from goose3.article import Article"]}],"homepage":null,"github":"https://github.com/goose3/goose3","docs":null,"changelog":null,"pypi":"https://pypi.org/project/goose3/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":null}