{"library":"fastwarc","type":"library","category":null,"description":"FastWARC is a high-performance Python library for parsing WARC (Web ARChive) files, written in C++/Cython. It supports WARC/1.0 and WARC/1.1 streams with GZip and LZ4 compression, offering significant speed improvements over pure Python alternatives like WARCIO. FastWARC is part of the ChatNoir Resiliparse toolkit and is currently at version 0.16.0, with active development.","language":"python","status":"active","version":"0.16.0","tags":["WARC","web archives","parsing","performance","Cython","C++","data processing"],"last_verified":"Sat May 23","install":[{"cmd":"pip install fastwarc","imports":["from fastwarc.warc import ArchiveIterator","from fastwarc.warc import WarcRecord","from fastwarc.warc import WarcRecordType"]},{"cmd":"pip install fastwarc[fsspec]","imports":[]},{"cmd":"sudo apt install build-essential python3-dev zlib1g-dev liblz4-dev && pip install --no-binary fastwarc fastwarc","imports":[]}],"homepage":"https://resiliparse.chatnoir.eu","github":"https://github.com/chatnoir-eu/chatnoir-resiliparse","docs":"https://resiliparse.chatnoir.eu","changelog":null,"pypi":"https://pypi.org/project/fastwarc/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":40,"avg_install_s":2.2,"avg_import_s":0.06,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/fastwarc/compatibility"}}