{"library":"warcio","type":"library","category":null,"description":"warcio is a Python library (v1.8.1) for fast, low-level, streaming input/output of Web ARChive (WARC) and ARC files, adhering to WARC 1.0 and 1.1 ISO standards. It focuses on processing a stream of web archive records rather than entire files. Developed by Webrecorder, it includes features for both reading existing archives and capturing HTTP/S traffic directly into WARC files. The library is actively maintained, with recent updates adding support for remote file systems like S3 and HTTPS.","language":"python","status":"active","version":"1.8.1","tags":["warc","arc","web archive","streaming","io","webrecorder"],"last_verified":"Fri May 22","install":[{"cmd":"pip install warcio","imports":["from warcio.archiveiterator import ArchiveIterator","from warcio.capture_http import capture_http","from warcio.warcwriter import WARCWriter","from warcio.warcwriter import WARCRecord"]},{"cmd":"pip install warcio[s3]","imports":[]}],"homepage":null,"github":"https://github.com/webrecorder/warcio","docs":null,"changelog":null,"pypi":"https://pypi.org/project/warcio/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":4.2,"avg_import_s":0.22,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/warcio/compatibility"}}