{"library":"hojichar","type":"library","category":null,"description":"HojiChar is a text preprocessing management system for Python, providing a pipeline API inspired by Compose/Filter patterns to clean, filter, and transform text data, with built-in support for deduplication, JSON loading/dumping, and asynchronous processing. Current version: 0.16.0, released Apr 2025; follows a monthly release cadence.","language":"python","status":"active","version":"0.16.0","tags":["text preprocessing","NLP","Japanese","pipeline","data cleaning"],"last_verified":"Mon Apr 27","install":[{"cmd":"pip install hojichar","imports":["from hojichar import Compose","from hojichar import AsyncCompose","from hojichar.document_filters import JSONLoader","from hojichar.document_filters import JSONDumper"]}],"homepage":null,"github":"https://github.com/HojiChar/HojiChar","docs":null,"changelog":null,"pypi":"https://pypi.org/project/hojichar/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":null}