{"library":"tinysegmenter","type":"library","category":null,"description":"TinySegmenter in Python is a Python port of the original JavaScript-based TinySegmenter, an extremely compact (23KB) Japanese tokenizer. It offers character-based segmentation with approximately 95% precision for Japanese news articles, compatible with MeCab + IPADic segmentation units, without relying on external dictionaries. The latest version, 0.4, was released on September 16, 2018, and its development is not actively maintained, though contributions are welcome.","language":"python","status":"maintenance","version":"0.4","tags":["Japanese","tokenizer","NLP","segmentation","compact"],"last_verified":"Sat May 23","install":[{"cmd":"pip install tinysegmenter","imports":["from tinysegmenter import TinySegmenter"]}],"homepage":"http://tinysegmenter.tuxfamily.org/","github":null,"docs":null,"changelog":null,"pypi":"https://pypi.org/project/tinysegmenter/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":2.4,"avg_import_s":0,"wheel_type":"sdist"},"url":"https://checklist.day/v1/registry/tinysegmenter/compatibility"}}