{"library":"blingfire","type":"library","category":null,"description":"BlingFire is a Python wrapper for a lightning-fast Finite State Machine (FSM) based Natural Language Processing (NLP) library developed by Microsoft. It is designed for high-performance text tokenization, multi-word expression matching, stemming, and lemmatization. Known for its speed, it often outperforms other NLP libraries like Hugging Face and SpaCy in tokenization tasks. The library supports various tokenization algorithms including pattern-based, WordPiece, Unigram LM, and BPE. The current version is 0.1.8, and it maintains an active release cadence with periodic updates adding new features and models.","language":"python","status":"active","version":"0.1.8","tags":["NLP","tokenization","text processing","FSM","Microsoft","performance"],"last_verified":"Thu May 21","install":[{"cmd":"pip install blingfire","imports":["from blingfire import text_to_words","from blingfire import text_to_sentences","from blingfire import load_model","from blingfire import tokenize_with_model","from blingfire import IdsToText"]}],"homepage":null,"github":"https://github.com/microsoft/blingfire","docs":null,"changelog":null,"pypi":"https://pypi.org/project/blingfire/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":50,"avg_install_s":2.3,"avg_import_s":null,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/blingfire/compatibility"}}