{"library":"ceja","type":"library","category":null,"description":"ceja is a Python library that provides PySpark implementations of string and phonetic matching algorithms. It enables users to apply functions like NYSIIS, Metaphone, Jaro-Winkler similarity, and Damerau-Levenshtein distance directly within PySpark DataFrames, leveraging Spark's distributed processing capabilities for large datasets. The library is currently at version 0.4.0, with its last release in February 2023, indicating a slow release cadence.","language":"en","status":"maintenance","version":"0.4.0","tags":["pyspark","string matching","phonetic algorithms","stemming","data processing","fuzzy matching"],"last_verified":"Wed May 27","install":[{"cmd":"pip install ceja","imports":["import ceja"]}],"homepage":null,"github":null,"docs":null,"changelog":null,"pypi":null,"npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":2.7,"avg_import_s":null,"wheel_type":"sdist"},"url":"https://checklist.day/v1/registry/ceja/compatibility"}}