{"library":"skrub","type":"library","category":null,"description":"Skrub is a Python library for machine learning with dataframes, offering robust tools for cleaning, preprocessing, and encoding tabular data, particularly for heterogeneous or messy datasets. It provides scikit-learn compatible transformers and a powerful DataOps API for complex data pipelines. The current version is 0.8.0, with regular minor and patch releases.","language":"python","status":"active","version":"0.8.0","tags":["machine-learning","data-preprocessing","tabular-data","scikit-learn-compatible","dataframe","categorical-encoding"],"install":[{"cmd":"pip install skrub","imports":["from skrub import GapEncoder","from skrub import TableVectorizer","from skrub import StringEncoder","from skrub import DataOps","from skrub import MinHashEncoder"]},{"cmd":"pip install 'skrub[polars,all]'","imports":[]}],"homepage":"https://skrub-data.org/","github":"https://github.com/skrub-data/skrub","docs":null,"changelog":null,"pypi":"https://pypi.org/project/skrub/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":50,"avg_install_s":18.3,"avg_import_s":8.5,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/skrub/compatibility"},"provenance":{"verified_status":"passing","verified_at":"Sun Jun 28","last_verified":"Sun Jun 28","next_check":"Tue Jul 28","install_tag":null}}