{"library":"collate-data-diff","type":"library","category":null,"description":"collate-data-diff (also known as data-diff) is a Python library and command-line tool designed to efficiently compare and find differences between rows across two databases or tables. It focuses on performance and scalability for large datasets, providing a fast and accurate way to detect data discrepancies. The current version is 0.11.10, and it maintains an active release cadence with frequent updates.","language":"python","status":"active","version":"0.11.10","tags":["database","diff","data comparison","data quality","etl","data validation"],"last_verified":"Fri May 22","install":[{"cmd":"pip install collate-data-diff","imports":["from data_diff import diff_tables","from data_diff import TableSegment","from data_diff import connect_to_uri"]},{"cmd":"pip install \"collate-data-diff[sqlite]\" \"collate-data-diff[postgresql]\" \"collate-data-diff[mysql]\" \"collate-data-diff[snowflake]\"","imports":[]}],"homepage":null,"github":"https://github.com/datafold/data-diff","docs":null,"changelog":null,"pypi":"https://pypi.org/project/collate-data-diff/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":50,"avg_install_s":14.2,"avg_import_s":1.02,"wheel_type":"sdist"},"url":"https://checklist.day/v1/registry/collate-data-diff/compatibility"}}