{"library":"datacompy","type":"library","category":null,"description":"DataComPy is a powerful Python library designed to simplify the comparison of two DataFrames, supporting various backends including Pandas, Spark, Polars, and Snowflake. It generates detailed, human-readable reports highlighting discrepancies at both row and column levels, and allows for the specification of absolute or relative tolerance levels for numeric comparisons. The library is currently at version 0.19.5 and is actively progressing towards a v1 release, with new features targeting development branches while the 0.19.x branch is for maintenance and critical fixes.","language":"python","status":"active","version":"0.19.5","tags":["data comparison","dataframe","pandas","spark","polars","data quality","etl validation"],"last_verified":"Thu May 21","install":[{"cmd":"pip install datacompy","imports":["import datacompy\ncompare = datacompy.Compare(...)","from datacompy.core import Compare\ncompare = Compare(...)","from datacompy.spark.sql import SparkSQLCompare"]},{"cmd":"pip install datacompy[spark]","imports":[]},{"cmd":"pip install datacompy[polars]","imports":[]},{"cmd":"pip install datacompy[fugue]","imports":[]},{"cmd":"pip install datacompy[snowflake]","imports":[]}],"homepage":null,"github":"https://github.com/capitalone/datacompy","docs":"https://capitalone.github.io/datacompy/","changelog":null,"pypi":"https://pypi.org/project/datacompy/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":58,"avg_install_s":20.3,"avg_import_s":0.28,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/datacompy/compatibility"}}