{"library":"datafusion","type":"library","category":null,"description":"A Python library that provides bindings to the Apache Arrow in-memory query engine, DataFusion. It enables users to build and execute high-performance queries using SQL or a DataFrame API against various data sources, including CSV, Parquet, JSON, and in-memory data. Leveraging its Rust-written query engine, it focuses on efficient, zero-copy data exchange with PyArrow. The library is actively maintained, with a current version of 52.3.0, and typically releases in sync with the core DataFusion project.","language":"python","status":"active","version":"52.3.0","tags":["data processing","query engine","SQL","dataframe","apache arrow","rust","etl"],"last_verified":"Thu May 21","install":[{"cmd":"pip install datafusion","imports":["from datafusion import SessionContext","from datafusion import col","from datafusion import udf","from datafusion import functions"]}],"homepage":"https://datafusion.apache.org/python","github":"https://github.com/apache/datafusion-python","docs":"https://datafusion.apache.org/python","changelog":null,"pypi":"https://pypi.org/project/datafusion/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":50,"avg_install_s":4.4,"avg_import_s":0.31,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/datafusion/compatibility"}}