{"id":327,"library":"pyarrow","title":"PyArrow","description":"PyArrow is a Python library for Apache Arrow, providing a standardized language-independent columnar memory format for flat and hierarchical data. The current version is 23.0.1, released on March 28, 2026, with a regular release cadence.","status":"active","version":"23.0.1","language":"python","source_language":"en","source_url":"https://github.com/apache/arrow","tags":["Apache Arrow","Data Processing","Parquet","Columnar Data"],"install":[{"cmd":"pip install pyarrow","lang":"bash","label":"Install PyArrow"}],"dependencies":[{"reason":"Required for array operations","package":"numpy","optional":false},{"reason":"Optional for DataFrame support","package":"pandas","optional":true}],"imports":[{"note":"Standard import pattern for PyArrow","symbol":"pa","correct":"import pyarrow as pa"}],"quickstart":{"code":"import pyarrow as pa\n\n# Create a simple Arrow Table\ndata = {'column1': [1, 2, 3], 'column2': ['A', 'B', 'C']}\ntable = pa.table(data)\n\n# Write the Table to a Parquet file\nimport pyarrow.parquet as pq\npq.write_table(table, 'example.parquet')\n\n# Read the Table back from the Parquet file\ntable_read = pq.read_table('example.parquet')\nprint(table_read)","lang":"python","description":"This script demonstrates creating an Arrow Table, writing it to a Parquet file, and reading it back using PyArrow."},"warnings":[{"fix":"Update your code to align with the new `pyarrow.fs` API as detailed in the release notes.","message":"PyArrow 23.0.1 introduces changes to the `pyarrow.fs` module, affecting file system operations. Review the release notes for migration details.","severity":"breaking","affected_versions":">=23.0.1"},{"fix":"Replace instances of `ParquetFile` with `ParquetDataset` in your codebase.","message":"The `pyarrow.parquet` module's `ParquetFile` class is deprecated as of version 23.0.1. Use `ParquetDataset` instead.","severity":"deprecated","affected_versions":">=23.0.1"}],"env_vars":null,"last_verified":"2026-05-12T13:05:15.962Z","next_check":"2026-06-26T00:00:00.000Z","problems":[{"fix":"Ensure that PyArrow is installed correctly by running 'pip install pyarrow' and verify the installation.","cause":"This error occurs when the 'pyarrow.dataset' module is not available, often due to an incomplete or incorrect installation of PyArrow.","error":"ModuleNotFoundError: No module named 'pyarrow._dataset'"},{"fix":"Install PyArrow using 'pip install pyarrow'.","cause":"This error indicates that the PyArrow library is not installed, which is required for certain functions like 'to_arrow()'.","error":"ValueError: The pyarrow library is not installed, please install pyarrow to use the to_arrow() function."},{"fix":"Install the missing AWS SDK for C++ shared library or ensure that all necessary dependencies are installed.","cause":"This error occurs when the required AWS SDK for C++ shared library is missing, leading to import failures in PyArrow.","error":"ImportError: libaws-cpp-sdk-s3.so: cannot open shared object file: No such file or directory"},{"fix":"Ensure that all necessary DLLs are present and compatible with your system; reinstalling PyArrow may resolve the issue.","cause":"This error indicates that a required DLL is missing or incompatible, preventing PyArrow from being imported.","error":"ImportError: DLL load failed while importing lib: The specified procedure could not be found."},{"fix":"Upgrade or reinstall PyArrow using 'pip install --upgrade pyarrow'.","cause":"This error occurs when the '__version__' attribute is missing from the PyArrow module, possibly due to an incomplete installation.","error":"AttributeError: module 'pyarrow' has no attribute '__version__'"}],"ecosystem":"pypi","meta_description":null,"install_score":100,"install_tag":"verified","quickstart_score":80,"quickstart_tag":"verified","pypi_latest":null,"install_checks":{"last_tested":"2026-05-12","tag":"verified","tag_description":"installs cleanly on critical runtimes, fast import, recently tested","results":[{"runtime":"python:3.10-alpine","python_version":"3.10","os_libc":"alpine (musl)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.07,"mem_mb":2.9,"disk_size":"187.4M"},{"runtime":"python:3.10-slim","python_version":"3.10","os_libc":"slim (glibc)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.04,"mem_mb":2.9,"disk_size":"165M"},{"runtime":"python:3.11-alpine","python_version":"3.11","os_libc":"alpine (musl)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.1,"mem_mb":2.9,"disk_size":"191.4M"},{"runtime":"python:3.11-slim","python_version":"3.11","os_libc":"slim (glibc)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.08,"mem_mb":2.9,"disk_size":"169M"},{"runtime":"python:3.12-alpine","python_version":"3.12","os_libc":"alpine (musl)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.08,"mem_mb":2.9,"disk_size":"183.0M"},{"runtime":"python:3.12-slim","python_version":"3.12","os_libc":"slim (glibc)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.1,"mem_mb":2.9,"disk_size":"160M"},{"runtime":"python:3.13-alpine","python_version":"3.13","os_libc":"alpine (musl)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.07,"mem_mb":2.9,"disk_size":"182.7M"},{"runtime":"python:3.13-slim","python_version":"3.13","os_libc":"slim (glibc)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.07,"mem_mb":2.7,"disk_size":"160M"},{"runtime":"python:3.9-alpine","python_version":"3.9","os_libc":"alpine (musl)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.06,"mem_mb":2.7,"disk_size":"173.4M"},{"runtime":"python:3.9-slim","python_version":"3.9","os_libc":"slim (glibc)","variant":"default","exit_code":0,"wheel_type":null,"failure_reason":null,"install_time_s":null,"import_time_s":0.06,"mem_mb":2.7,"disk_size":"156M"}]},"quickstart_checks":{"last_tested":"2026-04-23","tag":"verified","tag_description":"quickstart runs on critical runtimes, recently tested","results":[{"runtime":"python:3.10-alpine","exit_code":0},{"runtime":"python:3.10-slim","exit_code":0},{"runtime":"python:3.11-alpine","exit_code":0},{"runtime":"python:3.11-slim","exit_code":0},{"runtime":"python:3.12-alpine","exit_code":0},{"runtime":"python:3.12-slim","exit_code":0},{"runtime":"python:3.13-alpine","exit_code":0},{"runtime":"python:3.13-slim","exit_code":0},{"runtime":"python:3.9-alpine","exit_code":0},{"runtime":"python:3.9-slim","exit_code":0}]}}