{"id":21732,"library":"pyarrowfs-adlgen2","title":"pyarrowfs-adlgen2","description":"PyArrow filesystem interface for Azure Data Lake Storage Gen2. Version 0.2.5, compatible with Python >=3.6 and Apache Arrow. Last release in 2021, low maintenance.","status":"maintenance","version":"0.2.5","language":"python","source_language":"en","source_url":"https://github.com/kaaveland/pyarrowfs-adlgen2","tags":["pyarrow","azure","adls-gen2","filesystem","data-lake"],"install":[{"cmd":"pip install pyarrowfs-adlgen2","lang":"bash","label":"Install from PyPI"}],"dependencies":[{"reason":"Required for Arrow filesystem abstraction","package":"pyarrow","optional":false},{"reason":"Azure SDK for ADLS Gen2","package":"azure-storage-file-datalake","optional":false},{"reason":"Authentication (DefaultAzureCredential)","package":"azure-identity","optional":true}],"imports":[{"note":"pyarrowfs-adlgen2 registers its filesystem into pyarrow.fs; no direct import from the library.","symbol":"AdlGen2FileSystem","correct":"from pyarrow.fs import AdlGen2FileSystem"}],"quickstart":{"code":"import os\nfrom pyarrow.fs import AdlGen2FileSystem\n\nstorage_account = \"mystorageaccount\"\ncontainer = \"mycontainer\"\n\n# Use DefaultAzureCredential (requires azure-identity)\nfs = AdlGen2FileSystem(\n    account_name=storage_account,\n    account_key=os.environ.get('ADLS_KEY', ''),  # optional key\n    tenant_id=os.environ.get('AZURE_TENANT_ID', ''),\n    client_id=os.environ.get('AZURE_CLIENT_ID', ''),\n    client_secret=os.environ.get('AZURE_CLIENT_SECRET', '')\n)\n\n# List files\nprint(fs.get_file_info([f\"{container}/some/path\"]))","lang":"python","description":"Initialize ADLS Gen2 filesystem and list files using PyArrow."},"warnings":[{"fix":"Use 'from pyarrow.fs import AdlGen2FileSystem' instead of 'from pyarrowfs_adlgen2 import ...'.","message":"The filesystem is not imported from pyarrowfs-adlgen2 directly; it is registered into pyarrow.fs. Import from pyarrow.fs as shown.","severity":"gotcha","affected_versions":"all"},{"fix":"Consider using native PyArrow Azure support if available, or pin pyarrow<12.","message":"The library appears unmaintained since 2021 and may not work with newer PyArrow versions (>=12). The Azure SDK dependencies are also outdated.","severity":"deprecated","affected_versions":">=0.2.5"}],"env_vars":null,"last_verified":"2026-04-27T00:00:00.000Z","next_check":"2026-07-26T00:00:00.000Z","problems":[{"fix":"Run 'pip install pyarrowfs-adlgen2' and then 'import pyarrow.fs' before using AdlGen2FileSystem.","cause":"pyarrowfs-adlgen2 not installed or not loaded; the filesystem is only available after installing the library and importing pyarrow.","error":"ImportError: cannot import name 'AdlGen2FileSystem' from 'pyarrow.fs'"},{"fix":"Set environment variables AZURE_TENANT_ID, AZURE_CLIENT_ID, AZURE_CLIENT_SECRET, or provide account_key parameter.","cause":"Missing or invalid credentials. The library requires either account_key or a combination of tenant_id, client_id, client_secret, or DefaultAzureCredential.","error":"AzureError: Client authentication failed"}],"ecosystem":"pypi","meta_description":null,"install_score":null,"install_tag":null,"quickstart_score":null,"quickstart_tag":null}