{"id":23491,"library":"dagster-duckdb-pandas","title":"dagster-duckdb-pandas","description":"Dagster library for storing Pandas DataFrames in DuckDB. Current version 0.29.3, requires Python >=3.10,<3.15. Part of the Dagster ecosystem, releases follow Dagster core versions (libraries version 0.x). Cadence: monthly releases alongside Dagster core.","status":"active","version":"0.29.3","language":"python","source_language":"en","source_url":"https://github.com/dagster-io/dagster/tree/master/python_modules/libraries/dagster-duckdb-pandas","tags":["dagster","duckdb","pandas","io-manager","data-lake"],"install":[{"cmd":"pip install dagster-duckdb-pandas","lang":"bash","label":"Latest stable"}],"dependencies":[{"reason":"Required for DuckDB I/O manager functionality","package":"dagster-duckdb","optional":false},{"reason":"Core Dagster framework","package":"dagster","optional":false},{"reason":"Required for DataFrame operations","package":"pandas","optional":false}],"imports":[{"note":"DuckDBIOManager from dagster-duckdb is base class; DuckDBPandasIOManager handles pandas DataFrames specifically","wrong":"from dagster_duckdb import DuckDBIOManager","symbol":"DuckDBPandasIOManager","correct":"from dagster_duckdb_pandas import DuckDBPandasIOManager"}],"quickstart":{"code":"from dagster_duckdb_pandas import DuckDBPandasIOManager\nfrom dagster import Definitions, asset\n\n@asset\ndef my_table() -> str:\n    import pandas as pd\n    return pd.DataFrame({\"col1\": [1, 2], \"col2\": [\"a\", \"b\"]})\n\nresources = {\"io_manager\": DuckDBPandasIOManager(database=\"my_db.duckdb\")}\ndefs = Definitions(assets=[my_table], resources=resources)","lang":"python","description":"Initialize a DuckDB I/O manager that stores pandas DataFrames in a local DuckDB database."},"warnings":[{"fix":"Change import to `from dagster_duckdb_pandas import DuckDBPandasIOManager` and update resource configuration.","message":"Upgrading from dagster-duckdb 0.x to 0.23+ changes I/O manager import paths. Use `DuckDBPandasIOManager` from `dagster_duckdb_pandas` instead of legacy imports from `dagster_duckdb`.","severity":"breaking","affected_versions":">=0.23.0"},{"fix":"Provide the database file path (e.g., `DuckDBPandasIOManager(database='path/to/db.duckdb')`).","message":"DuckDBPandasIOManager expects a `database` argument (string path) instead of `conn` or `connection`. Using a pre-existing connection object will fail.","severity":"gotcha","affected_versions":"all"},{"fix":"Use asset metadata or custom I/O manager configurations instead of the `mode` parameter.","message":"The `mode` parameter (e.g., `'overwrite'`, `'append'`) has been deprecated in favor of per-asset metadata or explicit overwrite strategies.","severity":"deprecated","affected_versions":">=0.28.0"}],"env_vars":null,"last_verified":"2026-05-01T00:00:00.000Z","next_check":"2026-07-30T00:00:00.000Z","problems":[{"fix":"Run `pip install dagster-duckdb-pandas`.","cause":"dagster-duckdb-pandas not installed or installed in wrong environment.","error":"ModuleNotFoundError: No module named 'dagster_duckdb_pandas'"},{"fix":"Instantiate with `DuckDBPandasIOManager(database='my_database.duckdb')` or `database=':memory:'` for in-memory.","cause":"Misunderstanding of the `database` parameter; users may try to pass a connection string or existing connection.","error":"The `database` argument refer to a different database connection parameter. The `database` parameter expects a DuckDB database file path or `:memory:`."}],"ecosystem":"pypi","meta_description":null,"install_score":null,"install_tag":null,"quickstart_score":null,"quickstart_tag":null}