{"id":24810,"library":"verticapy","title":"VerticaPy","description":"VerticaPy is a Python library for data exploration, data cleaning, and machine learning in Vertica. It simplifies the integration between Python and Vertica databases, providing a pandas-like interface and ML capabilities that run directly in-database. Current version is 1.1.1, released May 2025. The project follows a monthly release cadence.","status":"active","version":"1.1.1","language":"python","source_language":"en","source_url":"https://github.com/vertica/VerticaPy","tags":["vertika","machine-learning","data-science","ettl","database"],"install":[{"cmd":"pip install verticapy","lang":"bash","label":"PyPI"}],"dependencies":[{"reason":"Database driver for connecting to Vertica.","package":"vertica-python","optional":false},{"reason":"Plotting backend.","package":"matplotlib","optional":true},{"reason":"Alternative plotting backend.","package":"plotly","optional":true}],"imports":[{"note":"Since 1.0.0, the API was restructured; vDataFrame is directly importable from the top-level package.","wrong":"from verticapy.core import vDataFrame","symbol":"vDataFrame","correct":"from verticapy import vDataFrame"},{"note":"set_option is now at the top level, not in a submodule.","wrong":"from verticapy.options import set_option","symbol":"set_option","correct":"from verticapy import set_option"}],"quickstart":{"code":"from verticapy import vDataFrame, set_option\n\n# Optional: configure display\nset_option('max_cellwidth', 50)\n\n# Connect using parameters (replace with actual credentials)\nfrom vertica_python import connect\nconn_info = {\n    'host': 'localhost',\n    'port': 5433,\n    'user': 'dbadmin',\n    'password': '',\n    'database': 'vmart',\n    'ssl': False\n}\ncur = connect(**conn_info).cursor()\n\n# Create vDataFrame from a table\nvdf = vDataFrame('public.my_table', cur)\n\n# Quick exploration\nprint(vdf.shape())\nprint(vdf.describe())","lang":"python","description":"Quickstart: connect to Vertica, load a table into vDataFrame, explore."},"warnings":[{"fix":"Run `verticapy.upgrade()` or consult the migration guide. For example, `from verticapy import vDataFrame` instead of `from verticapy.core import vDataFrame`.","message":"Import paths changed significantly in 1.0.0. Many functions moved from submodules to top-level or were renamed.","severity":"breaking","affected_versions":"<1.0.0 -> >=1.0.0"},{"fix":"Always provide a cursor or connection object: `vDataFrame('table', cursor)`.","message":"The database connection must be passed explicitly when creating a vDataFrame. It is easy to forget and assume an implicit connection.","severity":"gotcha","affected_versions":"all"},{"fix":"Be aware that operations like `drop()` modify the current vDataFrame; use `.copy()` if you need to preserve the original.","message":"vDataFrame methods mutate the object in-place by default, unlike pandas which returns a new object.","severity":"gotcha","affected_versions":"all"}],"env_vars":null,"last_verified":"2026-05-01T00:00:00.000Z","next_check":"2026-07-30T00:00:00.000Z","problems":[{"fix":"Use `from verticapy import vDataFrame` instead of `from verticapy.core import vDataFrame`.","cause":"Importing from the old submodule path that was removed in 1.0.0.","error":"No module named 'verticapy.core'"},{"fix":"Use `vdf.select_('col1', 'col2')` instead of `vdf.select('col1', 'col2')`.","cause":"The `select` method was renamed to `select_` (with trailing underscore) to avoid Python keyword conflict.","error":"AttributeError: 'vDataFrame' object has no attribute 'select'"}],"ecosystem":"pypi","meta_description":null,"install_score":null,"install_tag":null,"quickstart_score":null,"quickstart_tag":null}