{"library":"apache-airflow-providers-apache-spark","type":"library","category":null,"description":"This provider package enables Apache Airflow to interact with Apache Spark, allowing for the orchestration and scheduling of Spark jobs. It includes operators and hooks for submitting Spark applications, executing Spark SQL queries, and performing data transfers. It's an active provider package, with version 6.0.0 released on March 28, 2026. Airflow providers are released independently of Airflow core, typically with a regular cadence to support new features and bug fixes.","language":"python","status":"active","version":"6.0.0","tags":["Apache Airflow","Spark","Data Processing","ETL","Provider","Orchestration","Big Data"],"last_verified":"Fri May 22","install":[{"cmd":"pip install apache-airflow-providers-apache-spark","imports":["from airflow.providers.apache.spark.operators.spark_submit import SparkSubmitOperator","from airflow.providers.apache.spark.operators.spark_sql import SparkSqlOperator","from airflow.providers.apache.spark.operators.pyspark import PySparkOperator","from airflow.providers.apache.spark.operators.spark_jdbc import SparkJDBCOperator"]},{"cmd":"pip install apache-airflow-providers-apache-spark[pyspark]","imports":[]},{"cmd":"pip install apache-airflow-providers-apache-spark[cncf.kubernetes]","imports":[]}],"homepage":null,"github":"https://github.com/apache/airflow","docs":"https://airflow.apache.org/docs/apache-airflow-providers-apache-spark/6.0.1","changelog":"https://airflow.apache.org/docs/apache-airflow-providers-apache-spark/6.0.1/changelog.html","pypi":"https://pypi.org/project/apache-airflow-providers-apache-spark/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":100,"avg_install_s":30.1,"avg_import_s":5.44,"wheel_type":"sdist"},"url":"https://checklist.day/v1/registry/apache-airflow-providers-apache-spark/compatibility"}}