{"slug":"spark-docker","image":"spark","title":"Apache Spark (Docker)","description":"Apache Spark is a unified analytics engine for large-scale data processing and machine learning.","category":"other","recommended_tag":"4.1.2","variants":["full"],"base_os":"ubuntu","size_mb":795,"latest_version":"4.1.2","eol_date":"2027-06-11T00:00:00.000Z","support_until":null,"warnings":["Requires significant memory and CPU resources — configure container limits accordingly","Cluster mode requires additional setup (e.g., Kubernetes or standalone master/worker)","Default configuration uses local mode; for distributed processing, set SPARK_MASTER"],"pulls":"1682267","homepage":"https://spark.apache.org","docs":"https://hub.docker.com/_/spark","tags":["data-science"],"last_verified":"2026-06-14T00:00:00.000Z","next_check":"2026-09-12T00:00:00.000Z","created_at":"2026-06-14T04:13:48.973Z","updated_at":"2026-06-14T04:13:48.973Z"}