{"id":28105,"library":"pysparkling","title":"pysparkling","description":"Pure Python implementation of the Spark RDD interface, providing a lightweight alternative to PySpark for local or small-scale distributed computing. Current version: 0.6.2. Release cadence is sporadic, with the last release in 2020.","status":"maintenance","version":"0.6.2","language":"python","source_language":"en","source_url":"https://github.com/svenkreiss/pysparkling","tags":["spark","rdd","pure-python","big-data","lightweight"],"install":[{"cmd":"pip install pysparkling","lang":"bash","label":"Install from PyPI"}],"dependencies":[],"imports":[{"note":"pysparkling is a separate library, not PySpark.","wrong":"import pyspark","symbol":"pysparkling","correct":"import pysparkling"},{"note":"Use pysparkling's Context instead of SparkContext.","wrong":"from pyspark import SparkContext","symbol":"Context","correct":"from pysparkling import Context"}],"quickstart":{"code":"from pysparkling import Context\n\nsc = Context()\nrdd = sc.parallelize([1, 2, 3, 4, 5])\nprint(rdd.sum())  # 15\n\nsc.stop()","lang":"python","description":"Create a local context and run a simple RDD sum operation."},"warnings":[{"fix":"Consider migrating to PySpark or Dask for production use.","message":"pysparkling is no longer actively maintained. It may not work with newer Python versions or have security updates.","severity":"deprecated","affected_versions":">=0.6.2"},{"fix":"Check the official documentation for exact API differences.","message":"pysparkling's API is similar but not identical to PySpark. Some methods may have different signatures or missing features.","severity":"gotcha","affected_versions":"all"},{"fix":"Use PySpark or Dask for true distributed computing.","message":"pysparkling does not support distributed execution across multiple machines; it runs in a single process with simulated parallelism.","severity":"gotcha","affected_versions":"all"}],"env_vars":null,"last_verified":"2026-05-09T00:00:00.000Z","next_check":"2026-08-07T00:00:00.000Z","problems":[{"fix":"Install pysparkling with 'pip install pysparkling' and import as 'import pysparkling'.","cause":"Trying to import pysparkling as pyspark.","error":"ModuleNotFoundError: No module named 'pyspark'"},{"fix":"Use 'from pysparkling import Context' and create 'sc = Context()'.","cause":"pysparkling uses Context instead of SparkContext.","error":"AttributeError: module 'pysparkling' has no attribute 'SparkContext'"},{"fix":"Use pysparkling's Context without configuration, or pass options via keyword arguments if supported.","cause":"pysparkling does not support SparkConf.","error":"ImportError: cannot import name 'SparkConf'"}],"ecosystem":"pypi","meta_description":null,"install_score":null,"install_tag":null,"quickstart_score":null,"quickstart_tag":null}