{"library":"apache-beam","type":"library","category":null,"description":"Apache Beam is an open-source, unified programming model for defining and executing data processing pipelines for both batch and streaming data. It offers language-specific SDKs, including Python, to construct pipelines that can run on various distributed processing backends such as Apache Flink, Apache Spark, and Google Cloud Dataflow. The library maintains an active development pace with minor releases approximately every 6 weeks, and its current version is 2.71.0.","language":"python","status":"active","version":"2.71.0","tags":["data-processing","batch","streaming","etl","dataflow","flink","spark","pipeline"],"last_verified":"Tue Jun 09","install":[{"cmd":"pip install apache-beam","imports":["import apache_beam as beam","from apache_beam.io import ReadFromText","from apache_beam.io import WriteToText","from apache_beam.options.pipeline_options import PipelineOptions"]},{"cmd":"pip install 'apache-beam[gcp]'","imports":[]}],"homepage":"https://beam.apache.org","github":null,"docs":null,"changelog":null,"pypi":"https://pypi.org/project/apache-beam/","npm":null,"openapi_spec":null,"status_page":null,"smithery":null,"compatibility":{"summary":{"python_range":"3.10–3.9","success_rate":50,"avg_install_s":28.9,"avg_import_s":4.37,"wheel_type":"wheel"},"url":"https://checklist.day/v1/registry/apache-beam/compatibility"}}