dgadiraju
7/30/2017 - 6:39 AM

pyspark-rdd-parallelize.py

data = range(1, 1000000)
dataRDD = sc.parallelize(data)

dataRDD.reduce(lambda acc, value: acc + value)