numbersRDD = sc.parallelize(range(1,10+1))
print(numbersRDD.collect())
squaresRDD = numbersRDD.map(lambda x: x**2) # Square every number
print(squaresRDD.collect())
filteredRDD = numbersRDD.filter(lambda x: x % 2 == 0) # Only the evens
print(filteredRDD.collect())
defdoubleIfOdd(x):if x % 2 == 1:
return2 * x
else:
return x
resultRDD = (numbersRDD # In parentheses so we can write each
.map(doubleIfOdd) # transformation in one line
.filter(lambda x: x > 6)
.distinct())
resultRDD.collect()