diff --git a/python/pyspark/rdd.py b/python/pyspark/rdd.py index 1330e6146800ccfc4d91ecffb8c0915aea4b59d3..be23f87f5ed2d936fe79b22eb0f1cdc70d35d195 100644 --- a/python/pyspark/rdd.py +++ b/python/pyspark/rdd.py @@ -163,7 +163,7 @@ class RDD(object): def map(self, f, preservesPartitioning=False): """ - Return a new RDD containing the distinct elements in this RDD. + Return a new RDD by applying a function to each element of this RDD. """ def func(split, iterator): return imap(f, iterator) return PipelinedRDD(self, func, preservesPartitioning)