Clean extra whitespace

gliptak · gliptak · commit 4e34b246985b · 2016-03-20T11:36:38.000-04:00
diff --git a/python/pyspark/rdd.py b/python/pyspark/rdd.py
@@ -2004,20 +2004,20 @@ def keyBy(self, f):
 
     def repartition(self, numPartitions):
         """
-         Return a new RDD that has exactly numPartitions partitions.
-
-         Can increase or decrease the level of parallelism in this RDD.
-         Internally, this uses a shuffle to redistribute data.
-         If you are decreasing the number of partitions in this RDD, consider
-         using `coalesce`, which can avoid performing a shuffle.
-
-         >>> rdd = sc.parallelize([1,2,3,4,5,6,7], 4)
-         >>> sorted(rdd.glom().collect())
-         [[1], [2, 3], [4, 5], [6, 7]]
-         >>> len(rdd.repartition(2).glom().collect())
-         2
-         >>> len(rdd.repartition(10).glom().collect())
-         10
+        Return a new RDD that has exactly numPartitions partitions.
+
+        Can increase or decrease the level of parallelism in this RDD.
+        Internally, this uses a shuffle to redistribute data.
+        If you are decreasing the number of partitions in this RDD, consider
+        using `coalesce`, which can avoid performing a shuffle.
+
+        >>> rdd = sc.parallelize([1,2,3,4,5,6,7], 4)
+        >>> sorted(rdd.glom().collect())
+        [[1], [2, 3], [4, 5], [6, 7]]
+        >>> len(rdd.repartition(2).glom().collect())
+        2
+        >>> len(rdd.repartition(10).glom().collect())
+        10
         """
         jrdd = self._jrdd.repartition(numPartitions)
         return RDD(jrdd, self.ctx, self._jrdd_deserializer)