1- from base64 import standard_b64encode as b64enc
2- import copy
31from collections import defaultdict
4- from collections import namedtuple
52from itertools import chain , ifilter , imap
6- import operator
7- import os
8- import sys
9- import shlex
10- import traceback
11- from subprocess import Popen , PIPE
12- from tempfile import NamedTemporaryFile
13- from threading import Thread
14- import warnings
15- import heapq
16- from random import Random
17-
18- from pyspark .serializers import NoOpSerializer , CartesianDeserializer , \
19- BatchedSerializer , CloudPickleSerializer , PairDeserializer , pack_long
20- from pyspark .join import python_join , python_left_outer_join , \
21- python_right_outer_join , python_cogroup
22- from pyspark .statcounter import StatCounter
23- from pyspark .rddsampler import RDDSampler
24- from pyspark .storagelevel import StorageLevel
25- #from pyspark.resultiterable import ResultIterable
3+
4+ from pyspark .serializers import NoOpSerializer ,\
5+ BatchedSerializer , CloudPickleSerializer , pack_long
266from pyspark .rdd import _JavaStackTrace
277
288from py4j .java_collections import ListConverter , MapConverter
@@ -47,15 +27,14 @@ def generatedRDDs(self):
4727 def print_ (self ):
4828 """
4929 """
50- # print is a resrved name of Python. We cannot give print to function name
30+ # print is a reserved name of Python. We cannot give print to function name
5131 getattr (self ._jdstream , "print" )()
5232
5333 def pyprint (self ):
5434 """
5535 """
5636 self ._jdstream .pyprint ()
5737
58-
5938 def filter (self , f ):
6039 """
6140 """
@@ -140,7 +119,6 @@ def add_shuffle_key(split, iterator):
140119 keyed ._bypass_serializer = True
141120 with _JavaStackTrace (self .ctx ) as st :
142121 #JavaDStream
143- #pairRDD = self.ctx._jvm.PairwiseDStream(keyed._jdstream.dstream()).asJavaPairRDD()
144122 pairDStream = self .ctx ._jvm .PairwiseDStream (keyed ._jdstream .dstream ()).asJavaPairDStream ()
145123 partitioner = self .ctx ._jvm .PythonPartitioner (numPartitions ,
146124 id (partitionFunc ))
0 commit comments