1- from  base64  import  standard_b64encode  as  b64enc 
2- import  copy 
31from  collections  import  defaultdict 
4- from  collections  import  namedtuple 
52from  itertools  import  chain , ifilter , imap 
6- import  operator 
7- import  os 
8- import  sys 
9- import  shlex 
10- import  traceback 
11- from  subprocess  import  Popen , PIPE 
12- from  tempfile  import  NamedTemporaryFile 
13- from  threading  import  Thread 
14- import  warnings 
15- import  heapq 
16- from  random  import  Random 
17- 
18- from  pyspark .serializers  import  NoOpSerializer , CartesianDeserializer , \
19-     BatchedSerializer , CloudPickleSerializer , PairDeserializer , pack_long 
20- from  pyspark .join  import  python_join , python_left_outer_join , \
21-     python_right_outer_join , python_cogroup 
22- from  pyspark .statcounter  import  StatCounter 
23- from  pyspark .rddsampler  import  RDDSampler 
24- from  pyspark .storagelevel  import  StorageLevel 
25- #from pyspark.resultiterable import ResultIterable 
3+ 
4+ from  pyspark .serializers  import  NoOpSerializer ,\
5+     BatchedSerializer , CloudPickleSerializer , pack_long 
266from  pyspark .rdd  import  _JavaStackTrace 
277
288from  py4j .java_collections  import  ListConverter , MapConverter 
@@ -47,15 +27,14 @@ def generatedRDDs(self):
4727    def  print_ (self ):
4828        """ 
4929        """ 
50-         # print is a resrved  name of Python. We cannot give print to function name 
30+         # print is a reserved  name of Python. We cannot give print to function name 
5131        getattr (self ._jdstream , "print" )()
5232
5333    def  pyprint (self ):
5434        """ 
5535        """ 
5636        self ._jdstream .pyprint ()
5737
58- 
5938    def  filter (self , f ):
6039        """ 
6140        """ 
@@ -140,7 +119,6 @@ def add_shuffle_key(split, iterator):
140119        keyed ._bypass_serializer  =  True 
141120        with  _JavaStackTrace (self .ctx ) as  st :
142121            #JavaDStream 
143-             #pairRDD = self.ctx._jvm.PairwiseDStream(keyed._jdstream.dstream()).asJavaPairRDD() 
144122            pairDStream  =  self .ctx ._jvm .PairwiseDStream (keyed ._jdstream .dstream ()).asJavaPairDStream ()
145123            partitioner  =  self .ctx ._jvm .PythonPartitioner (numPartitions ,
146124                                                          id (partitionFunc ))
0 commit comments