From d8e51f9dd21cdffb5f8eb1f6312b761529dbcb9b Mon Sep 17 00:00:00 2001
From: Ken <ugw.gi.world@gmail.com>
Date: Tue, 8 Jul 2014 18:31:41 -0700
Subject: [PATCH 01/69] initial commit for pySparkStreaming

---
 bin/spark-submit                              |   6 +
 core/pom.xml                                  |   2 +-
 .../apache/spark/api/python/PythonRDD.scala   |   2 +-
 .../apache/spark/deploy/PythonRunner.scala    |   1 +
 .../src/main/python/streaming/wordcount.py    |  22 ++
 python/pyspark/java_gateway.py                |   3 +
 python/pyspark/streaming/__init__.py          |   1 +
 python/pyspark/streaming/context.py           | 133 ++++++++
 python/pyspark/streaming/dstream.py           | 315 ++++++++++++++++++
 python/pyspark/streaming/duration.py          | 171 ++++++++++
 python/pyspark/streaming/jtime.py             | 116 +++++++
 python/pyspark/streaming/pyprint.py           |  28 ++
 python/pyspark/streaming/utils.py             |  18 +
 streaming/pom.xml                             |  14 +-
 .../streaming/api/java/JavaDStreamLike.scala  |   8 +
 .../streaming/api/python/PythonDStream.scala  | 152 +++++++++
 .../spark/streaming/dstream/DStream.scala     |  68 +++-
 17 files changed, 1050 insertions(+), 10 deletions(-)
 create mode 100644 examples/src/main/python/streaming/wordcount.py
 create mode 100644 python/pyspark/streaming/__init__.py
 create mode 100644 python/pyspark/streaming/context.py
 create mode 100644 python/pyspark/streaming/dstream.py
 create mode 100644 python/pyspark/streaming/duration.py
 create mode 100644 python/pyspark/streaming/jtime.py
 create mode 100644 python/pyspark/streaming/pyprint.py
 create mode 100644 python/pyspark/streaming/utils.py
 create mode 100644 streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
diff --git a/bin/spark-submit b/bin/spark-submit
index 9e7cecedd0325..ac275b7696d5c 100755
--- a/bin/spark-submit
+++ b/bin/spark-submit
@@ -37,6 +37,12 @@ done
 
 DEPLOY_MODE=${DEPLOY_MODE:-"client"}
 
+# Figure out which Python executable to use
+if [[ -z "$PYSPARK_PYTHON" ]]; then
+  PYSPARK_PYTHON="python"
+fi
+export PYSPARK_PYTHON
+
 if [ -n "$DRIVER_MEMORY" ] && [ $DEPLOY_MODE == "client" ]; then
   export SPARK_DRIVER_MEMORY=$DRIVER_MEMORY
 fi
diff --git a/core/pom.xml b/core/pom.xml
index 8c23842730e37..43633dcb63f54 100644
--- a/core/pom.xml
+++ b/core/pom.xml
@@ -21,7 +21,7 @@
   <parent>
     <groupId>org.apache.spark</groupId>
     <artifactId>spark-parent</artifactId>
-    <version>1.1.0-SNAPSHOT</version>
+    <version>1.0.0</version>
     <relativePath>../pom.xml</relativePath>
   </parent>
 
diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
index f6570d335757a..e88a54d2086ea 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
@@ -252,7 +252,7 @@ private class PythonException(msg: String, cause: Exception) extends RuntimeExce
  * Form an RDD[(Array[Byte], Array[Byte])] from key-value pairs returned from Python.
  * This is used by PySpark's shuffle operations.
  */
-private class PairwiseRDD(prev: RDD[Array[Byte]]) extends
+private[spark] class PairwiseRDD(prev: RDD[Array[Byte]]) extends
   RDD[(Long, Array[Byte])](prev) {
   override def getPartitions = prev.partitions
   override def compute(split: Partition, context: TaskContext) =
diff --git a/core/src/main/scala/org/apache/spark/deploy/PythonRunner.scala b/core/src/main/scala/org/apache/spark/deploy/PythonRunner.scala
index 0d6751f3fa6d2..89f3fd47724fe 100644
--- a/core/src/main/scala/org/apache/spark/deploy/PythonRunner.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/PythonRunner.scala
@@ -57,6 +57,7 @@ object PythonRunner {
     val builder = new ProcessBuilder(Seq(pythonExec, "-u", formattedPythonFile) ++ otherArgs)
     val env = builder.environment()
     env.put("PYTHONPATH", pythonPath)
+    env.put("PYSPARK_PYTHON", pythonExec)
     env.put("PYSPARK_GATEWAY_PORT", "" + gatewayServer.getListeningPort)
     builder.redirectErrorStream(true) // Ugly but needed for stdout and stderr to synchronize
     val process = builder.start()
diff --git a/examples/src/main/python/streaming/wordcount.py b/examples/src/main/python/streaming/wordcount.py
new file mode 100644
index 0000000000000..f44cd696894ba
--- /dev/null
+++ b/examples/src/main/python/streaming/wordcount.py
@@ -0,0 +1,22 @@
+import sys
+from operator import add
+
+from pyspark.streaming.context import StreamingContext
+from pyspark.streaming.duration import *
+
+if __name__ == "__main__":
+    if len(sys.argv) != 2:
+        print >> sys.stderr, "Usage: wordcount <directory>"
+        exit(-1)
+    ssc = StreamingContext(appName="PythonStreamingWordCount", duration=Seconds(1))
+
+    lines = ssc.textFileStream(sys.argv[1])
+    fm_lines = lines.flatMap(lambda x: x.split(" "))
+    filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
+    mapped_lines = fm_lines.map(lambda x: (x, 1))
+    
+    fm_lines.pyprint()
+    filtered_lines.pyprint()
+    mapped_lines.pyprint()
+    ssc.start()
+    ssc.awaitTermination()
diff --git a/python/pyspark/java_gateway.py b/python/pyspark/java_gateway.py
index 0dbead4415b02..7038c6422be47 100644
--- a/python/pyspark/java_gateway.py
+++ b/python/pyspark/java_gateway.py
@@ -82,6 +82,9 @@ def run(self):
     java_import(gateway.jvm, "org.apache.spark.SparkConf")
     java_import(gateway.jvm, "org.apache.spark.api.java.*")
     java_import(gateway.jvm, "org.apache.spark.api.python.*")
+    java_import(gateway.jvm, "org.apache.spark.streaming.*")
+    java_import(gateway.jvm, "org.apache.spark.streaming.api.java.*")
+    java_import(gateway.jvm, "org.apache.spark.streaming.api.python.*")
     java_import(gateway.jvm, "org.apache.spark.mllib.api.python.*")
     java_import(gateway.jvm, "org.apache.spark.sql.SQLContext")
     java_import(gateway.jvm, "org.apache.spark.sql.hive.HiveContext")
diff --git a/python/pyspark/streaming/__init__.py b/python/pyspark/streaming/__init__.py
new file mode 100644
index 0000000000000..719592912e80c
--- /dev/null
+++ b/python/pyspark/streaming/__init__.py
@@ -0,0 +1 @@
+__author__ = 'ktakagiw'
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
new file mode 100644
index 0000000000000..c8ae9c4af85c9
--- /dev/null
+++ b/python/pyspark/streaming/context.py
@@ -0,0 +1,133 @@
+__author__ = 'ktakagiw'
+
+
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+import shutil
+import sys
+from threading import Lock
+from tempfile import NamedTemporaryFile
+
+from pyspark import accumulators
+from pyspark.accumulators import Accumulator
+from pyspark.broadcast import Broadcast
+from pyspark.conf import SparkConf
+from pyspark.files import SparkFiles
+from pyspark.java_gateway import launch_gateway
+from pyspark.serializers import PickleSerializer, BatchedSerializer, UTF8Deserializer
+from pyspark.storagelevel import StorageLevel
+from pyspark.rdd import RDD
+from pyspark.context import SparkContext
+
+from py4j.java_collections import ListConverter
+
+from pyspark.streaming.dstream import DStream
+
+class StreamingContext(object):
+    """
+    Main entry point for Spark functionality. A StreamingContext represents the
+    connection to a Spark cluster, and can be used to create L{RDD}s and
+    broadcast variables on that cluster.
+    """
+
+    def __init__(self, master=None, appName=None, sparkHome=None, pyFiles=None,
+        environment=None, batchSize=1024, serializer=PickleSerializer(), conf=None,
+        gateway=None, duration=None):
+        """
+        Create a new StreamingContext. At least the master and app name and duration
+        should be set, either through the named parameters here or through C{conf}.
+
+        @param master: Cluster URL to connect to
+               (e.g. mesos://host:port, spark://host:port, local[4]).
+        @param appName: A name for your job, to display on the cluster web UI.
+        @param sparkHome: Location where Spark is installed on cluster nodes.
+        @param pyFiles: Collection of .zip or .py files to send to the cluster
+               and add to PYTHONPATH.  These can be paths on the local file
+               system or HDFS, HTTP, HTTPS, or FTP URLs.
+        @param environment: A dictionary of environment variables to set on
+               worker nodes.
+        @param batchSize: The number of Python objects represented as a single
+               Java object.  Set 1 to disable batching or -1 to use an
+               unlimited batch size.
+        @param serializer: The serializer for RDDs.
+        @param conf: A L{SparkConf} object setting Spark properties.
+        @param gateway: Use an existing gateway and JVM, otherwise a new JVM
+               will be instatiated.
+        @param duration: A L{Duration} Duration for SparkStreaming
+
+        """
+        # Create the Python Sparkcontext
+        self._sc = SparkContext(master=master, appName=appName, sparkHome=sparkHome,
+                        pyFiles=pyFiles, environment=environment, batchSize=batchSize,
+                        serializer=serializer, conf=conf, gateway=gateway)
+        self._jvm = self._sc._jvm
+        self._jssc = self._initialize_context(self._sc._jsc, duration._jduration)
+
+    # Initialize StremaingContext in function to allow subclass specific initialization
+    def _initialize_context(self, jspark_context, jduration):
+        return self._jvm.JavaStreamingContext(jspark_context, jduration)
+
+    def actorStream(self, props, name, storageLevel, supervisorStrategy):
+        raise NotImplementedError
+
+    def addStreamingListener(self, streamingListener):
+        raise NotImplementedError
+
+    def awaitTermination(self, timeout=None):
+        if timeout:
+            self._jssc.awaitTermination(timeout)
+        else:
+            self._jssc.awaitTermination()
+
+    def checkpoint(self, directory):
+        raise NotImplementedError
+
+    def fileStream(self, directory, filter=None, newFilesOnly=None):
+        raise NotImplementedError
+
+    def networkStream(self, receiver):
+        raise NotImplementedError
+
+    def queueStream(self, queue, oneAtATime=True, defaultRDD=None):
+        raise NotImplementedError
+
+    def rawSocketStream(self, hostname, port, storagelevel):
+        raise NotImplementedError
+
+    def remember(self, duration):
+        raise NotImplementedError
+
+    def socketStream(hostname, port, converter,storageLevel):
+        raise NotImplementedError
+
+    def start(self):
+        self._jssc.start()
+
+    def stop(self, stopSparkContext=True):
+        raise NotImplementedError
+
+    def textFileStream(self, directory):
+        return DStream(self._jssc.textFileStream(directory), self, UTF8Deserializer())
+
+    def transform(self, seq):
+        raise NotImplementedError
+
+    def union(self, seq):
+        raise NotImplementedError
+
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
new file mode 100644
index 0000000000000..b422b147d11e1
--- /dev/null
+++ b/python/pyspark/streaming/dstream.py
@@ -0,0 +1,315 @@
+from base64 import standard_b64encode as b64enc
+import copy
+from collections import defaultdict
+from collections import namedtuple
+from itertools import chain, ifilter, imap
+import operator
+import os
+import sys
+import shlex
+import traceback
+from subprocess import Popen, PIPE
+from tempfile import NamedTemporaryFile
+from threading import Thread
+import warnings
+import heapq
+from random import Random
+
+from pyspark.serializers import NoOpSerializer, CartesianDeserializer, \
+    BatchedSerializer, CloudPickleSerializer, PairDeserializer, pack_long
+from pyspark.join import python_join, python_left_outer_join, \
+    python_right_outer_join, python_cogroup
+from pyspark.statcounter import StatCounter
+from pyspark.rddsampler import RDDSampler
+from pyspark.storagelevel import StorageLevel
+#from pyspark.resultiterable import ResultIterable
+from pyspark.rdd import _JavaStackTrace
+
+from py4j.java_collections import ListConverter, MapConverter
+
+__all__ = ["DStream"]
+
+class DStream(object):
+    def __init__(self, jdstream, ssc, jrdd_deserializer):
+        self._jdstream = jdstream
+        self._ssc = ssc
+        self.ctx = ssc._sc
+        self._jrdd_deserializer = jrdd_deserializer
+
+    def generatedRDDs(self):
+        """
+         // RDDs generated, marked as private[streaming] so that testsuites can access it
+         @transient
+        """
+        pass
+
+    def print_(self):
+        """
+        """
+        # print is a resrved name of Python. We cannot give print to function name
+        getattr(self._jdstream, "print")()
+
+    def pyprint(self):
+        """
+        """
+        self._jdstream.pyprint()
+
+    def cache(self):
+        """
+        """
+        raise NotImplementedError
+
+    def checkpoint(self):
+        """
+        """
+        raise NotImplementedError
+
+    def compute(self, time):
+        """
+        """
+        raise NotImplementedError
+
+    def context(self):
+        """
+        """
+        raise NotImplementedError
+
+    def count(self):
+        """
+        """
+        raise NotImplementedError
+
+    def countByValue(self, numPartitions=None):
+        """
+        """
+        raise NotImplementedError
+
+    def countByValueAndWindow(self, duration, slideDuration=None):
+        """
+        """
+        raise NotImplementedError
+
+    def countByWindow(self, duration, slideDuration=None):
+        """
+        """
+        raise NotImplementedError
+
+    def dstream(self):
+        """
+        """
+        raise NotImplementedError
+
+    def filter(self, f):
+        """
+        """
+        def func(iterator): return ifilter(f, iterator)
+        return self.mapPartitions(func)
+
+    def flatMap(self, f, preservesPartitioning=False):
+        """
+        """
+        def func(s, iterator): return chain.from_iterable(imap(f, iterator))
+        return self.mapPartitionsWithIndex(func, preservesPartitioning)
+
+    def foreachRDD(self, f, time):
+        """
+        """
+        raise NotImplementedError
+
+    def glom(self):
+        """
+        """
+        raise NotImplementedError
+
+    def map(self, f, preservesPartitioning=False):
+        """
+        """
+        def func(split, iterator): return imap(f, iterator)
+        return PipelinedDStream(self, func, preservesPartitioning)
+
+    def mapPartitions(self, f):
+        """
+        """
+        def func(s, iterator): return f(iterator)
+        return self.mapPartitionsWithIndex(func)
+
+    def perist(self, storageLevel):
+        """
+        """
+        raise NotImplementedError
+
+    def reduce(self, func, numPartitions=None):
+        """
+
+        """
+        return self._combineByKey(lambda x:x, func, func, numPartitions)
+
+    def _combineByKey(self, createCombiner, mergeValue, mergeCombiners,
+                      numPartitions = None):
+        """
+        """
+        if numPartitions is None:
+            numPartitions = self.ctx._defaultParallelism()
+        def combineLocally(iterator):
+            combiners = {}
+            for x in iterator:
+                (k, v) = x
+                if k not in combiners:
+                    combiners[k] = createCombiner(v)
+                else:
+                    combiners[k] = mergeValue(combiners[k], v)
+            return combiners.iteritems()
+        locally_combined = self.mapPartitions(combineLocally)
+        shuffled = locally_combined.partitionBy(numPartitions)
+        def _mergeCombiners(iterator):
+            combiners = {}
+            for (k, v) in iterator:
+                if not k in combiners:
+                    combiners[k] = v
+                else:
+                    combiners[k] = mergeCombiners(combiners[k], v)
+            return combiners.iteritems()
+        return shuffled.mapPartitions(_mergeCombiners) 
+
+
+   def partitionBy(self, numPartitions, partitionFunc=None):
+        """
+        Return a copy of the DStream partitioned using the specified partitioner.
+
+        """
+        if numPartitions is None:
+            numPartitions = self.ctx._defaultReducePartitions()
+
+        if partitionFunc is None:
+            partitionFunc = lambda x: 0 if x is None else hash(x)
+        # Transferring O(n) objects to Java is too expensive.  Instead, we'll
+        # form the hash buckets in Python, transferring O(numPartitions) objects
+        # to Java.  Each object is a (splitNumber, [objects]) pair.
+        outputSerializer = self.ctx._unbatched_serializer
+        def add_shuffle_key(split, iterator):
+
+            buckets = defaultdict(list)
+
+            for (k, v) in iterator:
+                buckets[partitionFunc(k) % numPartitions].append((k, v))
+            for (split, items) in buckets.iteritems():
+                yield pack_long(split)
+                yield outputSerializer.dumps(items)
+        keyed = PipelinedDStream(self, add_shuffle_key)
+        keyed._bypass_serializer = True
+        with _JavaStackTrace(self.ctx) as st:
+            #JavaDStream
+            #pairRDD = self.ctx._jvm.PairwiseDStream(keyed._jdstream.dstream()).asJavaPairRDD()
+            pairDStream = self.ctx._jvm.PairwiseDStream(keyed._jdstream.dstream()).asJavaPairDStream()
+            partitioner = self.ctx._jvm.PythonPartitioner(numPartitions,
+                                                          id(partitionFunc))
+        jdstream = pairDStream.partitionBy(partitioner).values()
+        dstream = DStream(jdstream, self._ssc, BatchedSerializer(outputSerializer))
+        # This is required so that id(partitionFunc) remains unique, even if
+        # partitionFunc is a lambda:
+        dstream._partitionFunc = partitionFunc
+        return dstream
+
+
+
+    def reduceByWindow(self, reduceFunc, windowDuration, slideDuration, inReduceTunc):
+        """
+        """
+
+        raise NotImplementedError
+
+    def repartition(self, numPartitions):
+        """
+        """
+        raise NotImplementedError
+
+    def slice(self, fromTime, toTime):
+        """
+        """
+        raise NotImplementedError
+
+    def transform(self, transformFunc):
+        """
+        """
+        raise NotImplementedError
+
+    def transformWith(self, other, transformFunc):
+        """
+        """
+        raise NotImplementedError
+
+    def union(self, that):
+        """
+        """
+        raise NotImplementedError
+
+    def window(self, windowDuration, slideDuration=None):
+        """
+        """
+        raise NotImplementedError
+
+    def wrapRDD(self, rdd):
+        """
+        """
+        raise NotImplementedError
+
+    def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
+        return PipelinedDStream(self, f, preservesPartitioning)
+
+
+class PipelinedDStream(DStream):
+    def __init__(self, prev, func, preservesPartitioning=False):
+        if not isinstance(prev, PipelinedDStream) or not prev._is_pipelinable():
+            # This transformation is the first in its stage:
+            self.func = func
+            self.preservesPartitioning = preservesPartitioning
+            self._prev_jdstream = prev._jdstream
+            self._prev_jrdd_deserializer = prev._jrdd_deserializer
+        else:
+            prev_func = prev.func
+            def pipeline_func(split, iterator):
+                return func(split, prev_func(split, iterator))
+            self.func = pipeline_func
+            self.preservesPartitioning = \
+                prev.preservesPartitioning and preservesPartitioning
+            self._prev_jdstream = prev._prev_jdstream  # maintain the pipeline
+            self._prev_jrdd_deserializer = prev._prev_jrdd_deserializer
+        self.is_cached = False
+        self.is_checkpointed = False
+        self._ssc = prev._ssc
+        self.ctx = prev.ctx
+        self.prev = prev
+        self._jdstream_val = None
+        self._jrdd_deserializer = self.ctx.serializer
+        self._bypass_serializer = False
+
+    @property
+    def _jdstream(self):
+        if self._jdstream_val:
+            return self._jdstream_val
+        if self._bypass_serializer:
+            serializer = NoOpSerializer()
+        else:
+            serializer = self.ctx.serializer
+
+        command = (self.func, self._prev_jrdd_deserializer, serializer)
+        pickled_command = CloudPickleSerializer().dumps(command)
+        broadcast_vars = ListConverter().convert(
+            [x._jbroadcast for x in self.ctx._pickled_broadcast_vars],
+            self.ctx._gateway._gateway_client)
+        self.ctx._pickled_broadcast_vars.clear()
+        class_tag = self._prev_jdstream.classTag()
+        env = MapConverter().convert(self.ctx.environment,
+                                     self.ctx._gateway._gateway_client)
+        includes = ListConverter().convert(self.ctx._python_includes,
+                                     self.ctx._gateway._gateway_client)
+        python_dstream = self.ctx._jvm.PythonDStream(self._prev_jdstream.dstream(),
+                bytearray(pickled_command),
+                env, includes, self.preservesPartitioning,
+                self.ctx.pythonExec, broadcast_vars, self.ctx._javaAccumulator,
+                class_tag)
+        self._jdstream_val = python_dstream.asJavaDStream()
+        return self._jdstream_val
+
+    def _is_pipelinable(self):
+        return not (self.is_cached or self.is_checkpointed)
diff --git a/python/pyspark/streaming/duration.py b/python/pyspark/streaming/duration.py
new file mode 100644
index 0000000000000..ef1b4f6cef237
--- /dev/null
+++ b/python/pyspark/streaming/duration.py
@@ -0,0 +1,171 @@
+__author__ = 'ktakagiw'
+
+from pyspark.streaming import utils
+
+class Duration(object):
+    """
+    Duration for Spark Streaming application. Used to set duration
+
+    Most of the time, you would create a Duration object with
+    C{Duration()}, which will load values from C{spark.streaming.*} Java system
+    properties as well. In this case, any parameters you set directly on
+    the C{Duration} object take priority over system properties.
+
+    """
+    def __init__(self, millis, _jvm=None):
+        """
+        Create new Duration.
+
+        @param millis: milisecond
+
+        """
+        self._millis = millis
+
+        from pyspark.context import SparkContext
+        SparkContext._ensure_initialized()
+        _jvm = _jvm or SparkContext._jvm
+        self._jduration = _jvm.Duration(millis)
+
+    def toString(self):
+        """ Return duration as string """
+        return str(self._millis) + " ms"
+
+    def isZero(self):
+        """ Check if millis is zero """
+        return self._millis == 0
+
+    def prettyPrint(self):
+        """
+        Return a human-readable string representing a duration
+        """
+        return utils.msDurationToString(self._millis)
+
+    def milliseconds(self):
+        """ Return millisecond """
+        return self._millis
+
+    def toFormattedString(self):
+        """ Return millisecond """
+        return str(self._millis)
+
+    def max(self, other):
+        """ Return higher Duration """
+        Duration._is_duration(other)
+        if self > other:
+            return self
+        else:
+            return other
+
+    def min(self, other):
+        """ Return lower Durattion """
+        Duration._is_duration(other)
+        if self < other:
+            return self
+        else:
+            return other
+
+    def __str__(self):
+        return self.toString()
+
+    def __add__(self, other):
+        """ Add Duration and Duration """
+        Duration._is_duration(other)
+        return Duration(self._millis + other._millis)
+
+    def __sub__(self, other):
+        """ Subtract Duration by Duration  """
+        Duration._is_duration(other)
+        return Duration(self._millis - other._millis)
+
+    def __mul__(self, other):
+        """ Multiple Duration by Duration """
+        Duration._is_duration(other)
+        return Duration(self._millis * other._millis)
+
+    def __div__(self, other):
+        """
+        Divide Duration by Duration
+        for Python 2.X
+        """
+        Duration._is_duration(other)
+        return Duration(self._millis / other._millis)
+
+    def __truediv__(self, other):
+        """
+        Divide Duration by Duration
+        for Python 3.0
+        """
+        Duration._is_duration(other)
+        return Duration(self._millis / other._millis)
+
+    def __floordiv__(self, other):
+        """ Divide Duration by Duration """
+        Duration._is_duration(other)
+        return Duration(self._millis // other._millis)
+
+    def __len__(self):
+        """ Length of miilisecond in Duration """
+        return len(self._millis)
+
+    def __lt__(self, other):
+        """ Duration < Duration """
+        Duration._is_duration(other)
+        return self._millis < other._millis
+
+    def __le__(self, other):
+        """ Duration <= Duration """
+        Duration._is_duration(other)
+        return self.millis <= other._millis
+
+    def __eq__(self, other):
+        """ Duration ==  Duration """
+        Duration._is_duration(other)
+        return self._millis == other._millis
+
+    def __ne__(self, other):
+        """ Duration != Duration """
+        Duration._is_duration(other)
+        return self._millis != other._millis
+
+    def __gt__(self, other):
+        """ Duration > Duration """
+        Duration._is_duration(other)
+        return self._millis > other._millis
+
+    def __ge__(self, other):
+        """ Duration >= Duration """
+        Duration._is_duration(other)
+        return self._millis >= other._millis
+
+    @classmethod
+    def _is_duration(self, instance):
+        """ is instance Duration """
+        if not isinstance(instance, Duration):
+            raise TypeError("This should be Duration")
+
+def Milliseconds(milliseconds):
+    """
+    Helper function that creates instance of [[pysparkstreaming.duration]] representing
+    a given number of milliseconds.
+    """
+    return Duration(milliseconds)
+
+def Seconds(seconds):
+    """
+    Helper function that creates instance of [[pysparkstreaming.duration]] representing
+    a given number of seconds.
+    """
+    return Duration(seconds * 1000)
+
+def Minites(minites):
+    """
+    Helper function that creates instance of [[pysparkstreaming.duration]] representing
+    a given number of minutes.
+    """
+    return Duration(minutes * 60000)
+
+if __name__ == "__main__":
+    d = Duration(1)
+    print d
+    print d.milliseconds()
+
diff --git a/python/pyspark/streaming/jtime.py b/python/pyspark/streaming/jtime.py
new file mode 100644
index 0000000000000..41670af659ea3
--- /dev/null
+++ b/python/pyspark/streaming/jtime.py
@@ -0,0 +1,116 @@
+__author__ = 'ktakagiw'
+
+from pyspark.streaming import utils
+from pyspark.streaming.duration import Duration
+
+class Time(object):
+    """
+    Time for Spark Streaming application. Used to set Time
+
+    Most of the time, you would create a Duration object with
+    C{Time()}, which will load values from C{spark.streaming.*} Java system
+    properties as well. In this case, any parameters you set directly on
+    the C{Time} object take priority over system properties.
+
+    """
+    def __init__(self, millis, _jvm=None):
+        """
+        Create new Time.
+
+        @param millis: milisecond
+
+        @param _jvm: internal parameter used to pass a handle to the
+               Java VM; does not need to be set by users
+
+        """
+        self._millis = millis
+
+        from pyspark.context import StreamingContext
+        StreamingContext._ensure_initialized()
+        _jvm = _jvm or StreamingContext._jvm
+        self._jtime = _jvm.Time(millis)
+
+    def toString(self):
+        """ Return time as string """
+        return str(self._millis) + " ms"
+
+    def milliseconds(self):
+        """ Return millisecond """
+        return self._millis
+
+    def max(self, other):
+        """ Return higher Time """
+        Time._is_time(other)
+        if self > other:
+            return self
+        else:
+            return other
+
+    def min(self, other):
+        """ Return lower Time """
+        Time._is_time(other)
+        if self < other:
+            return self
+        else:
+            return other
+
+    def __add__(self, other):
+        """ Add Time and Time """
+        Duration._is_duration(other)
+        return Time(self._millis + other._millis)
+
+    def __sub__(self, other):
+        """ Subtract Time by Duration or Time """
+        if isinstance(other, Duration):
+            return Time(self._millis - other._millis)
+        elif isinstance(other, Time):
+            return Duration(self._mills, other._millis)
+        else:
+            raise TypeError
+
+    def __lt__(self, other):
+        """ Time < Time """
+        Time._is_time(other)
+        return self._millis < other._millis
+
+    def __le__(self, other):
+        """ Time <= Time """
+        Time._is_time(other)
+        return self.millis <= other._millis
+
+    def __eq__(self, other):
+        """ Time ==  Time """
+        Time._is_time(other)
+        return self._millis == other._millis
+
+    def __ne__(self, other):
+        """ Time != Time """
+        Time._is_time(other)
+        return self._millis != other._millis
+
+    def __gt__(self, other):
+        """ Time > Time """
+        Time._is_time(other)
+        return self._millis > other._millis
+
+    def __ge__(self, other):
+        """ Time >= Time """
+        Time._is_time(other)
+        return self._millis >= other._millis
+
+    def isMultipbleOf(duration):
+        """ is multiple by Duration """
+        Duration._is_duration(duration)
+        return self._millis % duration._millis == 0
+
+    def until(time, interval):
+        raise NotImplementedError
+
+    def to(time, interval):
+        raise NotImplementedError
+
+    @classmethod
+    def _is_time(self, instance):
+        """ is instance Time """
+        if not isinstance(instance, Time):
+            raise TypeError
diff --git a/python/pyspark/streaming/pyprint.py b/python/pyspark/streaming/pyprint.py
new file mode 100644
index 0000000000000..fcdaca510812c
--- /dev/null
+++ b/python/pyspark/streaming/pyprint.py
@@ -0,0 +1,28 @@
+import sys
+from itertools import chain
+from pyspark.serializers import PickleSerializer, BatchedSerializer, UTF8Deserializer
+
+def collect(binary_file_path):
+    dse = PickleSerializer()
+    with open(binary_file_path, 'rb') as tempFile:
+        for item in dse.load_stream(tempFile):
+            yield item
+def main():
+    try:
+        binary_file_path = sys.argv[1]
+    except:
+        print "Missed FilePath in argement"
+
+    if not binary_file_path:
+        return 
+
+    counter = 0
+    for rdd in chain.from_iterable(collect(binary_file_path)):
+        print rdd
+        counter = counter + 1
+        if counter >= 10:
+            print "..."
+            break
+
+if __name__ =="__main__":
+    exit(main())
diff --git a/python/pyspark/streaming/utils.py b/python/pyspark/streaming/utils.py
new file mode 100644
index 0000000000000..71aa3376c6578
--- /dev/null
+++ b/python/pyspark/streaming/utils.py
@@ -0,0 +1,18 @@
+__author__ = 'ktakagiw'
+
+def msDurationToString(ms):
+    """
+    Returns a human-readable string representing a duration such as "35ms"
+    """
+    second = 1000
+    minute = 60 * second
+    hour = 60 * minute
+
+    if ms < second:
+        return "%d ms" % ms
+    elif ms < minute:
+        return "%.1f s" % (float(ms) / second)
+    elif ms < hout:
+        return "%.1f m" % (float(ms) / minute)
+    else:
+        return "%.2f h" % (float(ms) / hour)
diff --git a/streaming/pom.xml b/streaming/pom.xml
index f506d6ce34a6f..88df63592efee 100644
--- a/streaming/pom.xml
+++ b/streaming/pom.xml
@@ -21,7 +21,7 @@
   <parent>
     <groupId>org.apache.spark</groupId>
     <artifactId>spark-parent</artifactId>
-    <version>1.1.0-SNAPSHOT</version>
+    <version>1.0.0</version>
     <relativePath>../pom.xml</relativePath>
   </parent>
 
@@ -69,14 +69,14 @@
         <groupId>org.scalatest</groupId>
         <artifactId>scalatest-maven-plugin</artifactId>
       </plugin>
-      
-      <!-- 
-           This plugin forces the generation of jar containing streaming test classes, 
+
+      <!--
+           This plugin forces the generation of jar containing streaming test classes,
            so that the tests classes of external modules can use them. The two execution profiles
-           are necessary - first one for 'mvn package', second one for 'mvn compile'. Ideally, 
-           'mvn compile' should not compile test classes and therefore should not need this. 
+           are necessary - first one for 'mvn package', second one for 'mvn compile'. Ideally,
+           'mvn compile' should not compile test classes and therefore should not need this.
            However, an open Maven bug (http://jira.codehaus.org/browse/MNG-3559)
-           causes the compilation to fail if streaming test-jar is not generated. Hence, the 
+           causes the compilation to fail if streaming test-jar is not generated. Hence, the
            second execution profile for 'mvn compile'.
       -->
       <plugin>
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
index a6184de4e83c1..cfa336df8674f 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
@@ -54,6 +54,14 @@ trait JavaDStreamLike[T, This <: JavaDStreamLike[T, This, R], R <: JavaRDDLike[T
     dstream.print()
   }
 
+  /**
+   * Print the first ten elements of each PythonRDD generated in the PythonDStream. This is an output
+   * operator, so this PythonDStream will be registered as an output stream and there materialized.
+   * This function is for PythonAPI.
+   */
+
+  def pyprint() = dstream.pyprint()
+
   /**
    * Return a new DStream in which each RDD has a single element generated by counting each RDD
    * of this DStream.
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
new file mode 100644
index 0000000000000..2d8b1e468dc4c
--- /dev/null
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -0,0 +1,152 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.streaming.api.python
+
+import java.util.{List => JList, ArrayList => JArrayList, Map => JMap, Collections}
+
+import org.apache.spark.api.java.{JavaSparkContext, JavaPairRDD, JavaRDD}
+import org.apache.spark.broadcast.Broadcast
+import org.apache.spark._
+import org.apache.spark.util.Utils
+import java.io._
+import scala.Some
+import org.apache.spark.streaming.Duration
+import scala.util.control.Breaks._
+import org.apache.spark.broadcast.Broadcast
+import scala.Some
+import org.apache.spark.streaming.Duration
+import org.apache.spark.rdd.RDD
+import org.apache.spark.api.python.PythonRDD
+
+
+import org.apache.spark.streaming.{Duration, Time}
+import org.apache.spark.streaming.dstream._
+import org.apache.spark.streaming.api.java._
+import org.apache.spark.rdd.RDD
+import org.apache.spark.api.python._
+import org.apache.spark.api.python.PairwiseRDD
+
+
+import scala.reflect.ClassTag
+
+
+class PythonDStream[T: ClassTag](
+                                  parent: DStream[T],
+                                  command: Array[Byte],
+                                  envVars: JMap[String, String],
+                                  pythonIncludes: JList[String],
+                                  preservePartitoning: Boolean,
+                                  pythonExec: String,
+                                  broadcastVars: JList[Broadcast[Array[Byte]]],
+                                  accumulator: Accumulator[JList[Array[Byte]]]
+                                  ) extends DStream[Array[Byte]](parent.ssc) {
+
+  override def dependencies = List(parent)
+
+  override def slideDuration: Duration = parent.slideDuration
+
+  //pythonDStream compute
+  override def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
+    parent.getOrCompute(validTime) match{
+      case Some(rdd) =>
+        val pythonRDD = new PythonRDD(rdd, command, envVars, pythonIncludes, preservePartitoning, pythonExec, broadcastVars, accumulator)
+        Some(pythonRDD.asJavaRDD.rdd)
+      case None => None
+    }
+  }
+  val asJavaDStream  = JavaDStream.fromDStream(this)
+
+  /**
+   * Print the first ten elements of each PythonRDD generated in this PythonDStream. This is an output
+   * operator, so this PythonDStream will be registered as an output stream and there materialized.
+   * Since serialized Python object is readable by Python, pyprint writes out binary data to
+   * temporary file and run python script to deserialized and print the first ten elements
+   */
+  private[streaming] def ppyprint() {
+    def foreachFunc = (rdd: RDD[Array[Byte]], time: Time) => {
+      val iter = rdd.take(11).iterator
+
+      // make a temporary file
+      val prefix = "spark"
+      val suffix = ".tmp"
+      val tempFile = File.createTempFile(prefix, suffix)
+      val tempFileStream = new DataOutputStream(new FileOutputStream(tempFile.getAbsolutePath))
+      //write out serialized python object
+      PythonRDD.writeIteratorToStream(iter, tempFileStream)
+      tempFileStream.close()
+
+      // This value has to be passed from python
+      val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
+      val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
+      //val pb = new ProcessBuilder(Seq(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath())) // why this fails to compile???
+      //absolute path to the python script is needed to change because we do not use pysparkstreaming
+      val pb = new ProcessBuilder(pythonExec, sparkHome + "/python/pysparkstreaming/streaming/pyprint.py", tempFile.getAbsolutePath)
+      val workerEnv = pb.environment()
+
+      //envVars also need to be pass
+      //workerEnv.putAll(envVars)
+      val pythonPath = sparkHome + "/python/" + File.pathSeparator + workerEnv.get("PYTHONPATH")
+      workerEnv.put("PYTHONPATH", pythonPath)
+      val worker = pb.start()
+      val is = worker.getInputStream()
+      val isr = new InputStreamReader(is)
+      val br = new BufferedReader(isr)
+
+      println ("-------------------------------------------")
+      println ("Time: " + time)
+      println ("-------------------------------------------")
+
+      //print value from python std out
+      var line = ""
+      breakable {
+        while (true) {
+          line = br.readLine()
+          if (line == null) break()
+          println(line)
+        }
+      }
+      //delete temporary file
+      tempFile.delete()
+      println()
+
+    }
+    new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
+  }
+}
+
+
+private class PairwiseDStream(prev:DStream[Array[Byte]]) extends
+DStream[(Long, Array[Byte])](prev.ssc){
+  override def dependencies = List(prev)
+
+  override def slideDuration: Duration = prev.slideDuration
+
+  override def compute(validTime:Time):Option[RDD[(Long, Array[Byte])]]={
+    prev.getOrCompute(validTime) match{
+      case Some(rdd)=>Some(rdd)
+        val pairwiseRDD = new PairwiseRDD(rdd)
+        Some(pairwiseRDD.asJavaPairRDD.rdd)
+      case None => None
+    }
+  }
+  val asJavaPairDStream : JavaPairDStream[Long, Array[Byte]] = JavaPairDStream(this)
+}
+
+
+
+
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index 4709a62381647..ffd7f88fd9dd1 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -18,11 +18,13 @@
 package org.apache.spark.streaming.dstream
 
 
-import java.io.{IOException, ObjectInputStream, ObjectOutputStream}
+import java.io._
 
 import scala.deprecated
 import scala.collection.mutable.HashMap
 import scala.reflect.ClassTag
+import java.io.{IOException, ObjectInputStream, ObjectOutputStream}
+import scala.util.control.Breaks._
 
 import org.apache.spark.{Logging, SparkException}
 import org.apache.spark.rdd.{BlockRDD, RDD}
@@ -31,6 +33,8 @@ import org.apache.spark.streaming._
 import org.apache.spark.streaming.StreamingContext._
 import org.apache.spark.streaming.scheduler.Job
 import org.apache.spark.util.MetadataCleaner
+import org.apache.spark.streaming.Duration
+import org.apache.spark.api.python.PythonRDD
 
 /**
  * A Discretized Stream (DStream), the basic abstraction in Spark Streaming, is a continuous
@@ -601,6 +605,68 @@ abstract class DStream[T: ClassTag] (
     new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
   }
 
+
+
+
+
+  /**
+   * Print the first ten elements of each PythonRDD generated in this PythonDStream. This is an output
+   * operator, so this PythonDStream will be registered as an output stream and there materialized.
+   * Since serialized Python object is readable by Python, pyprint writes out binary data to
+   * temporary file and run python script to deserialized and print the first ten elements
+   */
+  private[streaming] def pyprint() {
+    def foreachFunc = (rdd: RDD[T], time: Time) => {
+      val iter = rdd.take(11).iterator
+
+      // make a temporary file
+      val prefix = "spark"
+      val suffix = ".tmp"
+      val tempFile = File.createTempFile(prefix, suffix)
+      val tempFileStream = new DataOutputStream(new FileOutputStream(tempFile.getAbsolutePath))
+      //write out serialized python object
+      PythonRDD.writeIteratorToStream(iter, tempFileStream)
+      tempFileStream.close()
+
+      // This value has to be passed from python
+      val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
+      val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
+      //val pb = new ProcessBuilder(Seq(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath())) // why this fails to compile???
+      //absolute path to the python script is needed to change because we do not use pysparkstreaming
+      val pb = new ProcessBuilder(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath)
+      val workerEnv = pb.environment()
+
+      //envVars also need to be pass
+      //workerEnv.putAll(envVars)
+      val pythonPath = sparkHome + "/python/" + File.pathSeparator + workerEnv.get("PYTHONPATH")
+      workerEnv.put("PYTHONPATH", pythonPath)
+      val worker = pb.start()
+      val is = worker.getInputStream()
+      val isr = new InputStreamReader(is)
+      val br = new BufferedReader(isr)
+
+      println ("-------------------------------------------")
+      println ("Time: " + time)
+      println ("-------------------------------------------")
+
+      //print value from python std out
+      var line = ""
+      breakable {
+        while (true) {
+          line = br.readLine()
+          if (line == null) break()
+          println(line)
+        }
+      }
+      //delete temporary file
+      tempFile.delete()
+      println()
+
+    }
+    new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
+  }
+
+
   /**
    * Return a new DStream in which each RDD contains all the elements in seen in a
    * sliding window of time over this DStream. The new DStream generates RDDs with

From 1367be52f80ee55a1b0cb1070b8fb02cf258c0be Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Tue, 15 Jul 2014 15:41:52 -0700
Subject: [PATCH 02/69] comment PythonDStream.PairwiseDStream

---
 .../apache/spark/streaming/api/python/PythonDStream.scala   | 3 ++-
 .../scala/org/apache/spark/streaming/dstream/DStream.scala  | 6 ++----
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 2d8b1e468dc4c..fe67250604d8e 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -129,7 +129,7 @@ class PythonDStream[T: ClassTag](
   }
 }
 
-
+/*
 private class PairwiseDStream(prev:DStream[Array[Byte]]) extends
 DStream[(Long, Array[Byte])](prev.ssc){
   override def dependencies = List(prev)
@@ -146,6 +146,7 @@ DStream[(Long, Array[Byte])](prev.ssc){
   }
   val asJavaPairDStream : JavaPairDStream[Long, Array[Byte]] = JavaPairDStream(this)
 }
+*/
 
 
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index b24109074e816..d9d5446b62e9f 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -620,10 +620,7 @@ abstract class DStream[T: ClassTag] (
     new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
   }
 
-
-
-
-
+//TODO move pyprint to PythonDStream
   /**
    * Print the first ten elements of each PythonRDD generated in this PythonDStream. This is an output
    * operator, so this PythonDStream will be registered as an output stream and there materialized.
@@ -644,6 +641,7 @@ abstract class DStream[T: ClassTag] (
       tempFileStream.close()
 
       // This value has to be passed from python
+      // Python currently does not do cluster deployment. But what happened
       val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
       val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
       //val pb = new ProcessBuilder(Seq(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath())) // why this fails to compile???

From 88068cf8439991b17c244d65af3192b49968583f Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Tue, 15 Jul 2014 17:19:20 -0700
Subject: [PATCH 03/69] modify dstream.py to fix indent error

---
 python/pyspark/streaming/dstream.py                             | 2 +-
 .../org/apache/spark/streaming/api/python/PythonDStream.scala   | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index b422b147d11e1..a512517f6e437 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -172,7 +172,7 @@ def _mergeCombiners(iterator):
         return shuffled.mapPartitions(_mergeCombiners) 
 
 
-   def partitionBy(self, numPartitions, partitionFunc=None):
+    def partitionBy(self, numPartitions, partitionFunc=None):
         """
         Return a copy of the DStream partitioned using the specified partitioner.
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index fe67250604d8e..389136f9e21a0 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -91,7 +91,7 @@ class PythonDStream[T: ClassTag](
       tempFileStream.close()
 
       // This value has to be passed from python
-      val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
+      //val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
       val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
       //val pb = new ProcessBuilder(Seq(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath())) // why this fails to compile???
       //absolute path to the python script is needed to change because we do not use pysparkstreaming

From 94a07879007d6e6157b7f5b59a04284996f5623f Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Tue, 15 Jul 2014 21:08:43 -0700
Subject: [PATCH 04/69] added reducedByKey not working yet

---
 .../src/main/python/streaming/wordcount.py    | 10 ++++++-
 python/pyspark/streaming/dstream.py           | 27 +++++++++++++++++--
 .../streaming/api/python/PythonDStream.scala  |  6 ++---
 3 files changed, 37 insertions(+), 6 deletions(-)

diff --git a/examples/src/main/python/streaming/wordcount.py b/examples/src/main/python/streaming/wordcount.py
index f44cd696894ba..3996991109d60 100644
--- a/examples/src/main/python/streaming/wordcount.py
+++ b/examples/src/main/python/streaming/wordcount.py
@@ -1,6 +1,7 @@
 import sys
 from operator import add
 
+from pyspark.conf import SparkConf
 from pyspark.streaming.context import StreamingContext
 from pyspark.streaming.duration import *
 
@@ -8,15 +9,22 @@
     if len(sys.argv) != 2:
         print >> sys.stderr, "Usage: wordcount <directory>"
         exit(-1)
-    ssc = StreamingContext(appName="PythonStreamingWordCount", duration=Seconds(1))
+    conf = SparkConf()
+    conf.setAppName("PythonStreamingWordCount")
+    conf.set("spark.default.parallelism", 1)
+
+#    ssc = StreamingContext(appName="PythonStreamingWordCount", duration=Seconds(1))
+    ssc = StreamingContext(conf=conf, duration=Seconds(1))
 
     lines = ssc.textFileStream(sys.argv[1])
     fm_lines = lines.flatMap(lambda x: x.split(" "))
     filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
     mapped_lines = fm_lines.map(lambda x: (x, 1))
+    reduced_lines = mapped_lines.reduce(add)
     
     fm_lines.pyprint()
     filtered_lines.pyprint()
     mapped_lines.pyprint()
+    reduced_lines.pyprint()
     ssc.start()
     ssc.awaitTermination()
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index a512517f6e437..e144f8bc1cc09 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -29,6 +29,7 @@
 
 __all__ = ["DStream"]
 
+
 class DStream(object):
     def __init__(self, jdstream, ssc, jrdd_deserializer):
         self._jdstream = jdstream
@@ -149,7 +150,7 @@ def _combineByKey(self, createCombiner, mergeValue, mergeCombiners,
         """
         """
         if numPartitions is None:
-            numPartitions = self.ctx._defaultParallelism()
+            numPartitions = self._defaultReducePartitions()
         def combineLocally(iterator):
             combiners = {}
             for x in iterator:
@@ -211,7 +212,6 @@ def add_shuffle_key(split, iterator):
         return dstream
 
 
-
     def reduceByWindow(self, reduceFunc, windowDuration, slideDuration, inReduceTunc):
         """
         """
@@ -254,8 +254,31 @@ def wrapRDD(self, rdd):
         raise NotImplementedError
 
     def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
+        """
+
+        """
         return PipelinedDStream(self, f, preservesPartitioning)
 
+    def _defaultReducePartitions(self):
+        """
+
+        """
+        # hard code to avoid the error
+        return 2
+        if self.ctx._conf.contains("spark.default.parallelism"):
+            return self.ctx.defaultParallelism
+        else:
+            return self.getNumPartitions()
+
+    def getNumPartitions(self):
+      """
+      Returns the number of partitions in RDD
+      >>> rdd = sc.parallelize([1, 2, 3, 4], 2)
+      >>> rdd.getNumPartitions()
+      2
+      """
+      return self._jdstream.partitions().size()
+
 
 class PipelinedDStream(DStream):
     def __init__(self, prev, func, preservesPartitioning=False):
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 389136f9e21a0..719dd0a6a53c2 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -129,7 +129,7 @@ class PythonDStream[T: ClassTag](
   }
 }
 
-/*
+
 private class PairwiseDStream(prev:DStream[Array[Byte]]) extends
 DStream[(Long, Array[Byte])](prev.ssc){
   override def dependencies = List(prev)
@@ -144,9 +144,9 @@ DStream[(Long, Array[Byte])](prev.ssc){
       case None => None
     }
   }
-  val asJavaPairDStream : JavaPairDStream[Long, Array[Byte]] = JavaPairDStream(this)
+  val asJavaPairDStream : JavaPairDStream[Long, Array[Byte]]  = JavaPairDStream.fromJavaDStream(this)
 }
-*/
+
 
 
 

From 69e9cd33a58b880f96cc9c3e5e62eaa415c49843 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 11:07:42 -0700
Subject: [PATCH 05/69] implementing transform function in Python

---
 python/pyspark/mllib/_common.py               |  2 +-
 python/pyspark/streaming/dstream.py           |  3 +-
 .../api/python/PythonTransformedDStream.scala | 37 +++++++++++++++++++
 .../spark/streaming/dstream/DStream.scala     |  3 ++
 4 files changed, 42 insertions(+), 3 deletions(-)
 create mode 100644 streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala

diff --git a/python/pyspark/mllib/_common.py b/python/pyspark/mllib/_common.py
index e609b60a0f968..4b723693f43e3 100644
--- a/python/pyspark/mllib/_common.py
+++ b/python/pyspark/mllib/_common.py
@@ -164,7 +164,7 @@ def _deserialize_double_vector(ba, offset=0):
     nb = len(ba) - offset
     if nb < 5:
         raise TypeError("_deserialize_double_vector called on a %d-byte array, "
-                "which is too short" % nb)
+                        "which is too short" % nb)
     if ba[offset] == DENSE_VECTOR_MAGIC:
         return _deserialize_dense_vector(ba, offset)
     elif ba[offset] == SPARSE_VECTOR_MAGIC:
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index e144f8bc1cc09..3365c6d69c1a2 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -172,7 +172,6 @@ def _mergeCombiners(iterator):
             return combiners.iteritems()
         return shuffled.mapPartitions(_mergeCombiners) 
 
-
     def partitionBy(self, numPartitions, partitionFunc=None):
         """
         Return a copy of the DStream partitioned using the specified partitioner.
@@ -231,6 +230,7 @@ def slice(self, fromTime, toTime):
     def transform(self, transformFunc):
         """
         """
+        self._jdstream.transform(transformFunc)
         raise NotImplementedError
 
     def transformWith(self, other, transformFunc):
@@ -264,7 +264,6 @@ def _defaultReducePartitions(self):
 
         """
         # hard code to avoid the error
-        return 2
         if self.ctx._conf.contains("spark.default.parallelism"):
             return self.ctx.defaultParallelism
         else:
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala
new file mode 100644
index 0000000000000..ff70483b771a4
--- /dev/null
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala
@@ -0,0 +1,37 @@
+package org.apache.spark.streaming.api.python
+
+import org.apache.spark.Accumulator
+import org.apache.spark.api.python.PythonRDD
+import org.apache.spark.broadcast.Broadcast
+import org.apache.spark.rdd.RDD
+import org.apache.spark.streaming.api.java.JavaDStream
+import org.apache.spark.streaming.{Time, Duration}
+import org.apache.spark.streaming.dstream.DStream
+
+import scala.reflect.ClassTag
+
+/**
+ * Created by ken on 7/15/14.
+ */
+class PythonTransformedDStream[T: ClassTag](
+               parents: Seq[DStream[T]],
+               command: Array[Byte],
+               envVars: JMap[String, String],
+               pythonIncludes: JList[String],
+               preservePartitoning: Boolean,
+               pythonExec: String,
+               broadcastVars: JList[Broadcast[Array[Byte]]],
+               accumulator: Accumulator[JList[Array[Byte]]]
+               ) extends DStream[Array[Byte]](parent.ssc) {
+
+  override def dependencies = List(parent)
+
+  override def slideDuration: Duration = parent.slideDuration
+
+  //pythonDStream compute
+  override def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
+    val parentRDDs = parents.map(_.getOrCompute(validTime).orNull).toSeq
+    Some()
+  }
+  val asJavaDStream  = JavaDStream.fromDStream(this)
+}
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index d9d5446b62e9f..67977244ef420 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -561,9 +561,12 @@ abstract class DStream[T: ClassTag] (
     // because the DStream is reachable from the outer object here, and because 
     // DStreams can't be serialized with closures, we can't proactively check 
     // it for serializability and so we pass the optional false to SparkContext.clean
+
+    // serialized python
     val cleanedF = context.sparkContext.clean(transformFunc, false)
     val realTransformFunc =  (rdds: Seq[RDD[_]], time: Time) => {
       assert(rdds.length == 1)
+      // if transformfunc is fine, it is okay
       cleanedF(rdds.head.asInstanceOf[RDD[T]], time)
     }
     new TransformedDStream[U](Seq(this), realTransformFunc)

From 72bfc66074b2f35224f116759e0a47204a138f24 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 11:12:53 -0700
Subject: [PATCH 06/69] modified the code base on comment in
 https://github.com/tdas/spark/pull/10

---
 core/pom.xml                         | 2 +-
 python/pyspark/streaming/__init__.py | 1 -
 python/pyspark/streaming/context.py  | 5 +----
 3 files changed, 2 insertions(+), 6 deletions(-)

diff --git a/core/pom.xml b/core/pom.xml
index a59fc9fc035d7..6abf8480d5da0 100644
--- a/core/pom.xml
+++ b/core/pom.xml
@@ -21,7 +21,7 @@
   <parent>
     <groupId>org.apache.spark</groupId>
     <artifactId>spark-parent</artifactId>
-    <version>1.0.0</version>
+    <version>1.1.0-SNAPSHOT</version>
     <relativePath>../pom.xml</relativePath>
   </parent>
 
diff --git a/python/pyspark/streaming/__init__.py b/python/pyspark/streaming/__init__.py
index 719592912e80c..e69de29bb2d1d 100644
--- a/python/pyspark/streaming/__init__.py
+++ b/python/pyspark/streaming/__init__.py
@@ -1 +0,0 @@
-__author__ = 'ktakagiw'
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index c8ae9c4af85c9..40e9d98942e2e 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -1,6 +1,3 @@
-__author__ = 'ktakagiw'
-
-
 #
 # Licensed to the Apache Software Foundation (ASF) under one or more
 # contributor license agreements.  See the NOTICE file distributed with
@@ -41,7 +38,7 @@
 
 class StreamingContext(object):
     """
-    Main entry point for Spark functionality. A StreamingContext represents the
+    Main entry point for Spark Streaming functionality. A StreamingContext represents the
     connection to a Spark cluster, and can be used to create L{RDD}s and
     broadcast variables on that cluster.
     """

From a7a0b5ce72e9bad14880f2285544d11d725f0f14 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 11:17:02 -0700
Subject: [PATCH 07/69] add coment for hack why PYSPARK_PYTHON is needed in
 spark-submit

---
 bin/spark-submit | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/bin/spark-submit b/bin/spark-submit
index ac275b7696d5c..fa022f707e572 100755
--- a/bin/spark-submit
+++ b/bin/spark-submit
@@ -37,6 +37,16 @@ done
 
 DEPLOY_MODE=${DEPLOY_MODE:-"client"}
 
+
+# This is a hack to make DStream.pyprint work. 
+# This will be removed after pyprint is moved to PythonDStream.
+# Problem is that print function is in (Scala)DStream. 
+# Whenever python code is executed, we call PythonDStream which passes
+# pythonExec(which python Spark should execute).
+# Since pyprint is located in DStream, Spark does not know which python should use. 
+# In that case, get python path from PYSPARK_PYTHON, environmental variable. 
+# This fix is ongoing in print branch in my repo.
+
 # Figure out which Python executable to use
 if [[ -z "$PYSPARK_PYTHON" ]]; then
   PYSPARK_PYTHON="python"

From 0a516f5a31bfb5f5d3ac58139af820ad8bb50a5a Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 11:19:13 -0700
Subject: [PATCH 08/69] add coment for hack why PYSPARK_PYTHON is needed in
 spark-submit

---
 bin/spark-submit | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bin/spark-submit b/bin/spark-submit
index fa022f707e572..ec4e10787cff0 100755
--- a/bin/spark-submit
+++ b/bin/spark-submit
@@ -45,7 +45,7 @@ DEPLOY_MODE=${DEPLOY_MODE:-"client"}
 # pythonExec(which python Spark should execute).
 # Since pyprint is located in DStream, Spark does not know which python should use. 
 # In that case, get python path from PYSPARK_PYTHON, environmental variable. 
-# This fix is ongoing in print branch in my repo.
+# This fix is ongoing in print branch in https://github.com/giwa/spark/tree/print.
 
 # Figure out which Python executable to use
 if [[ -z "$PYSPARK_PYTHON" ]]; then

From 57e3e52191464f6b8f8ec53a6452dcf86d4704a6 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 11:24:08 -0700
Subject: [PATCH 09/69] remove not implemented DStream functions in python

---
 python/pyspark/streaming/dstream.py | 102 ----------------------------
 1 file changed, 102 deletions(-)

diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index a512517f6e437..6ab9c500450aa 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -54,50 +54,6 @@ def pyprint(self):
         """
         self._jdstream.pyprint()
 
-    def cache(self):
-        """
-        """
-        raise NotImplementedError
-
-    def checkpoint(self):
-        """
-        """
-        raise NotImplementedError
-
-    def compute(self, time):
-        """
-        """
-        raise NotImplementedError
-
-    def context(self):
-        """
-        """
-        raise NotImplementedError
-
-    def count(self):
-        """
-        """
-        raise NotImplementedError
-
-    def countByValue(self, numPartitions=None):
-        """
-        """
-        raise NotImplementedError
-
-    def countByValueAndWindow(self, duration, slideDuration=None):
-        """
-        """
-        raise NotImplementedError
-
-    def countByWindow(self, duration, slideDuration=None):
-        """
-        """
-        raise NotImplementedError
-
-    def dstream(self):
-        """
-        """
-        raise NotImplementedError
 
     def filter(self, f):
         """
@@ -111,16 +67,6 @@ def flatMap(self, f, preservesPartitioning=False):
         def func(s, iterator): return chain.from_iterable(imap(f, iterator))
         return self.mapPartitionsWithIndex(func, preservesPartitioning)
 
-    def foreachRDD(self, f, time):
-        """
-        """
-        raise NotImplementedError
-
-    def glom(self):
-        """
-        """
-        raise NotImplementedError
-
     def map(self, f, preservesPartitioning=False):
         """
         """
@@ -133,11 +79,6 @@ def mapPartitions(self, f):
         def func(s, iterator): return f(iterator)
         return self.mapPartitionsWithIndex(func)
 
-    def perist(self, storageLevel):
-        """
-        """
-        raise NotImplementedError
-
     def reduce(self, func, numPartitions=None):
         """
 
@@ -210,49 +151,6 @@ def add_shuffle_key(split, iterator):
         dstream._partitionFunc = partitionFunc
         return dstream
 
-
-
-    def reduceByWindow(self, reduceFunc, windowDuration, slideDuration, inReduceTunc):
-        """
-        """
-
-        raise NotImplementedError
-
-    def repartition(self, numPartitions):
-        """
-        """
-        raise NotImplementedError
-
-    def slice(self, fromTime, toTime):
-        """
-        """
-        raise NotImplementedError
-
-    def transform(self, transformFunc):
-        """
-        """
-        raise NotImplementedError
-
-    def transformWith(self, other, transformFunc):
-        """
-        """
-        raise NotImplementedError
-
-    def union(self, that):
-        """
-        """
-        raise NotImplementedError
-
-    def window(self, windowDuration, slideDuration=None):
-        """
-        """
-        raise NotImplementedError
-
-    def wrapRDD(self, rdd):
-        """
-        """
-        raise NotImplementedError
-
     def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
         return PipelinedDStream(self, f, preservesPartitioning)
 

From c9d79dd381ee001eb5920ca865b5dc72f8b46a7f Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 11:35:59 -0700
Subject: [PATCH 10/69] revert pom.xml

---
 python/pyspark/streaming/pyprint.py | 2 +-
 streaming/pom.xml                   | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/pyspark/streaming/pyprint.py b/python/pyspark/streaming/pyprint.py
index fcdaca510812c..6e87c985a57e3 100644
--- a/python/pyspark/streaming/pyprint.py
+++ b/python/pyspark/streaming/pyprint.py
@@ -1,6 +1,6 @@
 import sys
 from itertools import chain
-from pyspark.serializers import PickleSerializer, BatchedSerializer, UTF8Deserializer
+from pyspark.serializers import PickleSerializer
 
 def collect(binary_file_path):
     dse = PickleSerializer()
diff --git a/streaming/pom.xml b/streaming/pom.xml
index 88df63592efee..2239ad9c8579c 100644
--- a/streaming/pom.xml
+++ b/streaming/pom.xml
@@ -21,7 +21,7 @@
   <parent>
     <groupId>org.apache.spark</groupId>
     <artifactId>spark-parent</artifactId>
-    <version>1.0.0</version>
+    <version>1.1.0-SNAPSHOT</version>
     <relativePath>../pom.xml</relativePath>
   </parent>
 

From 8f8202b5c9bfccfb42f7027e7e8079b4b5807f02 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 11:38:26 -0700
Subject: [PATCH 11/69] revert streaming pom.xml

---
 streaming/pom.xml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/streaming/pom.xml b/streaming/pom.xml
index 2239ad9c8579c..03102c5e836bf 100644
--- a/streaming/pom.xml
+++ b/streaming/pom.xml
@@ -76,7 +76,7 @@
            are necessary - first one for 'mvn package', second one for 'mvn compile'. Ideally,
            'mvn compile' should not compile test classes and therefore should not need this.
            However, an open Maven bug (http://jira.codehaus.org/browse/MNG-3559)
-           causes the compilation to fail if streaming test-jar is not generated. Hence, the
+           causes the compilation to fail if streaming test-jar is not generated. Hence, the 
            second execution profile for 'mvn compile'.
       -->
       <plugin>

From fa4a7fc1b0643bfbe48b24e3897d65bce3332e64 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 11:44:14 -0700
Subject: [PATCH 12/69] revert streaming/pom.xml

---
 streaming/pom.xml | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/streaming/pom.xml b/streaming/pom.xml
index 03102c5e836bf..f506d6ce34a6f 100644
--- a/streaming/pom.xml
+++ b/streaming/pom.xml
@@ -69,12 +69,12 @@
         <groupId>org.scalatest</groupId>
         <artifactId>scalatest-maven-plugin</artifactId>
       </plugin>
-
-      <!--
-           This plugin forces the generation of jar containing streaming test classes,
+      
+      <!-- 
+           This plugin forces the generation of jar containing streaming test classes, 
            so that the tests classes of external modules can use them. The two execution profiles
-           are necessary - first one for 'mvn package', second one for 'mvn compile'. Ideally,
-           'mvn compile' should not compile test classes and therefore should not need this.
+           are necessary - first one for 'mvn package', second one for 'mvn compile'. Ideally, 
+           'mvn compile' should not compile test classes and therefore should not need this. 
            However, an open Maven bug (http://jira.codehaus.org/browse/MNG-3559)
            causes the compilation to fail if streaming test-jar is not generated. Hence, the 
            second execution profile for 'mvn compile'.

From 6e0a64adc334cb8d158e827fa4a0b4e816903460 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 12:15:06 -0700
Subject: [PATCH 13/69] sorted the import following Spark coding convention

---
 .../streaming/api/python/PythonDStream.scala  | 120 ++----------------
 1 file changed, 13 insertions(+), 107 deletions(-)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 389136f9e21a0..9d4eebaadc4c7 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -19,42 +19,28 @@ package org.apache.spark.streaming.api.python
 
 import java.util.{List => JList, ArrayList => JArrayList, Map => JMap, Collections}
 
-import org.apache.spark.api.java.{JavaSparkContext, JavaPairRDD, JavaRDD}
-import org.apache.spark.broadcast.Broadcast
+import scala.reflect.ClassTag
+
 import org.apache.spark._
-import org.apache.spark.util.Utils
-import java.io._
-import scala.Some
-import org.apache.spark.streaming.Duration
-import scala.util.control.Breaks._
-import org.apache.spark.broadcast.Broadcast
-import scala.Some
-import org.apache.spark.streaming.Duration
 import org.apache.spark.rdd.RDD
-import org.apache.spark.api.python.PythonRDD
-
-
+import org.apache.spark.api.python._
+import org.apache.spark.broadcast.Broadcast
 import org.apache.spark.streaming.{Duration, Time}
 import org.apache.spark.streaming.dstream._
 import org.apache.spark.streaming.api.java._
-import org.apache.spark.rdd.RDD
-import org.apache.spark.api.python._
-import org.apache.spark.api.python.PairwiseRDD
-
 
-import scala.reflect.ClassTag
 
 
 class PythonDStream[T: ClassTag](
-                                  parent: DStream[T],
-                                  command: Array[Byte],
-                                  envVars: JMap[String, String],
-                                  pythonIncludes: JList[String],
-                                  preservePartitoning: Boolean,
-                                  pythonExec: String,
-                                  broadcastVars: JList[Broadcast[Array[Byte]]],
-                                  accumulator: Accumulator[JList[Array[Byte]]]
-                                  ) extends DStream[Array[Byte]](parent.ssc) {
+    parent: DStream[T],
+    command: Array[Byte],
+    envVars: JMap[String, String],
+    pythonIncludes: JList[String],
+    preservePartitoning: Boolean,
+    pythonExec: String,
+    broadcastVars: JList[Broadcast[Array[Byte]]],
+    accumulator: Accumulator[JList[Array[Byte]]])
+  extends DStream[Array[Byte]](parent.ssc) {
 
   override def dependencies = List(parent)
 
@@ -70,84 +56,4 @@ class PythonDStream[T: ClassTag](
     }
   }
   val asJavaDStream  = JavaDStream.fromDStream(this)
-
-  /**
-   * Print the first ten elements of each PythonRDD generated in this PythonDStream. This is an output
-   * operator, so this PythonDStream will be registered as an output stream and there materialized.
-   * Since serialized Python object is readable by Python, pyprint writes out binary data to
-   * temporary file and run python script to deserialized and print the first ten elements
-   */
-  private[streaming] def ppyprint() {
-    def foreachFunc = (rdd: RDD[Array[Byte]], time: Time) => {
-      val iter = rdd.take(11).iterator
-
-      // make a temporary file
-      val prefix = "spark"
-      val suffix = ".tmp"
-      val tempFile = File.createTempFile(prefix, suffix)
-      val tempFileStream = new DataOutputStream(new FileOutputStream(tempFile.getAbsolutePath))
-      //write out serialized python object
-      PythonRDD.writeIteratorToStream(iter, tempFileStream)
-      tempFileStream.close()
-
-      // This value has to be passed from python
-      //val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
-      val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
-      //val pb = new ProcessBuilder(Seq(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath())) // why this fails to compile???
-      //absolute path to the python script is needed to change because we do not use pysparkstreaming
-      val pb = new ProcessBuilder(pythonExec, sparkHome + "/python/pysparkstreaming/streaming/pyprint.py", tempFile.getAbsolutePath)
-      val workerEnv = pb.environment()
-
-      //envVars also need to be pass
-      //workerEnv.putAll(envVars)
-      val pythonPath = sparkHome + "/python/" + File.pathSeparator + workerEnv.get("PYTHONPATH")
-      workerEnv.put("PYTHONPATH", pythonPath)
-      val worker = pb.start()
-      val is = worker.getInputStream()
-      val isr = new InputStreamReader(is)
-      val br = new BufferedReader(isr)
-
-      println ("-------------------------------------------")
-      println ("Time: " + time)
-      println ("-------------------------------------------")
-
-      //print value from python std out
-      var line = ""
-      breakable {
-        while (true) {
-          line = br.readLine()
-          if (line == null) break()
-          println(line)
-        }
-      }
-      //delete temporary file
-      tempFile.delete()
-      println()
-
-    }
-    new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
-  }
-}
-
-/*
-private class PairwiseDStream(prev:DStream[Array[Byte]]) extends
-DStream[(Long, Array[Byte])](prev.ssc){
-  override def dependencies = List(prev)
-
-  override def slideDuration: Duration = prev.slideDuration
-
-  override def compute(validTime:Time):Option[RDD[(Long, Array[Byte])]]={
-    prev.getOrCompute(validTime) match{
-      case Some(rdd)=>Some(rdd)
-        val pairwiseRDD = new PairwiseRDD(rdd)
-        Some(pairwiseRDD.asJavaPairRDD.rdd)
-      case None => None
-    }
-  }
-  val asJavaPairDStream : JavaPairDStream[Long, Array[Byte]] = JavaPairDStream(this)
 }
-*/
-
-
-
-

From 25d30d531d8eefc477bd2540ad5f7a22d2b89010 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 12:19:42 -0700
Subject: [PATCH 14/69] add empty line

---
 .../org/apache/spark/streaming/api/python/PythonDStream.scala    | 1 +
 1 file changed, 1 insertion(+)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 9d4eebaadc4c7..4c98f1c993317 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -55,5 +55,6 @@ class PythonDStream[T: ClassTag](
       case None => None
     }
   }
+  
   val asJavaDStream  = JavaDStream.fromDStream(this)
 }

From 6d012f7f96e2355d035e12d1310c68de32ed329c Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 15:40:42 -0700
Subject: [PATCH 15/69] remove unused import in python

---
 python/pyspark/streaming/context.py           |  9 ------
 python/pyspark/streaming/dstream.py           | 30 +++----------------
 python/pyspark/streaming/duration.py          | 17 ++++++++++-
 python/pyspark/streaming/jtime.py             | 24 ++++++++++++++-
 python/pyspark/streaming/pyprint.py           | 19 ++++++++++++
 .../streaming/api/python/PythonDStream.scala  |  2 +-
 6 files changed, 63 insertions(+), 38 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 40e9d98942e2e..d3ff16fca764f 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -15,15 +15,6 @@
 # limitations under the License.
 #
 
-import os
-import shutil
-import sys
-from threading import Lock
-from tempfile import NamedTemporaryFile
-
-from pyspark import accumulators
-from pyspark.accumulators import Accumulator
-from pyspark.broadcast import Broadcast
 from pyspark.conf import SparkConf
 from pyspark.files import SparkFiles
 from pyspark.java_gateway import launch_gateway
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 6ab9c500450aa..cd28184274c9a 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -1,28 +1,8 @@
-from base64 import standard_b64encode as b64enc
-import copy
 from collections import defaultdict
-from collections import namedtuple
 from itertools import chain, ifilter, imap
-import operator
-import os
-import sys
-import shlex
-import traceback
-from subprocess import Popen, PIPE
-from tempfile import NamedTemporaryFile
-from threading import Thread
-import warnings
-import heapq
-from random import Random
-
-from pyspark.serializers import NoOpSerializer, CartesianDeserializer, \
-    BatchedSerializer, CloudPickleSerializer, PairDeserializer, pack_long
-from pyspark.join import python_join, python_left_outer_join, \
-    python_right_outer_join, python_cogroup
-from pyspark.statcounter import StatCounter
-from pyspark.rddsampler import RDDSampler
-from pyspark.storagelevel import StorageLevel
-#from pyspark.resultiterable import ResultIterable
+
+from pyspark.serializers import NoOpSerializer,\
+    BatchedSerializer, CloudPickleSerializer, pack_long
 from pyspark.rdd import _JavaStackTrace
 
 from py4j.java_collections import ListConverter, MapConverter
@@ -46,7 +26,7 @@ def generatedRDDs(self):
     def print_(self):
         """
         """
-        # print is a resrved name of Python. We cannot give print to function name
+        # print is a reserved name of Python. We cannot give print to function name
         getattr(self._jdstream, "print")()
 
     def pyprint(self):
@@ -54,7 +34,6 @@ def pyprint(self):
         """
         self._jdstream.pyprint()
 
-
     def filter(self, f):
         """
         """
@@ -140,7 +119,6 @@ def add_shuffle_key(split, iterator):
         keyed._bypass_serializer = True
         with _JavaStackTrace(self.ctx) as st:
             #JavaDStream
-            #pairRDD = self.ctx._jvm.PairwiseDStream(keyed._jdstream.dstream()).asJavaPairRDD()
             pairDStream = self.ctx._jvm.PairwiseDStream(keyed._jdstream.dstream()).asJavaPairDStream()
             partitioner = self.ctx._jvm.PythonPartitioner(numPartitions,
                                                           id(partitionFunc))
diff --git a/python/pyspark/streaming/duration.py b/python/pyspark/streaming/duration.py
index ef1b4f6cef237..5982146e69026 100644
--- a/python/pyspark/streaming/duration.py
+++ b/python/pyspark/streaming/duration.py
@@ -1,4 +1,19 @@
-__author__ = 'ktakagiw'
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
 
 from pyspark.streaming import utils
 
diff --git a/python/pyspark/streaming/jtime.py b/python/pyspark/streaming/jtime.py
index 41670af659ea3..32ef741051283 100644
--- a/python/pyspark/streaming/jtime.py
+++ b/python/pyspark/streaming/jtime.py
@@ -1,8 +1,30 @@
-__author__ = 'ktakagiw'
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
 
 from pyspark.streaming import utils
 from pyspark.streaming.duration import Duration
 
+"""
+The name of this file, time is not good naming for python
+because if we do import time when we want to use native python time package, it does
+not import python time package.
+"""
+
+
 class Time(object):
     """
     Time for Spark Streaming application. Used to set Time
diff --git a/python/pyspark/streaming/pyprint.py b/python/pyspark/streaming/pyprint.py
index 6e87c985a57e3..1aeb8e50375ed 100644
--- a/python/pyspark/streaming/pyprint.py
+++ b/python/pyspark/streaming/pyprint.py
@@ -1,5 +1,24 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+
 import sys
 from itertools import chain
+
 from pyspark.serializers import PickleSerializer
 
 def collect(binary_file_path):
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 4c98f1c993317..76b88385e095a 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -55,6 +55,6 @@ class PythonDStream[T: ClassTag](
       case None => None
     }
   }
-  
+
   val asJavaDStream  = JavaDStream.fromDStream(this)
 }

From 1e84f41b30404b46e0afc1c905a6dcfd523bca78 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 16:23:08 -0700
Subject: [PATCH 16/69] initial commit for socketTextStream

---
 .../python/streaming/nerwork_wordcount.py     | 22 +++++++++++++++++++
 1 file changed, 22 insertions(+)
 create mode 100644 examples/src/main/python/streaming/nerwork_wordcount.py

diff --git a/examples/src/main/python/streaming/nerwork_wordcount.py b/examples/src/main/python/streaming/nerwork_wordcount.py
new file mode 100644
index 0000000000000..2e5048ccad213
--- /dev/null
+++ b/examples/src/main/python/streaming/nerwork_wordcount.py
@@ -0,0 +1,22 @@
+import sys
+from operator import add
+
+from pyspark.streaming.context import StreamingContext
+from pyspark.streaming.duration import *
+
+if __name__ == "__main__":
+    if len(sys.argv) != 3:
+        print >> sys.stderr, "Usage: wordcount <hostname> <port>"
+        exit(-1)
+    ssc = StreamingContext(appName="PythonStreamingNetworkWordCount", duration=Seconds(1))
+
+    lines = ssc.socketTextStream(sys.argv[1], sys.argv[2])
+    fm_lines = lines.flatMap(lambda x: x.split(" "))
+    filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
+    mapped_lines = fm_lines.map(lambda x: (x, 1))
+    
+    fm_lines.pyprint()
+    filtered_lines.pyprint()
+    mapped_lines.pyprint()
+    ssc.start()
+    ssc.awaitTermination()

From a61fa9e0a590c5e30f650fc24df81deed4e09d78 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 16:27:28 -0700
Subject: [PATCH 17/69] fied input of socketTextDStream

---
 .../python/streaming/nerwork_wordcount.py     |  2 +-
 python/pyspark/java_gateway.py                |  1 +
 python/pyspark/streaming/context.py           | 25 +++----------------
 3 files changed, 6 insertions(+), 22 deletions(-)

diff --git a/examples/src/main/python/streaming/nerwork_wordcount.py b/examples/src/main/python/streaming/nerwork_wordcount.py
index 2e5048ccad213..67dc28f7bf7f0 100644
--- a/examples/src/main/python/streaming/nerwork_wordcount.py
+++ b/examples/src/main/python/streaming/nerwork_wordcount.py
@@ -10,7 +10,7 @@
         exit(-1)
     ssc = StreamingContext(appName="PythonStreamingNetworkWordCount", duration=Seconds(1))
 
-    lines = ssc.socketTextStream(sys.argv[1], sys.argv[2])
+    lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
     fm_lines = lines.flatMap(lambda x: x.split(" "))
     filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
     mapped_lines = fm_lines.map(lambda x: (x, 1))
diff --git a/python/pyspark/java_gateway.py b/python/pyspark/java_gateway.py
index 7038c6422be47..cea7d0975e5d1 100644
--- a/python/pyspark/java_gateway.py
+++ b/python/pyspark/java_gateway.py
@@ -85,6 +85,7 @@ def run(self):
     java_import(gateway.jvm, "org.apache.spark.streaming.*")
     java_import(gateway.jvm, "org.apache.spark.streaming.api.java.*")
     java_import(gateway.jvm, "org.apache.spark.streaming.api.python.*")
+    java_import(gateway.jvm, "org.apache.spark.streaming.dstream.*")
     java_import(gateway.jvm, "org.apache.spark.mllib.api.python.*")
     java_import(gateway.jvm, "org.apache.spark.sql.SQLContext")
     java_import(gateway.jvm, "org.apache.spark.sql.hive.HiveContext")
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index d3ff16fca764f..5dcc9ba35a653 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -19,7 +19,7 @@
 from pyspark.files import SparkFiles
 from pyspark.java_gateway import launch_gateway
 from pyspark.serializers import PickleSerializer, BatchedSerializer, UTF8Deserializer
-from pyspark.storagelevel import StorageLevel
+from pyspark.storagelevel import *
 from pyspark.rdd import RDD
 from pyspark.context import SparkContext
 
@@ -83,26 +83,9 @@ def awaitTermination(self, timeout=None):
         else:
             self._jssc.awaitTermination()
 
-    def checkpoint(self, directory):
-        raise NotImplementedError
-
-    def fileStream(self, directory, filter=None, newFilesOnly=None):
-        raise NotImplementedError
-
-    def networkStream(self, receiver):
-        raise NotImplementedError
-
-    def queueStream(self, queue, oneAtATime=True, defaultRDD=None):
-        raise NotImplementedError
-
-    def rawSocketStream(self, hostname, port, storagelevel):
-        raise NotImplementedError
-
-    def remember(self, duration):
-        raise NotImplementedError
-
-    def socketStream(hostname, port, converter,storageLevel):
-        raise NotImplementedError
+    # start from simple one. storageLevel is not passed for now.
+    def socketTextStream(self, hostname, port):
+        return DStream(self._jssc.socketTextStream(hostname, port), self, UTF8Deserializer())
 
     def start(self):
         self._jssc.start()

From a8c9fd5120204a96ae47520ec734212fb23a3af9 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 16:27:28 -0700
Subject: [PATCH 18/69] fixed for socketTextStream

---
 .../python/streaming/nerwork_wordcount.py     |  2 +-
 python/pyspark/java_gateway.py                |  1 +
 python/pyspark/streaming/context.py           | 25 +++----------------
 3 files changed, 6 insertions(+), 22 deletions(-)

diff --git a/examples/src/main/python/streaming/nerwork_wordcount.py b/examples/src/main/python/streaming/nerwork_wordcount.py
index 2e5048ccad213..67dc28f7bf7f0 100644
--- a/examples/src/main/python/streaming/nerwork_wordcount.py
+++ b/examples/src/main/python/streaming/nerwork_wordcount.py
@@ -10,7 +10,7 @@
         exit(-1)
     ssc = StreamingContext(appName="PythonStreamingNetworkWordCount", duration=Seconds(1))
 
-    lines = ssc.socketTextStream(sys.argv[1], sys.argv[2])
+    lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
     fm_lines = lines.flatMap(lambda x: x.split(" "))
     filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
     mapped_lines = fm_lines.map(lambda x: (x, 1))
diff --git a/python/pyspark/java_gateway.py b/python/pyspark/java_gateway.py
index 7038c6422be47..cea7d0975e5d1 100644
--- a/python/pyspark/java_gateway.py
+++ b/python/pyspark/java_gateway.py
@@ -85,6 +85,7 @@ def run(self):
     java_import(gateway.jvm, "org.apache.spark.streaming.*")
     java_import(gateway.jvm, "org.apache.spark.streaming.api.java.*")
     java_import(gateway.jvm, "org.apache.spark.streaming.api.python.*")
+    java_import(gateway.jvm, "org.apache.spark.streaming.dstream.*")
     java_import(gateway.jvm, "org.apache.spark.mllib.api.python.*")
     java_import(gateway.jvm, "org.apache.spark.sql.SQLContext")
     java_import(gateway.jvm, "org.apache.spark.sql.hive.HiveContext")
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index d3ff16fca764f..5dcc9ba35a653 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -19,7 +19,7 @@
 from pyspark.files import SparkFiles
 from pyspark.java_gateway import launch_gateway
 from pyspark.serializers import PickleSerializer, BatchedSerializer, UTF8Deserializer
-from pyspark.storagelevel import StorageLevel
+from pyspark.storagelevel import *
 from pyspark.rdd import RDD
 from pyspark.context import SparkContext
 
@@ -83,26 +83,9 @@ def awaitTermination(self, timeout=None):
         else:
             self._jssc.awaitTermination()
 
-    def checkpoint(self, directory):
-        raise NotImplementedError
-
-    def fileStream(self, directory, filter=None, newFilesOnly=None):
-        raise NotImplementedError
-
-    def networkStream(self, receiver):
-        raise NotImplementedError
-
-    def queueStream(self, queue, oneAtATime=True, defaultRDD=None):
-        raise NotImplementedError
-
-    def rawSocketStream(self, hostname, port, storagelevel):
-        raise NotImplementedError
-
-    def remember(self, duration):
-        raise NotImplementedError
-
-    def socketStream(hostname, port, converter,storageLevel):
-        raise NotImplementedError
+    # start from simple one. storageLevel is not passed for now.
+    def socketTextStream(self, hostname, port):
+        return DStream(self._jssc.socketTextStream(hostname, port), self, UTF8Deserializer())
 
     def start(self):
         self._jssc.start()

From ce7d426ffb4f8c8bcc384fa96d733b18aef4a6f5 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@kens-mbp.gateway.sonic.net>
Date: Wed, 16 Jul 2014 23:29:37 -0700
Subject: [PATCH 19/69] added doctest for pyspark.streaming.duration

---
 python/pyspark/streaming/duration.py | 242 +++++++++++++++++++++++----
 python/pyspark/streaming/utils.py    |  20 ++-
 python/run-tests                     |   1 +
 3 files changed, 233 insertions(+), 30 deletions(-)

diff --git a/python/pyspark/streaming/duration.py b/python/pyspark/streaming/duration.py
index 5982146e69026..06a169e5215ac 100644
--- a/python/pyspark/streaming/duration.py
+++ b/python/pyspark/streaming/duration.py
@@ -42,29 +42,80 @@ def __init__(self, millis, _jvm=None):
         self._jduration = _jvm.Duration(millis)
 
     def toString(self):
-        """ Return duration as string """
+        """
+        Return duration as string
+
+        >>> d_10 = Duration(10)
+        >>> d_10.toString()
+        '10 ms'
+        """
         return str(self._millis) + " ms"
 
     def isZero(self):
-        """ Check if millis is zero """
+        """
+        Check if millis is zero
+
+        >>> d_10 = Duration(10)
+        >>> d_10.isZero()
+        False
+        >>> d_0 = Duration(0)
+        >>> d_0.isZero()
+        True
+        """
         return self._millis == 0
 
     def prettyPrint(self):
         """
         Return a human-readable string representing a duration
+
+        >>> d_10 = Duration(10)
+        >>> d_10.prettyPrint()
+        '10 ms'
+        >>> d_1sec = Duration(1000)
+        >>> d_1sec.prettyPrint()
+        '1.0 s'
+        >>> d_1min = Duration(60 * 1000)
+        >>> d_1min.prettyPrint()
+        '1.0 m'
+        >>> d_1hour = Duration(60 * 60 * 1000)
+        >>> d_1hour.prettyPrint()
+        '1.00 h'
         """
         return utils.msDurationToString(self._millis)
 
     def milliseconds(self):
-        """ Return millisecond """
+        """
+        Return millisecond
+
+        >>> d_10 = Duration(10)
+        >>> d_10.milliseconds()
+        10
+
+        """
         return self._millis
 
     def toFormattedString(self):
-        """ Return millisecond """
+        """
+        Return millisecond
+
+        >>> d_10 = Duration(10)
+        >>> d_10.toFormattedString()
+        '10'
+
+        """
         return str(self._millis)
 
     def max(self, other):
-        """ Return higher Duration """
+        """
+        Return higher Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_100 = Duration(100)
+        >>> d_max = d_10.max(d_100)
+        >>> print d_max
+        100 ms
+
+        """
         Duration._is_duration(other)
         if self > other:
             return self
@@ -72,7 +123,16 @@ def max(self, other):
             return other
 
     def min(self, other):
-        """ Return lower Durattion """
+        """
+        Return lower Durattion
+
+        >>> d_10 = Duration(10)
+        >>> d_100 = Duration(100)
+        >>> d_min = d_10.min(d_100)
+        >>> print d_min
+        10 ms
+
+        """
         Duration._is_duration(other)
         if self < other:
             return self
@@ -80,20 +140,52 @@ def min(self, other):
             return other
 
     def __str__(self):
+        """
+        >>> d_10 = Duration(10)
+        >>> str(d_10)
+        '10 ms'
+
+        """
         return self.toString()
 
     def __add__(self, other):
-        """ Add Duration and Duration """
+        """
+        Add Duration and Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_100 = Duration(100)
+        >>> d_110 = d_10 + d_100
+        >>> print d_110
+        110 ms
+        """
         Duration._is_duration(other)
         return Duration(self._millis + other._millis)
 
     def __sub__(self, other):
-        """ Subtract Duration by Duration  """
+        """
+        Subtract Duration by Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_100 = Duration(100)
+        >>> d_90 =  d_100 - d_10
+        >>> print d_90
+        90 ms
+
+        """
         Duration._is_duration(other)
         return Duration(self._millis - other._millis)
 
     def __mul__(self, other):
-        """ Multiple Duration by Duration """
+        """
+        Multiple Duration by Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_100 = Duration(100)
+        >>> d_1000 = d_10 * d_100
+        >>> print d_1000
+        1000 ms
+
+        """
         Duration._is_duration(other)
         return Duration(self._millis * other._millis)
 
@@ -101,6 +193,13 @@ def __div__(self, other):
         """
         Divide Duration by Duration
         for Python 2.X
+
+        >>> d_10 = Duration(10)
+        >>> d_20 = Duration(20)
+        >>> d_2 = d_20 / d_10
+        >>> print d_2
+        2 ms
+
         """
         Duration._is_duration(other)
         return Duration(self._millis / other._millis)
@@ -109,46 +208,121 @@ def __truediv__(self, other):
         """
         Divide Duration by Duration
         for Python 3.0
+
+        >>> d_10 = Duration(10)
+        >>> d_20 = Duration(20)
+        >>> d_2 = d_20 / d_10
+        >>> print d_2
+        2 ms
+
         """
         Duration._is_duration(other)
         return Duration(self._millis / other._millis)
 
     def __floordiv__(self, other):
-        """ Divide Duration by Duration """
+        """
+        Divide Duration by Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_3 = Duration(3)
+        >>> d_3 = d_10 // d_3
+        >>> print d_3
+        3 ms
+
+        """
         Duration._is_duration(other)
         return Duration(self._millis // other._millis)
 
-    def __len__(self):
-        """ Length of miilisecond in Duration """
-        return len(self._millis)
-
     def __lt__(self, other):
-        """ Duration < Duration """
+        """
+        Duration < Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_20 = Duration(20)
+        >>> d_10 < d_20
+        True
+        >>> d_20 < d_10
+        False
+
+        """
         Duration._is_duration(other)
         return self._millis < other._millis
 
     def __le__(self, other):
-        """ Duration <= Duration """
+        """
+        Duration <= Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_20 = Duration(20)
+        >>> d_10 <= d_20
+        True
+        >>> d_20 <= d_10
+        False
+
+        """
         Duration._is_duration(other)
-        return self.millis <= other._millis
+        return self._millis <= other._millis
 
     def __eq__(self, other):
-        """ Duration ==  Duration """
+        """
+        Duration ==  Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_20 = Duration(20)
+        >>> d_10 == d_20
+        False
+        >>> other_d_10 = Duration(10)
+        >>> d_10 == other_d_10
+        True
+
+        """
         Duration._is_duration(other)
         return self._millis == other._millis
 
     def __ne__(self, other):
-        """ Duration != Duration """
+        """
+        Duration != Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_20 = Duration(20)
+        >>> d_10 != d_20
+        True
+        >>> other_d_10 = Duration(10)
+        >>> d_10 != other_d_10
+        False
+
+        """
         Duration._is_duration(other)
         return self._millis != other._millis
 
     def __gt__(self, other):
-        """ Duration > Duration """
+        """
+        Duration > Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_20 = Duration(20)
+        >>> d_10 > d_20
+        False
+        >>> d_20 > d_10
+        True
+
+        """
         Duration._is_duration(other)
         return self._millis > other._millis
 
     def __ge__(self, other):
-        """ Duration >= Duration """
+        """
+        Duration >= Duration
+
+        >>> d_10 = Duration(10)
+        >>> d_20 = Duration(20)
+        >>> d_10 < d_20
+        True
+        >>> d_20 < d_10
+        False
+
+
+        """
         Duration._is_duration(other)
         return self._millis >= other._millis
 
@@ -162,6 +336,12 @@ def Milliseconds(milliseconds):
     """
     Helper function that creates instance of [[pysparkstreaming.duration]] representing
     a given number of milliseconds.
+
+    >>> milliseconds = Milliseconds(1)
+    >>> d_1 = Duration(1)
+    >>> milliseconds == d_1
+    True
+
     """
     return Duration(milliseconds)
 
@@ -169,18 +349,24 @@ def Seconds(seconds):
     """
     Helper function that creates instance of [[pysparkstreaming.duration]] representing
     a given number of seconds.
+
+    >>> seconds = Seconds(1)
+    >>> d_1sec = Duration(1000)
+    >>> seconds == d_1sec
+    True
+
     """
     return Duration(seconds * 1000)
 
-def Minites(minites):
+def Minutes(minutes):
     """
     Helper function that creates instance of [[pysparkstreaming.duration]] representing
     a given number of minutes.
-    """
-    return Duration(minutes * 60000)
 
-if __name__ == "__main__":
-    d = Duration(1)
-    print d
-    print d.milliseconds()
+    >>> minutes = Minutes(1)
+    >>> d_1min = Duration(60 * 1000)
+    >>> minutes == d_1min
+    True
 
+    """
+    return Duration(minutes * 60 * 1000)
diff --git a/python/pyspark/streaming/utils.py b/python/pyspark/streaming/utils.py
index 71aa3376c6578..b1fa1e227b0a1 100644
--- a/python/pyspark/streaming/utils.py
+++ b/python/pyspark/streaming/utils.py
@@ -1,4 +1,20 @@
-__author__ = 'ktakagiw'
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
 
 def msDurationToString(ms):
     """
@@ -12,7 +28,7 @@ def msDurationToString(ms):
         return "%d ms" % ms
     elif ms < minute:
         return "%.1f s" % (float(ms) / second)
-    elif ms < hout:
+    elif ms < hour:
         return "%.1f m" % (float(ms) / minute)
     else:
         return "%.2f h" % (float(ms) / hour)
diff --git a/python/run-tests b/python/run-tests
index 9282aa47e8375..0d977770fc160 100755
--- a/python/run-tests
+++ b/python/run-tests
@@ -60,6 +60,7 @@ export PYSPARK_DOC_TEST=1
 run_test "pyspark/broadcast.py"
 run_test "pyspark/accumulators.py"
 run_test "pyspark/serializers.py"
+run_test "pyspark/streaming/duration.py"
 unset PYSPARK_DOC_TEST
 run_test "pyspark/tests.py"
 run_test "pyspark/mllib/_common.py"

From e604fcba9cbe97ee981d8ec14fd8d9207aaaa275 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@kens-mbp.gateway.sonic.net>
Date: Wed, 16 Jul 2014 23:36:33 -0700
Subject: [PATCH 20/69] fixed typo of network_workdcount.py

---
 .../python/streaming/network_wordcount.py     | 22 +++++++++++++++++++
 1 file changed, 22 insertions(+)
 create mode 100644 examples/src/main/python/streaming/network_wordcount.py

diff --git a/examples/src/main/python/streaming/network_wordcount.py b/examples/src/main/python/streaming/network_wordcount.py
new file mode 100644
index 0000000000000..67dc28f7bf7f0
--- /dev/null
+++ b/examples/src/main/python/streaming/network_wordcount.py
@@ -0,0 +1,22 @@
+import sys
+from operator import add
+
+from pyspark.streaming.context import StreamingContext
+from pyspark.streaming.duration import *
+
+if __name__ == "__main__":
+    if len(sys.argv) != 3:
+        print >> sys.stderr, "Usage: wordcount <hostname> <port>"
+        exit(-1)
+    ssc = StreamingContext(appName="PythonStreamingNetworkWordCount", duration=Seconds(1))
+
+    lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
+    fm_lines = lines.flatMap(lambda x: x.split(" "))
+    filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
+    mapped_lines = fm_lines.map(lambda x: (x, 1))
+    
+    fm_lines.pyprint()
+    filtered_lines.pyprint()
+    mapped_lines.pyprint()
+    ssc.start()
+    ssc.awaitTermination()

From 57209798d09cd72c4c6a9f28f63e7f7fbc89c68e Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@kens-mbp.gateway.sonic.net>
Date: Wed, 16 Jul 2014 23:39:25 -0700
Subject: [PATCH 21/69] delete old file

---
 .../python/streaming/nerwork_wordcount.py     | 22 -------------------
 1 file changed, 22 deletions(-)
 delete mode 100644 examples/src/main/python/streaming/nerwork_wordcount.py

diff --git a/examples/src/main/python/streaming/nerwork_wordcount.py b/examples/src/main/python/streaming/nerwork_wordcount.py
deleted file mode 100644
index 67dc28f7bf7f0..0000000000000
--- a/examples/src/main/python/streaming/nerwork_wordcount.py
+++ /dev/null
@@ -1,22 +0,0 @@
-import sys
-from operator import add
-
-from pyspark.streaming.context import StreamingContext
-from pyspark.streaming.duration import *
-
-if __name__ == "__main__":
-    if len(sys.argv) != 3:
-        print >> sys.stderr, "Usage: wordcount <hostname> <port>"
-        exit(-1)
-    ssc = StreamingContext(appName="PythonStreamingNetworkWordCount", duration=Seconds(1))
-
-    lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
-    fm_lines = lines.flatMap(lambda x: x.split(" "))
-    filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
-    mapped_lines = fm_lines.map(lambda x: (x, 1))
-    
-    fm_lines.pyprint()
-    filtered_lines.pyprint()
-    mapped_lines.pyprint()
-    ssc.start()
-    ssc.awaitTermination()

From 571d52d935565e88fc05d564d45aeb7020134b86 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Tue, 15 Jul 2014 21:08:43 -0700
Subject: [PATCH 22/69] added reducedByKey not working yet

---
 .../src/main/python/streaming/wordcount.py    | 10 ++-
 python/pyspark/streaming/dstream.py           | 26 +++++-
 .../streaming/api/python/PythonDStream.scala  | 85 +++++++++++++++++++
 3 files changed, 119 insertions(+), 2 deletions(-)

diff --git a/examples/src/main/python/streaming/wordcount.py b/examples/src/main/python/streaming/wordcount.py
index f44cd696894ba..3996991109d60 100644
--- a/examples/src/main/python/streaming/wordcount.py
+++ b/examples/src/main/python/streaming/wordcount.py
@@ -1,6 +1,7 @@
 import sys
 from operator import add
 
+from pyspark.conf import SparkConf
 from pyspark.streaming.context import StreamingContext
 from pyspark.streaming.duration import *
 
@@ -8,15 +9,22 @@
     if len(sys.argv) != 2:
         print >> sys.stderr, "Usage: wordcount <directory>"
         exit(-1)
-    ssc = StreamingContext(appName="PythonStreamingWordCount", duration=Seconds(1))
+    conf = SparkConf()
+    conf.setAppName("PythonStreamingWordCount")
+    conf.set("spark.default.parallelism", 1)
+
+#    ssc = StreamingContext(appName="PythonStreamingWordCount", duration=Seconds(1))
+    ssc = StreamingContext(conf=conf, duration=Seconds(1))
 
     lines = ssc.textFileStream(sys.argv[1])
     fm_lines = lines.flatMap(lambda x: x.split(" "))
     filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
     mapped_lines = fm_lines.map(lambda x: (x, 1))
+    reduced_lines = mapped_lines.reduce(add)
     
     fm_lines.pyprint()
     filtered_lines.pyprint()
     mapped_lines.pyprint()
+    reduced_lines.pyprint()
     ssc.start()
     ssc.awaitTermination()
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index cd28184274c9a..f0a3342876e4c 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -9,6 +9,7 @@
 
 __all__ = ["DStream"]
 
+
 class DStream(object):
     def __init__(self, jdstream, ssc, jrdd_deserializer):
         self._jdstream = jdstream
@@ -69,7 +70,7 @@ def _combineByKey(self, createCombiner, mergeValue, mergeCombiners,
         """
         """
         if numPartitions is None:
-            numPartitions = self.ctx._defaultParallelism()
+            numPartitions = self._defaultReducePartitions()
         def combineLocally(iterator):
             combiners = {}
             for x in iterator:
@@ -130,8 +131,31 @@ def add_shuffle_key(split, iterator):
         return dstream
 
     def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
+        """
+
+        """
         return PipelinedDStream(self, f, preservesPartitioning)
 
+    def _defaultReducePartitions(self):
+        """
+
+        """
+        # hard code to avoid the error
+        return 2
+        if self.ctx._conf.contains("spark.default.parallelism"):
+            return self.ctx.defaultParallelism
+        else:
+            return self.getNumPartitions()
+
+    def getNumPartitions(self):
+      """
+      Returns the number of partitions in RDD
+      >>> rdd = sc.parallelize([1, 2, 3, 4], 2)
+      >>> rdd.getNumPartitions()
+      2
+      """
+      return self._jdstream.partitions().size()
+
 
 class PipelinedDStream(DStream):
     def __init__(self, prev, func, preservesPartitioning=False):
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 76b88385e095a..83e4eaa8b5e4e 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -55,6 +55,91 @@ class PythonDStream[T: ClassTag](
       case None => None
     }
   }
+<<<<<<< HEAD
 
   val asJavaDStream  = JavaDStream.fromDStream(this)
 }
+=======
+  val asJavaDStream  = JavaDStream.fromDStream(this)
+
+  /**
+   * Print the first ten elements of each PythonRDD generated in this PythonDStream. This is an output
+   * operator, so this PythonDStream will be registered as an output stream and there materialized.
+   * Since serialized Python object is readable by Python, pyprint writes out binary data to
+   * temporary file and run python script to deserialized and print the first ten elements
+   */
+  private[streaming] def ppyprint() {
+    def foreachFunc = (rdd: RDD[Array[Byte]], time: Time) => {
+      val iter = rdd.take(11).iterator
+
+      // make a temporary file
+      val prefix = "spark"
+      val suffix = ".tmp"
+      val tempFile = File.createTempFile(prefix, suffix)
+      val tempFileStream = new DataOutputStream(new FileOutputStream(tempFile.getAbsolutePath))
+      //write out serialized python object
+      PythonRDD.writeIteratorToStream(iter, tempFileStream)
+      tempFileStream.close()
+
+      // This value has to be passed from python
+      //val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
+      val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
+      //val pb = new ProcessBuilder(Seq(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath())) // why this fails to compile???
+      //absolute path to the python script is needed to change because we do not use pysparkstreaming
+      val pb = new ProcessBuilder(pythonExec, sparkHome + "/python/pysparkstreaming/streaming/pyprint.py", tempFile.getAbsolutePath)
+      val workerEnv = pb.environment()
+
+      //envVars also need to be pass
+      //workerEnv.putAll(envVars)
+      val pythonPath = sparkHome + "/python/" + File.pathSeparator + workerEnv.get("PYTHONPATH")
+      workerEnv.put("PYTHONPATH", pythonPath)
+      val worker = pb.start()
+      val is = worker.getInputStream()
+      val isr = new InputStreamReader(is)
+      val br = new BufferedReader(isr)
+
+      println ("-------------------------------------------")
+      println ("Time: " + time)
+      println ("-------------------------------------------")
+
+      //print value from python std out
+      var line = ""
+      breakable {
+        while (true) {
+          line = br.readLine()
+          if (line == null) break()
+          println(line)
+        }
+      }
+      //delete temporary file
+      tempFile.delete()
+      println()
+
+    }
+    new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
+  }
+}
+
+
+private class PairwiseDStream(prev:DStream[Array[Byte]]) extends
+DStream[(Long, Array[Byte])](prev.ssc){
+  override def dependencies = List(prev)
+
+  override def slideDuration: Duration = prev.slideDuration
+
+  override def compute(validTime:Time):Option[RDD[(Long, Array[Byte])]]={
+    prev.getOrCompute(validTime) match{
+      case Some(rdd)=>Some(rdd)
+        val pairwiseRDD = new PairwiseRDD(rdd)
+        Some(pairwiseRDD.asJavaPairRDD.rdd)
+      case None => None
+    }
+  }
+  val asJavaPairDStream : JavaPairDStream[Long, Array[Byte]]  = JavaPairDStream.fromJavaDStream(this)
+}
+
+
+
+
+
+>>>>>>> added reducedByKey not working yet

From 3b6d7b01c3cd4d0ad9ac0ffde0032805b64560be Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Wed, 16 Jul 2014 11:07:42 -0700
Subject: [PATCH 23/69] implementing transform function in Python

---
 python/pyspark/mllib/_common.py               |  2 +-
 python/pyspark/streaming/dstream.py           |  2 -
 .../api/python/PythonTransformedDStream.scala | 37 +++++++++++++++++++
 .../spark/streaming/dstream/DStream.scala     |  3 ++
 4 files changed, 41 insertions(+), 3 deletions(-)
 create mode 100644 streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala

diff --git a/python/pyspark/mllib/_common.py b/python/pyspark/mllib/_common.py
index e609b60a0f968..4b723693f43e3 100644
--- a/python/pyspark/mllib/_common.py
+++ b/python/pyspark/mllib/_common.py
@@ -164,7 +164,7 @@ def _deserialize_double_vector(ba, offset=0):
     nb = len(ba) - offset
     if nb < 5:
         raise TypeError("_deserialize_double_vector called on a %d-byte array, "
-                "which is too short" % nb)
+                        "which is too short" % nb)
     if ba[offset] == DENSE_VECTOR_MAGIC:
         return _deserialize_dense_vector(ba, offset)
     elif ba[offset] == SPARSE_VECTOR_MAGIC:
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index f0a3342876e4c..5766cca39bdee 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -92,7 +92,6 @@ def _mergeCombiners(iterator):
             return combiners.iteritems()
         return shuffled.mapPartitions(_mergeCombiners) 
 
-
     def partitionBy(self, numPartitions, partitionFunc=None):
         """
         Return a copy of the DStream partitioned using the specified partitioner.
@@ -141,7 +140,6 @@ def _defaultReducePartitions(self):
 
         """
         # hard code to avoid the error
-        return 2
         if self.ctx._conf.contains("spark.default.parallelism"):
             return self.ctx.defaultParallelism
         else:
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala
new file mode 100644
index 0000000000000..ff70483b771a4
--- /dev/null
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala
@@ -0,0 +1,37 @@
+package org.apache.spark.streaming.api.python
+
+import org.apache.spark.Accumulator
+import org.apache.spark.api.python.PythonRDD
+import org.apache.spark.broadcast.Broadcast
+import org.apache.spark.rdd.RDD
+import org.apache.spark.streaming.api.java.JavaDStream
+import org.apache.spark.streaming.{Time, Duration}
+import org.apache.spark.streaming.dstream.DStream
+
+import scala.reflect.ClassTag
+
+/**
+ * Created by ken on 7/15/14.
+ */
+class PythonTransformedDStream[T: ClassTag](
+               parents: Seq[DStream[T]],
+               command: Array[Byte],
+               envVars: JMap[String, String],
+               pythonIncludes: JList[String],
+               preservePartitoning: Boolean,
+               pythonExec: String,
+               broadcastVars: JList[Broadcast[Array[Byte]]],
+               accumulator: Accumulator[JList[Array[Byte]]]
+               ) extends DStream[Array[Byte]](parent.ssc) {
+
+  override def dependencies = List(parent)
+
+  override def slideDuration: Duration = parent.slideDuration
+
+  //pythonDStream compute
+  override def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
+    val parentRDDs = parents.map(_.getOrCompute(validTime).orNull).toSeq
+    Some()
+  }
+  val asJavaDStream  = JavaDStream.fromDStream(this)
+}
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index d9d5446b62e9f..67977244ef420 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -561,9 +561,12 @@ abstract class DStream[T: ClassTag] (
     // because the DStream is reachable from the outer object here, and because 
     // DStreams can't be serialized with closures, we can't proactively check 
     // it for serializability and so we pass the optional false to SparkContext.clean
+
+    // serialized python
     val cleanedF = context.sparkContext.clean(transformFunc, false)
     val realTransformFunc =  (rdds: Seq[RDD[_]], time: Time) => {
       assert(rdds.length == 1)
+      // if transformfunc is fine, it is okay
       cleanedF(rdds.head.asInstanceOf[RDD[T]], time)
     }
     new TransformedDStream[U](Seq(this), realTransformFunc)

From 04af0462cd17a875d5a98c809ad7dece517c232f Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Thu, 17 Jul 2014 16:27:05 -0700
Subject: [PATCH 24/69] reduceByKey is working

---
 .../src/main/python/streaming/wordcount.pyc   | Bin 0 -> 1566 bytes
 python/pyspark/streaming/dstream.py           |   6 +-
 .../streaming/api/python/PythonDStream.scala  |  87 +++---------------
 .../api/python/PythonTransformedDStream.scala |  19 ++--
 4 files changed, 29 insertions(+), 83 deletions(-)
 create mode 100644 examples/src/main/python/streaming/wordcount.pyc

diff --git a/examples/src/main/python/streaming/wordcount.pyc b/examples/src/main/python/streaming/wordcount.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..db93702361f47f57988ea82c213aae522e7a9f81
GIT binary patch
literal 1566
zcmb_c+invv5S`tmX_F>xdP%Qb`WW$$yrZfDRUlD`3MEBIE2LoJN!i4Ek?qh#;suqD
z<A3-7n6a}d5{L(2H};Otj6G*APU%~t_Uz(oe+Y}GLf<De%)0<U(k}o75P3NS6+jX~
z6hgqd5~va+Wr)gtT?VxRNd=;cU$1~#g)3YGS%FCi`fY$!K!9-#ZUd03Fe!ol?2vUR
z%QXmJTwtBuk~&BMunf24y#d&O@dn7MQ}ALFWDVpx+!7V6fUL8LB*Ugd1KJlxTYy_I
z-d?yQ>q9y>+5y~w@h->>_~JZ8Ex;Cx_dsqI$i71kKsF2H5bzMjM}Q%7h>o4XJ*F4n
zK8zO<nJlE^r9>3&dpnXIIEg}|#P-`;l<D|8J(q1tH`o$QLQ21=(xRUWJvq<Pk%yWL
zS&brz(`$k)&aBt)_D6P&=D{ElaXJ{pAuY^3nqC`mjgL=mGA)PMG_@zEGS)b>nVz57
z12T9uw;!@}dGH%DJZD35$VV`Rj>M6eD%+ujPzqISlGsr$lgW?>I^S}tg^jax$SNMp
z;hctP(DaEa?*gX;_S>wwv}|<ZLs((ET*W^{G;0$EZZchxa3+#mq3Ieu>~fgh+)?kE
zA}QTvlpRuWK2DWL-b-<|OR}K>zmlsFO7$Rqlgg4A({btd9G1bVIK_XX)mx{dTQvSa
zhqw@<QCQG%$-ZOKW6J-5#a_Xp{g5Qre`ao6-m)C2n3?X80&Jb8eC~UJ%iVMN;QlDk
zWeGZ@=f>=Dh3(OAO^QZYbZjaT91NU$g{kG968ie1<$oh%C2H+3oW-`snC0*d+NXJb
zNn1T{w04!?K9YZFJZ6S=gYAjV^H`y8am%IUG8(sGq=bDbaz|y947`H9jACU`y92z4
za-rpWn$Q-`3VrjXg12du(;-^!crO;am|Z^4b(~s9!C0ZK<vT5IL~O56)3tW@=dQ9&
u`upBbGC5Uv#>Fxnn(9F_YzEDs7S@AS(4e<Uqggr*_kwNrZicm>cz*!UkyX3^

literal 0
HcmV?d00001

diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 5766cca39bdee..4e18cbacf3eba 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -118,11 +118,9 @@ def add_shuffle_key(split, iterator):
         keyed = PipelinedDStream(self, add_shuffle_key)
         keyed._bypass_serializer = True
         with _JavaStackTrace(self.ctx) as st:
-            #JavaDStream
-            pairDStream = self.ctx._jvm.PairwiseDStream(keyed._jdstream.dstream()).asJavaPairDStream()
             partitioner = self.ctx._jvm.PythonPartitioner(numPartitions,
-                                                          id(partitionFunc))
-        jdstream = pairDStream.partitionBy(partitioner).values()
+                                                      id(partitionFunc))
+            jdstream = self.ctx._jvm.PairwiseDStream(keyed._jdstream.dstream(), partitioner).asJavaDStream()
         dstream = DStream(jdstream, self._ssc, BatchedSerializer(outputSerializer))
         # This is required so that id(partitionFunc) remains unique, even if
         # partitionFunc is a lambda:
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 83e4eaa8b5e4e..d305797bb4a0f 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -55,91 +55,34 @@ class PythonDStream[T: ClassTag](
       case None => None
     }
   }
-<<<<<<< HEAD
 
   val asJavaDStream  = JavaDStream.fromDStream(this)
 }
-=======
-  val asJavaDStream  = JavaDStream.fromDStream(this)
-
-  /**
-   * Print the first ten elements of each PythonRDD generated in this PythonDStream. This is an output
-   * operator, so this PythonDStream will be registered as an output stream and there materialized.
-   * Since serialized Python object is readable by Python, pyprint writes out binary data to
-   * temporary file and run python script to deserialized and print the first ten elements
-   */
-  private[streaming] def ppyprint() {
-    def foreachFunc = (rdd: RDD[Array[Byte]], time: Time) => {
-      val iter = rdd.take(11).iterator
-
-      // make a temporary file
-      val prefix = "spark"
-      val suffix = ".tmp"
-      val tempFile = File.createTempFile(prefix, suffix)
-      val tempFileStream = new DataOutputStream(new FileOutputStream(tempFile.getAbsolutePath))
-      //write out serialized python object
-      PythonRDD.writeIteratorToStream(iter, tempFileStream)
-      tempFileStream.close()
-
-      // This value has to be passed from python
-      //val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
-      val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
-      //val pb = new ProcessBuilder(Seq(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath())) // why this fails to compile???
-      //absolute path to the python script is needed to change because we do not use pysparkstreaming
-      val pb = new ProcessBuilder(pythonExec, sparkHome + "/python/pysparkstreaming/streaming/pyprint.py", tempFile.getAbsolutePath)
-      val workerEnv = pb.environment()
-
-      //envVars also need to be pass
-      //workerEnv.putAll(envVars)
-      val pythonPath = sparkHome + "/python/" + File.pathSeparator + workerEnv.get("PYTHONPATH")
-      workerEnv.put("PYTHONPATH", pythonPath)
-      val worker = pb.start()
-      val is = worker.getInputStream()
-      val isr = new InputStreamReader(is)
-      val br = new BufferedReader(isr)
 
-      println ("-------------------------------------------")
-      println ("Time: " + time)
-      println ("-------------------------------------------")
 
-      //print value from python std out
-      var line = ""
-      breakable {
-        while (true) {
-          line = br.readLine()
-          if (line == null) break()
-          println(line)
-        }
-      }
-      //delete temporary file
-      tempFile.delete()
-      println()
-
-    }
-    new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
-  }
-}
-
-
-private class PairwiseDStream(prev:DStream[Array[Byte]]) extends
-DStream[(Long, Array[Byte])](prev.ssc){
+private class PairwiseDStream(prev:DStream[Array[Byte]], partitioner: Partitioner) extends
+DStream[Array[Byte]](prev.ssc){
   override def dependencies = List(prev)
 
   override def slideDuration: Duration = prev.slideDuration
 
-  override def compute(validTime:Time):Option[RDD[(Long, Array[Byte])]]={
+  override def compute(validTime:Time):Option[RDD[Array[Byte]]]={
     prev.getOrCompute(validTime) match{
       case Some(rdd)=>Some(rdd)
         val pairwiseRDD = new PairwiseRDD(rdd)
-        Some(pairwiseRDD.asJavaPairRDD.rdd)
+        /*
+         * This is equivalent to following python code
+         * with _JavaStackTrace(self.context) as st:
+         *    pairRDD = self.ctx._jvm.PairwiseRDD(keyed._jrdd.rdd()).asJavaPairRDD()
+         *    partitioner = self.ctx._jvm.PythonPartitioner(numPartitions,
+         *                                                  id(partitionFunc))
+         * jrdd = pairRDD.partitionBy(partitioner).values()
+         * rdd = RDD(jrdd, self.ctx, BatchedSerializer(outputSerializer))
+         */
+        Some(pairwiseRDD.asJavaPairRDD.partitionBy(partitioner).values().rdd)
       case None => None
     }
   }
-  val asJavaPairDStream : JavaPairDStream[Long, Array[Byte]]  = JavaPairDStream.fromJavaDStream(this)
+  val asJavaDStream  = JavaDStream.fromDStream(this)
+  //val asJavaPairDStream : JavaPairDStream[Long, Array[Byte]]  = JavaPairDStream.fromJavaDStream(this)
 }
-
-
-
-
-
->>>>>>> added reducedByKey not working yet
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala
index ff70483b771a4..bc07e09ec6d03 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala
@@ -1,3 +1,5 @@
+/*
+
 package org.apache.spark.streaming.api.python
 
 import org.apache.spark.Accumulator
@@ -10,11 +12,8 @@ import org.apache.spark.streaming.dstream.DStream
 
 import scala.reflect.ClassTag
 
-/**
- * Created by ken on 7/15/14.
- */
 class PythonTransformedDStream[T: ClassTag](
-               parents: Seq[DStream[T]],
+               parent: DStream[T],
                command: Array[Byte],
                envVars: JMap[String, String],
                pythonIncludes: JList[String],
@@ -30,8 +29,14 @@ class PythonTransformedDStream[T: ClassTag](
 
   //pythonDStream compute
   override def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
-    val parentRDDs = parents.map(_.getOrCompute(validTime).orNull).toSeq
-    Some()
+
+//    val parentRDDs = parents.map(_.getOrCompute(validTime).orNull).toSeq
+//    parents.map(_.getOrCompute(validTime).orNull).to
+//    parent = parents.head.asInstanceOf[RDD]
+//    Some()
   }
-  val asJavaDStream  = JavaDStream.fromDStream(this)
+
+  val asJavaDStream = JavaDStream.fromDStream(this)
 }
+
+*/

From ae464e0c0f2f87bae309d7f6bdb1a5a4a3cd646b Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Thu, 17 Jul 2014 17:09:23 -0700
Subject: [PATCH 25/69] edit python sparkstreaming example

---
 examples/src/main/python/streaming/network_wordcount.py | 8 +++++++-
 examples/src/main/python/streaming/wordcount.py         | 1 +
 2 files changed, 8 insertions(+), 1 deletion(-)

diff --git a/examples/src/main/python/streaming/network_wordcount.py b/examples/src/main/python/streaming/network_wordcount.py
index 67dc28f7bf7f0..77fca7ff7657d 100644
--- a/examples/src/main/python/streaming/network_wordcount.py
+++ b/examples/src/main/python/streaming/network_wordcount.py
@@ -1,6 +1,7 @@
 import sys
 from operator import add
 
+from pyspark.conf import SparkConf
 from pyspark.streaming.context import StreamingContext
 from pyspark.streaming.duration import *
 
@@ -8,15 +9,20 @@
     if len(sys.argv) != 3:
         print >> sys.stderr, "Usage: wordcount <hostname> <port>"
         exit(-1)
-    ssc = StreamingContext(appName="PythonStreamingNetworkWordCount", duration=Seconds(1))
+    conf = SparkConf()
+    conf.setAppName("PythonStreamingNetworkWordCount")
+    conf.set("spark.default.parallelism", 1)
+    ssc = StreamingContext(conf=conf, duration=Seconds(1))
 
     lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
     fm_lines = lines.flatMap(lambda x: x.split(" "))
     filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
     mapped_lines = fm_lines.map(lambda x: (x, 1))
+    reduced_lines = mapped_lines.reduce(add)
     
     fm_lines.pyprint()
     filtered_lines.pyprint()
     mapped_lines.pyprint()
+    reduced_lines.pyprint()
     ssc.start()
     ssc.awaitTermination()
diff --git a/examples/src/main/python/streaming/wordcount.py b/examples/src/main/python/streaming/wordcount.py
index 3996991109d60..9ff8bc5ac9ab2 100644
--- a/examples/src/main/python/streaming/wordcount.py
+++ b/examples/src/main/python/streaming/wordcount.py
@@ -13,6 +13,7 @@
     conf.setAppName("PythonStreamingWordCount")
     conf.set("spark.default.parallelism", 1)
 
+# still has a bug
 #    ssc = StreamingContext(appName="PythonStreamingWordCount", duration=Seconds(1))
     ssc = StreamingContext(conf=conf, duration=Seconds(1))
 

From d01a125a8bc9f3f2e33d1c90adaa47755fbc6049 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Fri, 18 Jul 2014 17:58:58 -0700
Subject: [PATCH 26/69] added count operation but this implementation need
 double check

---
 python/pyspark/streaming/dstream.py | 27 ++++++++++++++++++++++++---
 1 file changed, 24 insertions(+), 3 deletions(-)

diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 6fbd5b6f88089..3f23e65712368 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -1,5 +1,8 @@
 from collections import defaultdict
 from itertools import chain, ifilter, imap
+import operator
+
+import logging
 
 from pyspark.serializers import NoOpSerializer,\
     BatchedSerializer, CloudPickleSerializer, pack_long
@@ -24,6 +27,18 @@ def generatedRDDs(self):
         """
         pass
 
+    def count(self):
+        """
+
+        """
+        #TODO make sure count implementation, thiis different from what pyspark does
+        return self.mapPartitions(lambda i: [sum(1 for _ in i)]).sum().map(lambda x: x[1])
+
+    def sum(self):
+        """
+        """
+        return self.mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
+
     def print_(self):
         """
         """
@@ -63,9 +78,9 @@ def reduce(self, func, numPartitions=None):
         """
 
         """
-        return self._combineByKey(lambda x:x, func, func, numPartitions)
+        return self.combineByKey(lambda x:x, func, func, numPartitions)
 
-    def _combineByKey(self, createCombiner, mergeValue, mergeCombiners,
+    def combineByKey(self, createCombiner, mergeValue, mergeCombiners,
                       numPartitions = None):
         """
         """
@@ -74,6 +89,12 @@ def _combineByKey(self, createCombiner, mergeValue, mergeCombiners,
         def combineLocally(iterator):
             combiners = {}
             for x in iterator:
+
+                #TODO for count operation make sure count implementation
+                # This is different from what pyspark does
+                if isinstance(x, int):
+                    x = ("", x)
+
                 (k, v) = x
                 if k not in combiners:
                     combiners[k] = createCombiner(v)
@@ -143,7 +164,7 @@ def _defaultReducePartitions(self):
         else:
             return self.getNumPartitions()
 
-      return self._jdstream.partitions().size()
+        return self._jdstream.partitions().size()
 
     def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
         """

From bd20e179a4c151f5442a9497a0bdfe206b1ffc70 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Sat, 19 Jul 2014 18:58:01 -0700
Subject: [PATCH 27/69] fix map function

---
 .../python/streaming/network_wordcount.py     |  2 ++
 python/pyspark/streaming/dstream.py           | 32 ++++++++-----------
 2 files changed, 15 insertions(+), 19 deletions(-)

diff --git a/examples/src/main/python/streaming/network_wordcount.py b/examples/src/main/python/streaming/network_wordcount.py
index 77fca7ff7657d..a1458e06f13d2 100644
--- a/examples/src/main/python/streaming/network_wordcount.py
+++ b/examples/src/main/python/streaming/network_wordcount.py
@@ -19,10 +19,12 @@
     filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
     mapped_lines = fm_lines.map(lambda x: (x, 1))
     reduced_lines = mapped_lines.reduce(add)
+    counted_lines = reduced_lines.count()
     
     fm_lines.pyprint()
     filtered_lines.pyprint()
     mapped_lines.pyprint()
     reduced_lines.pyprint()
+    counted_lines.pyprint()
     ssc.start()
     ssc.awaitTermination()
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 3f23e65712368..caa62d44a9069 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -20,21 +20,14 @@ def __init__(self, jdstream, ssc, jrdd_deserializer):
         self.ctx = ssc._sc
         self._jrdd_deserializer = jrdd_deserializer
 
-    def generatedRDDs(self):
-        """
-         // RDDs generated, marked as private[streaming] so that testsuites can access it
-         @transient
-        """
-        pass
-
     def count(self):
         """
 
         """
         #TODO make sure count implementation, thiis different from what pyspark does
-        return self.mapPartitions(lambda i: [sum(1 for _ in i)]).sum().map(lambda x: x[1])
+        return self.mapPartitions(lambda i: [sum(1 for _ in i)]).map(lambda x: (None, 1))
 
-    def sum(self):
+    def _sum(self):
         """
         """
         return self.mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
@@ -65,8 +58,9 @@ def func(s, iterator): return chain.from_iterable(imap(f, iterator))
     def map(self, f, preservesPartitioning=False):
         """
         """
-        def func(split, iterator): return imap(f, iterator)
-        return PipelinedDStream(self, func, preservesPartitioning)
+        def func(iterator): return imap(f, iterator)
+        return self.mapPartitions(func)
+        #return PipelinedDStream(self, func, preservesPartitioning)
 
     def mapPartitions(self, f):
         """
@@ -74,6 +68,12 @@ def mapPartitions(self, f):
         def func(s, iterator): return f(iterator)
         return self.mapPartitionsWithIndex(func)
 
+    def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
+        """
+
+        """
+        return PipelinedDStream(self, f, preservesPartitioning)
+
     def reduce(self, func, numPartitions=None):
         """
 
@@ -92,8 +92,8 @@ def combineLocally(iterator):
 
                 #TODO for count operation make sure count implementation
                 # This is different from what pyspark does
-                if isinstance(x, int):
-                    x = ("", x)
+                #if isinstance(x, int):
+                #    x = ("", x)
 
                 (k, v) = x
                 if k not in combiners:
@@ -166,12 +166,6 @@ def _defaultReducePartitions(self):
 
         return self._jdstream.partitions().size()
 
-    def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
-        """
-
-        """
-        return PipelinedDStream(self, f, preservesPartitioning)
-
     def _defaultReducePartitions(self):
         """
 

From 84a021f9e7409f8baffd731989d87b124918fcf7 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Sun, 20 Jul 2014 14:31:55 -0700
Subject: [PATCH 28/69] clean up code

---
 python/pyspark/streaming/context.py           | 41 ++++-----
 python/pyspark/streaming/dstream.py           | 85 ++++++++++---------
 python/pyspark/streaming/duration.py          |  1 +
 python/pyspark/streaming/pyprint.py           |  9 +-
 .../streaming/api/java/JavaDStreamLike.scala  |  2 +-
 .../streaming/api/python/PythonDStream.scala  |  4 +-
 .../api/python/PythonTransformedDStream.scala | 54 ------------
 .../spark/streaming/dstream/DStream.scala     | 21 +++--
 8 files changed, 89 insertions(+), 128 deletions(-)
 delete mode 100644 streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 5dcc9ba35a653..a4900191d1730 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -22,15 +22,15 @@
 from pyspark.storagelevel import *
 from pyspark.rdd import RDD
 from pyspark.context import SparkContext
+from pyspark.streaming.dstream import DStream
 
 from py4j.java_collections import ListConverter
 
-from pyspark.streaming.dstream import DStream
 
 class StreamingContext(object):
     """
     Main entry point for Spark Streaming functionality. A StreamingContext represents the
-    connection to a Spark cluster, and can be used to create L{RDD}s and
+    connection to a Spark cluster, and can be used to create L{DStream}s and
     broadcast variables on that cluster.
     """
 
@@ -71,13 +71,16 @@ def __init__(self, master=None, appName=None, sparkHome=None, pyFiles=None,
     def _initialize_context(self, jspark_context, jduration):
         return self._jvm.JavaStreamingContext(jspark_context, jduration)
 
-    def actorStream(self, props, name, storageLevel, supervisorStrategy):
-        raise NotImplementedError
-
-    def addStreamingListener(self, streamingListener):
-        raise NotImplementedError
+    def start(self):
+        """
+        Start the execution of the streams.
+        """
+        self._jssc.start()
 
     def awaitTermination(self, timeout=None):
+        """
+        Wait for the execution to stop.
+        """
         if timeout:
             self._jssc.awaitTermination(timeout)
         else:
@@ -85,20 +88,18 @@ def awaitTermination(self, timeout=None):
 
     # start from simple one. storageLevel is not passed for now.
     def socketTextStream(self, hostname, port):
+        """
+        Create an input from TCP source hostname:port. Data is received using
+        a TCP socket and receive byte is interpreted as UTF8 encoded '\n' delimited
+        lines.
+        """
         return DStream(self._jssc.socketTextStream(hostname, port), self, UTF8Deserializer())
 
-    def start(self):
-        self._jssc.start()
-
-    def stop(self, stopSparkContext=True):
-        raise NotImplementedError
-
     def textFileStream(self, directory):
+        """
+        Create an input stream that monitors a Hadoop-compatible file system
+        for new files and reads them as text files. Files must be wrriten to the
+        monitored directory by "moving" them from another location within the same
+        file system. FIle names starting with . are ignored.
+        """
         return DStream(self._jssc.textFileStream(directory), self, UTF8Deserializer())
-
-    def transform(self, seq):
-        raise NotImplementedError
-
-    def union(self, seq):
-        raise NotImplementedError
-
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index caa62d44a9069..a640df7394bcf 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -2,8 +2,6 @@
 from itertools import chain, ifilter, imap
 import operator
 
-import logging
-
 from pyspark.serializers import NoOpSerializer,\
     BatchedSerializer, CloudPickleSerializer, pack_long
 from pyspark.rdd import _JavaStackTrace
@@ -25,64 +23,86 @@ def count(self):
 
         """
         #TODO make sure count implementation, thiis different from what pyspark does
-        return self.mapPartitions(lambda i: [sum(1 for _ in i)]).map(lambda x: (None, 1))
+        return self._mapPartitions(lambda i: [sum(1 for _ in i)]).map(lambda x: (None, 1))
 
     def _sum(self):
         """
         """
-        return self.mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
+        return self._mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
 
     def print_(self):
         """
+        Since print is reserved name for python, we cannot make a print method function.
+        This function prints serialized data in RDD in DStream because Scala and Java cannot
+        deserialized pickled python object. Please use DStream.pyprint() instead to print result.
+
+        Call DStream.print().
         """
-        # print is a reserved name of Python. We cannot give print to function name
+        #hack to call print function in DStream
         getattr(self._jdstream, "print")()
 
     def pyprint(self):
         """
+        Print the first ten elements of each RDD generated in this DStream. This is an output
+        operator, so this DStream will be registered as an output stream and there materialized.
+
         """
         self._jdstream.pyprint()
 
     def filter(self, f):
         """
+        Return DStream containing only the elements that satisfy predicate.
         """
         def func(iterator): return ifilter(f, iterator)
-        return self.mapPartitions(func)
+        return self._mapPartitions(func)
 
     def flatMap(self, f, preservesPartitioning=False):
         """
+        Pass each value in the key-value pair DStream through flatMap function
+        without changing the keys: this also retains the original RDD's partition.
         """
         def func(s, iterator): return chain.from_iterable(imap(f, iterator))
-        return self.mapPartitionsWithIndex(func, preservesPartitioning)
+        return self._mapPartitionsWithIndex(func, preservesPartitioning)
 
-    def map(self, f, preservesPartitioning=False):
+    def map(self, f):
         """
+        Return DStream by applying a function to each element of DStream.
         """
         def func(iterator): return imap(f, iterator)
-        return self.mapPartitions(func)
-        #return PipelinedDStream(self, func, preservesPartitioning)
+        return self._mapPartitions(func)
 
-    def mapPartitions(self, f):
+    def _mapPartitions(self, f):
         """
+        Return a new DStream by applying a function to each partition of this DStream.
         """
         def func(s, iterator): return f(iterator)
-        return self.mapPartitionsWithIndex(func)
+        return self._mapPartitionsWithIndex(func)
 
-    def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
+    def _mapPartitionsWithIndex(self, f, preservesPartitioning=False):
         """
-
+        Return a new DStream by applying a function to each partition of this DStream,
+        While tracking the index of the original partition.
         """
         return PipelinedDStream(self, f, preservesPartitioning)
 
-    def reduce(self, func, numPartitions=None):
+
+    def reduceByKey(self, func, numPartitions=None):
         """
+        Merge the value for each key using an associative reduce function.
+
+        This will also perform the merging locally on each mapper before
+        sending resuls to reducer, similarly to a "combiner" in MapReduce.
 
+        Output will be hash-partitioned with C{numPartitions} partitions, or
+        the default parallelism level if C{numPartitions} is not specified.
         """
         return self.combineByKey(lambda x:x, func, func, numPartitions)
 
     def combineByKey(self, createCombiner, mergeValue, mergeCombiners,
                       numPartitions = None):
         """
+        Count the number of elements for each key, and return the result to the
+        master as a dictionary
         """
         if numPartitions is None:
             numPartitions = self._defaultReducePartitions()
@@ -148,42 +168,27 @@ def add_shuffle_key(split, iterator):
         dstream._partitionFunc = partitionFunc
         return dstream
 
-    def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
-        """
-
-        """
-        return PipelinedDStream(self, f, preservesPartitioning)
-
     def _defaultReducePartitions(self):
         """
+        Returns the default number of partitions to use during reduce tasks (e.g., groupBy).
+        If spark.default.parallelism is set, then we'll use the value from SparkContext
+        defaultParallelism, otherwise we'll use the number of partitions in this RDD.
 
+        This mirrors the behavior of the Scala Partitioner#defaultPartitioner, intended to reduce
+        the likelihood of OOMs. Once PySpark adopts Partitioner-based APIs, this behavior will
+        be inherent.
         """
-        # hard code to avoid the error
         if self.ctx._conf.contains("spark.default.parallelism"):
             return self.ctx.defaultParallelism
         else:
             return self.getNumPartitions()
 
-        return self._jdstream.partitions().size()
-
-    def _defaultReducePartitions(self):
+    def getNumPartitions(self):
         """
-
+        Return the number of partitions in RDD
         """
-        # hard code to avoid the error
-        if self.ctx._conf.contains("spark.default.parallelism"):
-            return self.ctx.defaultParallelism
-        else:
-            return self.getNumPartitions()
-
-    def getNumPartitions(self):
-      """
-      Returns the number of partitions in RDD
-      >>> rdd = sc.parallelize([1, 2, 3, 4], 2)
-      >>> rdd.getNumPartitions()
-      2
-      """
-      return self._jdstream.partitions().size()
+        # TODO: remove hardcoding. RDD has NumPartitions but DStream does not have.
+        return 2
 
 
 class PipelinedDStream(DStream):
diff --git a/python/pyspark/streaming/duration.py b/python/pyspark/streaming/duration.py
index 06a169e5215ac..a7f1036e4b856 100644
--- a/python/pyspark/streaming/duration.py
+++ b/python/pyspark/streaming/duration.py
@@ -17,6 +17,7 @@
 
 from pyspark.streaming import utils
 
+
 class Duration(object):
     """
     Duration for Spark Streaming application. Used to set duration
diff --git a/python/pyspark/streaming/pyprint.py b/python/pyspark/streaming/pyprint.py
index 1aeb8e50375ed..49517b3e5c247 100644
--- a/python/pyspark/streaming/pyprint.py
+++ b/python/pyspark/streaming/pyprint.py
@@ -21,16 +21,22 @@
 
 from pyspark.serializers import PickleSerializer
 
+
 def collect(binary_file_path):
+    """
+    Read pickled file written by SparkStreaming
+    """
     dse = PickleSerializer()
     with open(binary_file_path, 'rb') as tempFile:
         for item in dse.load_stream(tempFile):
             yield item
+
+
 def main():
     try:
         binary_file_path = sys.argv[1]
     except:
-        print "Missed FilePath in argement"
+        print "Missed FilePath in argements"
 
     if not binary_file_path:
         return 
@@ -43,5 +49,6 @@ def main():
             print "..."
             break
 
+
 if __name__ =="__main__":
     exit(main())
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
index cfa336df8674f..a2b9d581f609c 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
@@ -59,7 +59,7 @@ trait JavaDStreamLike[T, This <: JavaDStreamLike[T, This, R], R <: JavaRDDLike[T
    * operator, so this PythonDStream will be registered as an output stream and there materialized.
    * This function is for PythonAPI.
    */
-
+  //TODO move this function to PythonDStream
   def pyprint() = dstream.pyprint()
 
   /**
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index b730a98bfdbf7..05ccc23e9f422 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -71,7 +71,9 @@ DStream[Array[Byte]](prev.ssc){
       case Some(rdd)=>Some(rdd)
         val pairwiseRDD = new PairwiseRDD(rdd)
         /*
-         * This is equivalent to following python code
+         * Since python operation is executed by Scala after StreamingContext.start.
+         * What PairwiseDStream does is equivalent to following python code in pySpark.
+         *
          * with _JavaStackTrace(self.context) as st:
          *    pairRDD = self.ctx._jvm.PairwiseRDD(keyed._jrdd.rdd()).asJavaPairRDD()
          *    partitioner = self.ctx._jvm.PythonPartitioner(numPartitions,
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala
deleted file mode 100644
index 9e2d261776ff6..0000000000000
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonTransformedDStream.scala
+++ /dev/null
@@ -1,54 +0,0 @@
-<<<<<<< HEAD
-/*
-
-=======
->>>>>>> 69e9cd33a58b880f96cc9c3e5e62eaa415c49843
-package org.apache.spark.streaming.api.python
-
-import org.apache.spark.Accumulator
-import org.apache.spark.api.python.PythonRDD
-import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.rdd.RDD
-import org.apache.spark.streaming.api.java.JavaDStream
-import org.apache.spark.streaming.{Time, Duration}
-import org.apache.spark.streaming.dstream.DStream
-
-import scala.reflect.ClassTag
-
-<<<<<<< HEAD
-class PythonTransformedDStream[T: ClassTag](
-               parent: DStream[T],
-=======
-/**
- * Created by ken on 7/15/14.
- */
-class PythonTransformedDStream[T: ClassTag](
-               parents: Seq[DStream[T]],
->>>>>>> 69e9cd33a58b880f96cc9c3e5e62eaa415c49843
-               command: Array[Byte],
-               envVars: JMap[String, String],
-               pythonIncludes: JList[String],
-               preservePartitoning: Boolean,
-               pythonExec: String,
-               broadcastVars: JList[Broadcast[Array[Byte]]],
-               accumulator: Accumulator[JList[Array[Byte]]]
-               ) extends DStream[Array[Byte]](parent.ssc) {
-
-  override def dependencies = List(parent)
-
-  override def slideDuration: Duration = parent.slideDuration
-
-  //pythonDStream compute
-  override def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
-<<<<<<< HEAD
-
-//    val parentRDDs = parents.map(_.getOrCompute(validTime).orNull).toSeq
-//    parents.map(_.getOrCompute(validTime).orNull).to
-//    parent = parents.head.asInstanceOf[RDD]
-//    Some()
-  }
-
-  val asJavaDStream = JavaDStream.fromDStream(this)
-}
-
-*/
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index 67977244ef420..fc7a2055025c1 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -623,37 +623,36 @@ abstract class DStream[T: ClassTag] (
     new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
   }
 
-//TODO move pyprint to PythonDStream
+//TODO move pyprint to PythonDStream and executed by py4j call back function
   /**
    * Print the first ten elements of each PythonRDD generated in this PythonDStream. This is an output
    * operator, so this PythonDStream will be registered as an output stream and there materialized.
    * Since serialized Python object is readable by Python, pyprint writes out binary data to
    * temporary file and run python script to deserialized and print the first ten elements
+   *
+   * Currently call python script directly. We should avoid this
    */
   private[streaming] def pyprint() {
     def foreachFunc = (rdd: RDD[T], time: Time) => {
       val iter = rdd.take(11).iterator
 
-      // make a temporary file
+      // Generate a temporary file
       val prefix = "spark"
       val suffix = ".tmp"
       val tempFile = File.createTempFile(prefix, suffix)
       val tempFileStream = new DataOutputStream(new FileOutputStream(tempFile.getAbsolutePath))
-      //write out serialized python object
+      // Write out serialized python object to temporary file
       PythonRDD.writeIteratorToStream(iter, tempFileStream)
       tempFileStream.close()
 
-      // This value has to be passed from python
-      // Python currently does not do cluster deployment. But what happened
+      // pythonExec should be passed from python. Move pyprint to PythonDStream
       val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
       val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
-      //val pb = new ProcessBuilder(Seq(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath())) // why this fails to compile???
-      //absolute path to the python script is needed to change because we do not use pysparkstreaming
+      // Call python script to deserialize and print result in stdout
       val pb = new ProcessBuilder(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath)
       val workerEnv = pb.environment()
 
-      //envVars also need to be pass
-      //workerEnv.putAll(envVars)
+      // envVars also should be pass from python
       val pythonPath = sparkHome + "/python/" + File.pathSeparator + workerEnv.get("PYTHONPATH")
       workerEnv.put("PYTHONPATH", pythonPath)
       val worker = pb.start()
@@ -665,7 +664,7 @@ abstract class DStream[T: ClassTag] (
       println ("Time: " + time)
       println ("-------------------------------------------")
 
-      //print value from python std out
+      // Print values which is from python std out
       var line = ""
       breakable {
         while (true) {
@@ -674,7 +673,7 @@ abstract class DStream[T: ClassTag] (
           println(line)
         }
       }
-      //delete temporary file
+      // Delete temporary file
       tempFile.delete()
       println()
 

From d042ac61dafe536d3eedee9307fbca854c7f6135 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Sun, 20 Jul 2014 15:32:20 -0700
Subject: [PATCH 29/69] clean up codes

---
 bin/spark-submit                                   |  4 ++--
 .../src/main/python/streaming/network_wordcount.py |  7 +------
 examples/src/main/python/streaming/wordcount.py    |  2 +-
 python/pyspark/streaming/dstream.py                | 14 +++++++-------
 .../apache/spark/streaming/dstream/DStream.scala   |  3 ++-
 5 files changed, 13 insertions(+), 17 deletions(-)

diff --git a/bin/spark-submit b/bin/spark-submit
index ec4e10787cff0..a297714c67da0 100755
--- a/bin/spark-submit
+++ b/bin/spark-submit
@@ -42,10 +42,9 @@ DEPLOY_MODE=${DEPLOY_MODE:-"client"}
 # This will be removed after pyprint is moved to PythonDStream.
 # Problem is that print function is in (Scala)DStream. 
 # Whenever python code is executed, we call PythonDStream which passes
-# pythonExec(which python Spark should execute).
+# pythonExec(which python Spark should execute). pythonExec is used to call python.
 # Since pyprint is located in DStream, Spark does not know which python should use. 
 # In that case, get python path from PYSPARK_PYTHON, environmental variable. 
-# This fix is ongoing in print branch in https://github.com/giwa/spark/tree/print.
 
 # Figure out which Python executable to use
 if [[ -z "$PYSPARK_PYTHON" ]]; then
@@ -53,6 +52,7 @@ if [[ -z "$PYSPARK_PYTHON" ]]; then
 fi
 export PYSPARK_PYTHON
 
+
 if [ -n "$DRIVER_MEMORY" ] && [ $DEPLOY_MODE == "client" ]; then
   export SPARK_DRIVER_MEMORY=$DRIVER_MEMORY
 fi
diff --git a/examples/src/main/python/streaming/network_wordcount.py b/examples/src/main/python/streaming/network_wordcount.py
index a1458e06f13d2..c6ededc24db21 100644
--- a/examples/src/main/python/streaming/network_wordcount.py
+++ b/examples/src/main/python/streaming/network_wordcount.py
@@ -11,20 +11,15 @@
         exit(-1)
     conf = SparkConf()
     conf.setAppName("PythonStreamingNetworkWordCount")
-    conf.set("spark.default.parallelism", 1)
     ssc = StreamingContext(conf=conf, duration=Seconds(1))
 
     lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
     fm_lines = lines.flatMap(lambda x: x.split(" "))
-    filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
     mapped_lines = fm_lines.map(lambda x: (x, 1))
-    reduced_lines = mapped_lines.reduce(add)
-    counted_lines = reduced_lines.count()
+    reduced_lines = mapped_lines.reduceByKey(add)
     
     fm_lines.pyprint()
-    filtered_lines.pyprint()
     mapped_lines.pyprint()
     reduced_lines.pyprint()
-    counted_lines.pyprint()
     ssc.start()
     ssc.awaitTermination()
diff --git a/examples/src/main/python/streaming/wordcount.py b/examples/src/main/python/streaming/wordcount.py
index 9ff8bc5ac9ab2..ee52c4e178142 100644
--- a/examples/src/main/python/streaming/wordcount.py
+++ b/examples/src/main/python/streaming/wordcount.py
@@ -21,7 +21,7 @@
     fm_lines = lines.flatMap(lambda x: x.split(" "))
     filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
     mapped_lines = fm_lines.map(lambda x: (x, 1))
-    reduced_lines = mapped_lines.reduce(add)
+    reduced_lines = mapped_lines.reduceByKey(add)
     
     fm_lines.pyprint()
     filtered_lines.pyprint()
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index a640df7394bcf..08de8dbe9d542 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -22,13 +22,15 @@ def count(self):
         """
 
         """
-        #TODO make sure count implementation, thiis different from what pyspark does
-        return self._mapPartitions(lambda i: [sum(1 for _ in i)]).map(lambda x: (None, 1))
+        pass
+        #TODO: make sure count implementation, thiis different from what pyspark does
+        #return self._mapPartitions(lambda i: [sum(1 for _ in i)]).map(lambda x: (None, 1))
 
     def _sum(self):
         """
         """
-        return self._mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
+        pass
+        #return self._mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
 
     def print_(self):
         """
@@ -85,7 +87,6 @@ def _mapPartitionsWithIndex(self, f, preservesPartitioning=False):
         """
         return PipelinedDStream(self, f, preservesPartitioning)
 
-
     def reduceByKey(self, func, numPartitions=None):
         """
         Merge the value for each key using an associative reduce function.
@@ -121,7 +122,7 @@ def combineLocally(iterator):
                 else:
                     combiners[k] = mergeValue(combiners[k], v)
             return combiners.iteritems()
-        locally_combined = self.mapPartitions(combineLocally)
+        locally_combined = self._mapPartitions(combineLocally)
         shuffled = locally_combined.partitionBy(numPartitions)
         def _mergeCombiners(iterator):
             combiners = {}
@@ -131,12 +132,11 @@ def _mergeCombiners(iterator):
                 else:
                     combiners[k] = mergeCombiners(combiners[k], v)
             return combiners.iteritems()
-        return shuffled.mapPartitions(_mergeCombiners) 
+        return shuffled._mapPartitions(_mergeCombiners)
 
     def partitionBy(self, numPartitions, partitionFunc=None):
         """
         Return a copy of the DStream partitioned using the specified partitioner.
-
         """
         if numPartitions is None:
             numPartitions = self.ctx._defaultReducePartitions()
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index fc7a2055025c1..f539bc9aa147d 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -623,7 +623,7 @@ abstract class DStream[T: ClassTag] (
     new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
   }
 
-//TODO move pyprint to PythonDStream and executed by py4j call back function
+//TODO: move pyprint to PythonDStream and executed by py4j call back function
   /**
    * Print the first ten elements of each PythonRDD generated in this PythonDStream. This is an output
    * operator, so this PythonDStream will be registered as an output stream and there materialized.
@@ -647,6 +647,7 @@ abstract class DStream[T: ClassTag] (
 
       // pythonExec should be passed from python. Move pyprint to PythonDStream
       val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
+
       val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
       // Call python script to deserialize and print result in stdout
       val pb = new ProcessBuilder(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath)

From cc2092b09868b82f0d495a786028190f74db7a4a Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@Kens-MacBook-Pro.local>
Date: Sun, 20 Jul 2014 15:33:34 -0700
Subject: [PATCH 30/69] remove waste file

---
 examples/src/main/python/streaming/wordcount.pyc | Bin 1566 -> 0 bytes
 1 file changed, 0 insertions(+), 0 deletions(-)
 delete mode 100644 examples/src/main/python/streaming/wordcount.pyc

diff --git a/examples/src/main/python/streaming/wordcount.pyc b/examples/src/main/python/streaming/wordcount.pyc
deleted file mode 100644
index db93702361f47f57988ea82c213aae522e7a9f81..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 1566
zcmb_c+invv5S`tmX_F>xdP%Qb`WW$$yrZfDRUlD`3MEBIE2LoJN!i4Ek?qh#;suqD
z<A3-7n6a}d5{L(2H};Otj6G*APU%~t_Uz(oe+Y}GLf<De%)0<U(k}o75P3NS6+jX~
z6hgqd5~va+Wr)gtT?VxRNd=;cU$1~#g)3YGS%FCi`fY$!K!9-#ZUd03Fe!ol?2vUR
z%QXmJTwtBuk~&BMunf24y#d&O@dn7MQ}ALFWDVpx+!7V6fUL8LB*Ugd1KJlxTYy_I
z-d?yQ>q9y>+5y~w@h->>_~JZ8Ex;Cx_dsqI$i71kKsF2H5bzMjM}Q%7h>o4XJ*F4n
zK8zO<nJlE^r9>3&dpnXIIEg}|#P-`;l<D|8J(q1tH`o$QLQ21=(xRUWJvq<Pk%yWL
zS&brz(`$k)&aBt)_D6P&=D{ElaXJ{pAuY^3nqC`mjgL=mGA)PMG_@zEGS)b>nVz57
z12T9uw;!@}dGH%DJZD35$VV`Rj>M6eD%+ujPzqISlGsr$lgW?>I^S}tg^jax$SNMp
z;hctP(DaEa?*gX;_S>wwv}|<ZLs((ET*W^{G;0$EZZchxa3+#mq3Ieu>~fgh+)?kE
zA}QTvlpRuWK2DWL-b-<|OR}K>zmlsFO7$Rqlgg4A({btd9G1bVIK_XX)mx{dTQvSa
zhqw@<QCQG%$-ZOKW6J-5#a_Xp{g5Qre`ao6-m)C2n3?X80&Jb8eC~UJ%iVMN;QlDk
zWeGZ@=f>=Dh3(OAO^QZYbZjaT91NU$g{kG968ie1<$oh%C2H+3oW-`snC0*d+NXJb
zNn1T{w04!?K9YZFJZ6S=gYAjV^H`y8am%IUG8(sGq=bDbaz|y947`H9jACU`y92z4
za-rpWn$Q-`3VrjXg12du(;-^!crO;am|Z^4b(~s9!C0ZK<vT5IL~O56)3tW@=dQ9&
u`upBbGC5Uv#>Fxnn(9F_YzEDs7S@AS(4e<Uqggr*_kwNrZicm>cz*!UkyX3^


From a778d4b675ae765cb24553e9c1eb7f36f7709279 Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Wed, 23 Jul 2014 15:43:11 -0700
Subject: [PATCH 31/69] Implemented DStream.foreachRDD in the Python API using
 Py4J callback server.

---
 .../python/streaming/network_wordcount.py     |   4 +-
 python/lib/py4j-0.8.1-src.zip                 | Bin 37662 -> 37673 bytes
 python/pyspark/java_gateway.py                |   2 +-
 python/pyspark/streaming/dstream.py           |  44 ++++++++++---
 python/pyspark/streaming/utils.py             |  21 ++++++
 .../streaming/api/java/JavaDStreamLike.scala  |   8 ---
 .../streaming/api/python/PythonDStream.scala  |  38 +++++++++++
 .../spark/streaming/dstream/DStream.scala     |  60 ------------------
 8 files changed, 95 insertions(+), 82 deletions(-)

diff --git a/examples/src/main/python/streaming/network_wordcount.py b/examples/src/main/python/streaming/network_wordcount.py
index c6ededc24db21..2bbb36a6b787e 100644
--- a/examples/src/main/python/streaming/network_wordcount.py
+++ b/examples/src/main/python/streaming/network_wordcount.py
@@ -17,9 +17,7 @@
     fm_lines = lines.flatMap(lambda x: x.split(" "))
     mapped_lines = fm_lines.map(lambda x: (x, 1))
     reduced_lines = mapped_lines.reduceByKey(add)
-    
-    fm_lines.pyprint()
-    mapped_lines.pyprint()
+
     reduced_lines.pyprint()
     ssc.start()
     ssc.awaitTermination()
diff --git a/python/lib/py4j-0.8.1-src.zip b/python/lib/py4j-0.8.1-src.zip
index 2069a328d1f2e6a94df057c6a3930048ae3f3832..68d7267c733da88cfdc5d9b97e24327013ec766d 100644
GIT binary patch
delta 11395
zcmV-}EPT_RrUI#^0<dmB4fK5XL}gLcTM#V(0OXT<KOldsInYzAInYyecnbgl1oZ&`
z00a~O008BEYj@j5lIVB+3XHtxkjzjRJCoUm&NBDP5}hcq9xGAKX1zWjL^dT@B)|Zm
zWNyy<_pL|2(I6?unSEh*ViD-BuCA`GuBxuCei0pfbr4O8X_ns|MmM832mgp~_V)Mp
z&x+}4E~0<Bh_bvEWjd*&r>wq@irbH3QdjUcN~0gr$25AEmGvr}M`!8eKFdWkD~m;x
z?p?0yBKJSWdwcKFGD~mgqKfMKw2l_p-F+QR=4o}$4b=A{`r+MKRMlxI+f4Ill}|-k
zO^Q<Nb*a_!bOA_5$3^}q@;Za2rbUz&bySK;u~>hIe2TcY0;vja6VSND3IaaPvj;I>
z_W;M^Qlzz*Mga9hOrk&cqpx4S{HMLW!*o^O7v*8}8o=I*xmc{Dlk`sHX;vZ8_Nebk
zGF#QFQY1-~EtUl!u*x$avPk9`l5$@4qx7~a=BrvHTw;%FPKx;)s0+QRRMn~YWhM6H
zk9mJ_cL%*zKZ}a1E!WdxqAJw&dI>0%s!$~mr2bV*9z@O6s@3hXEGDATja?Q?k@us^
z)61c*u$GO~_dpb66jgXcFZ$8dTY#yGKZ*3A6tg{r*f$?zpzaa|S{5kN{7&?v`?N~y
zy8OBy-KLeO>JqzU>ddk{ooD|cO1H7=bS8h^s83dL=tf-t@l@%rtZ$Dn<j5ZKQ<BIR
zNwT-MhdfY4=d1br`!t`<McI`kj^*#(;a&vKRLml=$m%XobJiywE2r`sK1%?zx0eH)
z<en==0|#txPXWFY^;`H8-t8lP`@J}wPE|1*0#_kOEp_9MFcXqHVAZE|z2Dp0dwqZN
z=FRXbxjy~3A=LWj<v;!X-pTOI(aqaYa&&TXHN3ut*PT~i|3mx|{_j;sf4#i88o{Tp
z|MKTQ|Jl6!dG!6od2)Gm@vlGICBD%mj*s5HeSLKNV{$#bdIt?39Ul)bN6F~)Y<O{l
z#s9K*`SUkFB-cNlUM9yEZ{H4&N2h-m=Y&P@Lx;<cu5Pdcm8iS#J8MyO`cY?%|EcLe
z<w|ruKzH|WScnEZxZRJBi{vpAPklMs2{4u%C77M3^sXWavrH!sFiWDMjF<<irI=*1
z3?}{UIvShmW0Z7IgMa}12;oP0x)2q>K!JuI4wq?}E+W<bA@HlvzYxOHeKrNTCuz!T
zlNm!Ie_2sKcD1aCzv`Lh6-DS@$v??to`EC<vMapf#Qj92QMdwsLNO51?@ot5!SJ1(
z9i5*f=SOG5=#Th1IXy#mNv>~Rdtd+ELDMvpO`&Gz-}4UqBdSTd6iF_gKwjpeYYn9?
z<iZ&OeAUk75%B33ghe0Iyn3RE=n^EZV3|oIe?_|T-yYQ{1*`yh@|ez70_%x7v0rr=
zV&4PUkIsu+@PBPM4mip8AR?#9$Fxj9xZZaSmygN}*VcjxNDhJJ@9AEYf`5YK0ImSh
zT7h7h;6fKW41wh<K>Ga$W_oC2md&vnBz1m$`BxA;<$gRX%0*gtEs5GQ_2YC2Yss{$
ze`*Il6;+JC<Bvs_>mSps#L1<9gV>)_4-*0dZS?xifbGZepZNa~xdUYPKkdWd>V^X?
zn>v$KSpwk?N?0XfA#!VOK^c}tSb4-O`_zy2tNXMRgo58XK>=FvIDjl5h-U4`W|0Cb
zKEcecy7;%XxLACEUu?dB5o2zcr>lH&f3GHN7rA`!5+{F&RR;U}eHJGA7t*O%*45zs
z2Sd+kCK4D&K%*YK0X;<+wt7nqfZQ5?$8C&R1%#=^YM@jlT!Dyq95UCDZc<1@S<Ay}
z5*nylaTJ}-K!xL?pin8SjA({hIVy5uc`p{INvX2Ys#096L^1dL(98g69RI#te}D4>
zeud^P^7$G%fM}=X8V3Rkz&G9WQ;M1{Xpx|oO`{a$c3$KM@FJh4<&@_SY8NoPP#tvM
zdsH<LA5>@*m=q{Gn+fE!Xl&SKj4Cj#F3^3!`Y@sAG^?SI`s#F24=Hz3|0Hs3pteUT
z=7d9}Y+9B$7@+NZs>?Kj_oR#he<)OO@Lz({b(%9HbziLJu!0I}%!m?%!B|%qN7S^a
zQ3RsWK2}JK<DQM1#gK<c;PD97{&C-QNHV<QK2Y`NbF78(F4uU~_b?=Ka8yZzS<$#v
z(L;uWR;*is1}!YE%~y+Ckp2a;hvEN9l#gmal<drA)E~ut8Uy(PWT+>%f4R*U(VH}z
zTO0`13`lVVMKU3_fqT+Ig0=)k3FZhh`mihuP!^AASg<ZF3VH<qegkQ)CAos6k$P*`
zhdax2-WU#ym*KmCLaq`^7Lp36C4ZzuHk!oyeH?xeO8W=8kS(x2kU(Vyfj`{^JA&$@
z49ju3CPeo?D2mxEq$|p{fAxBBZ~(;)U}oQz#e>KXmf2G5J7}t+pgNFrm7QP}J)Vl&
z)m;~bB$~N*nk~ulR2{WRt&|11#sD>e4rG3*Pkk_6r^TuspfyH6vYh_bqjQ4uXMrX+
zYnLoy%~+A~%T{bR7h=jHp;|4q3i!g4q!pu+5TpTG{#`^ZW=wD`f1Z*W)pL}Sge_QF
zhfvXhX+Ot>AM|qe7W5-}mEgi|R+K9NR-bqjtdLU)(yOP@*c2Z}()biCBP7JJoU0?8
z*fU^K62iO=%vN)n{m~e#^@6b(%y2c6OO_g(g5^BP5eDmN^QJwP1|*X62}r&ouhT47
zf{mK6Ya0ByBL1c1e+PFI2BMVxcjSke6mL$4Z%=&XnqPi5B;9(WYHe_j6W{|J7hB0T
z7=D%>?10}%DOS@_fdKRPA~_qLy#}*Uw!^|W5hSy?T<`tM5AAZTlNXYlFtu=O8Kdae
zSAXrOiRN_5^t#_dA<5YSxW#Ih`Mgz$-$0GNC#%{<#+f2=e=b$q=2AZ*Jj|537WJ0d
z1Wf46BV@!eL1~>*te$|TgmVT3h(I-nTeuaI6s8=N0b!lp<qKsff-Ec3x}YUPF1?d9
z$2ADlg97B!yhx{J(fylDIY8a6L;dFBY^XsI?uAkoO*1$_?HLNoH_1pGKKoUdAobfP
zqc>aBPmr@ff3SKTFN<Q{+uL0jT>lM(fzxMQtsx?QtBm*`B_h74VAx$K;1^Jw?+Z^V
z@VnL}HU(VC0GSBI+gt<ZNSeFr-_ENldg8_rvM7MiQ<dp`pRxr<3JJ0n@mGqdaLX~d
zxB%`v!YP-c%UsP^iCac0u+%kvS!Jb|f*C*t-&83-e^W-wtu;w)h5nhcg~8ZWE#fw%
zi)^)RMVCB+TE>|`L!xUzb6BK};dT}#ibr6EsJ<n|tSbwJ+9DO(@{s1!3>`uh(iHjz
z76O%1vj!+@540ozh_1(MDh*Ww)}_8g;!vAz%J5gvHVze5xR5xsm8V7zago6l2CNj?
zREWCB7h&t@msL7vgOsL7U+!KVV<m^a3Vt7Dlf+3Ye>jht><0BA-@Y^zqs6MKZTdTe
zZqRgJu5?O}O83Oa$3;vw9SAMCAr_CoD8E7PcUGOso?XnkgnH`)Q4<102QJg|q7q&F
zFYZ4YuKySO3M@k3D{{?q5ykds#ew~UTVTZ#@)WwDK1~EUM_e{nRS%;JQy0BvV}d>&
zE8*wxe^6bnE!$Lrh#6lw0MuMGRIU13PgXap`xTgLPkER3`m`u$b{I>7B!#j#TvYlw
zef8iUM%M-ebXeiBOP@VZvDb(A`um$va&_|4)ibC8!m+$f??fVZRV7b!eV4mg*bnz!
z5R4KHUq?@Z<z@~G&a~5$3uI$A5?FNsT5Y0te=fV#0<@)MDsbo5YZSNqN&yo(`lG|T
zo2ro00dO(sD)D15{lfs1ve6ap)}5Y@l8e_r439_2=?N{-9z0kiVBO1sBCx0$PnkU`
z_-s<#KsUR9#$462Veqs)vi8aFZBu{U8HhDXJJ$jARe%P&b9tlhweuZ5n|M!>8tSx9
zf6HT*Kcq16OhRQCwJqj8Tz=92Nuz0(s?gZVwZ22@8!y%A1TiI9w!|2Y3|4Ibx-M4H
zLtZ?w%Nc%^%0zp2hFgSlfo2@9OtL3dYy!29!U@F#<A4zaU~6W;EFf1{Z9_p?KnKg5
zC;kO06i={n^rZ@y&VjKo{-Op|F6t^<f092gLD$PBggR|piciaVHpxJ2Nta_G%}z;#
z+chbDh?4Tq9&4H_Q93pv$eQULNnSHX9X+?a!NM7an{#I1x5!+t9OKa_qyiC6R*S`&
z;wid?y+{*FLHVps5(+_RgdV6;>4el|8K-bN2T(wg!K>B^a^q_=)FcrY1hlR3e}ufO
zvJ?nbSh1yx0)E^!s>x2P(INrk_M1$YYFXq}hAfPmXdrk}jD@g9t5Oz?rB*sqK{0e{
zTpB394=NDg%*+<76s(Ymj{iBB3iAFMXbX|%mD#H~Fun~^dnV`>=O}{3YF=kc45Fgu
za6+<<yub~oJHc&LxG98=2XxG{e^*@)MsjNs<`ckb?%)ulpV0InY-y>ECZK&4i|CMb
z;ju-Kv6^){K8oGJw5^k};%F=O3WPH{V=4lDA*-=bMpJRj!*^SNB5<ER3S$IPFxf0c
z_4;;I%UvsqJCJ_qs-0}sDD|bw8~TIv%IhqZ<|%JCp(wabCl6I@d2SlBe+YC_UWW%>
zluVzz;R6bX>9Yu?nL9x7>uQ_6|7JjY_lDJ#x`U6@n`EPG*~lL_6f#D{kc2j~(C`H_
zB1%oOh7fx`?B<5+7N{1m*tBpWW+@B<(wB%3HyScTX>82dvq{Y)$--733HQVo<I0v_
z)7<dZ9=*a@c=+@`)O()~8A2?r{XymasI-b}Q*=E6hSTwfvQ}^qk#Ukv6n}~40oG(i
z*!qWC$nUcin4(^}6)1=hO3}Y+&yn>M;p!%?c$XWF4b;8Z1Z@tUi~6Z3AEfI|TllOF
z=-P3|EQ<|&(;!0uU<!F4>9V`4BG!bFFdy1oZFuqgSw-||){`W9p=wJV;#djch8EGl
zs39)9Hc#~p3pF<nJRa$X`F|nQZcMv@JNEi614{<wr{D3uRlc{uYOn@Q?weZmo~2GJ
zoRo&8LtH#orQMGlR|{QK`_H9%pu7vbj*}SF^2csj$qe2`Jp?^<9-;31=!!N1a4Q(b
zR6<=?QUf0NEPbbPYk!{21PdGKJX5hVcjRZ3&XbygT?!i#hpwmy27fFa2gOr>_q{p3
z)8vaA^zJnW*mh7jA3QNfp+x?u`|={dKmi;KKiGz-VokYmj(*rRt<_-$@%ZA0cV}w!
zY_~J%DoRbdbvT6G%h41x?TJ*-C~gPFx&)QuRE8w2QuI8^!nY1%*cuwUg~wX`s+y~u
z#F$t1F?-g=c0Vf7=zot;-%Y#3Uo%)t$@G)4P%3!3*(%YovAjDPVN|PdLy%pFL#nh}
z(<*u+q1iN>J3X_)Y;=$0)(?<Xz;v6M&41k|S%N!Zd2R#Uu}1#OOplUn5nM^_nbNwK
z<uG$tsBRF8n<q#%lf%<kBVN#o1g6-;o0?u1c#3UB-gW&3;C~FSt}d?3xax>iE?{P?
zw0#?5Te>|^${Lf09U8X0wOEJdD(^2#gAS)Fn+uUP>aYxMTc<F2f$ha?M&}u7s3q>q
zWULFh3N%H$)#MRk=UIt&E0`r9Bb0=YD*?Aks#8?ZCJJL_w5m#)iE6`1D&~kZ)IoVc
z9uOEB4Ehgip?}$bAnoTuDi5^Qnt?-0Il=8tI&RT@*{2F#OlgpNcGJJq<2cp>tV|5F
zah1m>=ngP*#CHiO<3z2~7Rp`a4N74kdWs3P^8gtf&*G4#rqD2_jsmBd;{S=(qoIe=
zQD6e3xAUyJ7t`mNj2l6Hd4o~y!T1(oX4#C;#An%sa(|b%3fhF|fO#x3T)#*?GtCiu
z{B8!J?Bqc9R{mDo9!GDI)AQk|ufASi;8~l|)$r)7=fc^jas7^#<r7AF$U|SaTgNlQ
z;qiI8xSgiaQ`z^usRN4yu2guA|J+sz$;Js-2Kc`6dF|GS4iv<!JdNe}jkTA3jH5OV
z4t?0}kraa^VRzfCyWV!i+3^n;_%$pi3%!$|Q6LHyVT`K4Gat}HNt4P^B!9eelfsCT
z*d9K|CvPb0JME2g-_X0ou^%eXK0p6f#%)7<5mujN+!~A42KG6|t!2^Lpf(z}&`vk#
zkn&H<_)%cW6{T=6W1(y(L)Qg4sM_cFR<6;5u4FpE2QqhY6Z_=ir}N~yqtWoEBX{F8
zhII&ceLJgqcJPlKPdIF4vVYBtrb=uU1uvo#Izo*R?0+zYDtShmBm+prwLU<i$ISKA
zv|8r>71p?l7i(DKRz#M=%Kv?g@c$A6**(y3>~`*O!x;u@W7B%5rhz(8v610*6sZ#u
zVNEydFv9!8gI6Ei>TWNNT%x(XkWr*PZz_CGe#?s0&y<6p$(R#tT7OQVc_KI%f;>NP
z_YYRl#j;*|uw-X$1vKgGc95K+je1&q-C3n0VX?;<SYH?s+vzmTr&eDaK8;u{Nep5f
zlFwB(rO*PxeBWD^*_dZMb`>LS{)dJZ&>@thrctrEixFZxP-y#hcG42I!s(bTb}J6E
zxz)TRCsxfds&we9n}5Y3R?)RRciYp1v5n*C4YZdRPg?aQCjeKI`@ForiHqqQ43Oow
zDrD3WUldLYpH$>)6e-gMO6jy4+y@iS&}O4@l&JzxTH#Lq;bTiW6Gu^u>wo~bA2cxb
zgYn;P5fhd(Fb#%H4Sno9aM;{xk^|81Vb-x&a9hza=>~It<$s%D#avb1B@VyQZ%~<P
zSX5eIm;&Ao8{k<fp8@=7@0`G_qtE8NH9mM?z4;bh81R;u06sPxg0xJUxKAkK1bh-_
zH8l26rC{W$jfL(h;<A|(O#l*GT_m2Qc_M#d`++unaxv$r>ZWQxgiKQ?HmI+5snm=1
zDr#hQuW<`2)qg|dYuK$CYM}u<Ts2tD_sVuvslMsEy&asOdZcB?S01xsJd`&Pq;iIC
zD`GG0kThj_(YMh{7vCTnjzgYi3}e^cZEKd`Kdy7roml!CzDmr&noft0sW!;@zHzX}
zuooTCv1g+~<by?V(*|Zq*_a0-B;vdx4%*v}>Y2`JEmkTpMK`<tcTHdsfZVceZ7n=n
zN?Y_oa_Z@gIakyG9tOuX2A!}@C;9}n!P!riVb*<?gPYfV>oh3qNbC&7h)E3bBImqX
z){z0ok*_eIlP}dqpYblslRi~Qe>t#&5|KPhi%87TrDiUdh5}#;dr;Ky529cHYKZtC
z)<JW{Kl)}uzx}0ndtDg=-l*u3%iyGDZ^J=rJ7p)6L8!6jEY79_ucgD*Ap6OrAJI`c
z4J8ya545lX=7EChM5{G@<TUp@Vr}gPd*Tzw4}jvj@WF3I3X~vyd2YiSf6Qa%sM}ru
z6`g$}2ZqZ(4fU<-Gig8(>Sh&x>pNo3T|D{FFw57*AkGYo7DX#0M(yt}(Ch_Ew$4x*
zuKWJ(s|oD{6RoO2W`faHO+=oSSz#x3VPF#&UbLYr5~$N+MJI1Sd3Y+bTDuY{dQ_ex
ziCsh4q3V0=_6JN)Weh#Ge}Q;_ys>O@xq;X?T;~vg2R1Y38N*!Tpylx$k5iCwHXr?U
z1;EZp0erC<KJ5FPqyR0N#_q>`@%fEMel3!B$=zw^&%&pvI6h0c*(w(Uq?O|t#F2J^
z-P!Ae(Ep-^2|1ixX~I6Jfqx3Yg70~J@ho6hWn1i0^?uZG#a^cuMb0)wof3F*vf`TC
zY03!3RyUl^0V4O!Qv`N%SmGELK&M_+2M!<D)#~D!>{Yi~37TEA-V5cdu?2|)*0Ilf
zP6yhhU`vxpS1u<wMP$;upt70Kf~wOw8BOnoo#1^3ob)wWHLavg8QJ<k{?()|N|KYF
zS1JLplgU>jF$nmp;TxI$a-)>TVkG3Hc-)p;(RBH@i+T0obELd2z0f-#MR@dW^h#z9
zz~3OzQL2+2SRa3{{+w9xdUP~8Jx(rxn5X}$=Qi?AtNSLb3)m${#%c^X(7HmasC)eO
z==z!v4X9ccrYuIB5&Jt7J%svi!YmxSw>fLY?yH``f~KFl<^`4re_IxFa=3}kWVTf_
zAv<xfO}TAj6N}p2-Hp}a0&4O2ENP1x&B9M$99j<K-7<f<_)c4EqssCSU7TN!u5OM;
z7gsyX=`ZLh(v^OL`u3ZYDV~>MhY^l$<GezvbLW!t;5HXy`N3I^DUl5=MjWCbvjJNR
zGrm`CQzN4C&-k^itGdDe)+_60EvbFV*$ax17pM4T)>jat3?9v@rh?1BWQjqfqAn@n
z@X20FDgJ-sGfZ~eY*m7!vqg@LOq3MG(<p|reOl-vW&$~KK2~!6^ECr}w03ZF{^L2u
zm~2xIY?Q)UK!cd=#eNsL;+Ta}F#zbtKOTKI44NLc6p&qOlR9?4>=n!2bJwf5YMWN`
zu%%=caj6IJ%KzqHU?4_7ki!pQOupo5DHlfB^PYdT<^AsLT_&Cyes7eI{Ar9~V8xS)
zOLt=Y{OcW1&}hkGA22rJkfL{_uv8vnlYYuGdAc*X8xAZloh3be<Tr}+q_Tu%wSC(=
zB(_))l){T&F-gMG?0Hs!YCwt{XGY@zn5n&07Lscutt|gGF{8n8r|KXDhF8P$<00vs
zm^FV@*N;6<ryuWfUGSN9I<qa=!m>2Gh0fxK1BK(>(?`2KP~@u9v4FAfEmXiKl$18h
z??svMUW*6EnBweFJdK{H3f|LU0=AJ+F>OSF2VzvVAP>@vf<f+9^R(m`D7m7C{D>CG
z2NwOFv4T89=zUoU@7i>RF#^z9Quuu->8pPou1(P^6$pjg|2F9>O%eAn%ca!Pwq*5?
zhef1+pUekOC^;KgZ5ve5NTC20TSJz}1lIvej;oxXi!{si<v$ouy#y->!`$j8K{0VA
zWsD`RQ)_SWtEd55WthMP!j8dp^UA9<6uBi`bgY^Nj!yV73}cCQS%%pum@=da@78~=
zgl*^bjtSx=1N2a7LxNOs-MHJd$oaM-j7FuN@)9d0P+u;G5|M3-VrVI(s%LUfl4Q8D
zJAlC`Xbf*Oad2Y4A!XmeG&`k34u_;1*d{)um_r5Z8*NKWixD){?Tv|FFgYWbWSq)`
zq3DtpIIC7{(iBB?35M)JF`H@TqUe8-JQFI<A0<aAYMJN*zRp&a&RDU#9w1kKD}yC(
z7&tTEGx*DT(0U<`TakoTqEe3}9APh8kSA_9C`P>#cu!M;d2pTE7F3_q-!0qoty}Z%
zISq^pKAjmv$4G;5-^zn60nnK_WOOGN908f~=`I6Ar|+i`R6F?LGhak#KJ$M?y&Pl5
zC+a3KlQ9P~&aLk5DOta1NoP_o@(!LhrWC~UqIg&>Ww-@hMzGc=7NnI-n}|6@gBxHf
zLzLcp>mhCQSu_bxLjvp<snlDjP3tm-XthKUO)agX`;1~vbzq3KXUS<#aUQ1+rVOEC
zb#qQv63k}Vgp`ElAw8cd5BYzzo>8wUwpk~>aRb8};DW5$JeQ|{spS6_!ZNu$(Jxfi
z<a(AR`%XLwr5-fU=;TFK<D4a0S%J}B?m?fs<dkx8XD)HaPZn$(IZ+qdkycsZSy$d#
zp%Gh}D=%0Rtzv!DksV$(O(cKIdzQ)q#sijp(hP77L6B~ev#Lf`lU#o!oQw}9-<g6z
z6GL{R3KGP~lg3agy6fZmO)+8GwsNUmud7-tVtFuolr6*=pqy2D+_ezl@it%$I0>H;
zP+2J_w+*+d-Z*O+IHc(7S+*X<1Ad7!=Mq$+ZqJW1YRoNEp8R*tK89}^hPGoH=A)bE
z%-tAqSa|~&HwO9i{PKTh1p52=yW!Pnc(p;B-2??uH^^*pYWuN-`c&vMjc2#Gr6S14
z4H>Ez%x2lx=W~JKC2a%k^k{Pg3~cuynoq%aC)da5j+r&v0%oN7+I5Vou;dK@2o~%%
z__Fs5!_?W<x3n_5q7{`%Fs*)g+vwrLKImg^6B;`waN=`5>ezo};0%a`V3<za|0cD3
zCy!ST_hRImYXc~}wbQn1;d5MI$TpMEN2-y!X{Q7sFQVhQz)Me;QL!ok@FU%IN=J~8
zhH4)nAaS2L1n6;8SNU0tH|WT0gz&B79oQv>u~OHEfdxtTB$B>Kw=zAc`#NEvIWh%A
zUad-DR$Q`nC?0>7Z&h5Rc$6up+q9^HHrUZ*fc4bUX|0<O@u4*M99=_K5}K+0oyhTm
z9CTfg-YU)B1z(UWue>5xm_nVJ?vhr9i#T*u10z-9RzUHrD0|H%oKwtS(13uYW9OMy
zmrsHQqI#8!=6T3fp8bLWMtpDyxFecopl9UJcdX5hSvP+vqvNcMx@7a`++(9!Q<c;J
z%ci}+Va20{?=b388|;QiE9bB>c1fS(Z%f#-`MyclwS{u}_-c4G8YWbB+b&3B%a_F8
z-zMzM%2WQ_ZPRAVdw97E2lkpZFdScCImX>w>iAJjc#15Nv)xWG|J4-4eUAER)i&p8
z4(N;KkZ&#Ioiq~;NJ1BifiiB)5j)#Ix?k+`cwUH<+4Gg+&eBS;T{*S9Fe!8UoI(N_
zlh0olf5Rd$U6Cmejj7iAS0CQP=ip4T`*lR*`e$?NuXR;)tP6Z=(o|>?w4S8LU>s|(
zP>X%J#RrPgn$VVc{#ho}5vCBXN$P5Volu;^(bd(FpD(=Wn~qdDp2)lGWCmukcQb;U
z8%d*ytA#bp4qzQb5xC_?*J*b1kAvSc&f>EKe}$c6LS12vW1Hy3KjeVAHnv)AO*1be
zuuPL;Q%;q1RVjyi<(Jqk^6fZ~gw93u(014`gW6^z?_1cpOf36c9uS6ZkvO29b)ngH
z#8<zwav(FBx2#7kDw{u&?b#DIYrdG)&FgT3*;)N^+t&^Him<KAw-)+LmiRwD<_$Hy
zf2l2hslnD`Sc-OgXXEVk{c~Mqi(;NM^1(1<rIdp(-{6AT#BUpk^m`asEnb{0m}sj?
z)7GR{=~MFPuq(ecd0{gh9T_iy6l$fA=?$})-9>W~vAnuH^Ro@`F3;H9a22p1LYVL1
z*|pORL^NNBcQ)~W?^N<KP{;%6L3~2~e~uj_m~|G+xy{NQle6?eW`lBWn4Svj3N*?f
zY2SH<4=R(^P8Ml*P97SWJVxdOX}gq)Iv+?<r#2C#0m<hxtxPv`JJQ`GmKE%&#6~8&
zi*M1yeZ<WOMr0utMM+t<=h-5oc1oE?y(sX$gthW<8#Tna;~==RX>pWu8`mg&e;XHC
zp*DfLvr>Q|WjorvRziH`+->Hb@5SN27xSeY{KphDo@I(Rhvafs4~PVUk?a~iVgsh?
za-N0~0iW;}lywLb0Kqt=x0DoKTB;ben>SfR-y8{Z$|3`l*476pm>fiEgO`)v(BqE$
z3c-Cd*|Eb26W1NcUwW@+md$I*e<~`}esPQK(E(lYt2af_q0C)Ie>_{m%Rc^P{rfuQ
zAXJ*Pw{+SC-UhagG?{5xW>V8m8~GFHvJJ;?q4x@1+pChR4k5)alzfx}CwG_RW@#-i
z3$(WL+&kS=du^}+<{f>qx`EZrh+&o=Rhz=Mt#F7(i_BCQI-X&8kxC<oe_%{<D18U2
z-y_+O0mcNu%jPS6hgz!%r_XiKbZDIF3Y#;7==<T@%N<NAe5k1Oyl**OXdb|(5pK32
zdX%4ri6z-SaNfDKis8)-wOWlce1408MgdIzkbvp=<pzS|nw~cfn*)6R_t1W802fe$
z^c<1Ze6yvstqVf0bk6A6e;ELADkn5iKksydcN`TDWJ<Z>Cu9cEh1)G%-Qo@hE_GQ(
z`2W-LWt~XIg>#;+^2xn6Mkn)1<|uxNYE%iMeLvXW@AJ~9f8lCeEbD6U{)4NEPcxB#
zs*RUDg>>S#)S4I4rF{J|BP7K@Q9u)^A?R54VoU;e7}?gOav@uvf4?2O8{3BBp@51;
z)?+48Q*T6}jZ!-=xTtr4y;_P1FG4k`g<yy-@5KVQ3{-hqxnmy#NqC7wirW$@Ddsmn
z;8$q&0@qbz7sx!D@XbNt3Dycy#7H~E05Cu{KS0fFnwHaOUQ9SsIv%B-DgBf1vhrZ_
z9E8E0krG!&<7!>Sf0!gW`!vR_7FHC|%cpO@a+`J_t@5cT8=cl1b|^ES%b!}gX&Hq8
z^_V#i^)Xjm|HY@eOrv6{uLYy)tyBm{*J;unMb@w}Tt$!P%AB>)mBvP$;k*Z9g~&MW
z`8Znhq+x*(LM9V6PY6<4pcbj`u4q6r!QB5rr4eq$$K#`if6Th@m{5>z<n*&9lDA%2
zftq%x<XD=IVf{pfQh36LF1At3Z;2cuZ~8Xj3{e%a22L=m8&yF<E%CA|yO+!E?d`pw
zluWOWj(?1<FNepcZ%&VOpseSe@MC4s{PA2|bf=n|XI>{B<akZ8w5^MFG+uNESLG$~
zyiu7-z3T=_f3d0p_L>&WGU-OiNhxfnyyb#eiqg7UPG;@c9!5#-n8u-s=LAQ#<jUV1
z@`%kUAzjQJGNZB&nmC2j$$6n7xp2;V_vdV}aG#U;2nW<k5*5f3>n|-qmciX5!B>tK
zEl!pd3|7~z$$CaF*2CjDxt?`qr8O!2)@1f3zTEj>e{-ypxbQ`UcUr2IkmBR2Vvg(n
zq|7Kl507Uce^L~leIEc_t7Qi#;87LaPcEi{wzAchnlSl_$@x)|xklm|MC05!V96O=
zOw8ycU10`S)JLWwopY2x>~;>X(!?V+bUSA=ySL6C-AwMiJt@6A$Zq;$voe{~#kTKV
z4z+bLe`C4IyS=#KuVY!Ae5o4;9B}Zf#=k&(>noct-X>Vv0hU}1Z?1<p_nXe$S6lN4
zJ1yR3U<d4wTmK8Czo$_Q`A)xhrhDekvvhr{uE3-?k4j%MBhq}ej8@D4=MIQ0JCK>S
zWR^7!0RWchg-SP_;K)3!ylR9NWp1F$h21;vfApeeiNz@L^Lg8TRPtrgwY}afkf@F0
z=*R};i&Fb!hjeKoa&m9O3j+4_s?XDo>_%;9Iu72VTsu$m#*-2)Eoq%Yk|n@zSw1Ve
z9YvZ*(uPKj(;qhgyOW6rw)>Z0!e$08FLyUA0E7MO%fD{P($LJ_?X-KxVgtPf-Coa5
ze;0=ja%e(f7qFT%YkzRbNfXw-9Y7H-lmR21;;Ec|ggM6eFPi_9Gau@s)0hA0Y9#uw
zqS60ad>fHIk*>7M<a&7ZZg`a(9Ul)bN6F~)Y<O`q@;Zr+O02pOX?!@BY~vH^oE2U7
zBs&(a?cJQxj}mhYm^~^yu>;A(3D<nNe=^I52Dae>68mwkms0%d--OB9CN<Pf>`;d`
z7j7y@VH~$jOihW|j_lUJ!rmg>a6e|~*>Iz$|FowVR*!eTi48k&zeKpUfB9FV>efB*
z?F4iLk)7=QDa~jBq9iLeZ9I_|CdKB2^qXKC<<5?(@z=~^`Mf2QZkd}qdkay+e+-m2
zva~L*s1sur#`)US8C7(vZSqM>_1~LU6BR>o0{yk<yJ@-v*09E%M!`#VY<aZpDwOuJ
zLA}>K?|_fYXs*UXCF-;&-{hU=Pn|8(rHMF-!5G!OMpT6yLrPl|{G_|-c{MCa%UYsy
z3b<KntPYk{=1O&9WN&kOvsc62fArmuamE(>&DE+syPIPv8|=4P%dLj2TI1+n&+Ku{
zr=+p-zmpxlN!<=l!ed)rq|>#1=uh6bT5Y;ln`IhKz9ui54XLKSMkKH<TjASQ8X$_>
zkDP+yvmrR$zEbzwDAe%uy>{_nHjQ6jwW*%?xHr`FC3?N)q{Nh(jJixYe}w*2jEv>C
z>gttHbgX*9`TgmF14&ky0-jxC_SW5|{JV)9Rda<orXr&7CW&0%V%G3VZE>u=e#eEr
z`4%30Xjjwf%6CUsuaCYPLO<SO>WZCv7376r$*GtdJ@7sE^+O1;HuXlW>%8xGlRxD4
zg=u88v|eGf?TRdOYCT5~e{<{njF*<URcX-<1Uob=t!#y()96=6U##5m)(Tf%$Q$qE
z6>)*9=<(U*UOQ7RaP628;1*Z13|G9#Z0R39v$&e>4Nk6xqnoSq<ZO6-4P2#5Tk|qE
z!rI#|4c%WWwIELr?I?rDe_KU%E^U6*ZJA`v+;_P7-{f9>gHZP?e+JkJ%Fw5?-mqgI
z*nqcju`jA{72&Oy@ivuWzT^ry)QP%fW)`2sWTj45gf4_^JRRw-rxUqeOx!hU2^O=u
zN&nQ%;)eUI5n}H1xlWI$<&DNGB%aA2(i?~s|3KmWF5TGgABYa1F{FAs+)Tr`Dua-I
zxdlE0aY;Z1t<^#Qe@Jv7BaByMjDduxW1zqN6P+PfnMU+>OG|{`5mi~U(3IoMXb=br
z7+cs$k}1e)mQJjV8U^E?nNXcjlW@>|H02a0V>U<h{ay4)K^dF2#xg>WkWwdmD7?&z
zDyyQdya`FhmnmQx76pe%j4L|{ng~$Q>20;TtwgQj)~4B{e>RXbgN;d!fD9S;qcJXx
z>UR%ckc|Kw&?WkqSJG@4n<S7dO7SBWLKTOk!+0ykl{6U-(5l>`!u#iIH*K0wf9Vbl
z=XEYV$vZz@nu(4*)XPgF;P+@s7fCXUNIoPgG`8mKC{|rOolf0ax{^MM#fK{GYgd5p
zib=-VIn|L;e-$lip|+EiOucpYPj!OghB__j6EJiY<^DK`UNyfWxsh$4DVfnseU>t!
zktH(&d819U2VqAmZR(AE%A6X7s`kwX(3|;Zg4UX$hU<jyBg=bSxYap<khGC)A*pT)
z|9k@Ag)o^#2OBy}zvhhD0j9oQ3jy{plHqk)WfR&xZ3Qt!TcvyaLzGFes$t@&yb@p{
zyZHfGHprV`TJI&Y<D9##rO<Vcp+!G`^Fwm|<LRX`4^A)6uhs1*MFrNzV^&fi5-AGi
z&HG@@4?u}0JOZFVP^r<?jkGa9_RuMApk*g`G!j&a{{&D=0|b+?kr=bnY>Ffe^nCY3
zWl_~z5G?=z<dbTVE)lFb&{K7I3jhHG^#K3?1QY<1sgW!J!jsmKRRL;~ERtOTZIg<U
RQ~}JB-;y~735x>-21)<`

delta 11422
zcmV;PEMe2BrUIU(0<dmB4caZ2LqsxE&IK(10Hl+9KOle1KDbiMKDbhKcnbgl1n2_*
z00ig*008BE`FGn!lJM{PD=_lDM>0cU>`Z14y=A^nmgq!@b*w}=oAvsE5ZRPqkpKgL
zlDT>Fzi%CVqd`)RGkaloViD-BuI{d`tE;PDL<e6TM3Z8g<#&hC&FIa+KjNFc{r&y3
zV!E1(s4jn^EU!hGPU`3>tM8-Y_M@286}*ko=!f(%joxKty-MfNSvtATauLnSViBc#
zm+QL7{g3h9-n+ES(%ZSHqWV6qqeXUiUq_R9THSL4^}UFGcy|_6by~_c(>z+`Q&Cov
zq7-{wYV|x_0MgNMkw1#O&Y-Dj5#>c4m10sX79xM2BJQm~s)E}DG;XnifRFR+LCn`Z
z!11^gX)UG^Ks^zY=+FJ=>z6P8X>ac^UDfwRc^JJ0u=ipv7VGFFy%TwwRXAvS)b}Kr
zt?E@Nk|fF&%K{Ks<rxgJNah(1<-F=g>1|caSG7pE#2(k26!STZF7&2SRj1;YmDrO%
z=EZ;A9rRlLEGn+HTu+OMs!-SKC7@KQLX|*}`d2Y|5H(k;R=3Ntn21U@c3CV%-j6O%
zFNeCqS~gPO!=NCcsKO(9(T}d)0!&r>Nu&>@nC&UVzWEr#=q_QRWq~ry??gYkPph=9
z%dh*<ZCZ({F0ost&MeE*dG;TobQ`-)XX1a2`eYS{Zqx+~o+|y7_3aU+9LYm|N)q`Z
zN%r>kkOr#gd^MkcpXSrKD7$iqWBI#xxEH}Q6|+bzvbqbSIqMURl~ef*pCy3V+sgq?
za?cf`fdjU;rvTrH`Yrqk@AeVD{a&0-r>d9@fvXUtmb&prSP97;km^&q-tX=0y}o~W
z^JaLJT%Z2i5Ndt%@}K^G?_~Jq=;rMxIXXGH8eU(+>&~mM{~>+}|M#k+zg}Kkjo{PQ
zfBEyD|7>3VJo^6PJh{BO_}8E965r?&$4779zCJqsF}WUIy@Q62j*o|zqhxe?HoUmO
z;(yt@{P~+7lItH&FO%bow{M5XqtkzjbHXC{p~K}zS2x&!O4Qx=owcYs{iw6X|J3xK
zawR$+pu2lGEi?u^x!sSCi{vpAPklMt2@sZ?C0L!O^sXWfvrH!suu7t$jF<+hrI=*1
z3>N+EIvShmW8`#DgMa}12;oP0x)2q>K!%1N4wq?}E+W<bA<(PPzYxOHeKrNTCvM7Q
zlNm!Ie@Rh4cD1aCzv`Lh)rio)l75oOJOfS&!>;g-6ZaF9M&=6i3B`a(zdIfN1k-nR
zc65G{oFAPHqd(&7<n#>5CAq$N?S1`s2TjvZHiep<f6qJckEkZ;QY5)}0)Cl`t~Hgq
zkPBxB@KrmPM?j}v5Egw*^XiEfqB|gQ1!5+Ve<RYB|MsXxDL?|`$zwWS39KjT#D3Lf
zh<y)WKRPdR!T+`4IN&7R1B;v{AJZ}c=6c^XR6Z&*l&u97kQ4&q@9AEYf`0<%0IC4i
zS^;C3prDH#g23_>ApQOW6Fsys%jVb(;yS;+{3|e?azCCG<sz-S7Dw%w`f<7hSu*Xa
zf7*dhMHS=k_+ydf`o}aYadGM2!1m|V!-T*<8@;|WVf%6XC;op#?f}XCPx~;ry5T^}
zrp{zlmN4)KB}hpSL~hM3D1&GO$s=ajr+&0w-KV7>6#Ui+3XB!c1MmWZXk<q=ixgP#
z308L1#lJ1#V$lJ9vFQS4jHzLsuJXyfe_F6zr1HT_T>K?g8SL-(nVINcI8Mc~t_JTv
znDLxuB7u1XH0r?{&{KpVtGCnu@U8K8+{TzyKv-I=21-@JWr&E!AyXacCWS<lwLGjQ
zp@FIuN73mFR5&gQ3YEgjux6;0qar7k_hNyXlqwsoDn-SL6?4xI%?g0V@$bv^e>Xqi
zS7`1cpRb_<h;~}8aU!q)eA7)orKstG772RUG)j?g=S6-1FY;+xPI>*Hb^+51)j{XI
zM^yvyL4`(vNnvDXGl7&AjSbn1Q3WRH0^Jv^4-<M$vl<GiuTCfRlyW!qPa2L5qwS3p
zQ^FyRY+9B$8KCWas>?Kj_oR#he<)OO@Lz({b(%9XbziLJAVGySXEYLo!B|%qN7S^a
zkp-gCK2}JK<DQM1MUaO$z~d3f{&C-QND{oFK2Y`NbF78@F4uU~_b?@La#Tr#S<$>z
z(L;s<tw^^74O&=Ko39qP!2Js*4@3WzC?C~?DBhXPs6UGOGzRho@KBF$e{-8JqBm(a
zw<r*-8Q|gwig-e71NXRv1Z^>l63h`M^kG>Rpe!EKv|wEl3R(gHy#Y7ZoLoWDNWC@W
z!=2?dZwv><%h26GAy<hdGf4&1;y;oj8%^T<K2AR{rTqh4$Yxj{h@mopz@M(bj-Waz
z!*X7(3DNxzYQ$_3(iLUfe_9?K96+%HSlPE_@gVYpWwsRi4w|Ycs1C$kWhYogkEh~x
zb=O5EiDvGdCQGtBRY&ciR?32uF)*4i4rG3*Pkk_6r^TuspfyH6vYh_bvvY#$XMrX+
zYnRMo&0LZ3%T{bR7h=jRp;|4q3i!g~q!pu+5TpTG{#`^ZW=v2Pe@{t`>N(0u!WJya
zAyjl=+0Rk%gI><wf__A=5)|x4qFf2E`oyDPg`7%|UOkP*ruaCL#;0H&At8?CS{>oS
zo&k{(6J|LuTg_?pM`N(o3&v(JLun>OmYSS``8@Fv2J30_rak5c#FFy~aK0k1(=1nv
zjhe7)8vMB;{-yW_e|HonqLlr2_=i~(Z%&7APkiN?Uw$_v-Fl;HZE%khpaYy2Tgf&U
zewH5WfZs_eR?AU=0Q2}FIUAn62D4GN!^}7l#Iv|u@BPaU?R>417jigZY2n;5M$xaY
z{@PIs&FPfsb-!hVBxMVr7OP#R^HwE(!)Ww9Uez`;&JvMpf2rEGmiiIlVV2ajsJE;p
zAVOyyAt8<lO6!th^#n8}Tr<c(1gb&Y!mXI3u;i!=Fzf6tUnoNncv+d&1&ItPdM9a)
zG6>Xz0{GLsNT){V{!Nw~pl;Wpesgg))Sw9WLMe-;8C;<D3I*{^JQAnRe$^#N{r1J^
ztrqnY_$&-qf4z>EMKSN~?amCY{|3y!>9elZU=hESNBoas5nq%s?9LSM3n<R_g~t{6
zU8{&q0ar3WCPL9R*T6NB=C1tPS*oHZZX6+r0tmfSdA#paw%|x1LDC}nN)Z)qIVKku
zz@109<Wh8*s}(D8%SZ*5y2dZ7tQ1o)1IXZ;D&=R&e`vY2CaJB^Ka;mG7`v)9xJ~XN
zTWyo*l15O=I1^|{bS-EOiL?>i&dfy72&@p*x1^YLWuZ`8q+(kh(tMhsL#V<rg}#A>
zK;_h`fswT*S`GlPuE%UD4OIiy9es(!p*G!=;jf@=oGPqvA#rFcPmLa;kU<FpRtjw@
zL|vq?7IpN?DxI@IN=u|Kcdw4Ik~6*vejj<0#YroFD36-#2K6D|zBCo1#j2|9@plHg
zF{b-c(kVtN-4h=l7ctp%z_jFsSUduw{06<>S#>IVb}{P`>a7bzEeK#8D5mE{CA#=u
z+<!Dw|1bCzNQAyu<eKLqitN#f1N#TJz=|iNDRe=7nh0`^xMZ%X9!3|YE_%(z1bsYK
z%+H~Jp}JgKwy6XWGrn>HsJUpUTJ^V{tZr8KD=^od@-FZ7X;#qeFqQ;P3T1J+sPuFC
z>cKyZt_=w2u)<@PK6{{IuMhF{_cx>D>g1=ZXN(3g$MQD46N%hal{C@yUG7G(AMU*%
z7$q9Mj-CYKW)1>p+UZFF+1QN)QeA*no9LZ?%Wky*Z7G=w-1+qy#Vx;5z=Dqc=#cKF
zD&%wkTnxI3{TNLDFaV`&bcMThr{|;O;`I;1<56;YLL%CO2SNhmUJfGyLe+T6>{-EQ
zli~)t*#$J_s-6vlr|proPlj)s`s>a>tXbN*4ydmJG}xWX8-1^x?(o?}dvd6uPW!Td
zJZAnw3KOp+REAO8V(LTji~diVO}kWu##XNN9a7&|RHqZflz7<^V>mL9+5mK2tfGg!
zcw(0`{3?}+_U;U~2<HOLIF?MZCsu3%wU5jR*#qN%5d>gsW<V^!S6FRBMp{4z%bXYf
z1u7IzAUXO{g-ho^SQvj%gDMwwl`YACAD5u(WfMZ3HZH}d<vg2Yz_z5zv5;n`9E967
zDSe2N^3WdZF;}c~Y*>)B(mQf^%^Y>~+VUm~R~T;2nTg-RbG>qmN28DmL^xS37Hf*9
z=oYq+CX#~kS)C*lg3t&(P^HodsmU@<;dTz7U`Ph9S}Vwnugy@CL|_omw#E~G^0LZO
zz*s?IOBV(FxNTIEomR6&494v@nK0F|$g2!V7&p;?@uV0FVa-;hEE-F#be4i5=+wA0
zkbfUkz`&W9Em$d7Arl?{b1)U;{WZ`QBF!taS94%|8>IG3&@IkU1dG+Y&XyQNMa|)Y
zWF2{d8%}qE+p2I=2ptdTm}jqlx*&|?)+DSafYsc=AxJ-==|k9(sE#I}eHDx7kagj)
zH6UZP>U4Y*yMt+4CuPOaR_qlBXLiO^1o}c&W21~7#W7FcZ2^kFeflVj5lF#gvlP|q
z+f^-httjq5`lYM(VY6nbFJ0cy9~`f|&QfWf@^%xlg4=ZRP{o$#rm>2DKsRMMJn*7q
z`s58CP&iDVSum~K0kU6L+w}c61KPVcq^{H*e5Bqa8)eHz{=lh_F(PJ2Xfq29Uoa!0
z)HG`bV$X-&+;H6j)dCiq7EZ)0g=xU?r9p@r4Vgh{Y|PoKNv$MF!d4&&_rz!8%9dZ#
z+VEtLmT(px{`ep2z0U_3A(qzupmKjyTE(?TbUgur)A5J0R&WxLaFYQ}6n_WJ1FVM?
zVe21mA-~U7V2XO>R-hn4C`JFOJxA74gsYpl>|Jg+Hc<Cs6SO&aF6yVEe2}g;ZQ-*z
zplin+BNiL_ra^`Rz!dT@q|5HEidYjy!gOeNwc*9{R~3y<vz{EH7pk_@A&wOjZfFq=
zj2i5+YtvNUkWh2;z@w3Vn13EZ?Z&hlxMQ#HGO%QjfBGHoTjhHjtOjf1<i4p@?^)`!
z!bxdZI>f~zRoeZ?QCjGt+J7$91La*{IZkX)^B=oq#WQ#t^$_&bd4#(2qs!U|z^z~y
zQweopaSeFjv-F+Ht^Ij66U=O+^GwCg+>xJAI!|f}b}4K~9J-<+7=N&I9Ar-c+V|G@
zPKz&YjCZd&!M20K`QWiR3MKMq-RBnp0t(<@=)pEb6=}+ibM(WmNmhpm#G{KJ-kqu0
zv)#_5t0*<;)}at~FGo|*v?o$QqqrTI>k?FsQyG%9O40Ku3*S0~VQXmY79MN$t7=L)
zi7`v|F?-g=c0Vf7=zot;-%YzjUo#M<WctZiC>1>2Y?a2bA>JL0FsfC!A@DB5AywL~
zX%)SZ&}^E`ot{}?Ho8Z0>j#Eaz;c_K&41k|S%N!Zd2R#Uv1b0uERT|H5tO9%N@?B8
za)>$1R5!52%?l)($?0jxh!-T0z!aN!OVjHDFR`u2yRP2=oPXif)y0*WR~@m+1<Z<-
zwr_)NOScDdS!43BL&N5`7U|Gh<^5%8(BX1rb0N}39hSju>l79*kiD4A=sZIWwZxrS
zjCCQUK$FE=O&%e3o|SmFf>i=MLU9Nw3Aj~KouYy^Q5Z9$RaMeVR2xoGF-N4K4)P1~
zfWXvX(0^D9&42y_$9^uP@<6iIOdMLu32t}Naf|NDK2`8yN`ut1oBpL9$FUwDWg?)B
zQXZe6JHV_F-zA`o6D6lDl)K6sl)^;x6cK9Y0TMW##UV{ip<zxP1x_=?{}Zi8GagDu
zfd!D>&a>)XOrK{mZUpt^4Mw#G<6DH8Wivt(pJf-yU4PyxXcM9X=CR07evx`+nj`Y~
z-3&t6$${*x{H?Y<j@~4v=fhE7eZ9WGvo@ov;n7*og|kuP`W-FHCyexvhrV#Pj#q|5
z<MVWJJ58gfvhRCS2i6d{T;VzXb6Y7S8z*2H;QPv_wOhkFkP)-;G?w!>)?W58&e}LQ
z^<le5PCb@{-EFh(dfOFe$3I};*C0+7T7q+Hi}XR@frD<RyzTU(m%Cb7i|P(fV;$uY
z1=U2wgoH3gRp6Nq=%E~w%uytNy>gSnu#?!HKF23-M%H)Q8|S_m?-s{?s6hMr{975f
z4faJ?eU@=+ELt1b=NPw^MQelFXxu_O-JnCtKP}@&fhkv%!okdivYpJhF33UEzQ(sw
zjh=MH(*ZsVa~C(UPcD8sPrf@E4SzavH%?=aL%8ePS=F<Hf9!b7VJne;Z6-8TVlyjv
z5uMNxYK&n2gDF(WGup%%fGe)`0TMlDuBWEeGXJlz##Ovn!y30DvK&(W?_-4jml(+I
zfrewZbB7zwFi;zt<e^#y>OjRtg4a=`PDq5c+^oY0?+*`NeQ>M0y*P3Q&FzJZBJFug
z;d}C1R;+%e90X0qoM6*`ath7UfP*2(>jQWHK#DGw_1c3aJ98_bNoTi%_!Mo_lkjy{
zm5zkP9%o>EVMJ`F(=?x2eR23SVzuO85aAGiuCghG77*t9o>*pMp7Gd~jkNh68d^Yy
zP?DNP#pW(Xi19?B?c3Q&OV|phW473>ILzi&^OBrcHOHvZp|5U#7K>O#*Y@0PPZP#A
zj-xlwUS2$D)t8(ATutut^8O|Y(>E9(%WqZ4sKvf0oEAQ*$k!-RrVEtPX*akJCZ3_q
zM&&3|1)#LTo&3Yc7I!9!q8Qf!0dPNPVC)Cuzuh7xEN5UE44WGI*m>Zvxz!{Gpx?u)
zW47S7qGQqx=KRWkH^Yj#s=P}aexu)@GSwhdT40z0-VPh!St*|Z{Aur;z^bFq=DamN
zcwoKx7F`(dmWTj8HXMQ^CQaNYlyL$+iLx3Rd#F+{a@EE{_Y`s2JQPg;5?fs)o}_sq
ze_{K9HvQpZ%2U-%)qV(>CR1#TzS^ZyFWRf9nc2O@El8?=hsM{iTQ$@|19-S<u$u3c
z?W$6J(|3D2I6?JD^Nz1PV#RnUZy`wK4Bb{lUfLmP%Jiadqn9qeK{OnPJgpeUuD#pV
zD#3qT=cc=`^f!E!n1eN)4j)r(4CnjC!5%|ibVSEqjS7(u)`*)nFiXnDJQyJs=M{0#
z-gZ>abXIFtQGq48+4a9`0*e6TmThZG@Mtb=jTa85Uf!5<MNQyga9(533F~yCPf#12
z{bU(N?lT|UEcdO`psXXYGZZ5xF~p0U^Gd8E0gxkKVL&Hes*OJ5UBr_>RY-q6u!9nj
zJWGp6%+aN0E|-P^U<!Ls)btOcU;k<b@j<ME=8Avx&4hmYqIi2<83W#^=nj{`Nv+<7
zgVuJ+P9}p;W6f2ZO$S~}hpj>OlSx0KqjDNbC}tkU!U~v&5mYByt>q(^x#tmUYd6>v
ze}Mb|D6R`1{8l7G363wXZFql!dCVMj+Y6wgvv1_UaOtO^zIA;f4Jbn0tm1Edht0Xd
zlMf9ue{D?S%)n?-v_fpu{{8~ZUa(~A47uUD@9(~v&`vPXsv3AE7;V)=<Y}1|c48L>
zHi79y8@eKfIxSXo@&=TLr!uRxE0Ll{<vEhrHI$uEeUIJ#fa$4>p~rtV5KoXdmrW`+
z5F3Z<oB`m8&CGemFx5C{d349~6eOI@M}J)guyaxXpRI-u`#vWrK#Qia`*B}<e&dl}
zYskCg?zHn~;nP$cpQYSv<%@x#mGc?Ik#>RI)$4@N|Du@*Ih<T>!ak^he+t2Z?|FRj
zEMQk<TkKNxe$;W<UZ+ME&NfAz5_od5;+osXlo5=rZaAF-MDClX2<+yt#4!p$r(RVD
z4j<Un>f)O0RkvCRnq9Nr3+1e_8HohevCn%>2im1zbCXI}E+;ufWYW8!vYC-U)#;p!
zrgy_m@V*01`kJhoR??=7Y<(F1)ub*;;*+0ODgm^U%2y*XF!-zC8=3xcBbUcw#N;J=
z+?HI?bosZldG+CQxV+81&^sVmc=T=bN@fng-@wt4tCJpBAAd`KPONx6IvSlGCzmjo
zr~j(gHquV3`zEXl*d>U^Y79Bhx<ad{d;Iq3`kD|8s9F}L%to9U`#WSkg!*s7EF8PH
zIcvr4QqN#P%g>d00TJPE%VJIrH_@5Qwu&ZXCl0nLw{7gfqIP$8W3{+|f*zlq?{u{`
znk)~`#rgH<>VM{VbaA!An*4&E9$o1-s9(QH8RB&ncKG1zG|n5eI%h69k8M+!$`6h>
zr9?C&OgO|qX7jZKE5284QzN4C&*-(uMcv?kYsvUoBC$_7cR{i7;taoxd;~Vg;L$8<
zDyR%hmKa1TYLXHLpX{}i;y*sa<i^cX#RxiE_|V8iIe$?+j3Ox8Cxt#<9w3KL$BIvX
zzGTNoOZS`eAI~vHWSe-mQ3^}(#$dJ=`(5~oW7bK*4$zN(Jo;`JG#zX%AiLJab?koG
z635;%*HT!uP0~1Q=@=m_<v2_3H~#_?F@ga({1C?EOG-N_*ksRp)|U0Vvv-+zYWS^@
zKk}zBhJSGtPb#k5iP7_~XFx`yIg5Qj*sw#2zLCsQd3;U!D9>c+&g5=3ki2wu^z@P4
zDAJ3{VwTnRZR-%*Vnt3eFMh>C66R*l)9O_NlI1un8V|5c?X9j5Un6d1`KO5(4URii
z2QDzY8lE2yNoT~Yr@DUZc`E&QmFt4fq|=#eNq-iWrPwWW7CxLPocEqSn(cuiSDTLI
zi+yjO0zRRnvRMxHe#Uzx9vovzvq$hWdZH?L&xQ%OMnc834+S1*QQ3YxNHYrNxLeKB
zl4F>pL=X7^tsx&+<M#{+@(iZ;WjVZSlNrJYKx;|C_ocY6c9=F<uT&rua{t@7uQVmx
z!+$83QcK&Cl|vr(kp6kvCH9z-vjNq%!6c(pC;-LQkR>ufIbiW|m9uk^X1Tt+2Lqy)
zVC7(#TKyy_rp=^$vDkHL?G1hvH9)Hj5hx(+7+N<kyh<aHTiiv*nrYzZL?6R6mg|I2
z8_UdrqzdoWu7qvp<&FvBB?I(OX+wfkaev*o+qB5}wjzusrJk~gl^m!q#i2xGn@|ji
zLaKTu_Y{eTE4u>-jDo)KMiK`n_WM!x988l_I>X@%DF>#BPbua=0sBVV64PP?O?7)?
zq8CiA2qqb)B4H@Hqy^5Z6`M3eQC)%|dr-_~nz$(XBhQ4&(?`ioidrV>fUmPvrGGO{
z?5+n$$!}$#WQV`A@|Q%`xR3j3O{u8|tryz36^UsjDs@Q05%RJHd18ixTGTs%_bert
z$JV(mLG?-f-Lk#jy0z|}v%t9C)0shZjAJnFTY0P{06O!Agzn^WBOp^gon?UN^!qe}
zY6m`iW{U=z&umdI$Jp_Sx(Uo=ynn%rajUy~O15uW(wWeUyo0BODTVO7C>~Zz87@JW
z39R*r18F7GCSXp{+y<D+@T51-dN?-vESZF-Ap!P_RO&6%rgfP@v|1vIrk2*xeMT{(
zI<UjqbL6z8xQ^2YQ-)Bnx;dvS1!l8sLP|pOkeyGIhkV-3sMi#mtP|I`fq&f%a6wXS
zo~u*9RPufcVVNAB#xGRX<Z6~B`%XLvr4BUE=;TCJ<C>+hvI3jE+<`uI$tC6D&Q#*g
zpDfroGNLY|BdxN+v#Pu`LNm5BS5~klTE+UPB0Ie7F_H8w?@1~Pm=6&9q#2+LL6B~e
zvZ_W>lT;*}j14AVnSwzJLw|Oo3J!?jCyl98<F1d}H`#<~+scJ@y{>Aph~>fRQMM3g
zfO1ypdDl#Y=i7ia;3RxXAZ4YD+&0~+dgH8Q;E<uOXW4obPxvLSoJ&xNx;;NmsIj(C
zdGg;m`w+fq7}`#4n2&CrGIwLcA>|EV+!*51^UIqN=<nz6hF7EE)qe(Ub`umt-5|3i
zs>zQ9)TcV1X*|2dEfqmVUdT|pU^dFeKAj5;FIgLCr$?J3U|_os(R>QVE4e;Kch0QU
z7BC~t*REq!g*k5kK(Ju9L6^N}7^cp)yrq@d6|JaBf@$@`+XfFG)<GY08`Ic10TZ9o
zQO70&XE-bb!{fyLZ-0)K@8t37;a-e<b8P^HgZtZdEqsa#Oxflk^pR?$UfL<a$BXEA
zF7VRQWmK$60Q^XImC_L+97DB_5a77aoC5SXs;l@c!W(pCHbMB-@ebUQ!dR*6zrcc|
zdk#t8q+6Aq)P0*EXpT$)kyooy7>P^P4#l(bt%!>hk0RxC8-Es6&;~o23?NS}oz}X^
z5Fbio&(Se-rJz~r--#SAxIxzy>8;Z2UGN3B^2#c5g(=jj=`LwyD8!+w8W^b(w*rc1
zMcHeLa840_K@$R&j-4l7T^<P<i0V}?n&%l;dG-qi2=T!qppIyofu4~=-?273X5FNU
zj<YiAlFgrUkAID7O;u6@ESvTMhYgP!zQd?XZLk|6t(?Qg*d=`qzb)a;=KCUD*B0{W
z<E!D(XqZshZMz_iEn8xLf19v1E6@0Iw@sTd>tS&h4$L(&FdQFXImX>w==f1Bc!~^?
ztKCiz|J4-OeUAER)wbqo4d{#FkZ$CiG7}CcLKljGGJkHY5j$Hyx?k+`bY6&)+4Gg`
z&eBS;UAeTpFeh_+oI(N#dyX!@VrIQ{tJ|Iu%O-gLs{i$ev2<O75SXsW6o|%D>;0<_
z@8NTBCE5KtqT%{yb8D}4)pM*1d~4E7=pkr536H@v)?}d;`*Mp96uC8_E%Wp<PpBhI
z0bCQ;)qemxp*V-5tE(eF-*?kD9jS7>kayY146J1DW&=03kwz1xg*D9%U>!sexTQze
zX?F9EgWogG;<Ffqog+eBL5*{pXyG4nKwTSKt+tk#m(f?IIk87hm2_1phkE6g*e&wy
zIFLlnMfA{i*f4?GW+U%g*ttk7`&=IIg>Df$pnslqq1koBSGTirATyG;$fFjO&7aBk
z?1!5*Urfv9b+|$7tbV!e>jr&A*w*D+3w<U@{2!n5hML~gmcP_w>p3h%yS=k<_4@v~
zuChfj&l&k(7_w5zfthb`!EB<pjf3=i7+5V{oGqAWt4fcpNsrQ}<j-MOerxi<W;!`C
zUVj29&`KfG6J|5Ji{>U_dG&hcXA9t6p0T;1Dqul`FyFzmYo`l{XuS~aY@z|*spMsl
zkO#_x_=Nl&J8&@TESGZ|l{+VA>4VJX<lGQF71kAIlmXJdvkV_pCas+;((ar*GBWv#
z%<0i~sT6fSkYrA6B1!|2&sSQRYUp;OyMIY6E7(hkjZAhI-=c~8h?^0N$U-cNlCosa
zvqeVjlrj%`QQ&<CYvtoMYKU`3L2zf&qA2G!tx@<kEwn=I0q)L90fv<AX!lwP(Uo&I
znR`ALr~h8emvZtSQ_y&pDc<~%%UwMfBw&nW*YFV;FjbfHG?d8qgufuKLzn;v=6@-@
zrKIlCQpKp<yh$SZ=0{jl)-XV6ZGDh}$w8zxc)9q^c-)a+A-HcQJ9Zdh;<*F)OYil}
zvUyEeL512cZm~T&peug$rYJg;dCTaJXKQ%b$G@z9U#A>|N{jZEPOHG%z}Ar-W)jOh
z)U?w^{sg)#!|_|_y+YUas-)B*q<{E@;*WCT<nEH(EUo2bf7W)MdncP}uMJkfyrWN6
zH?X>yG0f7VYE$^O6%O%e4Ko#nj%OHNq|yK)7?a#d-(l+aNH%1E@qplE@s+*<t<{9n
z=dx%yG)`rO&6z>;{qXJO4ki^oR8)H2x10_%4`9;>H`@?B%1^_@l4Kt^uYcTH#n9%4
zTCK(zKEK64qW~s<O2G8|audOEP0yQ$%>lmud&Yii02hn~={X{+`DRLMTNjvK>722%
zGx*_BPH3Ti-suMKI4K^elzhccs0^$Nw_Ccp#T^bz>avXR|0nTfohU}ZIZs#l<X#)2
zlX)d`48KG*s)X6TAMEe<S%38DUnq@>WnB&4e{fatX(kd-wehm1kWT!TTJu7>l&@cA
zbfg$43TPrV1Rcv>j7i`QBHNl&E@bQTw_|r>+l+W9prVnrm<Oq;HzLzUuALWL)H{G)
zEyaX|P)%wf7^2I2vA`_@Rh}ew>|-DYULuj=wuDM*`OOdb6`H+3xqoWx0+}ZhzBwp7
zfvg}!jI>h>00U(61Jul>X*rGN#e_4R<5B3D(mx3=D~~m=L73bbDRFf)uGUqINshBm
zW87+CMG?Jx`t~ZfX$R6OpNg{4X-#2=GIP27sg;|SSqO|C6X&5mri$`ke5%VdDwg_M
zFS?#eg>ZD8Cf!+N4SyTMRrGwW%vl><X>8OP&RZ~6h>YW&kE69t8WtEKWHL$ff*_>@
zYLWWxvIaC0%>5ly8sS!ayghoztP6_?1?fgkKWia*^2!R-v_mDw(tHf-Cn}V}V?J~-
zjUs-F<rsd`w+GG)sv4|;6U^#HRS;84yzI#C<*<8udoL)Z(tqot;~%5z%i;0qo6}<*
zDC>DA{8(8ue>@i#-HGPriPwn(IbM@2ZR?^OjThaaRe4D`Z&apH@4A3etg3*$rdhL0
zno)963EL@exgeIJwC;wJSvR(aQIb2Raj4=s!I3Sw?l*@#VzY`#7jtKrQP~GgoI>j4
zx=@i^xaPh4Z-2H}xX;O4gcE8dc?#rt^+ijNWN<f0@Ri|3i<4yqlht)=vYye4_4Ig7
zu4kQDX-z7>H5t8$FLyrJ6ze1&d=cTDlu8m(d|Xw`QSML5i~{uVcm~oZMd8``{OMXO
zJ2(N4s^ETdF%`6xt+v#J$u~^SkCMzaV%NYL=gt93&VRsSVn!$F3Nx^xJ~9>QoTCI{
zw{v(ECLXb&+clfnxpn^MW^(TBN#)&1cGDLd$z)Ow+rD=>)z-y|<tp#?;)cJDd3Exo
zZVYh1!LJ(s0`{%1T)udlU~LCjay7iU9^%?>I(J`f%>(STc$<M8utRSAFO<HXW-;VD
z{o<MGnSVad()F#n!jj@VDt$?eNb}V)S}p&dJ0Y^{KxWF4S<*NJ07#-2D&2H~Bk{D-
zs$p7`d4VnmcJHjyLd{}}QRL_2w*9E&%cN^}y;UGl8^_U+4a#Sw_Q?+E(nRFs-i8+h
z?CVvZrybdi+R$_yyft#|G|d}NinX+)We#zc0Drw@`K;)6)X+q7Y-rXveQ^V@yO?-l
zyMGBLTxQ_%a&|)kFxkJp{Ogu13(f4?PP=!^HqdL(?e*+*Z}=dECKPr7(xh4YgFBqG
zVD0SwYT!Z{EYc~S%IQa#BaHu|^-nqPp*}i&`Jb*vq7M>{{@3E$i1dkcrClc1!>f10
ztAFI^_;`3ZN=Bz=!;71d*GYU-V$_XD<HNaN8=p|;tmwKX*|BhK@8*+!l$dM0>{;Q3
z9Y_XFxaP~15g!`Zh6_aO$GIL#(W`%xC2O11Q2StqI<&cPQ$Y&jxNTwTk(ljBZVfE#
zEy4}=TZWzuH*)$<dx~K7c=waoumkr)gnw)Mmv=R)ZrualK7bA*vXiwxr5OnzO0r^)
zjmPrBL$Nub{3h5&xwE5ce3@A+pC>ZumbkgIw-7bVKzXA|t9V777_%tO*RIZ}qFZf~
zPhzV7-YiX248;lb*BakV%OxPg8g~)}FUhg_(YC8h+RFy@UiZ8MJ~AV@nh%v|(|;QI
zCha_b>1<gpO~jE6#;EQ!qAKJZQre;5C*4iYt6_0k))Jjlz|B%)b+D{5SE3Ukdz;&v
zy&CSO?}m&sHsfzftM=?{j-_m{-)1eh8nQ~p(Z8PA<C;%NW9NS-JA9M69bSaTHor)x
zYx~fjyfL-fbT2mZG+ca5S~eR}O@DojhQPWkg>Oq~fGBQ1ateyihTwGjO5IPRP{Y&r
z+Qoy}G=6>6rh4Mz-Z0ab==GY55>sL_>N4dJ`cpA7mfxzYQ$o?P>IvuPrwa<?u*wwf
z>>9JT?l$GmP2{YaE66bw5rsEN<oXt|h9$K{vHJQP7y9N~bnu~FO{**49e-WDKKgD5
z{dkM1D|YTxkQRa^r($mO!1vtO4<W?b)Egz&dEf6Qf5`0%&&X(Ly@F`l6<6ledX6CG
z*7+GPt#GT-q8$i!Xjod=3P-2Wua3SLx#P(SmtV*m>*N)0fve>4+2vk3Q!a3Am|@@+
zRWc7(w8>=YA3n3Fn(qBgu78H3o2&EWY<PVQRHaK>>oPaY+S@J--9Ia}AdeC4$b-m#
zTSay*Y<|^kS!B)JcewfAq+WdkQ1>ea*b2&wPiMVh$3CzDZ{uQLG~p`3TQAdXD#d(B
z6;h}Zb<4yoK8eXnovsL7=-7BV(p^s{a=n<iYt#}fVs(@LshhzK^?zA2#MI|got{z4
z8;w^$Jd;4AHxMiSfx`RUabv%KAUc5Nkm~Jlvkc>^3_|+l7WfRr<p45htq%G}q5~OW
zydq-^Bt#tp{q3LV47tiQqPJUGBK(f1%9@#`oM%RZKv2Ng!cKBbK~}SLVr|qY823zs
z>V%qvgYKg#r#Kn2Ie((>-=a?n%Gk6umJxb{lsef%;bmS_Srv8VO-3@lOaardC^$@F
zT-iy`L|_!1-d3yIO4KTDZJJGL14$FunD_|rka0g6qi9sWd-#HE1fYN}jgNUH&4#f_
z0?DitKVl(NafmyNw_;pLlkotp$}K9qf4+9prU~_z?!a(f=YQgpytCt_S?Jh9EnXS{
zzeiKL2$D%e(jkpPV{6WiV%5dd>C~;IE9s+He5lgCHU;Rem}H!tQynQ)(V`Y=J6Xxp
zTX+9dCm3$1({g+QhOQd9KMtZ-&96AzNH)-v%xI=QOCHh4l9>U&(Wcphu%neW^~OGB
zPK`oU`{n}Z&42teL2J!W!*#;<k>oup-0GY_NZQD@kW{yQfBpdAg)W&j4mNaHe$5rL
z15ABA76R;HB*W{p$|kgX3T%qDO85AOD3fAU!@^N{CBQ^>^8+$(kT<!s-YaCsId@x2
zq3a$)i+=v*hvfRl(@SL@oL-z?tJ_P83apLCtfW9BQYaM6oA<$*A7CV&@CbkcL8V4l
zH`2xc-b1IjVJthrqmiIW{3lRL0|b-2kr=byY>Ffe+AWtuL^4#)1uXyoq?2`#E(FXz
sxKfjVjUSW7ks1NFli`t70bi3hl3f8}la-QG0l|~%k~s$ciU0rr05{ZGF8}}l

diff --git a/python/pyspark/java_gateway.py b/python/pyspark/java_gateway.py
index cea7d0975e5d1..671c0d426677a 100644
--- a/python/pyspark/java_gateway.py
+++ b/python/pyspark/java_gateway.py
@@ -76,7 +76,7 @@ def run(self):
         EchoOutputThread(proc.stdout).start()
 
     # Connect to the gateway
-    gateway = JavaGateway(GatewayClient(port=gateway_port), auto_convert=False)
+    gateway = JavaGateway(GatewayClient(port=gateway_port), auto_convert=False, start_callback_server=True)
 
     # Import the classes used by PySpark
     java_import(gateway.jvm, "org.apache.spark.SparkConf")
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 08de8dbe9d542..0ba2b4b38a281 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -43,14 +43,6 @@ def print_(self):
         #hack to call print function in DStream
         getattr(self._jdstream, "print")()
 
-    def pyprint(self):
-        """
-        Print the first ten elements of each RDD generated in this DStream. This is an output
-        operator, so this DStream will be registered as an output stream and there materialized.
-
-        """
-        self._jdstream.pyprint()
-
     def filter(self, f):
         """
         Return DStream containing only the elements that satisfy predicate.
@@ -190,6 +182,38 @@ def getNumPartitions(self):
         # TODO: remove hardcoding. RDD has NumPartitions but DStream does not have.
         return 2
 
+    def foreachRDD(self, func):
+        """
+        """
+        from utils import RDDFunction
+        wrapped_func = RDDFunction(self.ctx, self._jrdd_deserializer, func)
+        self.ctx._jvm.PythonForeachDStream(self._jdstream.dstream(), wrapped_func)
+
+    def pyprint(self):
+        """
+        Print the first ten elements of each RDD generated in this DStream. This is an output
+        operator, so this DStream will be registered as an output stream and there materialized.
+
+        """
+        def takeAndPrint(rdd, time):
+            taken = rdd.take(11)
+            print "-------------------------------------------"
+            print "Time: %s" % (str(time))
+            print "-------------------------------------------"
+            for record in taken[:10]:
+                print record
+            if len(taken) > 10:
+                print "..."
+            print
+
+        self.foreachRDD(takeAndPrint)
+
+
+    #def transform(self, func):
+    #    from utils import RDDFunction
+    #    wrapped_func = RDDFunction(self.ctx, self._jrdd_deserializer, func)
+    #    jdstream = self.ctx._jvm.PythonTransformedDStream(self._jdstream.dstream(), wrapped_func).toJavaDStream
+    #    return DStream(jdstream, self._ssc, ...)  ## DO NOT KNOW HOW 
 
 class PipelinedDStream(DStream):
     def __init__(self, prev, func, preservesPartitioning=False):
@@ -209,7 +233,6 @@ def pipeline_func(split, iterator):
             self._prev_jdstream = prev._prev_jdstream  # maintain the pipeline
             self._prev_jrdd_deserializer = prev._prev_jrdd_deserializer
         self.is_cached = False
-        self.is_checkpointed = False
         self._ssc = prev._ssc
         self.ctx = prev.ctx
         self.prev = prev
@@ -246,4 +269,5 @@ def _jdstream(self):
         return self._jdstream_val
 
     def _is_pipelinable(self):
-        return not (self.is_cached or self.is_checkpointed)
+        return not (self.is_cached)
+
diff --git a/python/pyspark/streaming/utils.py b/python/pyspark/streaming/utils.py
index b1fa1e227b0a1..84f1dadeba03d 100644
--- a/python/pyspark/streaming/utils.py
+++ b/python/pyspark/streaming/utils.py
@@ -15,6 +15,27 @@
 # limitations under the License.
 #
 
+from pyspark.rdd import RDD
+
+class RDDFunction():
+    def __init__(self, ctx, jrdd_deserializer, func):
+        self.ctx = ctx
+        self.deserializer = jrdd_deserializer
+        self.func = func
+
+    def call(self, jrdd, time):
+        # Wrap JavaRDD into python's RDD class
+        rdd = RDD(jrdd, self.ctx, self.deserializer)
+        # Call user defined RDD function
+        self.func(rdd, time)
+
+    def __str__(self):
+        return "%s, %s" % (str(self.deserializer), str(self.func))
+
+    class Java:
+        implements = ['org.apache.spark.streaming.api.python.PythonRDDFunction']
+
+
 
 def msDurationToString(ms):
     """
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
index a2b9d581f609c..a6184de4e83c1 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
@@ -54,14 +54,6 @@ trait JavaDStreamLike[T, This <: JavaDStreamLike[T, This, R], R <: JavaRDDLike[T
     dstream.print()
   }
 
-  /**
-   * Print the first ten elements of each PythonRDD generated in the PythonDStream. This is an output
-   * operator, so this PythonDStream will be registered as an output stream and there materialized.
-   * This function is for PythonAPI.
-   */
-  //TODO move this function to PythonDStream
-  def pyprint() = dstream.pyprint()
-
   /**
    * Return a new DStream in which each RDD has a single element generated by counting each RDD
    * of this DStream.
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 05ccc23e9f422..751b7504f1cea 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -56,6 +56,10 @@ class PythonDStream[T: ClassTag](
     }
   }
 
+  def foreachRDD(foreachFunc: PythonRDDFunction) {
+    new PythonForeachDStream(this, context.sparkContext.clean(foreachFunc, false)).register()
+  }
+
   val asJavaDStream  = JavaDStream.fromDStream(this)
 }
 
@@ -85,5 +89,39 @@ DStream[Array[Byte]](prev.ssc){
       case None => None
     }
   }
+
+  val asJavaDStream  = JavaDStream.fromDStream(this)
+}
+
+class PythonForeachDStream(
+    prev: DStream[Array[Byte]],
+    foreachFunction: PythonRDDFunction
+  ) extends ForEachDStream[Array[Byte]](
+    prev,
+    (rdd: RDD[Array[Byte]], time: Time) => {
+      foreachFunction.call(rdd.toJavaRDD(), time.milliseconds)
+    }
+  ) {
+
+  this.register()
+}
+/*
+This does not work. Ignore this for now. -TD
+class PythonTransformedDStream(
+    prev: DStream[Array[Byte]],
+    transformFunction: PythonRDDFunction
+  ) extends DStream[Array[Byte]](prev.ssc) {
+
+  override def dependencies = List(prev)
+
+  override def slideDuration: Duration = prev.slideDuration
+
+  override def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
+    prev.getOrCompute(validTime).map(rdd => {
+      transformFunction.call(rdd.toJavaRDD(), validTime.milliseconds).rdd
+    })
+  }
+
   val asJavaDStream  = JavaDStream.fromDStream(this)
 }
+*/
\ No newline at end of file
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index f539bc9aa147d..d8dbdf59e7ff1 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -623,66 +623,6 @@ abstract class DStream[T: ClassTag] (
     new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
   }
 
-//TODO: move pyprint to PythonDStream and executed by py4j call back function
-  /**
-   * Print the first ten elements of each PythonRDD generated in this PythonDStream. This is an output
-   * operator, so this PythonDStream will be registered as an output stream and there materialized.
-   * Since serialized Python object is readable by Python, pyprint writes out binary data to
-   * temporary file and run python script to deserialized and print the first ten elements
-   *
-   * Currently call python script directly. We should avoid this
-   */
-  private[streaming] def pyprint() {
-    def foreachFunc = (rdd: RDD[T], time: Time) => {
-      val iter = rdd.take(11).iterator
-
-      // Generate a temporary file
-      val prefix = "spark"
-      val suffix = ".tmp"
-      val tempFile = File.createTempFile(prefix, suffix)
-      val tempFileStream = new DataOutputStream(new FileOutputStream(tempFile.getAbsolutePath))
-      // Write out serialized python object to temporary file
-      PythonRDD.writeIteratorToStream(iter, tempFileStream)
-      tempFileStream.close()
-
-      // pythonExec should be passed from python. Move pyprint to PythonDStream
-      val pythonExec = new ProcessBuilder().environment().get("PYSPARK_PYTHON")
-
-      val sparkHome = new ProcessBuilder().environment().get("SPARK_HOME")
-      // Call python script to deserialize and print result in stdout
-      val pb = new ProcessBuilder(pythonExec, sparkHome + "/python/pyspark/streaming/pyprint.py", tempFile.getAbsolutePath)
-      val workerEnv = pb.environment()
-
-      // envVars also should be pass from python
-      val pythonPath = sparkHome + "/python/" + File.pathSeparator + workerEnv.get("PYTHONPATH")
-      workerEnv.put("PYTHONPATH", pythonPath)
-      val worker = pb.start()
-      val is = worker.getInputStream()
-      val isr = new InputStreamReader(is)
-      val br = new BufferedReader(isr)
-
-      println ("-------------------------------------------")
-      println ("Time: " + time)
-      println ("-------------------------------------------")
-
-      // Print values which is from python std out
-      var line = ""
-      breakable {
-        while (true) {
-          line = br.readLine()
-          if (line == null) break()
-          println(line)
-        }
-      }
-      // Delete temporary file
-      tempFile.delete()
-      println()
-
-    }
-    new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
-  }
-
-
   /**
    * Return a new DStream in which each RDD contains all the elements in seen in a
    * sliding window of time over this DStream. The new DStream generates RDDs with

From e185338e1b13d92f66356c0a966e5b5c59e69f0c Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Fri, 1 Aug 2014 14:39:18 -0700
Subject: [PATCH 32/69] Added missing file

---
 .../spark/streaming/api/python/PythonRDDFunction.java     | 8 ++++++++
 1 file changed, 8 insertions(+)
 create mode 100644 streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonRDDFunction.java

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonRDDFunction.java b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonRDDFunction.java
new file mode 100644
index 0000000000000..88f7036c3a05b
--- /dev/null
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonRDDFunction.java
@@ -0,0 +1,8 @@
+package org.apache.spark.streaming.api.python;
+
+import org.apache.spark.api.java.JavaRDD;
+import org.apache.spark.streaming.Time;
+
+public interface PythonRDDFunction {
+  JavaRDD<byte[]> call(JavaRDD<byte[]> rdd, long time);
+}

From 54e2e8c5e4e7c5a65e9b8f1d90142902ed95160e Mon Sep 17 00:00:00 2001
From: Tathagata Das <tathagata.das1565@gmail.com>
Date: Fri, 1 Aug 2014 14:40:37 -0700
Subject: [PATCH 33/69] Added extra line.

---
 python/pyspark/streaming/utils.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/python/pyspark/streaming/utils.py b/python/pyspark/streaming/utils.py
index 84f1dadeba03d..c60ecd1ed607a 100644
--- a/python/pyspark/streaming/utils.py
+++ b/python/pyspark/streaming/utils.py
@@ -17,6 +17,7 @@
 
 from pyspark.rdd import RDD
 
+
 class RDDFunction():
     def __init__(self, ctx, jrdd_deserializer, func):
         self.ctx = ctx

From fe8619882c5f2f5631ee7d1326e9558256753ca4 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@kens-mbp.gateway.sonic.net>
Date: Fri, 1 Aug 2014 18:29:15 -0700
Subject: [PATCH 34/69] add py4j 0.8.2.1 but server is not launched

---
 LICENSE                                         |   2 +-
 bin/pyspark                                     |   2 +-
 bin/pyspark2.cmd                                |   2 +-
 .../apache/spark/api/python/PythonUtils.scala   |   2 +-
 project/SparkBuild.scala                        |   2 +-
 python/lib/py4j-0.8.2.1-src.zip                 | Bin 0 -> 37800 bytes
 sbin/spark-config.sh                            |   2 +-
 sbin/spark-executor                             |   2 +-
 8 files changed, 7 insertions(+), 7 deletions(-)
 create mode 100644 python/lib/py4j-0.8.2.1-src.zip

diff --git a/LICENSE b/LICENSE
index 383f079df8c8b..e8e52800de12f 100644
--- a/LICENSE
+++ b/LICENSE
@@ -514,7 +514,7 @@ The following components are provided under a BSD-style license. See project lin
      (New BSD license) Protocol Buffer Java API (org.spark-project.protobuf:protobuf-java:2.4.1-shaded - http://code.google.com/p/protobuf)
      (The BSD License) Fortran to Java ARPACK (net.sourceforge.f2j:arpack_combined_all:0.1 - http://f2j.sourceforge.net)
      (The BSD License) xmlenc Library (xmlenc:xmlenc:0.52 - http://xmlenc.sourceforge.net)
-     (The New BSD License) Py4J (net.sf.py4j:py4j:0.8.1 - http://py4j.sourceforge.net/)
+     (The New BSD License) Py4J (net.sf.py4j:py4j:0.8.2.1 - http://py4j.sourceforge.net/)
      (Two-clause BSD-style license) JUnit-Interface (com.novocode:junit-interface:0.10 - http://github.com/szeiger/junit-interface/)
      (ISC/BSD License) jbcrypt (org.mindrot:jbcrypt:0.3m - http://www.mindrot.org/)
 
diff --git a/bin/pyspark b/bin/pyspark
index 69b056fe28f2c..39a20e2a24a3c 100755
--- a/bin/pyspark
+++ b/bin/pyspark
@@ -52,7 +52,7 @@ export PYSPARK_PYTHON
 
 # Add the PySpark classes to the Python path:
 export PYTHONPATH=$SPARK_HOME/python/:$PYTHONPATH
-export PYTHONPATH=$SPARK_HOME/python/lib/py4j-0.8.1-src.zip:$PYTHONPATH
+export PYTHONPATH=$SPARK_HOME/python/lib/py4j-0.8.2.1-src.zip:$PYTHONPATH
 
 # Load the PySpark shell.py script when ./pyspark is used interactively:
 export OLD_PYTHONSTARTUP=$PYTHONSTARTUP
diff --git a/bin/pyspark2.cmd b/bin/pyspark2.cmd
index 0ef9eea95342e..2c4b08af8d4c3 100644
--- a/bin/pyspark2.cmd
+++ b/bin/pyspark2.cmd
@@ -45,7 +45,7 @@ rem Figure out which Python to use.
 if [%PYSPARK_PYTHON%] == [] set PYSPARK_PYTHON=python
 
 set PYTHONPATH=%FWDIR%python;%PYTHONPATH%
-set PYTHONPATH=%FWDIR%python\lib\py4j-0.8.1-src.zip;%PYTHONPATH%
+set PYTHONPATH=%FWDIR%python\lib\py4j-0.8.2.1-src.zip;%PYTHONPATH%
 
 set OLD_PYTHONSTARTUP=%PYTHONSTARTUP%
 set PYTHONSTARTUP=%FWDIR%python\pyspark\shell.py
diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonUtils.scala b/core/src/main/scala/org/apache/spark/api/python/PythonUtils.scala
index 6d3e257c4d5df..52c70712eea3d 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonUtils.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonUtils.scala
@@ -29,7 +29,7 @@ private[spark] object PythonUtils {
     val pythonPath = new ArrayBuffer[String]
     for (sparkHome <- sys.env.get("SPARK_HOME")) {
       pythonPath += Seq(sparkHome, "python").mkString(File.separator)
-      pythonPath += Seq(sparkHome, "python", "lib", "py4j-0.8.1-src.zip").mkString(File.separator)
+      pythonPath += Seq(sparkHome, "python", "lib", "py4j-0.8.2.1-src.zip").mkString(File.separator)
     }
     pythonPath ++= SparkContext.jarOfObject(this)
     pythonPath.mkString(File.pathSeparator)
diff --git a/project/SparkBuild.scala b/project/SparkBuild.scala
index 599714233c18f..7fca8f8c2b328 100644
--- a/project/SparkBuild.scala
+++ b/project/SparkBuild.scala
@@ -382,7 +382,7 @@ object SparkBuild extends Build {
         "org.tachyonproject"         % "tachyon"          % "0.4.1-thrift" excludeAll(excludeHadoop, excludeCurator, excludeEclipseJetty, excludePowermock),
         "com.clearspring.analytics"  % "stream"           % "2.7.0" excludeAll(excludeFastutil), // Only HyperLogLogPlus is used, which does not depend on fastutil.
         "org.spark-project"          % "pyrolite"         % "2.0.1",
-        "net.sf.py4j"                % "py4j"             % "0.8.1"
+        "net.sf.py4j"                % "py4j"             % "0.8.2.1"
       ),
     libraryDependencies ++= maybeAvro,
     assembleDeps,
diff --git a/python/lib/py4j-0.8.2.1-src.zip b/python/lib/py4j-0.8.2.1-src.zip
new file mode 100644
index 0000000000000000000000000000000000000000..646bbd532d5883943bbb25f33d505918a6f41394
GIT binary patch
literal 37800
zcmagEV~i)jvo$=nZQHhYZ2iWzZQHhO?3g>YZF9%A-~Hdb_d)U`w?B0HL)Yn~Q`KFk
zPASTOg24d&XJGjPi~ZN)|DV8t@PHgV*{m1=s?b27_Ly5Lfs|V+t{$*Jz+g|nKtNz<
z|28WAFLQQ^Xwm=E9O=K!_4O_7EM4^V85}(S3u$FVLPhKUjr1QxD4_o!kujW@{O6E-
za3COr|3)&lw{<Xd`5$m<Rj1>!nUH!O&`6(v5|vfS(_vf@0j19y-T-3UusxW|F@n}x
zBj3Ot4M=0Z#!Iu8IXt6}Y<oYx-97hE>eL>SIi;s>W3*An$KhsmVd*OIc_2VJtg<+7
zMNFuCwX`8LiuGLuR)S<NGP@691qY72C89{WgZu|u6w5rb73=Gk0pjlEu3#sJ+(nb>
zN^`;qKq7aT4{}*Awv-uIJ%sy2oEFC&j5yblXTZluRLOwm>bJ(6k4vzz3j6OfQms+)
z6KVCoqv83t&@-A~pN9pt!H^cBv@*b^5T@r1M@*Ynuy}utEiWxgAF&_Lpunrq--B$f
zzeaw=&Zo}@V)~~I6p~i+brN*ZHwVBQa(cpr3}`Xuh{wOxb1iY)TK}2jrU?GLL1yum
z?Ldc3cf>B<(njg*3;CE`nZt8`BFWExc$?7LrzoqtmR|~W)|enKek`kI0X3c!wS(r=
z%p~fLoj-F@uo)xoF7YnLBaeQqtNKxWbL^P+qGaDSt$W;h0UThjk6+l8ZeMgJwNCv0
zdR|*Q*Ju~1e7!Xr=0Akb+P!<XCndV6m^~3C0DgK5<KNPG%q(2vFuh?DAZT$2;<ED4
zZg<BlK_2h0Q5N&b_)C2&Z*4>Bf2T5xb;4AZNm|nOJubp4uMelN!&91FVTk($`X4v^
z-_8T?{wiGw3IueG1O$Zq-_B!ZX=i9->1FElKlsm;x~=t+5Yl&^KJyad&bY23a*9yD
z8Z}f;z={INYPX5gx?2;j8)tXkfxo*OX9wAfvbGqSt$;4Y!}}B~>lS~8K!!*a3j-#!
z4<CP~fOFF6-X4)xaibQ|T9D=#(+LVZ6W4wc^fx$rNf0(Dj$CQUzO(XlYS{}oCk8t=
z7zOKs2*nxsg!UknS7D;&l#rCiARAw9-(h$>fw<Cul{QswAM;|XP~b6)UL&~lNUQ?&
zYE{TOU7c;MBL}FSnzVKWc{z#$1sAy4fNa2YEK19;=3GQjDLqv^Z40~4k5(z>^r+R-
z5uZFjQ>kOx+(|u)DoUiZeCHi>(lNGQa(b4z<&X@-i)xURYqQV|VoSIU$!bP4Slbo~
zsCvbtA7vf9`?x}>EX35>rt1bdp1G`(V>xXLgG??H$vI6g=5VY!9|MgU>_9+G4^{(%
z3fh^)Xdz43VPzOJRppRK72~s9r@Y0WGurxq0&ZsoNxFxMPO^(En)`hU8ahwKy`H(p
zo~KR#Vc8)tHS}%58e6TkO0Ju7h_B1Yl-%LKhg}LUw6ABySYh-q@5n*~rcAMAOo&E?
zxPC)C1FeId>Yie02LjSf4&L{+5XzO4fU1_FOBiVx?=Z0xydo;Xsw1hPxaDP&9S>pu
zf|K!qBRsII*m2JLdQ*!;PWmr6TXtWgO{*J|^fuJ3&4Em&5;eRqZc>kZryYbXqHL1M
zD%yEoiBVQ6nT$`J=ijU?_NriNYj0Lj#+}C{Gqg|JU)wA!*OXn~_>$zZmjP#1PVvcZ
zNPY+F<{-ag-Qb;YWLzUR_iRP}HircyGNwB9j``@VOmEfBIe$25-ZtM3_|b+qG$qc%
zkiGOqi0M>X9j)D_nf>sfbO363$z%gaBrT;86)ai~2z03STU|pW7+*1Pto@<8CM>gD
zV$D%+3OIpf-IoV>MI;zI3g^|7Yr+iXs|v38sr+A&N*ih}t&(lJk*?hEt*|Q4(pPd}
ztA9fah2Kq}%d--^TaC0`W6gTE+YE1<mamq$&Z!GqO}7@3W?b+si&}<xbKrR4+H12z
zC(c`3Vq_mq+tuQa+a}a@<gV&X{o#F6*cms}&fWhTYUA@>Scc+TP3`)Nl+ppGSxVKi
zrC{3dd3WOHo9Wwq_2zo$DX;fr=&ILPu-$O;<>JI{b^3Y*(QbvH?2=?$4(eb*fe$x%
z+n->I!3Lejaj;sjuX1;yyj#c0vl+C=!=Do*)UNCe|NoA89rKy$1~?#~ACZ4Q*?-5p
zm7$xVzOlWHjj6GVrM;c={}lQ<7xuW^2tU`oBI$m&?XIyUe+UtTn}j$nc1qJFkpIBa
zbq=ex9(!!u#n=-_`H20zkXDXLK13aoZPF=%irGY#P(^)4rkK6Qbo+cK$sKAU>0URz
z9C9-LMAGNlwQX|8ntM`dkSqZ3O8dcjW)Hz4ifI!~`ucY6X%Tt{6=j=<;?~%XENPU}
zhA+2yv<;%qE-Pk$aT$YB=t~`5G3x5G!)=nx>0;hwr`AlS&5ULqm~dTqa*IW8;k1Nz
zv<Vv2>)tPyuXpUqn`WJ{$k)w#@5!_y6zNtkIsK?f2uj#OJy94lZ)P9p6hdyA3_7Bc
zV~&-8R51LoOi1<(H_UyKMhx?y^_5-7%nN<1G!-6Vg30CItiUl&n-X8`8Hy@TF9;TI
z&BH6>&&Cr3E~u2wcmRhrD}w$6vWLe}=3aP9aNqR8ZIW9+he73hlS%3rqvlM#{?KI|
zf32s(Wt;@w;Iv-OJ}NcjMHkG|NgmQcYS@#nB-(M(Y5*wa%v0)<o(OK`=%nYy%_<m_
zdc-|#3J;s>>%iJ2F&F5F!KzmAkEhT&oso+O)lpN2p$7RjZ~1+L157;-m_ZEW^H8ij
z_ZA~48paOn@<9TzjUMEoeMY`UBvJw2Uc@9QCS<bxzC~DFbe(9CRv4fepi;o;pytp;
zL=V1<==)u>EO`aTAoW=+&4Tct$Y*DV<@MtR#&&}-A)timYw@qj^`I-mgu1_OV`7at
zpbbV0nJ^ch(26MX2AhdoY*-KZ=80i&Ne^j|)tU0hubgPs#XOmpE(?{;?B$q|k%W+`
zwULVROhuT;Lph(B&+IRGgdzKp1q~l4w+TcSSepqdm4`gSo}++cmuRt6G$bRYu(?H;
z!UbiwWWj-<qstfh4D+yb5Z=XiH2EgVqlt;YG>j`Oy^&t09PwokVnhTuSib`av1+?a
zlydfUOqx`g>FJc|8qePq4}PGm^+c=G&#zFOcacw`T5@DL*gCY*YIIv_0JbYLv|y5(
zLK@$nZV|w0Nns;Swa{In2Qr=lQ)s<hb0DYt>;JCB26f^S1Bvdz#8wzCfeMoc?$?@n
z3I?_IaOGBSz+yy3Ak+wIU<Bot2>p}$2uJ}4FS<wV>z}!WtMv(C&}$^K5Jn?i!bY;i
zLAz}J+Qyf4bVO%EDdJ~<{8r~G21--~Iz5Ett>8X49V>Ecg`8}p#)x`R(OvBt8xX>p
zLHCZ3aTG6G2?I7_kqc<D<-$*d>$1~2z16E9iJIhLePt^Oq3wPBp5DvFb(`<A>y5TM
zkmX8}IRT4@K2XW&B%n@R7<g*5r>~RfJ0nIoZjRP^<?9_?{8cUDCP)QdU{v@B8P{RW
zG19FjQpUnAO6s&R2-$C&7^@#U+j#yZy!>Xw|Fw7@>qVmANx<jQ6*_wL45)D)jqF$Z
z^daIO!gcFsR8(REWTod$X$Xf8V<Z<RE&?28gTz=e%S~T<hrK3EdM+XFHd)wA5CyBs
z%5o9L;@@e)ZtJ(8pj9(kV?tuxEILy`E)&UW0_bn1^2<82P|*@{&*D05?7~!wt)@2?
z_3f_OuE97aZB9ViBhS~-v2CPVVSQ??O8CuyvX{9r4s(MbCu=|veg?p%${;UfIGZ4F
zH&*Xf5B)a9BN!i{3!eg7pBJbcwhg8WIS08rq%Bbcf)O1L=eI8fnS-zz!tlMU!N6wX
zH!*d^YX($}Pp~Hu(Ne?Sa5GkoOD4UGmfd2pgaRgB6?(N%*6kT)O;7CrucQ>?aD*na
z6OPMq$)~8SXP$Ja0Z{~$RX7YE%xa7Rb%!>2Kg(DUEmduSPtbsNmQ1qV=r|?|Uwj|V
z1^Uv%hL%4+8xL^3j?x>!^iXW>-0k`a-?Y3(7JgTt^e!+Sl%NprVR7r>b>k`|6;LY>
zS+%SFX=?yj2H6+GdcK141g@fdG1$VM7(lVmg;X0hM5>urTt>2MGqHt}qaMo#0gqld
zf1{F<m<+V#Oo{BbZ_Ytr9Np?^3c01$sa6p-!rK1u@IK-9{M*^t{<{75`u-V`86EBq
zc%Y!yk9Ehxtn^qm*-HGlL?3P!fuh?_OlK;w{usRM*P}Y$IA5t3K#+)FU`#96Jsi{c
z*I@CZ7MWS+?-zJw;DJ;ug|Av6BpQ<5cd*vHly%k0j`8mNuzpp0F9YM(M6Jn&#7GIs
zQHeoFHkPm+7qTg?Qu*I6E%cy{-`yC6rK*8K@XA0RF`%atAdzY{&Fj>(%mc}R@5k6n
zXUpR4aP<SwRC?Vf8?assdMV3Lcs8{Yt|Hr!(G+ahpi8t&iP@2P%P0Xb?(A5~IwJ2|
z<++ea$N1f;>Ui+eKs<YDmmjzA@z_4S>N8X#%Cn=S(v&D;Xuh6SV7&G0N?N)Tg?($U
zqpYI8L5m-fu-vOyqEpP#^oXZ)iA@L4UdY(=71c4achVN#`}bWQ$@ZE>YHCz|y|V@T
z6+0)w8xxWn;45aECFE#1%-H~DAI5D1yTG6jh#e?aB9h8QoJu97FN)11SiXhP)IZP>
zlL~Hmovc*H`pjrOfq<UAOjVB>66_R<npBXB1$hH7$Dkb{t!d2`(!%a8^a3d=6!M#C
ziOtbF=<KPi(!Esg&@0vw=|b%Se^b0(u{N2p(*jjDwTup}Zfv-arf_5D@gq#|k+apq
z45Mnqz6aNbInDP#I@k4HI}nI(9fLAILvS!U4mL>bKovk5Q&ZXVMqCW;d@B%oU-ASf
zmAN=h+{U@JtUQrN#vKo@ZSE?VesL%Vfpk@jt2nV_7yzvVH8>Jj3J|M2zIP^obu^~s
zPE@1j)Xc-2ulaNW(G@tp+F*=LVpG{UoGdOkE+t1Tzu`^EEIFd+Kp-PZVPRi?5Kb=Y
zUgXM;eII}p)L!Uoqi#PHgY>wA+tgv}^=9OpAuoz{qzoI_R$8(*sA<dFTH(*0P;bjz
zWl;!8wiVKUafr^YWfK95Z$)+RRA&KW0m=3^V)8WT11TJ>hHZ6A`fUx@={VzT+sRzT
zLR&9-XG?E~@TBK13#Za$<Rt;{<=3B%fj6BWSS`1JjErYFcCZL716)M+NJ-+l^;S1w
z9Wmt8raJz1X~R4^%n3L?R!wwq&1G4@iRaPlNQv(Umc7+~G^iO)uh%d@S1qc?DXP8x
zNlQUg*ScSZVa@v^50;uD-Mpz5Ro8*Tr01h=KxbbrH}=XF&4jne#qe?5CutA&69(=~
zi;%5=fj>+HDOPjoYlBxtOdv<L!!bvTV^OE%x7{<((Dj>OvpsBh7Q(fL#JbXSxu|8e
z>D4oc-L?r|YM-#h*4EZLz4#&daK2q<LOGk8>&MaV`*7=1cxL(sX4T%m^_&?_Uj=K=
zyh#;bFqI5jL;_};PJ73Sc-lh25t$azxuC3#e^QuDK94IK8`!ZmK<7dJ)!oI<&4sIn
z6X?L`V9)gnAQg3J8KkvfrnK5kR$Ag{RmOolMB4;Dtwp+x(Ka>sL3eldkqoK1H{nL^
zT8aK7n%+8{biE)wkyYA#VuUAHxxD6wtV0M`Hu++;Y}~2wlviASaj*WYO7Qnq+Au#X
z(P3PhjGai0Utrr#UZX?P(a<|NEMONGfcrH|LM2*r05CiYZsMX@&!qF{t1n*ex(Cbb
zc4__F7}?4%WGl!}kJ!CQ;6v8=;Q7=r!xi5M@g3Vb@nRm2+Nqq`3!hNtsO(8>k*s|2
zc_2LXf@ER#H|R!=ymHNm2Xk;Y9JBaiH4ag*IL*8wzrir&FLckJjy>!@7%p#;kPja8
zl6BEynLNTvv*{CR5!5m<l=*4C?w2|gng((tS$kT9$t$7NWz`bsCj~9_Dgxk_axFtF
zF)3uhMO^g5s*u+!XNu_|^H(KF9*djiobSXgix+y(0yEX5PYR;x$L?pg;qZDtSdo{K
zJx8=CjIF!RWX(s3bvwW-xbbpE@D{aRHUy0`czd-`9mg2%qQhmL!2pIqqS+vaTl+kQ
zf<K!+$uiMNIM9z(3C^O$_NDzH%DAi0Y=YzvQLRR1awb!etA7!V6uw~U8_d-8vE17@
zY53RTXgD&Lk+#g%6k(Vjwb#-H&eRS`QX8(R_4$(=iN_`X@QeK6nauw6+Z&5e7lUH%
z@BEx^_I^5<FmifL+<ICAR}W#jS2xaJa0KF9<V}&Z@;kuVm*~m`#SuCh=r^WlLa!z2
zAPm<UaK?h<X^l2+A+7+FN*LQrQ_|d^`}b?S`=9{qn-k07bi8|eMUb1dA4<t83yJO9
zCY%&<<95cqaE&cQs(rT&Crx)*({M&a<7TV}AAufT+$>`&&dO&xxUKOI;s2&U#eN^6
zxt0|!a`Zqz8XZ7DX#W=lGB<QFbvN|<Z~C(kwEX|7z+L%TyB~@>ow|R))KHutJt}Wu
z*Ks1|&b?TX#nF2|Mu^59%Ki;NT2C=Z1cDD(U=sM)Rf+d27FIrNNVW+w;U}5X)!o+B
z)dlG4K9TUe9uQ@rEz<S!#@LD5BYY$8US8eY<fAVx>xjA{n|jhuxF|~~X!;VOw+Ti{
z>Gp3@#rDV$E}rVDtyH@Z<d!CX&|%Kk&|xTbx_A7(iQf9z*xmF_Pt)|`#RRDCmb*5O
zU0+{Vuqae}+ZFa;&b!~t6jjN~tXpJBRQu3OSShC%F_xLlE`l52<72)Rk6plJWnn1k
zEh$k`3>y*OQ<Ln%l+d)x2_0h4LcMa$5)AolgX6`^B(50Y05733M}BWb_xQZs=RZFq
zETTVF@x|zYu6Z+KM!UKs?L_iT)8Mu6pZg?DsXbMpNuiiVn*u}C+{1}$l0CqUI_W(X
zJ+{*Pt=1ybF^adAk9xxk!}L<AtWvpqkiHxzd^os9@T&F0Kv&oPT|O)dsJM7SQKSJB
zN)t(bRcG);WK{#IH%&EVMN4u2(4~>wh^3dO|I#(2$F00ER7_A--AC>|6;rndE~EJ-
zTL@R4dPXzS|5^&4*Bua@1ToFpjns3=SF_Yj*MBbBY(@d-8nwyhYNnMxTndVwak%Bq
z4B<YF(;#eDz+&+M-eE5`NoBc{!aq~U?!}TWudayURp;NV1b#TC%bk@*oFYE%-CrCS
zgUo5n5;aU*;flF0kYiI--r)1e1J*Yuf#scM(Tf8?TmO^;?MA-Se?s3pBlmvU3FgWJ
zm~lbWi6!Y>KLq=wC9eZi^B11{-0g3krn5N*tB>9vcf%Afs?&cSU%V*?IVCvlCC2B+
z$Cq#4arE5veBThi(r^9ic-}9LhnJxQeBaUqf8J*Q9>*8kGtMMWR!94P%`@DkGC2A?
zK3`oFAKoNi>@V|Lyq>;#cyLRLmzxhp<I;VncTW=bzB6=ue?PKt_jr7`dGPUcb5YU-
z5%TExxwr=7SBT>G-qeUKpNZwNf0vj2q|na40c~#&S{5?zjmP?X>5#=|dYq51%LmjS
z(e<D6mAa!lW|;DL1^`gdO^4VN>4(X(P3uqXSLfGM2}!GialpX#B%lN*7DFq5AXwNw
z9ol6lU63oE5d-x?zeADouA9dB8&oI;Q?kF3hl*$aQGU2UrD(CA-@C<e&+4umH@(wU
zozWHA{PQIhgnzWu9(zx-{w_z%^(Ofxjq`!Z!wmkuy{5dTq=}tEKShlKPWE%>`2;Sz
zxx766B;yw3!4>x(S{*;bPLgr*ec1STzd^_<E3|=O=l#iZ-y>9#TPT%ux&!-U!E9hp
z?M#3*hq?vurc0=kzGwVhMx`fcL;Zqj4HJDPN&9iD6sHcbJ{dRW(TA>~JRkByXC2Ce
ztjEm7?AZI+aKLj&QVXn=OU_?l0S@yZ#GSxP#l8*)M^9*i(Oy~XrUL&7Sw>)mzN`l^
zW9px-ypbhIs{=ZFA<R%LjMd~AwL>a@JwDbC)J*yK(o|wt;Aw3)SY5g)m)ZMS)L2IF
zp{Wx1zWz})>G)=zmexUf=d3^HeqthKniFq3kzMoa{h|E!7rh3OdQ|ve>ge3xZ9YC1
zpa*a1YEcS4H36hCZ9<aUl-C<~u(uh&dQ;gb8KwDNihW$wqM~IG<@p%kfX&;mtkWqQ
z3`-aQ17iHO|0Ia{ybe={6QNS{dv;DxzF3)#wl_mCCd#B}nAZ318vic#-#<c|?8NE%
zF$i<YiUf;*oU4Ge7b-vwOWRcj?b{pKb-*>oz%b-*>Z3A6NOvY72$wx48$v@-!hmeZ
z3V~qJ6pWHLC%SM{O6WpU3k&~Mi$^Zd(1i($)}gv?0jMl3_TYH=oTKBl!29XZ@qfbi
z3;oM*|Axa8U{QXILkR-g$GQEe62-zCkxkSmSB!@3qjv;(OOju9oPtRoMa<N#s4G1h
zf+#HjBMU>yn+;vkY+*BI7SqUL`)kg(KZv#Pgsr+TA?LzHS%KPJ<)>tSjcH>?l9?Ru
zV64nEG8x!teza4T)I&j;Hb6uZ>W7@GVKFDO^23NdyjD%aS)5cDE5<d{QB*D(=Z!)7
z#W-}ReYeH23F;mR(t{6#*l>##KMAa^0?{St4bPf5d754CiC;D{2M>T^sK#awcud$A
zqFtaDUc$gw{#!jvZ^I3q9A5Y%of2;)f;Ko~wnQlAiv#)wg4Nch>5$D>#A(UVMuoIQ
zu*QRgb{EnEzjcU#(mc#0J*S;97jCK<pz0~R802b6xv+^ahigOZ^`V%+rfd)Y=3wqQ
zjSC-q$Kt}NI0i5pmsJLCd5u3B6F>6kjbB8RwfqsnY{XuHG^&s#x-F+A7gfwHG2>=j
z4LSXWWH;h~K8tF!?Iy&-6KVj}SZ_1EBf1YZZAJS)$f}|mqaD&UrPN5fQ5e2DXGoJp
zIn$jdKdY!Jf7YNy7PDhv%3(q(si;)oS9C5Pt|BPd5f^OC`CeIc4uZ7^+~A%poHCv^
zNz9shx66TLHqBG4P1Dlw*>6~gnwNrF0Ez`;E?O~{bs)@3x?OP<Eedhf-H1@^3UU>c
za0Dgu;GlaX@k-q*vujPE1%5B|K%?tafllfxpI<{Glu(vKpCTh0YS5`6)mdl7ay=O6
zLY`7{*7}~udVCLRz@Bp8P4-U9$_c{eXGVdz82>8cH-j8Xet@p;A*oxWQ_qRbs<+1Z
z>>&9r#e#B2qbN%Ga>t6$M7Ng@w^#6C&e8W{C8PE!MzV9bp%jATVr=EIWBMdJ+XU`S
zruw~73<4bWDCWe$=M4{2W)t4wND^V`*m3=lPPl=sP04uVFt9MtVH#7UulLnbjFGiS
z{V(~Ogp!)T5TaN6BYRR?H5fL3>N!<qYnDS!vZ~x-OaDYNFi2Nvtz@q$CloTnBO-!_
znzBMZd=DKV-ENi;2$d4t9;(eOWjL;cy|=Qi+oMQBe%r`W3%kL3w8JaqycHrOKouZ3
z9qnS}w!LdQ4t(y0f6j?%{)80ez?jl(k<|}wRj0Vt8!2({xL#)zv}COxvty+s7&to+
zuzc~|NcDHSdpooL>81}ZN8rK=9^=m1bLfW(<4!YU;Cc$EH(<y|-(xFax5ciOdQU2A
zRFo>~FHSqh!q)bS+m7748fRPr8*qqT5#P)Ub+sK?1d$Z7ZfOKe+ZH7$R$s0}`;szS
zRdp(j<D}$s>fq-C4ec=6k^jPDne=HUi<Vujl$Ff=>=8BG$ZsonyX5LIwM{oCDMBjU
z9Oxw?BiO881hyfqtf)$CAhf@p=&8*b=+La9O{^!wvJ_a^1OZ%SbDWCs6**e;OpVW?
zlfXb}PZ@HhVOD*e#f*tuOFY>NujtLODxv5MWC*s$mGi&0bR5iqpF-mBi?FC|@V~mG
zPii6;P|n6de;d~v#nc7u{vt>Y)4G1I(o?HcXy_jj_;8p(LD~-tZA4?+*tg*03_7E1
z%74f;aCGMY1)V6SI4r<BqD?C^YSsX>@PE$;agMm?UpquaO8*&Bh>sSacJBL^+-v%S
zZM?#7j5eLCK3^JPpq|&liqb<F;J5S7MoSO9>hl${ss1p&qDzMKsGD@1kVIW7d4qOC
zB92E<mQXkI`{qD3Mzx##t|Ab}EMv%;90Bv?Q=6JCEbP?LmaYVwH}^RPQ*@qJY&j>C
z*W9kTRxc>yKW5H{uu_}5WJ&{*hcR{Rtax;OKkpZe`3(<sT0dZ%F5q48u1EO3y1NsT
zRGm!tJC7Ns4{vhwQJ(C63$P%1iTgSo=GXobWROyE%X5!x!|A-{P?r09iwO55Rj3L!
z!3@>66<ZxPAt|Y{ugS1Zi4TnqobL2A9^uTcN@NA1Z@8d(Ex!K|5fo`eT-_tj-Ah24
zLC>F)kAS?KvRTag)*v~+moXeUP;NP6>{7GeJh=~oWgVRDZ&VJvSou|Ai$a)vw$sIo
zP>tqB2SP+G2-#}xq`T|5Tj!uT>eYB*7|+$@ea0Iiv}{+BB9ypgbR}Y&KAX>i%|<DW
zYNHeVO~UJlwkwaYY-Bq9{4{B>E^ff@=zs4rrh<)in0~49^iJ+R@qtdk`v`CHW#n<U
z&=sk($a5c8K|Jtj1~wAxEjq?#LL$aoKg&s|e;~*(>LngO^+2gJ5#8flg>Xu=QR%Py
zQSvdb^$^AKV!1m<?pX@#dU{K1x{^+6$bC0C5yGMp*``siDRf$VTnv-i$2dGaRtfy>
z)~@jZ^e~A)vxBx<ojSb3d8!f}ba}Pt;VeFegMpor$dUpdHA-l1YPK9y)k+r;qsB**
z_FPaZtfc<x6`1=WYt|()<WtJ#+Pjdc>P9pswY7#)OAx;;j;e9_>U9!`!{=<(3@gne
zKp0s}xp|+5@?%=PS+z1wEV&wwj4-l`l`QsHFCvY>p6nDx4O(+T<TDaa1`Nvwjs<Mu
z-&F1rZYB<R6mJR(M03I5VJkgzna8H0zYfBUF<pJhWxV~i01uoH2*~EKCT?9M@q1a6
z71TZ}f^DP{Ld7Ry8_ViA3L;<h=+gw#{RVa-<CgPgNc8N$Gd@bw{&|c`bSQJT5mm5v
z5iR557=mGDg<V_Vpg!Mssu&c>Z?h(};fqZGeSGy8tMEo~^|N7<StX_1_8cKzUDu3q
zW!^nEYGcr*%e~?geYBi0dZ5k3$8Fz3@mV6ej}QVYzgd5?6XckmuH|CeCft}xUqUB}
z`)#6AvP}v*?i*;ih*x3;aiI#Gs*iANgz{nyb_746+e3*ftSYR=ZnFc48MQ2E93#9)
z?|cGw%1C5Rch-`05}8d$mV<&1$8VQ6_F8!Rn|a=x&~U-;@b|d~;fPXKriv-TR1C)}
zWL<@Tz2@+u8uT1dGCcC$z!|b1C&5W)RNtN=!8H*~v_9bnpbJB>wfAuCv74r2h+@4C
z^s#9q>G|IC`ov?j{Rs*N?{vyo_$B^wuv&z?==Vx0!jf@0>sLC2(~YmVbqw75GT|_t
zA+&p@l1UGB;TmXCL!Rb8RsmASi~0aIfoU(N2)&98<uEQa*>++vHYTh3$+fb|JmSK?
zg@F>J-Aw!;8&`|edvV=8lS0YD-)HV!=BYP!b2v4T$&h7g-R6;tFqGtmmb)17s%J~2
zquU~w%Wlrp1XLFwH-|$I>^}|KYJ9=*3W&n;xe`>of}J(7KwB_j%&Cf)7^?x00y3MG
ze2e+!to>8sII}5>Q~2xHrFSJ1jOhbmLjtrDuD~)c!I#uRA3Hd^mUmCMhugOD^|l2L
z0v<MTJ`taqFK=Q20U%shUiIioVp;cncvtn-8`Xng2lK=Kc<$2Wx|w+rASJ`)LJ=xE
zy_i~Z1C_cUaS&n36`EwU@=;8y)WS0*)E<AJo}7&XHooN*!0yf+$$WEZ+*%WR<)>OS
zPgvNK?H1W%R-c)4PMKSf;_cc5z#07~EJ%hZ)#l&^x)UQ*CfUhVTf~N#E!tc^PTkkd
z^Cw9NFx7yhZ7$)xUkHq&Y(Y;t;hx5^KjfQxrqo35$y?Q>tgzCBXAH`^f@*Jd2{mTs
z<c$#A1-X$a4pZzbJa+cU*wEhpKH~&3_i%M}H2n+s7<B?}GAg~^G}v6Y4Afbv;Io;l
zf2$SaX;ypF(WG%{*U{9CXjTq4y=~_S9fmbwG-K_&Q~X8mXpUj5JEmJOeo#vhkHo7W
z)1}={158lJ6|x204nWB*3PMoAVkHFtl;u<*<&~KvN(vF~VH*SbmiAf#>d~^kAmhGt
zB=-ZKwOAc1s3|?Bq%c_y()p|QxRW6&%{kv>_~Q)ug(gIWaNRw9g8l+EiTfl6D9bMi
z*cRf^S}Ve!&I3d%Vj(5>Jha2f*h9lQ($U&)mwxgq__OX5Szzb_9^LW)FGlZtsg9%-
zvvo{WtXTS_Q*^n=S+8W>ih1{H!nsKBOz~o2ADEHmW!xn3yRyV7xp-qc6T9bYho^E*
zUIKVeORE>KU9qg4I0U(_x?H&Azjqazd_)itJ?Y^TE<8-R*aQ?X+ZNfpXuNyaT@By^
zC(-ka1=~VJ792scfP3nEwEnQyfMPSlDj0M78{3)^9@fMLs}QbuADKw4IcB@9ZZmN4
zJ_CdHhFzHyx;xm}CJI1xSt7YlY|1lwbyTOdR9xTotSAvAvdXE-TA+&8!E_md@TUZm
z-Zk3RDviGM#}*-2%Uz#Exx_D@L@+m>KlcoW2_3to5`iqzB2vTgo^39ktQ}2{y^DJr
zZ*d-O8?7OtTj=NaraNsK=!Yy*Qn!g0w*>k|Iaymab5z7m&^Mz(!YhBXWAA>*WEP<z
zm@%YWn~b;$LsUJp_oP}qmeA%Q+!|&W^9>1fyzcY8{k35G+#loTx*8M+DeuVz@bkWo
z#*N~&qO6;VsE~6s1!2xZ>o$tdJ_%-sq;?I<<p8%IXzk+7JO9<P(qe!3fw9$ji)L?j
zoFttjKK>Dqe)W$Gy4*40a^rPx-@gWFX|NPjofO(GS(Cio@LqC^tWV2!h2H<#@2^I*
zb8W+vxGw1EPS`2dwWs!xahr@9o=wTkm&!z~(ULFp#Bopr^Yq<2BfKn%Htl{k7@ygK
zu~^`~A`%dTd}@B{td{ofGm2-O>zPAsU9_xHsBPu)!RgU*Vv2Bx5L91J(Se0}@U_=A
zGtIkOOO0(_C&W<}3Rg@@5+6Qi@QSz-Exg`bmy%wCDL0N=qZgd|tMrf*qrv`Bv0z)r
zbrIcj|NE+QG;bu<b}N2I$lLR-L`<Ir#DU#&X7VJvJ+ns`Qq!+mN1Xmy?7I0@%Ckp2
zQCYVjC2p$Um+2eMmWReWlLn~t`1(lSwY8m93GJ;N0V?1_7}S^->*orC*^V1@(LiH)
z4s#K7b-tEj{qB=M4ZjJz4gD(Gj_E|b2S;rRaIE`zgZl-MSQ#c)3LZwims<~<m)eNk
zm;XEtUBmNkW9NPtyn2{zKOX{Y9|^T*JV+$DS#tLg!V)(~sigMH2oV6|^?O6(G>?QK
zJG=;5$f!E{k<v16On=R<K+eBC<6hNOr3F)@Y#a@@xK6%uDf*el%FM0K5teuP*P-=V
z4USbIFrN;)#&p}nNR{gB<F){TydvL1*CA}Y#ysJKHk2~guO{@wbPmZZmhIDv)6!^r
zB=}Jx1=_F%>zmdV>083p_A>^$FL-_OzanzwgD)z$gKs^Kg`)|Wy3-Bn#Ue++><4A=
zF~yC{%Hk2jo?>{-ZMyTUxy#C`29b6gUpF`mq(B|VYa1ILZ0W5du;D6<_AwJh6t_%V
zb-oGE7cND0^0+x)b9iRE<^t`WyKQ!XjWI(bijNthn2anl)wcN10dQ|Hpq+2Zw$0c#
zjb9KoJ)K!yoh)Mclos;466sW!9ncNnq3`pYM0Z*+txn{iwuQ?k6R&t1X`rs6g+A6X
z#JSyOI_$v(o4I#6<T|TXXCx+*UQ>{6NF+(-Qpk}Vol7xzi%3AShKNyF-@=cR`qM-L
z5w425cXeIZ{}dD29X<8;08X0DK~o3i>NdlIme|JRaiS#+XLR$$z|{rA>f|qzh3M0$
zoG_I8%<zVKyuXHE%W`VgZ)2v{nnN2K@XtepM7zLI7Xy&J=;Mk(hm+R0I|e1J5?jxB
z6{pv@*i1U_mJ#+13MIh8R5LW+E6!^<e?0F^4gc1~O66c<(FdtT#BS{B7i_?0+2j&)
z>b!g|svmAZ(`W%eXTeHqvm*HDn+D=e2l^<Ox+{LE4=I)pN7?NJ+}^61wQ!Ipy;O8b
zEV!eanyc;_w+R{m(H5UJAPk`%O`9f9zz>Za^Oys97_mC%Gt06gXc27R@qt5|KcwoX
z17G67^_f@i%k<1bL(Gv_UiwXA=IeVduj1TiOy#;YGx%f$9X5qz*ZMFsH9H9eb1hKU
z|M9}de9vcRB@RxWlv{&fzqKdUxaE&#+yRdP@Qq|ty%fbwKJ#olWKf@{^kpZbuWkvH
z#Te|Khb?jo9rbud_t_!H;2lDoE>)lR9fSVS($z`sIai|<ZnR$UE{tL4AWiJ!dG?(>
z6Us)jxwe-|xsNNsAdfF<@Z*o02s4l(wCQLZkby?Ew5>X#58@9-#SMQ)(6B9{U`3Xd
zN6xHgpt3P*E<ERw7hm{eNa`^QOld2pCP%BKBHk$g_hY4uN$%(dF6(VcOK9KP+wq(J
zFrNVPP?C@``Ac?Jq6{evW^1kIQ_2wj#L{o|#1j9HJ0z&n)8&azwlFN?n9)&bzVpr3
zLx|*NM6(JSWS!q&TBt>64M1vf@2Cy4nadVcdTPgs-G|iJ*>20A9_xxRiPb*((?a}X
z^@izuu-t};<4|-kWQ)J3u2`ML0{A;@8VvjVY5MN&_PvuhbzG#bVs72x@oHF#<^9eH
z>pt?q{=I3hADOI9LZW!_@CXIs;ZdJmTe#7-1ut|M=?_?gdo1yXhk8ZA@Th(K?>gxD
zfE07X3B0MyhTdPlB`SVsrUvYSvx7}9d-ieYERO$d+8VguD}*q^Md0elg$0RSwJajG
zQY*w<_7}PN`X2ZPc5uE4g4X$cyTNr8tm)+Fh^iZ<9k|8cgYArg!&81lu*UbxbvHQ|
zHJXvZo6^X;HK0@aPmUZMb*vmjKU~Z&Pv4y$ScS_yx3%F2Dx`k^ve0i*V&|7XpI=%q
z^qo$x%3K%)x$gPJhDgrReDh3zoMaY8U#e`aL{+~__c?@hIbV0RRDZ~@yCn<<gctAe
z@&)7j5OgB?NpCEzrr>1LutX<fvyF1{FI!R$1O@sbB6e`2e%x9mDM=6Aq!7HK3T#NZ
z8<7c!B)l$Y&#o4aeSMmz{GGqQxOr-AQQvJ-1{!^hnKq++)!6&8pp4Cv4g`b*zrRnj
z4d>Dfoq^X|IA%;=CU-(@C<*AZt6QbS5wrDTEEr0?(@u6jVP%J)AdYT-VI|K}gUUFn
zKX+Nb&2{m5r$?5L2;<yKe6xx7E*wbdx;W;9eWkFBS+JQmkYZrD{SyR|G^<FdP-kbF
z3Wr$F^gziNYwL9Je-TAJ7Byy=wrs~!47F->Cr?G|-z9`}tUpY_RRNDX<)FuMo|m=q
zp&wWe)z*Nrl86T%$}b1P!qtVHjQ(06WBzXZz55a;?*rL+5fp5qhy*2tk#<JI;KHRy
zF6`!71BHmT{@vp2xGU(V*hh)B!!vm!mU*{d3pq+9;UnsZ!>@!c3vXf<KvY<?q`e2v
zi|#iS%tm_C_-C1qe!Wup`m`_@+IkFf<(1zU(i39wqYH1RWeIBlO2|4A{Jo>SPN3hi
zQIA@P>gao=y^f8kz3q^pG^LeXHlfRx0`Z@;cbAdmOtRy4Ku@1%GTBUS68W#>SO3}$
zL(nDJq(g}}h>IhmST<+h>W6Y<Vr`_TdCAj~gWeN?Qvevl*&?zj_v8E(8fBfVy(Pxm
zYqjT5#TjNvw+dazkya=xg|<_x3%xmmG)Ebc4mbC!6doF7*!9qEk>mu-`gBL0|CnCQ
zsUU9)ft+NMV|Y$Y5-?km40`8K>JAi`h)F}C<m7M=3<Yx%>i9?6oGXXeR6+BOdALBf
zVAn#|NGqnGvYnU0tKXuoAj#2&EUZXIYp+Jj7xjg%N@gw$F=|~F6;l)IUbdpI5Y4u-
z!t{vfl}8)E12%K*6tMMHo6zn9a#r(6p2(gD?W3a-^C@hNz|cm*Tq`=vBK<lMXCth)
zZ#)?3Majgj69n9n+eKfcaDIc~pRcA*_;P@$$HtY5Ejr2tahQj$s1H&g(=K@`?;r)j
za(qz)5g`vI!djsdG>|T7S@4EJ{p1vbpI>nqN&$u$R<E<Yt+Ii*m?S^0c!Uq9FVrw~
zB6e4=CH+G$ZQZz{UQm)Is|U@k%gEfPI>zmrwL9D}pRP^L2M=AZU!rVR$WhzOFmDw}
zm!+j8@q*3WV6DJ92_1Aub;u)6D2pvJeEv5lDSOInJtQRLZ>@el72?}_9dg}SV@O=d
z@eZ410Bn-gLs1<_*+PT{)Fd4`n_pogg+&+Lx-;GqRa#}BxOzt;&MIAOs_Wtatl7Cr
zx{fl#wJiDd=Xg*ouMJHkg;XlKUfxNQR#ro)RNi2c#qz3q`MQN!d}N7z=0+`@fq=m#
z<v7p_64;rzT#XeOyOh`fG_f%V6%AH1lL=?lUI3QgLWVT^HP5$1vRp=M?Ox34MHNPL
zPs}6J1jYfJ;tUP{O;+Ts4{kj~PKW~XRSj0_W|=m?US|hk%j@}=PCM=Zx_2nm8Ja|C
z>j@td*BUmI@+a4s=d3!6_$Myx{S-ppC7u^wc?W2ud&$Ae&yyA8?dx;<){3obgJ{|=
zD5wJ0q%|kuV`lt4>y0(lyse#_L{gpU>;o4re)FG-6lkb77Rce%j12<O`i8VzUI1EZ
zZR~O~rDY4uzTgv!UrICO2?`Vheh8uKmS32`<0q1)YNp=2)dgL)j5y0k>En%LJ7p_t
zd=lXRCbfHrphMGy1Q(C`(#x&YlQ>!(4#{&r-2#mEjB3gIc1z8`WSSj5CsBnAYgZoe
zi?QgiqmOTLvO*&j=rwVHb}?5R@0V*F(q8*)4oEXs)ny^ZK0FUg7q!oY2QrYPL5(Vj
z$Q%(hJMDOO%I=j^DO6bO-!U{K&lZ}{bw{a9Vn}cKqfW^?I}>@&w~8ROH6_!4ucai*
z+N0`MMLl@8)nd8|vr2zbr>W-9GTJ2V(v3fRC0i_>1epV9=SwcK%Gh=Xa{%}l(MWCJ
z;ijTXjy8uGO-Er=kgT}ec9G*h;LxH^G?>${E7g1-*!&o86l97LY|}zBV}&;w+3-zv
zDe9vd*uy0cCtJp(S}LhaK$B(LeOD*NVOLC1mGB(DN>Wk3fc}(#1~-cVZRQ-Tu-g*n
z3-sU+#D+nqZo9!Oa6wT#zkK9$YegdFc|UIOVZhtF?`MOUA;NjXYlb;;a)bJ*!sh9q
zA6vDts`)U3yX6=AXtmUOYJu{Yk}t%{+OZoVO0X4TQ5}xpG%SV}ybbs4UA*aJvFeXs
z(^aBvrpin{{9*H?Lr0NZb7p%(XT7M^-fm6N;OYNR?`9N?DLupC2t12Y4YZJL+39`1
zB@lpAPui{{#rf^e5jj$O`RJ>=XN~$Ijwozxf$(@zPXSxHmac76Fjfm~o5>a8DS~e(
zd!N<*8{$+{1t9Z!dVW5pAT-x3CsBpRc%&=O0!q6s({cczy=ZY@XDHVMs^M(}wh(&8
zGi~?nc)OVs?ia<Hhi@~E5WRTVA@}%~kVQxrSGTq`Efdp7XGFJALO#_+j5^%wIK4;v
z=)#exsx<nv(6-(Xq-9xLpshZbRP((fh6`w$#7&4lx^SJH`o}r*MWsyAVm)3<l*6B5
zbFjfK&4*dOWOW~+q3QLwwGQ_Y+)z8sp8heC?5@{m2G__-MeAE9x%Q+U?dpAIWcgzA
z#HcjdXiu!MpUH$g1(bEyAZT6G9vAYgO|f39hD)1iUMrPA8?~-dV*Yfn>~qDUV)`|$
zqzlZ5B~4^RX4=dRQ%?RN<FhT|clX?&1usE%iYG8UNyr;Qnl7)Ol;}mMg*htxt2jAh
zNvw+}!U1Zd`(<B$&19*(7oWTQ%mO5~-pn{a5M51P3`WYDQfUY>RO*5(x`daqJ~c+1
zJQ%LUw4-<ivPiG$muRKXeW*RH3r4B-pX^6daBu2{r18H8+NzF(cT7RZnh|13%4^@A
ztz#9r$`oc)FtUA(Y8-Z?VO&xwL6q4TV%%q6;`@(&6`>oTc(c;LQ7N_-FIv#^smXNn
zuE4`*y_gTBIiI6wWO=4hl@U&!Rgl48F^P{jJx!2R=T3QHB+>b|m`AQqs6hRErEMvu
zB34zWKiQm8qU8ml?56ObDJvV0&>5GaR>A4fyD_8q>*zrzW{t+-$l?Qh3B8Y+vvk?3
zXk{7|4+j|A#h{G`nD$XczY2k3KRsH*()m9p-(OrO<SUvj?9bluy5RBf&kW0KGsCmw
zH^%aW*1hrmgbL8QxYkKu^Ms)FDt;=-=kVz!g_pKW30UEubV!i^ylv}2&hdR4I|G-e
zV+_}r0NHk~8rMkiD@-berygO~Vl)iYLCo`iU06(eB^rrAV<5qBN|vg9ri%fgi<n}T
z+-$!i!<I9JAFpn&juB|k1yohFcG`5*IS>sN9XL1l_$L&84JVlpLKVzu4bS}z)2f}o
z7U&fhCWWN%mlk^Z^g-?Slbg*BpGN5M=QZyAmoJG2AK@h~=g_S3tbmuP^Q8M-B^0%%
zplVg*yZsvYvm3|RMXrBG+68(saG0ji);<Vtr<;cS{nPBLNsQodm{VTu<5ZVAKi-uj
zJgZ-X1sJf|MSOno?s_`YZ^y;_FPVHV>R?fpjL6FPxjjMlGfnG3r!%EiKP-cskjlw|
zgc%HeGA~|=h&roQjs~^y>FuJyyWUou??`bTs(2=NDFrvtl5}+jmf>7%s3Og1AX`z+
zh?uHq(z~IL6cmu>cHI*ni02V08a0YSGjXlHyRUBX4Dtdf#vJSGzMU4{hkk}Z8It4?
zgJcro5EL4>$x2(a(39nQ0vR#OpnglfZ3MY^zzG@8O+-?cIJDAzVm|kJc8rmrr=u!L
zRVZI{&UPcJy|1Lg&0Rrrqf((B%hzhR%na>2Wp*Su_kL*qiH>*86dzVT!7lOfoCqa#
z%W^SKB)4%<pMU6Jakq6TZ9q2XN|?|fX1R9v#jAB)nCpWgM%~E61cRnmj2?1NXD`Sy
zK!H)R4AFM%iajN6VyQrdS%}H;TM)T_rkzw;bW6pPd19u^r&5QBe^V@@6Z^!NWd1BO
zN6f)iW!C^5&0Kz}A}UMs*x%T;S@!n!W~3U~{7)N9@x|o+-C6dc@fFpDCZ&(Qrm8<5
zDkiz53#$65WZ7k%R90(hhs>dv)E5mS&221<@8vNg^>7u;sdX0nB$WWUL`OsHeHye8
zwKT0}DI93?c5KoVbF2*dtYe&wR8PbDF>*FQwljlwFlInN^596Bay9h+Xn_5O{Ai<S
zUw|?NN4^5xl>y0PV^=GPEVx{X<V4$;UOWw5R_$`dgu8fib@33pBhS^mlznn|<q~V8
zck9hSrN){4TP#G%X<1(K+Y!J#>g%s;c2p3)%9<cB4m&H)B;xsQa{|^?6?8H_tU9OE
z%A<@*0mOqXD6PC2p$lrA!;4ABO_p+pom)Z+2OWDqrds0sjB@%XcW|rAV>oQ#i(?V|
zG~jXC26(ecr#<;{M1_+#IWp94bLUu9J5z5GK;ZrX?~VU(e&k%r<k;6=hw}sST<hGY
z-z8Vy3QE_3v!jFPc*Pm}r>+%(!d<ItS_pBCSaZ~TqFlHMt1;K_c?nxK-~8-d?Rbe?
zFkafc7R9nhOT7B{$C*+z4S#ITm&Jzk4-k-)%dgUGaR;(IH7$18=z|8uRwvHLvYjQm
zRxB~UAfU}S=~meZ(Cb=|$c=VF{Plmbm(}iN0)?EYe4ed`d|!{wljTC<b_KlLN53}d
zs{EqQZHb1AOwKEkIrN-%+H6#NaTrCC@vo+lyCvL!?cpI*+#hl*;JiS6)?FqtpyaQ~
z$zHq2?gd%My=L!G8_-$^$2RNH{2@qcHsUteHMy)7!S+EZ*cExsA_xYwRf^n$+8n(Q
zVc0iDt)G+-(DUN?^q)v}6#ljOQ-Au_Sjk;U^#xNW{w^=hF6p?q`0(^%6BjRzu6AtC
z+#!k3-L(id0lYsYchIIYQTL<caiP}Ul^I@2M)xoqO#`sJ3Aq6d)9JKLz7__!EI8}&
z$#wGc)%jZKrE*pkzV*NGH*`E!CD}GH$_OIY<BnGP1_Vg95*#=mZ6uK|1+R#0mk!Bg
z8x0{*Rzj>l*1>QAZFzzAghJuS>+7U>3o#r-FsnxKv7`3`zZ$p)hbh*?+nc(rKKYw8
z1nehEnp2%mY>2HY0$GMtE}s9j)P%X_*6C&{dA4oP<PWL-bbE3t37}EV>0A47(x>+k
ztVkwdOl_Dx6x(*BZcIWP>%H`V3b2@^Wg()oP2#*!T=Dsz*=RDz4JE=qD{WbO0LHjW
zPR08bI<xZtg9puY<UDNw*`*`rMw+F=dK{Zx;hWjDIM;<YVG*nxhxXTMSNkORa_a`Y
za@uwPlVt*lA1|x;Y60@t<e%KfTe$-_4`hPPPm<i<S2F%Aq0Y<e1;We<gTt#Orp`pm
zDXSJxHJ5TZJ(a*k?O&0<6n$90$~V<%4AVs5?RTwF5ycl@j{(`Ik@4C0Rh07=9GK)I
zr>0A$W5mtnMdoz9fQ}rIorZJh(d6O)FDDICd1#K<bqV)u5HCt6wI@%kP!f_Cib$PV
zl9gL|Tcw(rlVg$HoE2C?p5^Aw`|0`Ri(>n*x%f7$PNNe&a7$thCz`+F2tKpEUq~V~
za$QOvJoz8nM~EG{fr%+;D>)XMPS=^*7u-P^+Aro^Tqm_6(Hul;zYQ%-VexXsdwF<N
zyhk@_b^M4`EGBZ2Vf-kY!|mi#EGNM4v2Y;ll*k_(#Ij}6zK>a>tEiDZo!IfVb#f`q
z2QRD(XmmHU(mM=Sb{s9Kh+9*F_{5t@5lKF3(YrBuX6p{p#8zVR!^3~%&X=jj4;Zlw
zXsK8Qa-YIbKl*^XVxx24M$kjr%wFtZhI7~vsh93LO^q-JhfPZD)I(UNIP&7yRu^M+
zW+|_6O2MKvwhR27Y`Si1ox(ESeX15&tu%|7C-zvOMYTX14hYA(ckww}KOnn6Ef6Yq
z5E2!!)k~2U7~A?Ni5MUggsmOtdQtErpbpWoi%E$muq^C<B;CgVCCI*83kUn|qJWht
zwqrh49Izm~5e&B_SEt6TQq+qA@&0ym5>?J6GCVdyIqsqHjAi6pqyzzKD&xf!4X;yV
z<#RK{j&x5wQvlke#-D{=S>VO`F>YBSops?kQ3JHx9kuFB>7@yK+blUNP$|^4j8~}J
z1V=`k!<7m@_dD=2C?R0x*mzI!<*){5kntKcK_g-`#|Yk-HX|LW)H|S-33`$)|6aGn
zLg=UTq<gM9=Q|||WG_n$o@YgSM)>gEVrtVeQ<Ov($>KS#tfp=a*E<&;SL-wBcNz@+
zs^$kS;BEBem}2KD+R_Q_B@tUn`b@8jy!`X}LwHB6I0d130O`x9@MF~*dN}SlL{<{=
z^pg2FDUK2g>mH{TyEjs6+d|pSTH92mQiWBya^TLCAaZjW9J|h_FQL><@j&eebVy06
z4Xjiqb<_JJa37pXCOZO$i-zAcdK0KDelRw$+kEoAtClG$4?j4Em_(`f=dTp0hAPAT
z42S6kT*3s;U|IU*tkbDy=QwSd!ZQNhXur?%KS%E$i!!AIIeIzz)h_=ZXYbf0TDNTJ
zrfu7{ohxnIwr$%sR@%00+qUgosamH_RqcB3-KSOE`v*pwAEHOh5z*rrk|LlRBSxx;
z#7K}(C(|GL)9?&Pa_*q~0eOmrmDuG*0Jr&CTMVhc_m;&GNWYQ)WzGH%oPj;FQmif<
z0084(d-neVBiK9IIoti+PW_*@?EeCc(2Qkex5@F)=?hB#A+R!HMPgIed1r%Wk3%Z6
zTJO`c2%gDbVzQxH7$z_-(Jk`xF&&RWD(SdMdlOg?G3Mc5%0WNgVq?`}U_6;bbDtD1
zJno3j)L>jmU`jbYq>BKmaR(B|q8mw?`o|f2$f`kVJ(1>R#og~k6Zu@7pIIF8vyj9n
zw?PjLWuGO<T8Meeq*7%MoMvW>YTtO;aKz$m(si^|VxlVCB+FRB8!NQ0LI$lfnuoE6
zoFGHg8?FHsl2VTu>9zp$kkW!ST~2@jnq(V!LPG)!+_)3M5K6g;g?2^5ZR5eCUW@Z6
zqhv_#fJL1N&Jes_8CZsyFc@_R^N<mCJaG7%tl$$-CBZh)tVP*u5+otM_*e+69yDA*
zG7(iGs5e8|451!w{JD86pebUnwZNCGTmgwJBSakWEU*X@+_#(q^W(_QybG*{wzwu;
zv`XeP9?0tb75NxYCwOXLv`I$&#7!RFXT}^XT|!#4@8YRSMmIY<M_o1T#vkQ25qd%(
zF<!*WQKFxRMVuC!$8<O;+<nI~?V96}2T6D{*vuFm+_%A47sJ?GTwes;0_le7L;^y}
zuz=K;cd~u~W{LlOLF>~K><<W#jgif`y-faq5P;;E1O0K~#@5a3FV|0!jRH^-{&a|0
zz)(f2Yi)7$EwgAx*;o3FS2P8_Hi&qeI+0^Jz)1K_UJ7#G@>ZE68o*ogO1|M=pWwcr
zv#BQCH{ItRt=(=r)Aph><57!^yEDFi@0aU#b*Hi)-SwBxde3BaF3x^_#u|Kx>@#y}
z2^Gh1W=XF*?jU13X9vxjxgP9k09Ix#%lNQib@t3yo`>V+SF)zJG8nrpC5<~*CGa0N
z%hTN2ADvdjajSN=)l#n&ZtUqEcddeZ_%=o^Yn?6*xPrjjAsKzy*R3?obUU+K<?LR3
zXdnJyKpm?$!t|gmtQfGh&yRgAbfSd;o7fk{pbXgCIxyPZ4Z<&9S(`ij^g0KaWbCAp
z<u?5mTM^t>=;>Q6o=Fn7-MRn<r8m-iw*1*y7WX(CD>imj_~kaRw_u>FYb_()-+JAb
zfrDr$zs_W$go0e{w%04?i*+OXC&oHm?C7<dN`J4dWX;Re|A1I#wkPdaE1y}wX72!_
z8VtIHd{XCM)kCT8fe-LcwQP+Wla%=dBJVtZ+&D+ddHI6}Q)(Yf?V4EhoR&KQNW=L^
zPna$GA2@@lJLtMRRsO*6-jzkz8z+xn#@X6=-FeZVD@+*~?v9em95H}dbVmukCQ$@V
z=4yW7tr3uCaOcJ?)!1(Jo7h-|XxYQ|3EliDTc+ao2Ut{dYn+_l%y-+)YPahbtB|J@
zgnTW#32p=4VUvHYYVaGnJtV#h+?+2GeWn=bR=d&HF6<DfSkS2yM@iVb=x%q|U18%p
zDEX+ljl~XGKVU0s3^Rx->I})fRC(wK{b1<sEQ@HQ8_K`~kdPt>!ftbu;Wq$eu@8$O
zsB(UYfIcw~MnVe<l3t@S_C@1wp~?ljCWLch|FjBswJE5dq$MXvA!h>=4aBs^2C*=`
zL&Rgml?j%F`<NQ?Ig~B2MMhZV*R+a}RO(^Bdd2ckfOU#WXa^)(KwuB!4@4^bJ9Qe9
zJpZE7-(Qdq>GGWj!1@vsl+Gel6nRS(fn?WF(#er>n+t9e76x6&n)dus1AhiS(yO<(
zLO^eoD;@&t0=YkeMcuCkBykgIO9V5Sik%1=R^dGxA!^@=O+jY`rwGpI=#Jpgc|6YY
zN7`xABOXpE^P#{%U-Bb4N0TI_5S|86N(RzOk?spJb4w!BPCQpOg~~8eCP-7zAX<$z
z*IMl!2R%vrHuqO}03ayhv~p(0-i71~gJwpid}y5M&{=@8Xi`^vD3^KBVUjjHX>$2Z
z>NkNZ9B?N*h>I+KP%8@|!fD5Ogfj`yW8@kWTO*wruK%@$6ekN?ul<{4zvAEt!Lwc5
zQZOv?7Qs@%o|SMSaD7qaQs6zxvod0eO8QIyQqn{n`GyV+m*~;(1?HN63U2=0P@rDj
zB^VwaAt--}M1=?ver2vJL{=@HlZz{}&PLqlOd2qh04BgUT<A17W)G-?FK{PUki97Y
zj~PZJifqN`%s-g!(T9wi>P!o1SY2=g@`=AIukfxzYY#a=yQt=D-8d-#H@hg0-vi9W
z5nbG30EvMw<ZT+$S&8w*o#(L#HVW9SjmLblr?+*}9({k5uGX=A!r*>q&H)ffDt^s1
z+4E9W@qqP=9eqpLPBy=*=E(^Zm-j=s&<298UfOleAB{`7L$!f2swgjkDZbo%xJ+vb
zABq)AbL30gPR4VkG0Mpibi~w9ftWwNZWv0I#QW;YX+*QKKhj^$oJ&V&yYAemj?%?x
zJ8~AAXo`Rg^8-e>!pQtRb~eHeH*|VkXz{^?h$u75o0aZ|jIQ>;w|6S#Q3^Sko<FuE
zd#Me+{6QLl6~L{Z5wOj*qSLc9o~Tzg^;dR8{-0N*Q1f(G`KzHTNID*~rCon^P|ACY
zi8<7ff@gC2N@)}~606&WW%}Mh)XK|ZsBAqU&L@iD%aAvfUlm9zTa@!lhoP!InTf=#
z5g_P#31CXf>7T@SpoHXns<f~Yb3ASOQ-~CO8gb$*(JBTs;H=f~o<j?o90!qfb9B!R
z3Q|dKc#Z*qOG%B`c9ThRAF1KgFoLRxH+1)mNJ+D&u*eR2LgNl4jsc8{=1F;jTsGM+
zHWao!C34DGw7CcqoY@$Pf={{N7;waBX6M<$Frz7^@rzT+7+T)O93avJT}(gqMnjy@
zIA^$yY##FB#4je^dXYxu${-j7#t!+haCn7E;TQ3I;}Om|a=$iBhfsU-kgbYTdgtFu
z8U`~>aw>lF>Sv;6Zx&e-*kzIIx0ii21^khKabu>&RXm4a$<c>PfW$z8Hlu`)6B&f?
zv#WO-TIx#JZ{eyNVI?-n*PM^GlE3(Lj*WaKb;5ZdGwx{&Qu6x#eUg;k%%g&;CLx~e
z8Lw}OQCG#DQTafi&;}4}udHd14V6gOh%IC^jsZQ_>l7c&*w4*&=<LwkGc1HU9=49b
z+=p)poa!9DP^P$ue_F&7%S++UIQ3}&SeIZ=(CQ=76NH4)xQK5`ANgKO(az%eMTaM%
zTq`<HCP#TPIQne8I@Oom@YCDI;@R!1VV|z%0p+7@rIhL6!~4#{P#zZ;cX?mmxNV{m
z`WDo#V4RPNvX)K^AL`a<&urYMdArM2x15Y+86LTm;_&GZQ6H9|2PQ(V-hxw!x9~8b
zeD&FMoPK`2UYSK1;I~RF&xN@?-Es6dj@}7u7M&+Ti!84aJ21q**;XC(@nBkxlzaxM
z*Wx|O=%|62pFDe1L*B847PDyfRKz;H#=Pz28(#ZEP`qa)$<rZjX>;#+qwgCPK>{4@
zgT^DUfOy-+z?}!^bl`Eo++d*e%W5WioJ!8IftXn_yQmyGll4%KkeHKQUcf@kP)Q+C
zO}0Cn<)M_vft0nt&?HKo*9&ubshK39QoLr|ZJ7vD3=wU=j+(kLyQbx*S@<em0p})P
z5!6D-+oY<3)&xVr(xJr=rvP?Rk64Nq#VMAdZ*>H5o6E$ZnOa<89$7x3xI#ev!vpy(
zi%BjX*HUR~5e8*9mvrZR_H4!Jd2YRqL0WTWE1)qvF(&kP1I}0*T_BCjPdh~5rW;he
z8VeH}(+qMAUF_rjQU6&>J(r4>d}K~0AoMLqFmC(L{!{-N$}6I4<>Cl@_;X&kulu}D
znXc+60Wg#KA9dXf#+sdXM=buqa8k046zUmO-~s$jbYutT#JBI*!&R`n+xTOAUj6J3
z??1<nQS`Xsk-tT;sGuz40`Z!RCif1SiovE9S==r|rhc$J^7#V1=ey(hdOshC8%_(*
z8&;3M@h3llp=>QH;5|t~;p^RGpDOnz0)(4BHX=;W{s8)|@YXpjKSk$zkMj2*)2N`f
zCxJiEe|5C5d72yGZ=@3c85D|3J%e&$poBKF3Xh5Q8m9}Q8kuYavnvPXQPv_y*3FTW
zlujTcwFgY~;|mHv2j1Y4Mw^RJ>tC3_Y1LmR<z2^vG6Dpx5L04eskBe?W0oKK<0y56
z;h@?ma!{#5qh}mh>&5hE>`35YLY#%F$xvWAxTKg&)HfbfxhVL#rwtV>4xwWlC#$`^
zuA+p6Uhz@;)MON9R?<r)4B3m7o`w?fz}VreqCaS@>9tjwX0O*`A4=JFuN6BKC6Ff1
z;EsLAck11#V=_@Y*y(BC1AA!+6*#MAZpx*6;!Vg~>j_bn*CbUI@@SS50amDrVQH%`
z8HBICpuR|XjqV2uE^M64%pyrh`uHZ-NdOLpi=HcWAiBg2`$lbnSQ5ZT7eYj<f{D*p
zI2DcVV3A{0QK}=E8C{p1U2QYPommY?`LpbyLCjiZh0D3q<i6nuW$%|`tg5glZy*(q
zDE)YozXBeNoWoe7zp9w1A8VA5;BW0F+ITi~7>$?gJF#(z$4|CW^@EhgX}5do$lzNu
zv`T~QvK~_M=idbtuJu1EY<=)N&}UmhMbG!l!`6dIr|BdP3I>O*aq$F34gP!kMqiVu
zfvH_Qp-T%wtU+53PV=on;9ib;I94^lDef`ED5wT5-KKvI6%l6rNHAwNW%}R*KmF_J
z45(p=){qeeo~)IIP*cPvDMgs>!9xjV2gUb1s*^*gDJB<PveFOI{x}4m^RJ8|x>Q0g
z1qUwzAoLCVoWw?eA)E+?NcUX5&m-;jvilu6Y2P+Yqx-!XJ)FCDgeu%V?yEfyRyWl2
z1xl)rR;Q!mmcBj{yLJhUOT8eRqEg|Slcv4Px2dQJJ(~olp}*{Idrii6mMKDM4ut~M
zN#%hoA%`S#Zi0!8{-OVmd+LAk|F*pU$^V1?pDV=9CQi;y|49M-LHqwm0Yv-fA^*Qv
zfP72X()2(801F@h0C@jA&(Oo!M9<0D(ZbeD?>|2C|8SKKQJ%EjWI*V;q*njXZx0U<
z9m{9flfq&bL2LrGd`(0f64hL1qEIANi+z@OkNs9pODrC{Ar6F_T)r|lYdcb((w!AH
zT+p^VG3@r_^SWdfFqI)Jnxd+pk)(VmU`Ykx;V7gMT(1e*ORsg74UX+#Jq87%mC(?;
zF2KDKu=T$~yokLdKDFIk0?^PDB4ex&Y6qejM`;(q>HD1Bf~<Zj?}_wA#ml2Wm86gw
z?}FrVyXQq19Tf;&u%VWmE`$ptP}s|EtAXrIG~rgALU$b?>h%PND}4+l7?$QJa>3+M
zUT0jddtjm(KG>xVUc}=;tF*ZR=`{wi9My&10QzVZF>UZ_`Zf{@DR=LiVjyDFG!on@
zpr1TfnLV|M%NC>=oIJOX`u!f2f4e1F8;WoR%Y7e~moIZY%3MD`bMz;9V!ko%G}!3=
z{LzxrET-DIP=%JC#~zUS8I@=j1dpK{YrgqSadE{QQH&QHuWJxkXWmv%c-j~T*9{T=
zu^|RLwo{5O+h5W2Av=n9U4Lc(?C#RyK^uHU@Y?Dg!Nz@;@&l}5U`{8;;GkFkfO*t?
zW^UoZ43tW_jCVZbPT(W$T<XppBJKyAoz3LsgPpIffb{hq`t9wzVw9Z`|1p{#7&fFA
z3JsbuvB6(kiZc`3NUmtgbg;3*9B4<N_NQh%gt(Ww@EigCe!P8<w;`MO)6}E8hj*Ai
z(-+`3Rmqt=j~s+Z8t=u8T-j~7+aLCS_HY_LK1e|SQUyT}0saQz|6pVOr#Ai<Tk!uT
z2$$8it^Nj~->V*BN7x!o`WgyYK%ZpGFPM)072X&^<M%DDlxpcj^p0L%a=*>z4dbsD
zA;U}A-p-Hhu&Z_JlPXjOV8#SaPNT@KtR#Cx8k|#J>ZxL7DI`V{Istyy>nV9Y1t#KT
zvJgrXdC3K9>J&ne97jxG)N;V#;2dN$3rZ;9rUm<K&Bs9QZ9F6XEGQ@ND@lO`fP-o!
z$d=VnY(5DmvIV|8toL_PE<8UY$ZWO(&hu?YK<RncELR+I(I*VzetVq}j|9{}%!m$)
zD_Y#ZRn_8lhx>Z(i}N>kxt$tue+F%a>TwBjXOkvCTT2+LkOdT@!lh+`M9*#Am-=AM
z1d*_&7C$$Cb@J1dLPkw2Vs$LJjJ{o0k3hQIVFxh;QC_>|Ea)V8Ep(bFLs8e%Y84xd
zFAdg{RNTh0eUBZAuDgUouZyx@^}AP5F=sf?ZwW@!Y0Q1D(X5fapWc8P&G)$iXaO5h
z{@Et}yp&FZ3ph*Z5Y!`MSG)3aH~bb}yIck`a`Jm@LBp+3RwenT>HYP00yhs1R<Wlc
zUNumC?pZ$E<u!p^nFdrE{xi!mILZUEXs!))sj!5F;Qd!G?-9u@z5_YFjc717Vepok
zfH@HFec{srX(@>ND!*Sx%h;!UhTr-`RnjzrnDG5jrI%#i*i$OrY<Io4HhBm_AC&JU
z9NE;*&YtT&MrmyRLXtEqSBaThwgvHKPe>!#`>Z!MYn``{2C$jhMN8u;pHY$I<DDRW
zq86yy0tW5I%=YqFl~zfBW}sk&$%0qGuKUVpEO%cwb<lA(l_0J@>N9?g_oIxPaID$C
zzg`nECKtE6c?S6{kCgd?9NjDtT$={00&Za-m%cRszdjRj%tf_K$K6d!j}@x=A8wfR
z2f#YnOGoi;|DJe_K&a(CULLpSBY!Er`^Lm)(ZAjE1{^hU-vmUK#ZPy`)AR~t8!+Q*
z(Y=xPo>6$C0^75~@tWnh$}t@(emNZUm5`TI{kxAAst22lr!v(#I8#G(=m+>OX?bd{
z2@5QuwgLQ=))P1Y0Pa7f_1_VG29Ayf9{<pmcz^l7Ls-P9Y}#({Blx_kRb_)?k2klG
zc!UQl1KH9Q6GF+RK;<ukfgPCpoZnzg?7FS6M+=#M0dfCwI+?oCs5Q|Tkq1z!BXJP+
zWf15%g*$KIwi$ezP<%#<qIR4P_5_C8kBwf#B0>`%9GFT87ZN<DQYi<Jlt3V>mnVq{
z6zKw)00s?oI7fJ)GRmRK;~W@c9!#zzK)eSkf+=vx_)Zs#Hl$o!Jz^*bM2PmGE#^;6
z9>4kA_A$d2U0qvDy_Q_?irzlT$5J$#0OncFmmIHs^z!6;<IIZ#{#jv&Canrr=75Fr
zQ%|?gLmC1L-tJ(6_~li76X;+&D?M$)HT2maes>x_H}3dkWNHZ|d+zz3E0B1n->-}y
zcGBh2#3O~IsZ7I~osgD>&XgG+79rOolVi)1`-c4RWy?eMT`h)}OD1H;Me4TOP<$)n
zBkZ*Z!{>ts$7`32NLr+K6A~k`n)hea)9zTG-OKEh8t^PUoTSX7KO=c)w0z@Ox80M~
z7zt`vLn|)_Sqn(d;I1kgI&Repp-kvUAgYbRFnjpQ+Ss%*!X?2R27AvngXy6r*Y4NB
znxn^L0jXF85~qqg(g4$jrOIZZNxLTwd8l4MGq=t-AX4YGE{nLN+RJ6=(2*q^R654+
zW*N?KJ_t({L=eQ{)!|T$x74!YsUKaLs#HY)0!5xemAO2-_Gzei1g^{hfubidp1u}F
zvud<O51c6)4pz9+@cl^&*4Pc<1D&FbdI<n6h@eNW(#Um=5Qng<Zdtp8%bo}9nhmNC
zzKCYG?yMu!b>qz^$hipM<qX#&mPtzFmwGf~<vdxz{q!*;B-i;5i8fvuLVv2M1C4S|
z@5MCV>G{cH`Gf3q!{OEYtBDlyG5eSTb-tSUH>7#`xes#3o1-2R^Z2Ry7oiL1WE>?C
zJXNv}zOhQ+wIs-nb+zfR-_eQ-C&=_F&w`k!rUV!3!oa8tYUv(2{(j?&_T~nJsyn0@
z&61jZubi}`5Snmu<~y5mt`6>S(lh$MWc8l)A-vV~;Vb-CQVX~M00jR=Rz?Qa)`kW~
zR{u~ITFbwO!)R#9VRNGR{#|Ffi;u{RO_Xm@>`Y(_PM#DLAhFR<U~x3f)=#fD<HaMW
z__O=E<`i)%NMK!jW9g>M8sS5i8#n7>&XyIEPoRzj?+^->&(CeMbm`0;Gh)Y)x~knJ
z)TusZb&#YV@N$>UAYCYmjA0fCKIULr9}Vh&BODYD9bqV{bAvcqnh0?vW)obB_-Z7P
z9bAxL4^~faLD42v5Z>T1;+tB<vXHC5BV&O?=K*Wa8{}Jn&g3WooQMQ<l}PDo$2=e}
zPlo%j$Ck=pOrj7<uHDsMuY(t?Zb}2x$jRtxcZchGqF?RRHD(^GZ^NfyS=b1g9^H?K
zhh~=j0amGqf(pW6Ny+z&Zx@?g*nb+}#FmcJq!4U26j5Vze($wn&ceealn@-{54=b4
zWRMijO;okg2^MH(LAE*EW2a+FrIKaS^u7VRUr3_&SZ1aaBxNG{Lh;T7A(Y#pt~kS1
zt4Y1|>Rb1{h@dU%m~fEpAEFAp<_qQ@wP#Se3B3a5G}aejwkJZFIU2vm;H<cfnMv#H
z;1KX4J3qPz`N!U~hc7d4obu1t-5Z7soaourr!xmu-26WHmlG3~oWCc_%G06T;J$fN
zDQHMpu1GMb<f-t><<y*HxJ|biX)j1Xn=yqql+&$Qz|9x#(k37D^9ypB4!#)TAApEB
z7@oKajE1+T&^9K}s@UWEp~YoW;ZF_hdA1IV!p(278F9%nJT9TuvRyGtkM_)Lt@qPx
zh#|n`snb{NkS~;lmrY%}(nr_M&1pACey>-M>K)nG0;Fs}@eCpYX;J-}NmHLUwpvG_
zE2o=kEAYclN~TEN{49KMOAN6@@J{HlzI9tvtpZKt;<b{y?S8?%kO28ek@<9`zB~$6
zgA4q1=0l(gLTjQ47zYtR&2ZQr*>p3~rCRw`6*r^B<Kka!B+2GQe0|v>2_Dytmctac
zp7}1&qAb$hc+6nOl;ty_D!5^S>n_<#MS@A39dj)T5Uh&~HUrk^>Zxzb^jge7G)l4w
zg5w}S&k9?62<qlU2Tw<TCJu*SVPP&t$~vlxI|?kQUu$Jf0<N^XaYq&ks-c#Vz~;=T
zSahelj%%eZbjoq~D=kgK9Wutt2jpi_tlhQNC_AAB5Q$VwubI&_K()-;D{d`gGKkBt
zYCH+4ty-;{nT8T1o!XC0L{*slJiUs0ChiW74w}tM=t^(LE}9ftf#s;5seBS*8ytIj
zw>zk`orolpNCc%M6zNYaen6|(vm01Bo2&byg~g96RH-6%TO5JoT)Ztem6I@@u7Bxe
zXl8*&9#MY`gxs<cE($C9H<swxrh3A$?h{f}Rz%z#^eq)lVmQ~c9!IaFHNs3EWr{+4
zTR31(mqw{39Db?2R6l-cy?QNzU4mg8!09*Xrf($@V{6E?*U)uZOjkUfZ;=W6LNWX8
zOgz1N*I2sh`2{eJg#J2Iuhr=I+Okfuut9K^z6rN8q46r*mitiQy7B;z=kP{IQHUiS
zGK~N0yfi30A>n?2gsiruEUx%vE)w*CgSZ~P#9m5Fjabp)#F|=st*qDXGARwBe$_vv
zBnuJ}P*#H!tl_?VC{@)wDp90#!i(N|_MOQ9g1no|l<s$1-X)4drW258Fx@hr+{O_L
zalp)inZv0E7M3J9frSo0J71DI8Od)6kG&;LlZ{|6>2ixd?!%>tQI{eFl#6In97MLR
z|6~^JQ;9=&E!~J0m>91Nq&1rg2)J~eO(Tnjt+)PR+KJ#WGM@V2)eO~ue9GPe1W;s{
zOF}mF-hhd@1?LIfJ{MBAOoa;b`*8wMHQvbyeT}O`i5$nOv{B`RL)P%<$szZhe%G{r
z?qjea$d0i3H0RH+gDJftz+yp)13&?>T)C^C>JBbZY0z#~!#xEtH9H<_{K~H0a1zL?
zcCFjZZcUPoes?mcC+droY~#35rCgZBryLN?bsMVbhVqJ5(eARbbOTGz{tJgP?=wl*
z$Ro&r*hOqdFdg};3cz~rWX;kX>_a-7Qid<Oa*p%V?O$@raoy0&Ypu@sfk3eHC>1Bj
z@L*aKb?Qe+)e+@HLpnKg@k?6xy4|S_#VO{Q$@<$^XrmxR6t896Pmrb#Z@ZT@o<BP;
z6VbmPcvGG4mz){^8_4)!S~*8qh!Rx7cX_Hd<5puyP{@SS>*c4GG2;d0`|6+c(MrPn
z%LQ@^ZuYqO;2rw+CexJV$S4NiT<rRz`!(bK@@$owDuk*1sJq20)thTJFc0Xt)u_$=
zC>MHeba_=58kCtRW=b#ReAc~w0vO+~Rl{`0XoDK&7xSI<yWNkbl5epl9z{|ha&yt3
z*>p18TcVapZCpvjf<@{H#C44ze-M+6QJc$6`qx-U5om>%5y4Ir{L+EhsMx>nBdU-D
z;%5NAHEE>?QIc`2R;z&Ny(q0-m}9_HZly8dmh{v=e45TV086GE*pLm{nafo4-=P0h
zo#D0Cgt?{MX7rE%01^!V0Pz1!b^agFwtp07-GP7m+k4G(>AE>G|MQN5eGcB2EC?#!
zfcv{Jhl&YxvY9Sdyz`vV$3AsWF&Gwz20+qur)+i}{o}7YxbHwRJTaxD`9S>0(3YE-
zo7roSZvDd{j-!9+*)DGEV}5;y+WOo)bA=NYGiE&*<d?@Zj^WK~cysTMQt6{wN93u1
zyD%9`^y!pQ6suTzNPpnki#2Mkpy}q24owgP8TBqG*wo8bddO0gXRvHRpVsgc8Uk(r
zr%7yQo^IfaruX$&ZELK*W>wdkPH4bj0YtEDUag1}5Uwx~7gRPqjjX@y%+=#$f0<aQ
zTB%=SSYcNGxQN^UN&37cQ8_f!J<bw?3P+5)5D;D`G#Q}KMIEF|4~hTe+_O=Zj|*1@
z(LuV1gkRca&}=9&O)3j2L(w<wB_exfm67ORe2o{$m-%xz`dcg1!_;&6>G#M$m$eX=
z(O=sM=qGb`;S25BQ%((XbnDzpl=;OyJ-RicfkE6>!&*-JR90jhG#FXf>>*q~euU#i
z`&67j2quFWQ8;v<TGH%PM7>hWr5NKgt|>UP2#vfO4u^o{8$S2%8GHLj1A8Mqz3u2R
z#(KDqFJChjjMyc#N~f>5pw^eoBzW?d=kYUG7VreXjcn{(;MLV6dL{O!^T6U=0TDdk
zxqcNLc%0_V>w8^`(EHOT{K%HD-|vq@&&_mWEGEoA4`KRBW_W9e(6{PkZgCv8Cv2fY
zymCKnL2cZ;4UMNX`*OO<<|jJ%0QrQajgRH2A+(U>Rj%W;z2B0$dI^)2h@71r?<NdH
zh13tNk8ZbPXVd=LyV}3uLWLZCM|ul306ZCv?gn2=ON08YWX&P5k`6_|OY~0;ksfRO
zS>AwkyrD5+>~m=zf&7Z2NX;9YHGOrwd0DDOsw0C7`{U$OitsUk@Ar+{pR~h9Z1>Wf
z$wl%fk8krjv+*>`;KkA)1R~-wh(n3&aVO7;)Iw@(0kHxjZU@yDU8b9Ku|Do{%b&%$
zY&$r=G5@l4Ah2Co^oAGrc2<+>GsjSB;uNDuW??X;qfw;n{nJNN88Pqp^z&etV<NaR
zr|!*B5)dIAsYt-pdH3!G8@AWi$MFPcLghJO)rCI^a)hMW#y-NQRq--F32zZv0A<67
zx%(%=l7S_+m_?vn7eg72Mp~-Hrm~)k*a&(=5W7uAH@IM$Y{?jaFrB$z_c;+1QL@1I
z6E4%!ReuP62;}hjA7DN7!xI)l<K5!MDYWaQ?e~QsO2=A3U@Hjv9f3g}OZ$xK^S+fW
z`F)k-AJ7<)c)ub4q`mjS#KaRogU8+IKvZrRUdfI2R17x->EEf(hYZQ?7g?!N-pI|h
z%h#sTJQiDJNFm6|JyiGCn<u|9T>v^=SUs%;wzxu?&brHFa}FxsAcG_HKdO(7@y0+r
z7kd%=4US!<Ve@8NitVEf2aV-RsUDGkQU{tN!hg3H<n%m-dgwC5j_&UU%>nbqjv`>I
z{W?5rnZ3!6f5^yLw7EAxO{l^7o}Fba4IL5`BEywe5Y29+gY)+`r*I~qG>KiN5}idp
zPhh6t)Ci5REj7eO@H3I5Tu?(T;xyvJ`@p<g3-d$JdAxFjt6^Xj{xZHWjf=a$n-6aA
zuA#~UmPreM@0B^M6Nt?QyaNY?ei`jCW_Zzg^9$q|@g;E=Co|#`=EoN$zl(oJJ8Qm}
zP4?ibWW0iPO7~K8be2wsEtWX}mY2s)7+q6jPf=z4A~7uCRFuhQl?Ma+RmI=LN}<D?
z9_NIlqcz;vt)|%uilw&07OwSxJVLzSj7@PB_{gsv$O!@Xd_WU;HbDGGhsgj=M*zXe
zAO{d|YLF8MgaeAu*3uenD5R)G2fc5$YS2t2^QUU-h`~!V_7=|^dK8*S6$hmqQFUg1
z*#PzAGa&sC*QoZ9WPLTV%yax^GJy3s5xOR_(um@dYS4raGHn|cgrAzT$@2}_4pA5q
z&D~6j1w~MfkhVLD81m3XDmn;kLl7f-!-%gVQn;3?o+|Q&W`0R^=dDn6m$ZTTB9N3I
zQjVvEAmFfSAYP^!#*wmQS)<+su6fmFtW+QSvO0YDR;swXEL)2#REH@uXklLuCVwVQ
zl@J*jsBAjCZy+oiMR^t(%n3-;m^0>*-T!2SZ;2%HlosX@O8hx<9AP-pQOacD)wnHY
z=;W5H{y7YOo#9Id%r|)0NyOP#-dRo@b+|tAfdL<9TX$eBd~?#2SCFGpwWFggOJWzr
zHEYnyH!)rQEf@b0`I@?h@N+aSk?XZ1-*$-T%hTu16(Lk$jTlcyy5y<M#N)BLOXlQ8
zX-O|iC6S^BMz$ZXt)5V|Vln~|u~8W&1N&hGXrVA}9bNG@(%?o1#0};(v5XJ3&zHXq
z6;(36SLkIn1-k+nd09P$*+|zCa`TvEm*h2KuhvmSzyUGlRoME=I8gZ`u1p7KTxx|L
zR82Bk<7wkUcImCLX$$oAcPV9C1=>Vz`Cf(NOQ5NivWXU&ntFR~aI1*rwUZ$w4z*Lz
zLlZv<y9v`AhtpmJ<pN_G;0JTGbP3#I;5QkJR0dZU3eN^u%rtXQAlPn{%yuF#nFy?J
zkJep`*kIvzHDh$Z{Pk?*I?QW03Jb6|f*MG(1INo~y?WaLe)GgWQKK7XN7&E-Kf^*)
zWgKf%-A{nx<osW9aTxy9t|d+`|IG<j#nlJ!qtC~@UIPUTw=CkUc>0G8fJ}WxZB|JK
z4IiRGV37KUO6<t*lKFNJ;qiPbghW!P{uz?dQAdeF1ZqEUSo$|g5E1OKk7i!`LSsHf
zy|F>)b%9VrfHoMsbLQdeV4Lg`ik6FCob&kpUTZ*VbY9ogrQ86$Vl3l2msHPH(GZ^s
z9p_MAE`@E8EmdxdpNZT8iHw|EtByS1HzQ7g7b($4C1xeMgEPr`-hXIErFLvWnGpGs
zW+|Siua}5bd;R2hE5&P>?E~9&Zj{U>`Hq@2PfRnk%i&Rx<~kw?6Jr{p&A3maDzf28
z2S``CZ2S!B%gU)u*_g-$69;MQ>|-`}lshiAeh=j338QGYllGQmwsfN}#pypwr_TM}
z`d;j?yubV9%FC|%vp*T8>iMP0I^yA+GqeFDVCjVbV-+?F)nu2wH{R_AP(l&40o`FO
z>Lpb84ytp}uI};Tmj;U|z^hYQS>&ZShqpeCktfc*tPv<y8HS*IFeLjcC@(~I9u=R|
z?dw2X*J7=7)U_OxzPR&vCvq`1jydV=!~D>m{jvfYJc>YDPd<020rc^Z&s*Jn05P{|
zhbt7>9S^U78a>uQ`u969mH)z@I2Gu-H_Wn*F<o3nYIYdxq%!q-5;3aWOI8vrJ~c|V
z`LP)CPYDY$uD|a*^+VLIzmUn(X0eojml1OZ^0B!I6YMkU)pAJv#%+sjsm^O@-d29m
zt}Z1jrcFwXuKr6p8A!#+8WHV(b0qd^ycyFSr=_BuCmwEhPN60r6<?Kd#d<?fEFj;E
z|JJMa*a7{%Zr9_o{?nGIqLDRZ)F7j@6ok`cg4f04zU=34SHTOXr>%g9&A@pj@VzI}
zOIrz>r_$u1^%Fq!Rg`yZ{oLq9T|2>(-;NZ?tr#*A6_mzZ!ExeSvYpn(wjH{bv(63&
zr-uSbISW7J<nq_BlGz(~YBTa^+o6p=YkAUULf%i3*z0)j>#SPOR^KUA<83E%6Lcpv
zB)1o};s3-OpGY6h8%c4({+sUmi=IwtzPNb$7>nOR)z^a+3nxG&xc=z5;VIdOL5dD3
zBFdc7zss*gb_sv$U3ryE7c8&MF}YboVzc)rrTL*!t3<sta34JMjh{CiQaDmB{89&%
zK~*W-p9fmlvr8RO8;ck!P>ZT<83ZqQkLqOfOU|D#{O}a^Ze=tGCC5)z?0)w0?E_)Q
z5`x?as67v@5y{M{&F*{(87lmoRp^V@)^Ja7UF!3>Lab^~=*^^OZ#s4P4E%%ld}vkR
zXygW0C?kYjj-q331S=nI)p|t40=upncC8kx{v&2hn-6vke0r^H4eV-A^h$X*!jDIJ
zm9%Tclg@zc(p^r$5wcmM-|Kn7ar*>J(h)x2H}6W80dEwrgGZNY;cRI9H|qg1wF!UT
zrceyA*gy{sT3)1_B^L^Lb_vhQW1Op~VL>oFq?yWq2GwvP5gEaFGO9gNj|^6}`g6Ey
zd4X{Ep7X^x5eyz(yj8J;^E$n7x|}2jlhcJ<{4xVy5p+p1PHG#Oj#7xU`Am)~s7R)X
z`Oe2s?-GfPN)QDnR(t0h=jy;?e{Z|g?}OH0tzk~uWl<oddOuK3D=A0PMa@|QtzX)G
zeYtFB8qHNrIWEbV(Pt7i;DstAZeuqrnnoR=N4$e#?$7aW0^zkVV`U;;!O>J0PjN+)
zMMJ}C1haA$A>ufbVAkJn5y94&4dL&Me2LX_e?c_LmK#;m-k3O%c`AjZX$85#1QoG6
z<j#f8f^lle3Wwf&1=@<cby{8f6ZGo`7QavoR=0l2N8_3g-$fkx%zpJsN4g}2J+)a1
zH>0cA`I<m0_F!X-=~anhz7pzOWN5xw13Z>-JxZY?_M*oEd3_8d<nnL37quC4`ho*i
zxr7xyS(ZdW%AHGN<~Yc-BVZx6^oulG$2>TOjH1riZ<&VWQrD0=x*ouyt<yq>6M4Hy
z+&-khdXEcTBHL+~RV3MX&r;nPDA#0jK;V~l{P?EG1WCfSyQ>Q==IpL>94fZj+{c1#
z(r&YcrC#hmOj?-awrxq2GM{ts-CqE4HVn(=-N<^q_mJ7?*W-RaB!@B=%b!dIrLdEh
zIX$D9{jKLuaA~{*G`kD-foVs_e|RQ;i&BJ->Htu(;yhQ)ao*ZjC#~T2_ZTqCZISq9
zA{aM2MtQbY_jMRE*68!%IB>_n9Eyb|lShwei_-9^tN8>7Q6`#`OCZK?k@#EoJ@@VM
zgG~AM;+pK26O`nqjK_QtHxTCFT5N`pYH)Xb+240tBCKtyz)FHeN0RhoQlCI!s%*jA
za0#=~=ZsIf3ceF-E6`nukpYM_mr*jg`PYhp(1zrd<KaC@tBh?Fa^<uOG{NLaut?E#
zdd4_C;ehjx)wX$Ze0{3>GxD*P0gp6?LHB$HX=ES4I}ja)%LF8bgk4gYs)(xEOc+?2
z@gCIo4~F2!^)=FKL!dEukLgKnc5t$$tLj~{I-an}9unl7RbJun)oa{rYIjwXMgRt~
z(1<-(r_t*^gODB`d@g+3KiqufeF$G5i+LA)2dY@#VUITKQQ(HB&!?d0KElQ+s!8Sd
zP|PG@TQpkS1;3v(hq1ZwNxfP;xNL<*!P9lpH$1HKvZ254b6fNKe!wX-4P*VH4#GKP
z(ih(Xt6sLuQ5q|6;%_{|&{CW&=XW1YGUxZG)Ekc?STYrO8U-h64{!iW5q^fewk%aS
zVByQc9tvS+v@Y_;F==BxsI70wkR4nv8ww1hpl9QdAzd$vjNjud-nW<~tZZi<>WpVd
zh#$^5o%(gB78O&Qu`p9p!;*l_M)QY|a}wb0K>Sx26B$a<xa-z~iWc{b;~F-))hF3-
z+3BO{-OYB&-({p6nHBQG1N@is<zstiN6v<Zfd|;f)Lm++fNmX=2&`nM!x)P^x~IW8
z(CP@cv15cgKt2R~1KXDS?%dG>A1x(zO;2Z?uBiG+yI&WS{eK9<LAAla_E)N|F?224
zOZM;#qGUF%KiW`eVw;EKG}}juEmj}R^Oy+28}g<thEuoE``Tq6ZGDKjSNm_qly2K(
zYvW}Dho_+iBY0rThr$l1DLB(<^}eY;%6noJwuEL4P>m1T-W(-Dl(!kuav$P?=!;)v
zfU2*%({2s&G@0(9ZfhxO-1g$qZs6`eZ(OAiZltG*I*!7O4pJ$PxQBk{A(;YEeJOe-
zUS{$DT)J>~inL7(4hag#P@~!eBL^0TX||vLSRu*!o+ArSc8hgvf8ai{#70$??^4<H
zi<=$yg>suM4H|;&!bjQj8SfB*5!11Z@!zRjIc4xV;rn_raH@T*(;8};NDCj1jqlp}
zBB>V4?}m!5bnXXww%@o|a;H7TgwNdbH785qDjO3=*gp({5q*^s7@q9RRf(%F?$lba
zN1;n1F{Mm@89Fick_ZRUXX#g=G5EkG1*381?98X!PHC(i=rCN5DlKD)Jk#VmMhgk}
z3zBk^!a`B4AftMD^gl3G@kv3A;=f~0>fzA1R>bu#M=Uxp?iz&{Zn_Wpj<%pLJ==JR
zg(p?uXyupw!2hdn74mmjdny!1`wj*Ga7g+8@<IIfVXd`=lk-2CR+|5QR(q|f<CMjL
z;`3T7{~O#s3N!lJb)|7<oyFm?K7&lD^Y@K0Pqg6?20AgCFw)OQ%1{_6#6gS3R@gI%
zQIXf|^89iF0#jr`lPnMjWCP$!AEl=M4mWIi=)G3uGkNqF6gaUxIB<g?-G;Rm6etaF
z7hr00v^WaEB+$&rC?H_MDNS7r%_<><zik<yJGvn|(O4v}CZi*A`_Mgb7ysX_>{rT9
zvKkB0VTO*!N7kYByp<YSLHYF1r`Dk6o<3~+L?G<`o>2I?j#3?;;LWAW#FgK}DuLuS
z>3g8A%$A$|q>tGkfN(6jM`=L836M@Q>Qz)xcdvU39X#KT*4sF<Gpq;$qzwZq!q%T>
z&6>2>v;yMhnY2$J>^)L36z=>18<@=iUsnzJ^m&&Rtu`ylTEN#g1EqQ)Z#aX$Y-H&o
zFfWqc4%S|E%m5>Tx?j48ZSel|q%@^FascV|`hu3O?j1hEc(;8!vt<OVv%Xy(TtH3D
zknf!=K93u7fuiHPJFsQUl)V~He3j<P$&w{0;f;YGIyb3oobeJFY3y>>H_q5tYC|C`
zXM=wRGlwX)hY0KJjS)l64xO?o_+L2pA%XV+#)1Q#Z5IxC$p+DAV}$N;5WRtTHOVj)
z29=atENGmAgi=IIEe4O7>A@y+7Nv+;<mh<&#Q|;5y9$U@E19Zw$sP;M-JtlmV4Xqn
z5~#@#mL|RC&QAEwwan(5b+Ra5aFRMt*e-0yl4IM7N|~KkV@^$FOq26EBR;4I;iCl>
zJsQ)<BBszmtZ5EqV9f?XDBKrC5JG^JDo<P3HrN*|85srC_Kd`;2}zq1kqoG#Y6;3!
zodS8WLE+CE6?o=@{zOKGa+&=(zqP&`3e9;VK&#^6S%yi1y6&Cmc6pK$M(0ThyLM*M
z`Jyl3Vq~qwUE#tm$TIff3-;$wER_(>sixvB_D|9@ln!q+u|L%<LpkC!$W+!jB5ha#
z=+q@gss;%r83VZLfCz5~QMMKcmvo+Z{^2b|A}AR{_s9{WC2Xx+N4HMxJNe$TZ9k{8
z;~vBhaB6!4yO{$LB?K})4)*^R=pzAT=p+YsjtpIfwcS%n#diI&wq={4`?%r)U7A6D
ze2)m^L9(XJl@)yuN($YSp66I|6RlP%)5n9*ILZH5!fX8@v!ISMdvP(;JH1|px`{%%
zxh>xBp*Zj@%{;N1t2Ly^%p_Yat$q~Dz+tX-DiJc7DVxc5KycifR<Gbv?QPxgb?v5^
zX<j`n7=m(HR+dhPYDdRZGB%nxclJX1C1?U194WPjNu>0rDp=RPlA%gxE!5D|eX+dG
z&a3d-8(hZbvOy+?98UZZ1wCg{32NU%l2GL-Izd5#-i#ZiyGCPBj)jfCuB=h%2v63G
z&CvwOXxXdsa#*#@(6oe}4|sRQRJ1N}$g>g#R%qV;A=P&pS_&PV-G%6QvtVm!2}v$&
zx{8R5l~uHg4@(s>DHCgIt&Yx2(a7j1dOlCn3`t38$k*BubaPu9?c+@~^)PxHiL0hU
zT8+cerY;a3q7KU#T5j^pBETD{ho4>WGu>4gjyQX7XjDC=X$8Fa*(%P&;Q?bL{98>n
zm&(bhaWkB9$+7Cm+}~8f#|xMJI~a@nbFzPD$B<?x2i`T*bVXnqNtMIdK!wmB5D1Sf
zuRCxbYNx$y+LxehJrVWAnPCuPOF(P4U$SuA{@nhi#tQ#e+a{MnUroFh4%bpZMru*>
zh#l@nHMH+L@wC8kLW#MBKGS%oht*WGvqCOkTGFQP$yP3U8Zs^~;!3UI#!5kbdZo~l
z);Xp0#yACeF@`FzA-67KYAUk6gWbT2R7g#>q=T6vTT%IOr~xD)<50M5oYs^hF_V;%
z8|wBwhA?YWTb2l+a;DQ+51Ly$kPh4F+;$GyYYz}z{pp>dWwNhJHde2<9Skv<_BLV0
zXg?b0_GnKg?#kmp?Lfum<bA=gUPwj;v8vaumxpdAF|?4YzCzj53VeiBJ=;2!WSjsN
zH^};Q+0)6pEK}N1%R&W7Q0f$@yFc3-;CNQbCR{zQY^Vvx>~iXBAHMm%ipQ(h{`%SZ
zN6zrV^=&B!IIOMjamN`ZY5@YQ*q$L|qC(;G9%AT|?6-gKu$@l=>H*(W&|G~2+7Hb8
z*yG5{XdK7eizLi(2#A0dFmI5J0boA12}oj^pgF&0C?2ewQsrfbwyMbrl9148^erwt
z*rwGF0z4BcpN{G|10-9`dKaW`?MU(OKM7lpuZcz`!hE}qB7F`g?#kHnD1yIE-^DJ{
zvAeGTUq-{^n1s7e;eyjk-TQKADB96Mdr#LS`qT{G14njf9aH-nc-jnVbr*zNX{~^9
zXB##cDZF;WmlgYZ|5Z+-{+3hrnKq@FzuqSwXaE50e=`QMF|hwfH8uS&s;TO(T_Fd8
z?`iGbe3*Z-5ahN`Io-ku(uQqqYdM?qvXZjKU&7OpK0e#Ei`v(&oizby=5>YUc}^_)
z)am<ih8-9@7_gP9e1UnOd#tQQ@D6+eA66XAB{1c3Dmpm@QOJg(Xrq`Fz{6#r8N}gV
z_jjOS^n&!AU_O(aQI7nSq6qZB5ki8vqbgM-HDu+&lw^sb!d<###z~gwSA}5JAEnfU
zGa{<#vga!)N-FH6gZu57%>=JNcKbx|hc%3DfUBxN%|uNl*Q5H-mxRyf8z4RDUg`T~
z79M;ei4~Mdn{uS@c&*fwIo3od$G~$w5@Z-Q3kNyqQQmq4p4ogaMuRDh^^Fu>;g{Na
zf3?}3`T01Tz)BlQ`Z6>nLUk<Ul!vVz7x)fx!MzP5<Uz!a_I80s&_7KO^XCVT8VCjU
z0pD-#9uWhN06IRpQ-Q}wK0K_s26Zq3T<Tcw$IsSiAWlZ&c@j!k;MulinK)dXT996*
zv*kTdP$1(8Wkz5s*@*MP>bJg)5k7$<@!1eNJ?w!hFw`HFUm%f;#EJzL<!{ladtxE-
z6s45CrM;%Y3mYX8uqvwq3CY!fJeH1=Z>B=f98tOemptJo3;MAVo!2iWybR6~x0Fs;
zDIRwp&+Ag0i6o~aav15BBxz8ZR95n<+iB`y$LGmCihbR6WL@N##RHfgw_c)H1#%lW
zZh1zWv6a#?0|iC=>12$NiH2}6wvLVLt0ivD>rtzl_bh&-b*a$hn#~tplCFP_s?WN&
zeN6w%QL9XJIT5w`S%x;Ts0NwaLtFZS6N6#%8F7{F0<b9qq2?_py`uCH%ixbiB=M(x
z=?sKBBJFp0rGCj(ua-UUGL0{Z#X(zK!6<;aOn;^}I>%s4|F*s=7%$RnX?-?|?qhVG
z=f<|u&Erl!(QmGtUzr%G?9{U1el)ljg!w$xR#~8rIU^60+;(xj$S`w$!A_R&bQHfr
z!I12nF77PcRW>YY|5>^Y`KtShIAI>B79{D+e_1(~P2cI31)*WWn0kQ2!bUmy1CO&r
zQx-d&y%DhqDgxWW^Ja%n_r0(F<yuGk`F4#L3vY7vR=0T=WZRooG~;X5W-&w7i7)jw
zOC)AKQ_d1h1|v&04@`d}ohzQBpih#(^U70O4A>eNE_^j_9?-TiFfDe5o!ql*v7F84
ztO6(ekoD`Wvi_UtJV8)g=B*y{+1G52ocsL+X?(d&kD&db^Cw$XJ%BERSOu_N0^K&u
zleFkPu1~s;gFK@LRVdO1hE&Qa`np2r^#?6R5atKyUnwH?Z;Ajbzroc1n<5hbZjk@G
z6yap@&mV5<{~|@G>BJqdq4><!wi)7yldxshZThG~meUxUxlW|cCzh9JR?`5ZLpUBR
zxu(zb-ns}91Vc1G&bd}R1p4^!&G7zmO|)&jj7D(`l8UGF-iP{g>owO4SA%;hmXj5u
zjK4>$W*P*PWQOs``nTsKn?|H2N!GVU#ojJBLLkdj4s&GD6)$B>#8%ce$Ghi5D`Fd;
zf+vfaaWpWLkqEuSCA+Hf=40XTqV#*VQ7I|{**Ug3T0p0GDreW`i+0zcr6eck%_-$6
z)|$Pz{KSIzIfAdT1UOM|ce}oGpI*q7FWS~C?;R>*=g5>YS8>!KwGGH794EB*kp#IZ
z+%jz9`4<O&FR`;<e~5jri*>myJeM6B<`?S&I^)YKW#6@vB_9p=APw?;V3vBx?^|6f
zj~o+gz4`%r(73obhMa-fMTlQAy*t5(!b)%FkH$drHW06RrG@rvL9@A$7AP}B4{&B7
zKUW4UP=gK$6hQ*btaPY4g_upxHz_l|^(U#!AtdoAOaomA+Ey4RqOr!3H)KRT+m`4)
z+}I8=UUwp4=6FnMh3X0S6$RpB&seAe4Zuioa_(dy)3j@s?lOA0NHX?ef5Uxbe>5!1
ziLXa{=fRnhLgko~*;zDk;=&{BcSD``<Wz_c2Zz@7A58+&o8})OVu|8a0i6oE-~8if
zq)I{J$KoHlh(__1jF9yQC-F5k3y$>xtGg2%-2hdpf>|57zg0FiW~|P>uIVUalXA1v
z-&(cpOwBD*o>mqvT~D`}wd5O7q80aA^T3Zjy5|8T#;C&1>?tw)CeITcTuwZ|1HNi2
zq$>V=h@emkR|b>qn;lTv_VE6N*yX>y+@vQb%Ups+yzAE{AshWPP*78pMo4Nr+*p*b
zT?+W+FaM^VTQCBu1^+PUZBKG>lLT|nOeV3wC;NgXgkn}nDH~}Kh5q)S{(k3+%Dq?>
zJfS62i<bn(Sy7}55PT$Ql;d=doCdqeJtrjzY5ms1FTqwsQTt|m2(hM=K7!L?>+;#(
z9b1Ry)`K9bbI{j}uI)X%xG2XHoQA$JX%(9!zNX*C^V-cDW;UOEmy~<b5Vwbch`p%}
zYZ#ZwdhcC$xa5uTYtbRsohLV(K>i5ez~B$74<4m7`u#wIr@K&<lKBn%FVQCa6|L%C
zMATn&Awc)vN6G&mo@N^tYiA2*b4L>c<NtkW#qr<Ec3I6vZc`lL`$n%`hHouZF{)Kb
zj#s3ErA;0SOIUiiT(ELDC%D+Ewz(5-y0=%O_BRJ*h+{#=-<L|=cxJnJm~$9=ZoP;>
zr}#yU1xn--w^w}{S{pkLJ^UIcw#1)9wV6$9`T2XEyg{atryz?PCzPQmNO|asnTn{~
zshINuvE`-Dei^K4Mos{@VC4v%q%d?TGl5onFxu^#$sVwZ>FBU?!I{`HOjQ-;E(QL#
z&dvoKs`QWJCzsr!Q8xFbXb>heY^g{~WXNbxE}3;_j4^ISid>>%+``h<XflN)vYV{S
zvLq`SBorx+<Wf&VF|Ns;gLG!cU!MPX=J8<W`#FBUci!`R-}ijqW79J#QxPQp=p1P-
ztud-wIW45YEYA8)#?OOHb$bn6<1NhR#qE0xUL<c0LKmE<q*)Yrrajc>QyO=j@-k_T
zX}C8SBH467=O4NAg=#x_vBHFPJNRD*^XR`vXQv8?o?+T{SLzK{nqofx?uDoe5~HZg
z)-j!rr$^>Ak!{EC)`a#H7t<*@9g`UUkdVV7O8svXw~inOjr|U$2uzQL?L#*BnK2kj
z*}=NoM_#wrD^iiUvKHQR!*!lw^|AM9DI2;z@eT!wxRdb=8ZO~oXvAKXYUB=+i<&u+
zUgn!z$NJlbNxkp7qX}cQR2L@|Ve|#tEcEzKf)j5Ltuc<JW!@H+_HPV?CT#|+t#?1{
z>NVR@Be2t<if8tkeGu}JIC7|qLJ|+@kx4#ah(1B!4oS5!HE`NQY{j8?>bat&V~Asi
z?10q2kBl3aKB;?^?XcU}BD=;ZN#N8+GsAtj$FqsI;?4Bc@jSm2PtBTTen~wl_j%-I
zn6o;?j->U>NU)(;v&zOyo%^+k!kjkZuUptFv(H(H^d`qZt8fi^x+(qRv%4AY+icyV
zPHs1xKs!t6@_1{AyJ2b@JMxmo_9*u^Ires4B;TfZ+hUu09ZL(OX*5l>13c>e8eyS+
z;{`u97Q5KEa+%-1f{QY0viB;r*58Yl%NTg?Ow{g-NoEbbC+hGN25VG5qgBk_QgGle
zowi~KMe|NdCyblBX~oTl9gxL$1;#~dOWz98v1g3XXShsVo@E{TjrLyqPS)|VFz5LV
zg%y;X7q&%$l!7PJfSUFrGaFm%8{&E+UOF^WYc~{m;GQ$cEV5pi$&d1GJ3R+#3N82!
z&7MHLjDLmfi>R37F6Rr2qr2RsVtPq8kI_?4FmrgzVS<?YjKv`5ADKRPQ;m-tR&
z=ETDk&UiUIk3UmoappIhxf?!w?HS&0@a@;z5f5&)G{Wk1XbYFaVfY@CbpUVybfPJ+
z*XiUCGy%VSF|}K;lMk8b_8lu)T9O5(_5h-8WL9PUKE*mjmz9bbm(9jVzRGcAF)`(0
zk7BvB`%eYa6QnOzq1cuPhgVIrZ$Ah{p4*QQjOCROE>D+#VVI<L4D*O-I4BZRk|f~I
zN5rz!Mq^UqBTK6C`b=eb!zY=ShYW6aBt<C|?mx20Ma?(*evzu+Fuj%5u%oHRxv|<J
zV!PPDO`}b3o;u?W$t&b;%Wd<>_S2I&l#c!RN{xJYel4Ob0c}zm^UgbhGB-`EJe<<~
z*1gj1UjA$4FZnM#seKzQ%1mz9;du!jThDj?qQ<5F@OoG9X$q~EqA8adpf2XGr?_$V
zv4aFg)WsmCdgUFpKN!D031~%U{^LzbPB0m!>N>=ucFk9J|7CYgrwk|g6hT1N>nX4*
zw2zi&M5E%%ezn7fi%3$PHecT!F2TsC+BIo1A4RpCX!*0|YRu=XZ=EibBvp^d#9;sc
z62L?$t|3WU-^r3WwwzR}vEe1_hnK{iR9*0H>NL+-Go$ny@)EH}KD=|n1|FS1OIJ2(
zia;b(?4_<35E)>(5tPah)Wg%Js_`U|8>7iZ54a@T>@SI){BtB~P*+BYc|SyZ{n2Z|
z=XSlP%5)}wNFoQP7NPpKUVconeB9T3v)}W@y-t4FGuD%rrxLZKx=$6VakH*!-}ZHR
zv<`9h)4}MwQG%_lL!$ZHrsT4_k-6C^$`h_1l4tPoYU1fk+!hk^&L(Ah#lBr0lIaM(
zVhmMpLswwoo!zmm-uW^?W17>pxxdr>Dn&g@j7vUxwBkx<Tmxa}E+~vr)>#uxU>J?S
zFiNcu#<ewZpG0$SFnBQ|Uw$ZSIPdiI9!4mlRe1eg;jVJaV|)BE^~u-LG-h6_rikd|
zwiu1%8_QkDbri(C<)-r&eimqK=iaCD#5B)CijehKYQl=pjF&ldo~ty4tN-J$C)l5q
zY@RVwm`cLsjiS1`)l}Zf9+y@ry5CZAu4DbDRyzmPq$#8Bs#Hg_S7GFYxZ@9yZGJr+
zeJ&3&uZH`?_zwiPlxvOdKkIcRREv2!oa=C8qGcFmw9TQV)QZcRlH(<daz|q<Sw08M
z$JFhbRH0_JXp`l+I%`Pityh)+;{!c6evQvbH~#=HU((kWrM$9_0*_yM9Ud>gUtUQA
zwHu{{(o_<}V!-Jl?nQ*eS#~Eb?*a&9fqO@NFo3>8Jr3x|<psEX#b4rrf`x!}JS;F-
zJYwJ<;ZjgGp*MVeAeN;7fF7X_{(3=*&6f+RLR(R-s0!)x1CXjBYS0xzX7K`m$dW4f
zBdB`utE!8y57}wale;!e;Zswld0@@NL;!#&o8}|1*IhW$Wvk^voYyAn;K9hh2bN*;
z2ceWfNdthzLoEZ>F&1PORxZH3xQK2pfnX8?)~L>T+hw?V<z~1#{3gucaYHv@{!WP5
zcMXFpA2(Q1X4^w-wP^e=kN2YLQp>_FseW~QgMyIbd&R?C6#Q@d+Oia0D8%##BX+_6
zqm{9Hzu_TBW7l5M3BFoDzO`g_V=tT`gJTQGa@+ehA@_X(r@s+SIAy~|Sjp`OA|SWp
zib+`fCpf)ca0J7a6R}*ZERR1x3grA+g~EBwI-Eju;-qj~!45*8E7(_oa4s;yA&P;V
z5ccIpkN_<=u0r6PbA=NELOBU+Gq4~4nt@#fz&T?B2c(B{0@&tnKmas<vkHK7bO{Gw
zqSyc{jWt08G}c@N0e!653tl)vI+hIqb)YMkzaVH0XA<_J4GyZl@O{u?3AZ*9dtC!3
z@m=C1!K<9r^cQ<V&bk1uuN1eW53dqHQK(Ab$OA8URsw)6;FlmjIN$)^3IP8C08&v!

literal 0
HcmV?d00001

diff --git a/sbin/spark-config.sh b/sbin/spark-config.sh
index 147b506dd5ca3..5c87da5815b64 100755
--- a/sbin/spark-config.sh
+++ b/sbin/spark-config.sh
@@ -36,4 +36,4 @@ export SPARK_HOME=${SPARK_PREFIX}
 export SPARK_CONF_DIR="$SPARK_HOME/conf"
 # Add the PySpark classes to the PYTHONPATH:
 export PYTHONPATH=$SPARK_HOME/python:$PYTHONPATH
-export PYTHONPATH=$SPARK_HOME/python/lib/py4j-0.8.1-src.zip:$PYTHONPATH
+export PYTHONPATH=$SPARK_HOME/python/lib/py4j-0.8.2.1-src.zip:$PYTHONPATH
diff --git a/sbin/spark-executor b/sbin/spark-executor
index 336549f29c9ce..3621321a9bc8d 100755
--- a/sbin/spark-executor
+++ b/sbin/spark-executor
@@ -20,7 +20,7 @@
 FWDIR="$(cd `dirname $0`/..; pwd)"
 
 export PYTHONPATH=$FWDIR/python:$PYTHONPATH
-export PYTHONPATH=$FWDIR/python/lib/py4j-0.8.1-src.zip:$PYTHONPATH
+export PYTHONPATH=$FWDIR/python/lib/py4j-0.8.2.1-src.zip:$PYTHONPATH
 
 echo "Running spark-executor with framework dir = $FWDIR"
 exec $FWDIR/bin/spark-class org.apache.spark.executor.MesosExecutorBackend

From f96cd4eced0a5d6d9c18f9c9228b295a58098387 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@kens-mbp.gateway.sonic.net>
Date: Sat, 2 Aug 2014 15:58:24 -0700
Subject: [PATCH 35/69] tried to restart callback server

---
 python/pyspark/java_gateway.py      | 5 ++++-
 python/pyspark/streaming/context.py | 8 ++++++++
 2 files changed, 12 insertions(+), 1 deletion(-)

diff --git a/python/pyspark/java_gateway.py b/python/pyspark/java_gateway.py
index 671c0d426677a..f7f4a82ede3a0 100644
--- a/python/pyspark/java_gateway.py
+++ b/python/pyspark/java_gateway.py
@@ -76,7 +76,10 @@ def run(self):
         EchoOutputThread(proc.stdout).start()
 
     # Connect to the gateway
-    gateway = JavaGateway(GatewayClient(port=gateway_port), auto_convert=False, start_callback_server=True)
+    # If start_callback_server is True, it looks like callback server is not killed
+    # process is hang up and test case does not move forward.
+    #gateway = JavaGateway(GatewayClient(port=gateway_port), auto_convert=False, start_callback_server=True)
+    gateway = JavaGateway(GatewayClient(port=gateway_port), auto_convert=False, start_callback_server=False)
 
     # Import the classes used by PySpark
     java_import(gateway.jvm, "org.apache.spark.SparkConf")
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index a4900191d1730..04737243f3192 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -15,6 +15,8 @@
 # limitations under the License.
 #
 
+import time
+
 from pyspark.conf import SparkConf
 from pyspark.files import SparkFiles
 from pyspark.java_gateway import launch_gateway
@@ -60,6 +62,12 @@ def __init__(self, master=None, appName=None, sparkHome=None, pyFiles=None,
         @param duration: A L{Duration} Duration for SparkStreaming
 
         """
+
+        # launch call back server
+        if not gateway:
+            gateway = launch_gateway()
+#        gateway.restart_callback_server()
+
         # Create the Python Sparkcontext
         self._sc = SparkContext(master=master, appName=appName, sparkHome=sparkHome,
                         pyFiles=pyFiles, environment=environment, batchSize=batchSize,

From 1679808cfc45aba0a74edb6ebf9caa12ada664b9 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@kens-mbp.gateway.sonic.net>
Date: Sat, 2 Aug 2014 20:05:15 -0700
Subject: [PATCH 36/69] Kill py4j callback server properly

---
 python/pyspark/streaming/context.py | 22 ++++++++++++++++------
 1 file changed, 16 insertions(+), 6 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 04737243f3192..5952e81a4bef3 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -15,7 +15,8 @@
 # limitations under the License.
 #
 
-import time
+import sys
+from signal import signal, SIGTERM, SIGINT
 
 from pyspark.conf import SparkConf
 from pyspark.files import SparkFiles
@@ -63,15 +64,14 @@ def __init__(self, master=None, appName=None, sparkHome=None, pyFiles=None,
 
         """
 
-        # launch call back server
-        if not gateway:
-            gateway = launch_gateway()
-#        gateway.restart_callback_server()
-
         # Create the Python Sparkcontext
         self._sc = SparkContext(master=master, appName=appName, sparkHome=sparkHome,
                         pyFiles=pyFiles, environment=environment, batchSize=batchSize,
                         serializer=serializer, conf=conf, gateway=gateway)
+
+        # Start py4j callback server
+        SparkContext._gateway.restart_callback_server()
+        self._clean_up_trigger()
         self._jvm = self._sc._jvm
         self._jssc = self._initialize_context(self._sc._jsc, duration._jduration)
 
@@ -79,6 +79,16 @@ def __init__(self, master=None, appName=None, sparkHome=None, pyFiles=None,
     def _initialize_context(self, jspark_context, jduration):
         return self._jvm.JavaStreamingContext(jspark_context, jduration)
 
+    def _clean_up_trigger(self):
+        """Kill py4j callback server properly using signal lib"""
+
+        def clean_up_handler(*args):
+            SparkContext._gateway.shutdown()
+            sys.exit(0)
+
+        for sig in (SIGINT, SIGTERM):
+            signal(sig, clean_up_handler)
+
     def start(self):
         """
         Start the execution of the streams.

From 0f83eaab0afb5a57c0ca2225142222a323ff3325 Mon Sep 17 00:00:00 2001
From: Ken Takagiwa <ken@kens-mbp.gateway.sonic.net>
Date: Sat, 2 Aug 2014 20:07:15 -0700
Subject: [PATCH 37/69] delete py4j 0.8.1

---
 python/lib/py4j-0.8.1-src.zip | Bin 37673 -> 0 bytes
 1 file changed, 0 insertions(+), 0 deletions(-)
 delete mode 100644 python/lib/py4j-0.8.1-src.zip

diff --git a/python/lib/py4j-0.8.1-src.zip b/python/lib/py4j-0.8.1-src.zip
deleted file mode 100644
index 68d7267c733da88cfdc5d9b97e24327013ec766d..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 37673
zcmb4qbC4$el5X4POxy0Bwr$(CZQHiHr)}G|ZQC~Qd}sIE-S6Dp*u52z74=W$`-^-l
zpC>6R0Sp2K@Yj_XK`8i-hkw6;0$>5yx-pvnQc{Ej03I<ImVf;tPOi`ZfFLKp0095E
z$^N&mL;v%2M<WMEhyPGwYxrL(LHYBm5CD_hMEuPylR?ve^anu$0AT)IiMgJ$o{p8C
zt<GOMX>8s8aWeY%BiX;?Uru(Zyls=uir{@*eKQ;4n<xOe=~YTIcZ9TNUEN&D?6|0)
zs0Nl9xS)&6eCed}xou;K2bz9arhb|ojeaqGKhCfX0|N$Zp)8wc>hBsYZ5Fr%AIF0c
zLv;>JzL<<oN=6X0CNEqsVgYb>?r#FI?^HVGuOB%ldBdMeFJq7`J0ULw-FJWxCu*-u
z5l#tNJ~ts=BrkW9DxP+PS*^`%Tvb-7WMlL*j3#d`Qhk~`DX)%>8fW{m1G|;f6_~{x
zFD7ahx@U@_gt(N+NCd~i6n9kTn&xKkVH`zAs{bB8-cYJ`Bbj0szST$#Qj4$@k0td>
zfWCJp7VWvgb^{r@_a3Va9eF4-sZwiI!0;Ob+V$}Q6Z><8q-Cw>!QY$?)xVHVj(qx3
z<2lEJ0HlhGnGP#ABLkCBCr2g%A&Z9lHz+<7`bkVoN(vb#{LJF<AeAc3?65*TY=9BO
zT<_e-uWFNeyi`m9AgS~@)*VNI#e<p6P4N{56X`}uG6Z6gyy%~bcEW<ldR}jnBu|hS
z0`>&1?^_VcbQKrXPsn6LkpMzPg?kLy0l29AxtT>D*;|vL1&vY(7-dyKgyb5)t_ugr
zx0AtWw&<NR7XhX;ut%v4>()9;zyc``+4RM7Y2e*DzdI8N#q6c;0{u#b?MrhS>%g2g
zy~3PSv!zcdK{uc+`aI(0C^F-oyG#o3-wGz}z}ZvwTgDcMsKlWH&5-iR$d7t<NLV}^
ztlU*XI$b-lW$smgELvmBl*+q`4U28I!nf8pO^V<<<qIb`NbTQ?jYTC4m_ostbB<hS
z^=ob!iX7fxbp?oJ0V%kgYydgu9{e&{Astt@i6bdU5v$rwR=*eAqtw5t6C}MJT4IN$
z5R7D(Cv4axmP2PZMu%w9CCiN7Re6RWGzHK*9cqq1+XT$ul-n_^DlI$O+83J`aM6AZ
z^!Q9E5r58wdJ~i^XdM@1y9t~4@TL`zh73si<u<HqwsE{k5euik%WP_|z_0%{<tE&q
z5Uj&Ax5>H+Jl#AO>>&u~rMk|k<<qPB?%|vCKU<q9&1%t-UC<p5_<q{m!;N0F0blQn
z*}mF+kqwT9Z|CAZdGZiD%XA6OII^sJuMPaBvJX7U6c;e<+c8Gsy4jn02s`)*DvUJh
zFnzC%aif9|7s`b}ji93Oa*y~14|S9%H~A`{a>z^6eHzh?asDd-hdgj05H~~a+6Bz3
zF2UwkoMzNJXgp>2`=nVA>WMt7JSswl<L<R=bs*z5Vk+d1W1@MV;aGi4fzdfEgLd=f
z&t{=~g#PaT0Ghur;y>dQ+TSrkN5{<C%uz?@e}IR-^!*#=OjD-_tj#R%86p7yIOqWY
z;Qn3TKQPBc&(X+5&+Tux)5P5(|CjtL?r@$vuMf?BzoKBCg7+lygT~gOX60v7(4&qo
zULu>Za23H%A!&x!@cDxBj!s}cvc2hVPh9z{YC_7@%{3@vg=tP$nHZZG+pG|K@LVC1
zrnY=-BD(Q#u5%0|Cl{Gj&d1KCN{Q|yuuR||d55UJzw<Pz`xK75q6LZ=O7^=BaWd=J
z1)BYs2(yw&xurL3lG=DBfH0_g(9-R(oQ_fx?JN;EVTI~2ny>_%MM_0JYH>ItHnka8
zPX2H|hA4TRi`W$U!Acd*YbxL^Sz|r03_=+SqKv|-qnZhjmAQJX@~IaBQzi3l3?JP5
znJ^w5C`Oxqs2Y!kviGwDcrg*-=Up%er}MESQ1F7D!I`HR0DA8EF!TFagM82cT|~V1
zFXhhZVB`sOM`~TsPmU#gYewzC$Y6Xer;)e(MSSg@ZSoO?<>KsjOz8SL*ptL8;uw^h
z>4)q!7u|L6HgVc5zV%;urTyKSb+4&G*!IKv9%uA61l&_UQ*pRs)IofR#!8RrdB9MM
zdNRZCXdtv>co;~Bq*tqO2NzsYu_aM!c{lBLKrFytY8TC6-<omXnx7^gFJrNg&vVu<
zn}R=kWvyz}S-wv?>$kH!S!->igKcuzLSbf(CSI^wy0SgfT5@HMEkCgp4|c(^HJ2WH
z^wuxou9J*^_-KC%%s$mH_~5j6ErF$xSc>z0Ay}SG0CDK=azQ^nAr4Dz4%wC*pW?b8
zxD*RGKV^b`jD|x^cAR_RG441zb1T)=5bp*q(!4${>x^bt*gJ6%nJhPVKZF>%N_{zd
z+wle4ydNAry*2Rsh`nd{LR|!#`2-BX?cm|MeBQR@hn`8rVqvERWxz#GZ3Zpq#XZ^6
z7}3pnH;hAlq0IWln-R5mcm8qiXEsTxM1%$F9au*6IdT#KPZ|+)%+BZx+?~Tg4y8rq
z4ZdmgFvIJ`+9n7g9ysuW4#DqSRhYDs%CXU520_vjcPPEeqUdpLCFEPOQebJnC~Nok
z9`RT}jh;xo5ho;$C)dyNFv;CBQ>(axH2i?D+94z?yrWtn$+r*qA7q1?!-CjSN3JLY
zF9;xPsPVuRI5)2Nt5+8n1u=MN0wtLsR0Q4#)3ngB&xjc`T=cN~Tlkj1nP?);{)O<R
z;E63J;b<2{uzDj=RvIy>ESI8Iyq*yR?!(cIN<U056?H-APYjXttJp}w_3QCC?Xi*P
z&z|bw>mC4!)?-0~e~?>2ygsMG^b<>fqH_n@hI>NK<Uk=&G4s;;0C65UoXHe`9k75B
zTObn7?*Gp5DTSAug@CNHy*cR(swtZk`7%5xSJ!kwfWe_`i(Ro`Jxw<Xe@AwtSr{jl
z@H!PfLJFKu@U*a{!XWO7bnnT01LI;YuGI2hWza@68KO;k9{?1*;Y6dq<0a(xI^7!C
zrj>s;5{55clW!5S<FP;SKYWG!4#!g;`1GMEExztB%0`delY4o_d*F@9M;sU`oMvsi
ztOqA6@hmcN%<xeaE}#zi9(R~5!LOb16$4jHL^P?00LH__u*Vh^Pcvu?pRE^UKY$UJ
zN!HI>FI@o}&`FcOdr$&3n;MA`@rL5O+r<@JrfQE2pp=A_<4J2<-OX<kV9cfZT@H1^
zJFm3UZ!^zY5=UqN@WI#X{~7n|XQU_k7cOB;94;hI{OAZg;!MaaBxk_~sC(2KgI@L&
z1&qfy*3lL^7B;f6lv%<X0Lp^!0bSFKRH2d-Pgv?XR%y`;6d5out}@;lRASZ7iQ(3;
zD(d~yt=uJR-=U;t*uCVBz}ry9O)#kT9ZrN4T{wQ;PSyy#wwqAvjL0;B6odiIR1;o+
zd)sILz-a!^j2{`GcKD@M%b+(5=Q~14N8MyBY!lkC`-6m5yRLi#cL4+pec^0voE3c=
zJO~aQ1{Y4rMDOZIO4Ta@bTw72hW_PyXFs62$81-n`iwk)0cXU)DlxtWGQj2hLAO>B
zV1s6sW0SXr;sS5m@P(^`n-IW?pH^a;2xj%jmBnVWNYcl~Fnt!z+IgMDwQ4{FZ)=B-
zh-@>Be$<5}^V1A8uv0fp<vz7RzoJ+gbfVV2c;zypCOPyE)JOy~$g+P#;4i$+(i`gY
z12q0bRDFp}@IP~#(3S29r7E`j1e@7-2?-axuM5&s2DIobq8F^q+u%=o;QDDzSo_*8
zX8E}*z%1#5?uV;)tBI6_i@J#{?`Bug!8rjg(u_{aymwTmCWA0lmRLn`RW!F8wE1?E
zo<&50@^w7?q52+f0r7pCUoh5bU5Z&N+O77u_1I4f!7-43e;bIyL}k;J)I7T375-*X
zBaSqv(o4Pq%)&e%?nFmNpr0O&?;x<1F5vz^_s)N&ML*GbzmvV2jr2$gv;q&&oW~D&
z=Q8ru>L}o(pNCQIXgnc7t=ArTka56`_@PuqMn;o&n;lyDTQS!D8?iBh&~5aM_*guQ
z?p|ACD-6mfIl29y>z)%-WtIOG8dcM1Dtq2Cpv-c74~p_R;f6-0(oLEw(7?!AHWMxM
zphyzT+ysu3PKf=8Ue_l$ZgfFUeP%OIk6a;S*<WNnr`F9lc7DgBwpF8Mn6<ih`q`oD
z*3@;On*ofDw(Z@GEo%=a&fnM<elI+S8A{}f3=LZ4BVU<a)9{Ig-z8QR3qsi4`>|FZ
z@rg&)oNcZ3_4_8^QzL30d1O;lpwP?5u*-(~4H_*-Z<u^f4bq_-GKZY`-f3Pj<#3ol
z(iXv@dt$a_et|v3myA^rlD|$6e<khUMU}?vK>zSMXP1p9D93bPx4RD9I`Kl}%)!kS
zpKBx*9zdlR*^8t*t0rpxU{HCJl<<wv79L|~%&6My&=GvcC6uJq!m2Pk3DJ*7-KLG-
zXOoO3pZa{$$$K;tPb>}V!r~{6kIVi~zDIFk`*{YXYQ5sIX`avIed2Rw;IvSk5fhZR
zLgzDt^7TulXNtLUm`q*kl=p?zJNTcKXsv1_DrW{kAPr6Wp@#WXhpQ8>dGyBuVYXpR
z7VA2yROV;#X;Bklu?M!$RGPa@EJ;=D4y3eXWQd?D#-r6$MOIg!i-f9N3B-=1&EE}8
z>YN=hTGLS~J}-B<aoXKVQFb_4q_xZ<v1>RW{bRfJAeWe=uJ+eJJt#(U9@6NKrZ#4b
z?FG<W$duDx*JUJxCB^5CNsb~=Yxo@Gz$j+LoDw&tk3amyGgn595gKO5+x8L;s<g32
zDPZ3p7HF7u3LTqQH0;)H&5V(Jep_N)8CyB+>f!{JOPtMfFq?RPgup{jv+gA<aSYo6
zP4^2p4))PSmoj(=g379X*HQpxa|0`(uZ|NMp9bq$A)!(xABY}0)cXtWn@|k0W2D^%
z@>ryYNt=75GxT9LbwVnRlSG{ZFT`Q@;%0CV#NMP<r(_mN!)uDHE6c90Srd3vEh+5x
zC5s6REs;zC=t)F784#Lyw#Id;xfoXOpcN*c#C~YDO(Z246qJK<z<NTE&(>RsepfGX
zqWk%{T%p5da90{CEs@-&T5h5=rua2YY@KiEJu6+;u)*nQ${||NvRVG}xXD{j{1XSz
zuXR+ui^h4&&(Jr$t#&4;7-!FFLJne=^6x8MKSonTxBfPNW~!26!EZ8gj@s%i=fppB
zli^f3rq$1VeRth5=De;-Io~%M#A-evN)@bAq1l3;7GEN9b{TEFt{f3S@D6){^pwMl
zwT6<v0j(859Q-JnKkWV<G#YDfXlT_0CYu<mt_t}itO=)0?l5lRKKvn>5Fxn7zlOoP
zC7?ih7IXEXzD%MGmeXRN*rX=5-u<1_bXTrXq+0C13m*K!%asZ#7%mffu0>3%tQG3Z
z2`$Lpp^B(!P6*|%LD8ZFjuW^;aWwoX<BK1<e++xGG`xk8?V}yD_gm%m8NXu@L3#+p
zo{zeSc<RV@dnRod1z~v^<}s!v%n#bA`gU0_L=_zTX54cygSvbP{)uBQ%*KBtYSSZ_
z9@+*+!7(?Ai66B}Ehb`aNmm222Hv8!y>Ug8hiRqL-BQsK_KA=BNqsxahf{eOv}4Gf
zMtAAlRYuMpuu;3$V{y)Y(-=(L9zNGS=OUU8XBe=JQ=4M$WMwpyX%Cswh&N|lAc|0=
zuL}z;CtSvy9fdTLgmdXW##vmyA`l+ZB&ko0V$h#p2yZm-&=#r72?I-GF;qD>Pq1^x
z@obd<28SlrqEO6nby_G@Mx2$N;Y=oWk(MXNp(qh6xrIbaE-2D$C|em)DBaj}>wTbm
zfygQ;fQ${JwS9(dx$nNWyA?WXuQ^a-l#O~(7)YVk2a?S~!X9*9{g<8ww`NbzZ{`!V
z#)^h)r$mg%6EQ3Bd?g~6kt;@Zy|&;3u0avk$JiIX&}ul*QlXB(Nbw(zF$LolVG-55
z*}vzY;#iYmS3Yi$Ay)|u5$_GWi8OM-i+W2Go7FPj=vh(t%7vk6gjgW?6tO#}PlV4Q
zxwPekqwYUL^~Jo#uWo`VyA30XUu6Te9KMU;c$T7%(MS6uUq9%{m&9=9_RA0#wH3Qw
zlW0U=t#$EyYB7vB108dV&3EeoC-ToGY&t_<I&D!_*3qLsK+c8;2SLYgIUsZ^J+KOw
z6|^K>p-jeZBG1#Ia}o70H5Db6$*PlGHFsf#t=wN)57Y@vNVjz3w(5Mz`dm^Tm~~cr
zQaBm8Z-;^?I97+AD}Zo?59h)HZp_NwuT@rw$QENGLYNpY53`~eXdKtku1#w;`?MTP
z$#H4AGn1df#<LvRlcMjDt7&2hH7-ETt_l(^E$+b3)^~r&l(H#68BI~Cx+D9utJv5H
z=eY@A+pPlk-C@HHyNYR7P1jGD1!lT#fX2#C%1t9>-NUJ{n=K+<XfQtxNbMa%@+lKG
zmpHE@RZybsLoMwiHqVdXdFzY14Vg|D{RwXx7tvW!2*RA>Q2<A!fJ(qL;XhyndoG^W
z<uJ1C^)b}rHb!^|F!xsDnzU5o8~fYgQ?|>&{5rK3a}0aPWRNmz4Xa}12R~=p1Ptpx
z(mEVT6M6bj4>!CGfnrr6(g_&AU)Tj_<RQ|}cIl=SgDN=7_R}y0B>>L^>j&z}RX9YZ
zZ2<x=!plSEr(@WD+$%(}>uP$m?2PlIzKVSTkkUu5ppdD$)`aUT8yhYbVHMdg5#nHS
zYQEeeaK6t4=>qnLd=%DHX2=DYIW<aCn^^BVVGSUA6=v;|GDmo2gsD6((DBBmAC^=-
zzAfsB$kNkHS6{%BqF=vXn#liV-6MQNr!olGW=#ea+2tKbr0IOgv~fjgQ-^qTv&-HT
z&5#NponWcvVr+d^YmrH)+~?Nxwp|s-PMXH4VVj2E)&ss<e-6!?RJl?6dGI3zP+)J#
zv{L>)lV7-yE!}N+CEi^aw2v}d2zX566G|H-ml-yXhZ|`WHj<%)XiUa5g`*Ow_;qyy
zZ>lp)j}Y{LtiKY`C#rGM(R@mn7!5_xt+v;UVpLcu5M-JRR>lKPbubHmD=085aN?QM
z;Hj%S)5dc$(b?InGHjzpZx()34b1mg<c=+oE;m(@c|W;wE!{4;f2&1vmxWxI>38#I
zM1%$9bQxPlgUrw&&&B+CdGF1ExoKh0p~ew)mr62_NBbBO6WQ?)<~*;`Nk}fVI`Vbw
zINlDhHy(H2hULBoPt4$Z6Nz=h%?X7Mx<Sge=fX0`c~jTKa$U4UF6Ddhv${2ztLTdE
zZ|8Sw8juJBtFL_J3rD@9M@M3;z4$L->_lNuIZQ^jx)oVKAl7-St=eN+=jP?l(t><?
zs0|uA=@EnIv7YH}jrf4oyUH$k=SQxHJ%2YaN>b$E!DeBKg0i9Nk3=slPx1~?BvY&F
z1WyN`XJYwV`(H&PzYKR`nzx>I!`7|P@it0R2^vS?hX<(TN1Q`3n^25lC_d#~<4@B$
zSI-(X+TB{_6#Dr2oFovW0+IbIWy<a6zn2Z;FVaaulim0n>(N<^&9IJB#JZKZ{mJ^m
zd!d>KN<x&Nx?WIsy+u2PV1zaKV*Pf?S9<6<j<`P@b(boi>a&I$!c#+s;u5+qFD}Y>
z^V?yg8e9U{9_cqNl$>c!F%h%&eJIG$*-J)*k#-M4U<KQz`35FB+|}Z0@;WtUt&eQN
zi44Uv+Fy@6xqc(Sc3Jw@V)Qt&Ng}BqxVGg;Y^T-M^h#)_#}wBMhTPqCJ4On`i{!>r
z$6|mUS_H;RwdvlXEd3@9+K>5AI;eKP&$@H4Qrc_KoOo7sT4C1C+OEB1bMji>LforR
zimsfQ{|5h$;+1a%5x*J*`Pe-e002K0007>9QM@wHv$WLLGqCtu^(x2jSoSaZ*Xos;
zmCZUc!q=5fZwoG!UX?D#Bvb<f?XcZ_T?3?f^W+Q|5cO;mlGp+nMYQZg_qAvoGco0q
z1UQONF?=l%&UG~W@AiH2O677oLlB2OLX3RAz8P)INA^wW{9Dqg7ymjHQ(T5FJp3?w
zN8e+jA-*-!-hrR_i1wRmLkz;2=%8}^KSk8ATo*{Kf7tffrZypF7cow-+Chg2(=m+k
z;}Au<6G;WQUX^H69(A}{mJBmyQ26OH>-es7Pt4yTzw$@i;}M9*>cvRbx>SN9qYZ2j
zH)|VQ(jF5ndK14!P!8wI`L|~G*>aK&ouGF0USY{<>}if?_O$o!DPd+E18BiWv`kKu
z!$y_%$*RlmgsYS*eShu^aQ*beYB>%VmBTD_72a@+v-?f6FPy)d@Kc=45`qdqL<}Mz
za1+6JwHgDWib*m$q<`jZ1Enb4YQgi0_(oy&*Kue$d6ojZf{Ee=Ogs?`=L9eY%dbo7
zBaiRe&w7xOesTqGNr2o-xC`zczlam(>h%bm%LzLe!EC^YL>3n}|AYahrbd?OnZZF&
zc2<GwDUy@P)%X5c5UHsdo#EnQQ+r1K<Ll|*{M#Sc-ElDqv#vmM`L&6-K0n|@@_|dq
z_`I+Y(SBqhZ&e5M(gb3&8KcTX@_G)DwN4*z#n`t!b7^0HkyX1~->yN^5!JKA0*v-N
z10xEcWoaYEP=*ZFd8*TD!4wf?Hp<Nit5`X1`iL0hfefNf%rKoj$GLWTYgB05I7t7<
z+gYS47|)t(u{V1*s%~C(YhAyr5{7JfI>S+8)1(q2V(rHV6cW_W2Gabk@wmI*rU^(l
zAupZ(i4~uPvl*CQ^D77iOQFSu&VZGrXNT(7I~OQ!U;&DvMsD>_BUxWv1kl>tstR5T
zJ6~m@r%L`emW9Uip0ujl_D9jaS<$Z^xMZcOu}GzIVao&LS!zF1-Vg2wgAx!Sd`4NP
zO#q6_a|+Qk6bB<Ii+qr=1VAggRdOk{_g~pqY=|55kBP*A(g+AVhk#I6!pO;`N#oSh
zP)C^Dq1ey^)|Hb<xtl9KkZJI3Do0sF`^vgDqLrHfZdUwn5e7b=4{SHTgjzr|jE%{P
zG|yKZ1vC|UZrT{-3!(bR2{IChO{nT7t<q$fTPdl{2}143qp_2@S6TNa5sC@&D`Jn;
z%YeGqI>!))bnR+y<I}?J?PDsWF`YPUSHqR;3AOz0%srR8sH_}v#lum=DPKjqG>ukB
zB|G!@K1R}zEPUf=X-dq=r5@I_0XdUz$!k|7^=%d5O5-MBO_eU1qXS1$UXYD)xBVp(
z?7<9`SX3-HhUIU5L|Ubb*?AkP$D;znMKUE3mQ-V{WsDN|D!7Cfv}G-QKIU@nKc>7`
z9Ir25H75g~2>;lF+o<`Sx)Dx{sU{_>qRgs9a?aY>7kC37c685R^{c=^4(I(&*bzf^
zPUet9BKslTS!oGSsQ4f_Fge?vcJ14?g*?RT8v;oLqO9Q{Re(zPt+Epib2gsUOjK0g
ziIQ9ii>)b>7&njKh0v=Wu@<Uu508o+&&mE2T7BJ^pyvW$EyA3D>=DN)32$~+=~~Bc
z36Qu{GEHKvYSx}lA7pZoF*Ns36U@_(j4=fU)hlj4hy2zy8A;H@l%CUt2R53tFp-Id
zt>H--zc|9TuOBeIc0;O1hUV!LTdho?W48&9Xo4ZHvTlX|GxBTH)>Ns#u#$S*J0C(U
zcgDL04kE|;*y@XU`xU9%x>4d!rOmRkTg8I6+O^R@1It$tD;}tCk#jQ|=yJ!h*Fg=!
zs$HJeaH?EbRcv}u>R=>QnFvc_j*Y+}6OGQ^nZ?BWaFYtqi?ssj<7d2cGT#pZjF46+
zGDLpzC<yk~m!((S#Y;MUj1w*buq&drmzJGC)q_vYLn8YlZLVgI#_SQ`A>dA4pB(KV
zB5=lxV8fC*4@6U?HA}2yDTPjvg$P(|2CP)7l`S|W^h)zsH+^EN9Pb@i0snof*GDL?
z>*LA?67uqQ)mkB?{W6cV#bLyEy+mpwN>eIN3@L~Ry7A?0)CDP66Id|u^KB6wE~wI<
zH?fmKdCKslI;|h<15e(4g~?5>pFu;CjE#v*P3>36v9n5JTl}8xV$F-By*Fbj1+Wlj
z@}0R~4#)Np7uQCs$D8BrcdgRe0rn10FUcZ4IygV9roW7b!B;J1LA9I=fzL-jlbO40
ze&}?fls@l<wFI6nDK=Xq`HLvIOCyHOM<NcOr}pFehjWsE71EsiECT6^<b?;+Y8@Wr
z@zquDak<*vjgiU1L<9i^+3->9qzUq$F}Tb~IyTcGn$+Ji1=$PGizK|o?exZF(qif3
zyJ(x_Uk!)Zqn3O@{|_?#tFshOePi(PhfL4O0sc_wzjwg@t%d!MPLQRUgX7<b^uKFA
zt7|!Au%dW9SIcIB+eZA1ymVfw-&$p~yRS_nQE1P)GUSZZKlp)8h$e{i{hl-s0t&I$
zq_z<<DLEwioL!z@PKXZ@p4T7^1OizH_|!wL?z_bSn;LwpQT|98IRXVvXbTQp$4|3n
zsR0E_1>6Cc+!!f}f;SE{H8cze7<Wun6GgR*Pv&b~0_cja&q6Q~&ZSOgkK8(N3*5o0
zcjEf&Zl4z18WvGm@I%<eyDOL#b78Gf3<7F?=F7Qe3Eg#HKwg)4W%&kB{kdU0#x}!U
zYp$)nMf|1!7P+IxTG)!C#V|Voug7mF;zQn-mR_$4GD67+@e4;&J!M!Yx-w&bwH1uN
zMNqjVJTwZoQ@PwIpBMsCsyQfoXUL@#5fq+GmLnf6$EV%$1p1`y%qoLvaf!FR{pM5#
zpL@8bo0&9a0OnE5)9&KEs@`{?SKDJNjv3x-TU=d|4a=`ur`vzt;^x*Jj9b%(J!7Kh
z0^`HU&I#1`7}@sz^v#ey%Rd6XgEd3aWWj^}@N0gWlr&+K9R47{j(v^7>H#ONw&FT#
zMeUfGi3T*(d>YuhFO9$Sf<KSO_8>0MWX~akjMs@>Hw<_OU>F$i;Yx0gtC$asrT~gF
z8iKnQ$0}jsB&W2r%~6@%4_}<%o)Q0URYl-{#_Uio-2{DmJKy&yLW|Z;!C0k3`cPoz
z3dPF_;{=KePels9IN|yC^qBWd({!#$JEP(m8?ob=_1u~?DW<isgvn{;&xwh&Nm4FH
z#5*McTr~fJdqXN|#3UM+74?BMjA?%ex!Zy;d<d{&#Yr>kI@`Pj0|US6uAyiZ0ZCH=
zqCQnr4St!5V;~P^DBM|tJojAC@9^+oc9XZ$Ys>S2;OrMXv<gnnMVJJr%kHsGrw189
zbnc{(OGkRG&tFCCbWGLQOYE3=8HQdwfxfKr#bScll@wfsz6t93lA-lRw#V8fC<knM
z>55th#B~b*?b@VBl^}scBLEj|5TUIgik5t#;*MjF-(2}fcts=VZrLK#_|4_3=$6Sn
zM_)VEt*10L9R0X{4lOTWS2IAu_&|n-Gn=vyc)IaGshbJF>_Yu#U@SM}<FM`C%q*BD
zDPGQ5K<39`uOEVZIFL=rGNgpBxnliRMW$F69QjM+inQ>7RQEGp<}vF&2@OfZ4Dal<
z)%Q>4pwB{(&(CwVIw*GC3R3q>Cn|I(Qc?-$^Gj~IlF?~PZ1cJFCW<CgtPpHB##Bn!
z<=YxoJnh<O$7|<ya{57S<`hLEgBuZ%<aKn1j%{3!xVd$J{DZ_dFmdEw%KX1tlzuGH
zSPIZFbet-#G<VARbOjVOIjxdRBZC*Xg+ostk_X*z7RFMz4~>)*q|{@FYcE&ql44-u
zsV=ON+rt+#V7AhS)t+@OKI&5{(lN}Z{Pwf4U?5Z#)9+LY4$d{@b(8Qp3M!0<$Y77V
zvy!tmHxDcBH&#YWNXH;t!i6ml6_bKBwp2}FD6OTlA2OA#WC$xI*XLnw^uM&GiSY8I
z9Jd>?hQwA;Dx$<{WmfG42T_Hs3o15xXyD}r)XBlb_m<?K2tky#-7}~VS3eJ!dutr7
zV|9Zu5d5YrmPu-DU9}oOF=tbDXXLFf=<1Bd^x=;}{@T~Iv7tk=nFi+&U^ve)hNQ%5
zt0_b10RV(Yp3&~L1-;f>F#ZK$-DDWVg*`zF<}$P7QZr{tugRX-e!dn0f7K+7QbT!w
z69VU?TSRPDd8;w(eeSRGCF&sSRzR+fkt%s-y@laGt+jAGeR$CHo9+2{@K8`hCh)O5
zwW-mR>gWvNQ`sFV!I^$cj68VJcO_aSu<#H>bt9wZQ9hTlSbifd5!TGSRZo>)6oxKu
zeIKoUBXnYJK}*Pm6HE@4`pQ@iBIyXLt$I+aiZ^AF&9S+7u(R4%;)1Os6{AoGyLjl=
zHfDb)q>78^kzI`t-*auXamZuGO?l1PlYNKjt%{!UQRw2<vv&6K)kt3~wkirm{iDF1
zdWBR|_?$uP5FDQ~14XA>SHc8wYh?q)Xb!OhAWjafH}9SCVUvJmOoHCeDTl^Gt{ZT5
zSEa2_ZC7UZw=R=f$M<*gDZYRVomLum;UF@>e#914f5Qb+F4sW(&IFzvo7-g_!=RT4
zHw1R(xxMAs7)~2YpO4T0o9Y2sZBc{<rWuA6G&F=ZIbpn4vOur`qm$Vi#>Td)aU&&T
zYC1;8sh6!=-I~rP_**=M+p{|H5V0D&$s?&74<?$+g_wiv?i4Ia!nfCCN}y<l;rzAG
zB7{4(X&(9EjT0mI8Xj)Xc>FUi7rX(^LEtAtzELl-7p`Gxpf0F!bjByExO$M}!(P~T
zkOY!8D>cj$*W|@$zSU>pie#WK(7!V(&jP08FCYMbIS>E<oWC=wzMG?wj)SAUnYGFP
zhEszS$F0|C5jxH(Ro``6LxY4za%p!YFj#~T8$ivU<Ix6$)mQ1s<cU?HAH`myzf@D=
z3rDU9{o%$JFHB8Z4pb+!rv>%rG;NObJKcFa&KdZOrSJ<TD9WhB$?x(QlR-FH^C|dO
zs{(dXs~x2SquZDcLBXiS)O0TMurK(meQyxYqR$DBt=AU-)YJt?=*k3Ifv84NT7|HB
zKBhMyD<4X`!aY%Oa>!7{$s|TQAlY4Rxe$hj`GV)HD8(o9;r#LBb~0P4AiLv@IFu*Q
zo%;y7-NE6C?}PCMC0PrcezGgB(yi9q(NhfWZBqx%<8Y#tTU~*48-kb*YeTOAy*CRP
z*LgI283+WGy7o-a640p|@NeY(8b4K<KDLU<<frN%KQ)ucdX31v-Vm=2M!10GxDCn4
zmAV{esGXfUcuO3ct&celG`KyzH)k`6s&vd(qUPna1*CjLC71@mp)JLjZG4fRUou4$
z;R46$=m*xCwbl`wG{nMoL4?1rivo{sm!Qe?l{dc2jNn?;o$3R-IXAo01YhF6w75mE
za@{6>2P^BF(aP4_>(<?47<QeSnY%LqrBE#48V$PPdrvu)xN(Ju`37fUHhOwz;c3Yu
ze!hi%dHE_EW}(BqkNgD;8`KSj22B@V=c_5fmJV(pQ!ruNU*Bd5w8dBbT{Rj+*iD&#
zihzDQ+S<=mmr3|x?AF=EHOQOp4Uk1qbRx?s10j^cb#^6FavkdO#`5>iaBs~{-0RO+
z;UEkE0QTQMLn|jsM>9uLdm}x=|HWY8qRP7UIxB+LvP#WW08tOBy@um#ke?GaliAq<
zUj>R93Sh6OK?pf96w%>=Pq%<voe_&vx=^?k=nC2>n*$p|dYsqxvoKVuU*w3tWG+#A
z^}C^siOcZ)mvK^S+!<`E@z{p1ujlD2L@Ie2vbaf7DT=JPtG2k2sM3w1F)t`fPU?(T
zUsWSY65tsTXUGJlo@=Qgl={6s4pVbwIz#hAdSO)+CSV9N%ZYVxi!yg9i@IIE!_5-h
zPvEvj4H|gse8nST25RM6eYmW7jV4{kXv>XSBT5H<4-xBfLbJy+SU2-#WxfvwTYj0~
z-@y--saPJ_DZP=V0i5zLV|VfZi#cdH{x?w~H|ilj3nfE$9H!5%9>uPe)c2-~_&2IL
zO&w3koLTzoP&kc($MalJw=9yAh^?p^n{?vG$0h7p@o`BZ-B{Ro!ja=8M?#+W>BOQ9
z?47xP4$hOieOGCd+%oc=x~h-M{1VP*<*q<YGMp*;#hdRy8}R<;#I}mRL9Gh`B1-Xy
z-!h?s7h~}<NPkPa0H<sZDPh7FVj)YI<?v0s736j!)}#msV%qPXEmY+(4+o%KRW6j5
z*@iaur6~p?Yqz*VK5>XR5rw0ZoSa2jqq}Kg#qkO<YMBGOB`S;a=^;_gD$sxog9KuR
zTiyz*10?oJKZvwU4sPXZvI@xL_vyt#y4*_&aw?3x#{@@8@=$Ao=+?Y^O2&O9D&l@z
zmwM~dM5$ZTF9<=6*3oq<OHu=GixPe^A#@eVroXQ|#uQ9wI|};D6ef!o+%80?7ZIu%
z2RIW6Iy32Gu!C68q8mx{k1v(P-m{S%Ol+;#1!-AnUV}QpUj?n#AyQ!U0}0OX!|gYt
zi)@e8QgIjyk;p1hvN5F&bZo*l-<iCh18;g}MON;u$<|qWWsL^!pu&TtvM0K1D+W3M
zlKviZ^Q+nM9*pZMl{CKHb}2EC$gqy5HR*4NHXeV;Qq<u!dw9Dyr+2Ijengg7mbv)7
zo78;E$N{UIGux=<VC}$^@CE#!d`IAl$E;F+ObcAGiqb@=$(0!c7Y{DF3Z33{b3X64
z<(&e(oZlSgig)$dGv&8UaH2|H>Mec;@7;Oeu>n`*fB59nr_1Y}cod1A_>`_P{Y33k
z`rRiJ_$vw;Gw%91%%;Cgr@<;8!@=sK9HYT}PZ?GH^<R=T!2`cqpg%tS0sjB^^gog{
zJ$w6q8QS}Avb89sb?Y@=1g~e6icE0K(Z&`cx6nXEAZwaJd?@K8sN6*`usu_+(<_Xz
zZI>mMNC8u~UJh=DqlpW(Y9qBFSpbC^B0E8ETE4bpxYH&MtNxcU`A4(}O8dz`cVM{P
z=*Sfe0yNS7zKNtz0sd18rBVQKF$9uYS)wR^p$?ESU{HU%Q-mi9gKUZ%w!RUD{={-T
z#9N>On7l>}&Sb`z*EzCedM_zBLJEl9m1RXJL$R!jsqIadCOyZfPOH@_qR!zJDV#EV
zry|ZC1?;lK5BBcj=YZe9Z>%>qu>Goi;i5qbxi=v}kl+-2mb@#KlmR<7)r(rRQ<rI_
ztx_SWI%tqz*huVZ(O+q4>HZ3B+F!JyNH|ofP<tbp&C$swV*C-|g~1GWcX#~4$al22
zqs^o9QOC$W{9W5o!vo!qBm47)CsM@+R~k(Zoux6RHtD;?)BU-}QS^C%596IRwI>*g
z->TP@SQp0E7oNlbS%`5UOutzBD<AF3oLg0@v|-Z%`R$g_N{$DTdsKdKQXcp1KVpEK
z&A_iwkm+X*URW9$mxnpUnZjW1IH%FyRsFW%-dnME8_y#aDMMmYawX`aUo%%)&o^py
z$07~Z@oVJJ8U;jZztm<F6<2vW4<0x$hl5J}F}PlWHJA&+SOF0LF@Lc?P~|DHD1Yoj
zQ=%+U=7&I*BUfQ6%c6N4EE<L_wTCC~PKcwc@uN{W(yR;47!3;})M4=UC<$Za3jdBq
zUP`qHfEt9~ty^K}GFyOE&{?~rRm^F}4R*x})eBchy;FPI9_q6G>I39d2=IK0{T{<8
zDg0A4lCFG~B=2_e5E7F8^qWW%Ck3H5+1QRsv8(%RlIQsJ=)Uw$da`c+;`P}`0{M_-
zRE{!N#q<l(H1*UAx$VVXhn`{dSoIU%iETWFoB*C8(F@m5$^TLuWXrbFc+lry$%zeQ
za+z~ZL|9#nooTLb*a@|G2OW2}{z-Fv4MN%VrwG-8ie0yiq__Z@U}E|!v*K?p?7@V`
z|KwPhQHA`JCjK#}e}-(M0RaGr{!W&Etpw=&-<E=rtDcpur4ju<r)|+bg5~~_e`za7
z$+lbf)52^#qHb9J%4SEsNz643krYbK!}}2;eR-xQ>nQ*2RX`>*;fE02!I2FH33v2p
zWKP<KkS+EqP8n$pmv<9a(+u=;ULzdQx%E2Wm>rAss?m)JOg_uim*G4cYdP*R*48z#
zhGq{xVa!@?Y;U^oz;v~C83Nl=={eygh8|<xrJ4%(F_Wpx#$X5#!RwAcuqps*cJ>6Z
zoZtmFf1RWxKc4K#@G|aACz1+1`APxJ`l<qnOoM2T!Q^K$0(hN7HaE<gV|4{<$gD*<
zmeW1mt6E8Yfn6t}X_H9Pt;wuH%bTGi@ZVz&45i;s6MxJo^v8@C|AiU<-Fp8t-hTs5
zRxwf*e~cG={e{{#8l*Q@D*^2{3k${pyVfqJ!e*DoW1E#k`?gIP564_GBXnIZf*V?*
z4W)1hTmVu10Xe=1%*i|{UTT72{(B7LNzr^-2TM2zs3jig;P%us`a!A*`Aw4WC03#I
zhGuP@iu@2;6_dQCai+<43G8lGU6V5QMQFV{QCo7$+cr8vwV7nzZgXkRpgAqm$12$V
z$aSWj{)WrTEZu|t%H0P@%s)oXJL+a$bEZWRNGYn=44cN7Q9|y~idX8MT781@@AeV%
z*4Y&OW1G-F=>g$?VV{5f%>D;MCB@1}^z$MNUcZxraS{z8tSOSC04c-!gLgiV)LF)d
zZ4$L(8naZsK3RV$ddSZBX>LutA6`QH`*I;bg@FEmZBNEq6^x})kr=uXJcbKyiiNZX
zx0HRPx(SYt^l$1e-4n+G^?ANZIN>W>iVYyG=8{G-pt1>Utf7QDEtt(6rI^^%AMcUz
zBStwY6hhjc(^nA2BP<~(nK#L|<HizBmK8|v!}BTcM`(*?6m1DUv+#@he6{Qpi(fx9
z?o_WW-zNJiUp39%gO_O&%~RI_H8;TzTGpik;u*+Ub9Il(-HD>ZO>>||vF9d&XI0@h
zp9%<bx}xr^plX;(nRJ+COdGMVj*AvO&1Tn(q+$5(S?^NMVs2CTIfr0QGR#f**uf;<
zo*GCK*_NU%>jU>QTMs#h*yqPoYB$5P=yyQ2+|x{JUuN*f@4x>^b?@&)pnvWAApSoU
zQDZY}JxeopBm4hN_O__9Y4Im}^Lf_6ZwpzWN?kz#^Xn0B;)ZGKUE+$uH+<b-PpXuR
zM{n!)CiPi=Tr>Q963{=F?rwkI47pgfJgPvY1*VH*V>1Zv$Vjk7q{2GpqMRsHlt7|0
zqT%CpzMPQdk)tO}Bncw_6EM$NQYPUGW!wJ*MlA&#49rGGGb4urZkV&pRKNG<*u*j5
z&46+MzYyn}1K6unfNWYG#^e!mAerOI!FYWoX2<a{fXrmhV>{in2b7$3&Tz&e6@K_Z
z*lVjb<Q9kO|1+%3?1CEGe_6S()$X>|^X&A+Rc5P7)R$J1wsKUA)X}H`(ApfvB4`f9
zAb(*IFW!Aq`>8fiJx(a3p~=U^SC#a5DW6UqgHRPiCaq`N+0CEk_n@5!f-sj&V+M4B
ztOhz&gubwIa;1{hk54tGqh##*l3lkgvW}a$eUGye?%M5(h^P}R=$AMH$`pnk=SZe-
z?+;HvwZ_}ud}w}a5x$v5zFg!E{c~6gsSuPyBNyAUGgrK39^34CQZlkT%mIVVP!>hG
z$Em%wH+)xjb{5gcK^|35J+2vE9HmwM?CE+GYQ9s8Qdo+8(rC_gHOa8}`QW`5Pp@H#
zP2PRk-t}lORw3}_>VVl0uRWoYd?`tYyGmKl!zC;eUV|?^!b&OX0ra>&sFDlPFDyxA
zFV@?h8|$2S!FP(cV)o3cCnt|J@55A9^dtW2<;#Q&O`H5U(?`VNEIpQM>(!1MNPU>}
zt-{5z<d3LGvat>j-w|^ZEq?trBPKgJObW|HKvPh#f+T^<V3$25ROZ{y>ssho>k1GT
z@3m>%qrE7jMyxBgug{nGbcuznF75$7i$f*8AO}|qc$db0%YYj{kc(gHfS(@;SZ5-d
zCSz_UB}ej=efQUldi`J>Y$YSOHnYZ_!w{;u4i`slc}SlMZ@zxwGU{IMcmfU^xvm2u
zOXH@x;HZ1}GxwSBG-+SSdQQo`P=M`NV0lclUSt~&6h7_udyC16D?<pI1?#{j;wVit
z_fJ(3?E3)zhik1-PVrMr@NDY;ajkT?|9aKU!RYV3h7Xu_xxeIJ*!5CHDrQd@q4QlO
zF%`IJplRsB7@iV82=sbFdWBY<b5^iisoW1Jat-&?njy{Sw>f429h&%2tYMyQZo4LK
zwRWeqK=ZnjFjP=4aRH<!BGlWp$4vKAHTJPcT!vH`caKQ!1Q_wqG%cEiq+mf7jZl>$
z2JmtD#sL&t2-%dp5uQw*P@5nPVSu>kCNSM{=>+WETt7MCzGga^!YNQ=bUf4guX4uc
z!=+UlC+=x!YLf6-wk1X|rzCa{?`9*7T4YbDPOh+Hic{=WYjK6idEql;A8RRaqVBHt
zeV2Zn;1BN~TTi?ZsP>(slk{HVSi@?2P!0I;tY0*Hl5+xz9Ew%Xy?}36x%EM@bDvAK
zh3s4>9cqRTiz7M%D>B6Z&C{i7vNXYJB>6$Ka_Np;9+ihe$+upEQ2nT!+}wSxP&_gM
zFN~k=$bksbf8y2z$iQa64WF!N|5X@nABrYDTIf-ZRMfBfkXbT_A)!1Nutif%iZ)>e
z)ALQrEVbJSY8NOmGDyQfH+)bj_tXr>M3Mt*{=N0eqLB-0BF3v;bnHC05zQ!jp`r3{
zg0!mT5{P&$RYb&WF+B(9CwA@m6uCUeE7>-s5!RO%TZb#s<Z+ESD&oR2PLtp%aZNR@
zYg%&X2sLAxiQOGbr||~Ci4BV<0Yb6DWj?Jknyi7uU*bhzxnprh+K2|SC3KLrdq=TV
zRdaWGz`xdu{>&+=Rt7RRs%0sytxZ{+tU9Bk4~HF+#9t_%Ou|T2#&4;+Z(enH7~fkY
z`^!On96kGbcC%pML8=`hVAFu^+puXdS50wV<JEjCIf*IxbcgZ>nI_E;eMoW+PBss-
zQPQ9oUq_3Htu|=KranKjv(Y{Mim3CqPcKO<JjpgTug7^nSKVwyqUIWUcCXQS%1Eea
zSD+7#&m$6huQ}C$kV`Es6Krf^QootjxSjr1`%vsgqql)<^(SJ&)6FW9$eH1sy3l~j
zCaCv&H+iFr@6mWl?sXIhM+(O#)EP<cW8Ksn?^(zFz-05#JBAhmVTO~8xP5fd)Z$u{
zC~@oUym&HoEBq{6H@H4;c73yA(>V>}hQ5sf{F?22{L_#(WB684_wFpdoo+f8q<kw+
z4PE(?!-C1_ccaP+yq9)EgXfv6NJ{_um#_}j<wd;okK0}$001EVGi>?4T=+i(DVHi%
z77M%xU)efz3-DW`TC#|VyuHfg5M91YG6c(=hW4w@^_b2qo!NUnF3v2iM9=aXLMT?;
zS|s;x6ATO+T&dit{AKhs=#ZYATxr}6@h3Ywc<%Xi>Ub;uY9qAANU*f5yYY};piBk+
zKY=l%3JZ1}<R_Dgo<UjAnAku_80Pp%PKn1f`pMjL<J2a2#a#OtIkS59Lt=1*<@(Gu
z$g+Cq=9_r^4xzN`K*fimWXPAx0#~W3tt#!9fwh&zHA;w!k!(p=L5=$)eJ7)k8VA*8
zLj4P=$!aJYnLNMM3(+Ts%^wdqrIpm=S|?5HRnp1A`3sA;-hjvLqIyLqr|BB^iGbY6
z`UzRrbDhC9_?i*Srvw8utRMi&mt1?1RzW)tOXP|IjVvrXt`TGCirSbLlQ+<aq|y)^
zlC>lEN6LSrq0oWsaVu*>tD=!XI?(ISrSsV?4FV@A?Bgk-eH3dJH|n-USnQF&Y%L*(
zcac$vb`V9dy-h$uW-GYV&~@3cS98NH+WI90y^dM@RBkGh>LeZD?9ewNw%zk&62l7W
z=~^<78Q#x6Fy)6Tl5HH}rI5g{Srbl0X=Nh2BU#u219z5!^}5N0aALtBt0d{*Ls-Px
zk1GT%2@f@Ijjzpbd|qe5g4;c3`E}16;#ZV!H{)@&u1+8&egw*x(NkyH<V-8R32|e&
zCy^#c4$Frb-(}Ng4Q2%|8E?3Za+Y17pPob{;aTl=l)k}K7C>&{!65i+>tVqd<-<x~
zlb-&HwBrj~lvwh@_te}zCczoOdvDbQs4B`C)*eH`DQtbmivOq~*f;K1l707xr}on1
zM&*pdyS>^?!%d$zWuR?++$<E)b9bnaW~uqX%1yHIH#<_RQY8nGq%VP}nK-<RY2zM_
zCfRP2Q=rJN7c>kDAIOd|vvkKO6Xfe07C=dt#eNQckzcL3v&!-n!Md|$IhR~yJ}(G`
zwG|iU36`A*m(JMcKT1$ima?GBs~~wpZpToi8F1drhnlZ`OnbCg4z8UPFBdq?sPLIj
zHsungo^vh=ngx3>W4L45XfQ#>&6-}IW$aH{S7MJ^#a6avEo)D-bG*uIjp}J+?H&bL
zdcNfrA$gUPI|&ey+F~?_DVjCrOzJ&tk9~j9ez`1PUkyBFcOMU2b{p`t=&e7WA6qX^
zUM;~}FX0qj5R6Je?9It=VkT_*;B3%XqO#ldm-F<LZjTjrYMQ$>0Oz^-umA;F7rkQt
zMb-bd8UL>vrwIS_`Ty@-(+AIIK_j_E4FqZcfP)4A0F-}f`p;XY{{)Z<wi$)L<lor-
z@lT%gkB!wsFAJA-;rJ7mPpHU_<Jbw=9~=p*Ayf3vV@O$KwK$Y=Q^uX#c!JEtszf~i
zIfm9#AJ3H{-LrV)!)ac6F8YWkRsXoks;ayZu|1s-q{7XTx3Ps;@>#&YLv5a(o}Z_~
zPt9ra+Cu9((2Uqi^NTCGV#3#B^yO7<n8ovP=Y|>GQ<5GjvP4Wy54gvL7%3x!60fwX
z&Iz7*hCDp3=jbJDj`PCL-W#IPRyV!=?E9HHO~Woc6TIziswpm-k*`bMn<mK!sY!*)
zUpSR6-a7({iVO>Vk=?Ne6cq_2qB|*ui`A-zdWN?&1C>HqBhR!9LIH74)q~UNJOd2x
z%NI1J3IjX}O6KuA=U3}=eH3?g_B$$VqaW%$VDxN7w5nF*Cp<_Wm?`7WK9yXH(Q7Q0
z%M*zuQYVAr)r>LV)rlVcjJMZ*%ztR2I4V~s($tT!kPd&vDuM1SRa`86F(Q6Ch;g%X
z0q<1ii3l&JUY^&_qgZ%!ha^iXlO;wd_)?O@5u98sTfD5JBFUSJ(n6Dnd(I!9AJ46-
zNsd~0=0!0?QF0ah^)|bx;aeKc6ZVjcQqL8%!h&m%bA<$^jz%{BA^nj5-XMP7_R)sB
zS(H?AhSY9!Hc`i!W%7+L-dua`NU~KTqilB~tOanZcv@Xy6GMA2f^(-3KY}h+*W4V!
zDJyhb{`&FG_<KrdHHj$t@Oo=k8)RB>f}nQfj7HXBi4=#j_zsg>0-(M*1vv8{n^G7U
z+|ot{unYN7;{|!^lF<9TlQm0Pi4GG;1z(ifX+MS*Ii5pzvDmS5dwt!*>;7o+hN6}G
zvl)Nk?dXu_^K)zTW^#6NUC!Ro-kzzWD|k6eMdw@K1L^BpNyMkKqXnb4xcd9<nCE-7
z<HPOYbI{G+&FQw9XPvlfmN+_QtINyF@x#ELtHT`}78e^A{+Gz;$%Cb<UBKXXoy+Sz
z3lGsUPqsG6FuKh)T#QID`f;GpjX=nFOqF#Fa8gP8HHU?q)0>=0)OYDA&!M;@H?PaH
zt!gM3XUk?xOvC{lvWyqo8YFEp7IA7;@k12>WW6LQJgr1tUSukGSz)SSJq*d`B|ApO
znL(nXY=AGo2gI(3TN?su53gS^E?kOP8V$kX7yeE8OgBQ`yccsTso9uis(rmryz2nW
zAmcc~kH)Id>pgBKM(xE_PVWpQCwRGL_dGQ@9_Pl2(C)LeBUGUiol%}q!)!ky&^pSF
z{ee%xLb(<oAAUN7xohbVp5B|REbOe`M8_f~{U<Rm>}*^D&SF(I+8#RJn|$+(iBh@7
z$J_UCAB1IMZ75<i*}U3Ec^0sRGzWb@fjk$d4iRro(F28W=R4f<!cLHgs&v!Dh=khi
zws988Kq~;;?oy{zfX>6%YjvD{>Td(D#7sqK-uPIt!m*A%;}H~(4mU{hwrsh;ro@cF
zEHC*(iNg6EUY}|w`uq4F08|0Ys{84t?eL>>!1x_f^1gk78@rntBv0025;=K$y{aH^
z9(r?9jtQx|P=~ECJnlO}T8uW7n}c(sDn)kh#|R~#<IYzMj28L?{2#*3p-T{`N!n%G
zwr$(CZQHhO+wQV$n_aeTPtW4RyO=Y7As2a1#EmC%Jzp6f83@?+>0>tFdh9;`?H92F
z*yNS}dT8$=445{XD_K<&XdhlmgVd1F$=Xg3GfhmxbC~9HIsT>kvl%5MXqQV6Q0tx}
zfQBH#?0VcR5r~>^V7jjJt*xb9!zV!BrZ)i5*e;{I+Q;b+nGJe}&m9uEf21nd=cg|k
z*$4V!rN-*Y-Z!}LoFy3&hPXg6UN<1GC`PN7G;F{Ymj9S-j3#JE<%m^*3aL(Dga;1O
zTB4njgox(UkQEYEg_a{q?yNxQVNrnsWlfAlm=-6MlaVJqT7_g~<3g2^PK^lT>(~4=
zfCbKPua5sCuwUp2-NQQ;SAa$NF%~!wbU*v{lX6rRoke0nx@<AZv76oz_#IJx*>TD#
zycIe_w*s!qj<*Uc0=|j`N(KrAcQ)ivvxUvNSqv3JE#18Dzz0L&DNA)>!pDV+5<I25
z@-K;#O+l+T<w=NeiH%ko2S&lQPt_Dl&}&Hy5QU24oqo`gYZf!HtA5Q%eGruObOch!
zfQCAT_;PcFB1q99pPEF>VP0(ZNJ6;8-aW+XkK?Y31XK3`pThI0b4}<2-I~YBD+7s>
zgNkH`=0dybf^b-fT8(xP7%ffRjC!<o!VhRu`2Md{O1zao%GI>lGX97!7VtZeNd<XZ
z#|-*HHcPfP4#X;qgd>P36Jcwh_o7fxD~K562?X;;Jq@%1TD+x3JsmBS7bt)quw@--
zM^H(km-Tu$_muMv23$<~epjGS9g;L!5>y4Le~AcN*6^n<jvs>5CwON9Z9QLtfGJoY
z|28Oh&_xN%lw${($SXfZ)CNrn^<?X_mxBYq2%Lf0ZrVujIDFcM(iOKwRZ#&~f=g<y
z0V;1^)aHsVdMHU&hkF+7#DfZMi)3vIXvZi3YapD7U!}Y+gI@Va6<z_W7=L5V&uX!A
z(4%=E8M}2ljnRxo;{BAG4LiEgBvGLjZ41=fU~&m+aWX;)pw^GB2(6in18rUs){1jV
zatN)4R=C1Kpe6rUDE^bv3)&O0SL)uNomvVtpjy5MN=<??<YIOC!a54R_~IK14Kc}Z
zLryhu&N{P!64GEd+_ai=*7pKN&2vx#=ClKAvUD0&PS7#W1R~g_<zpFd8W>5^Bcwzx
z(Vrz6^`O|SdTXq&4x*pZBXD;Vu%eW2_oMJk6nnXFdwHMZEPX$Al5MYID_e(n<UL><
zbnOW?48JtItAJfeO0^}$K!C?LB2MhQ9<V0G)}cWTM3Sa<o!jpz_-m)yWb~vQh871K
z%;K{(b^q&%$P<^zr_Nm=!if!__7SV}_iok5U4htM^6I~0qnSibbgG*tO8i7T(<z;3
z&uJSVGH27oCc}(^mbpqbc>!f1&S0Ps0<00*?WoBpWjLvThPm6v(54hYG}KF-1*F1s
zJ;^L%tPsn=Ku1g666IzK-`O&p0^4=M-zNt)6@rL2p-O17%p8K(m{3#f6B0OlpQ`Bu
z&zt1M?Apun2~7g^UbytpMmw9Ex)?gYupxm<=DM|nM1IvVZ}_A{y%h%Qx)gip3OTpX
z@>F+StE6n8Iuihy5F?v9z^4*fU6;GF)l^;wqlk?Z0rSeK=f3%kpyE)FjcE7kQ56nT
zj2-O&H#~!s=|xjIGa8ZFVpR3ZtbUrNr5Qn(0${r;l>EwKQ?;y;wxK_njiCeUs<a1e
zrO`Gmwxa1gL0Y4k0>VYsg3cNxvHNalWKrS<VHLfkBQ?~}p?`@`Hy;vCmSAv&P!~}?
zz|eqFm7BmQtl^tU03zzfY^Y#Wfmcg=MGh3Q?I!Qk=h@&;)!Gv{np4Zg;2jeOP{C?Y
z{;EWDjvHQ{rK@t82d9)t=-=q!8k2_iLiypF%3@h{oND`Mmh!p6lD*7^H7N%`z|*9Z
z4lclnA9f(h<V^cbxCf1FZ@|EC#AjWBJrnNsvY-}^R8`r2aEI8<yXe=sNF_+U4v&qA
z%CO-=&~^}_#rIS63EsM^<xb}5PIrcQU4keg1BrmsEj<<?>3-4Q@MG2eqJKfr2<`s+
z=5$6Jd9fG?{0`PO7(sqO=`7%r1>qFeVN+LyFNRh|?=dqD;=`lfKfP1Xt)tyk35vkf
z=LA^RVNt35(3V$Yul_{Mu$K2sfBk5tuyDhW4k8I{<j_(1;Pido!xviv198#VZ;;OC
zRcKfXfBX2%R&;WGSXyDO032-Smc11ra#tmlckxZ{(p-ms)kBCug4Gw74>~r3gPv_(
zN`^KuW=GO+1=O-Fa;NKB0ctKap>jA~vqowAk^)5L`Y0ai%&tmU0(4+Jqq;X{_#OgC
zX<R_PS<TIhPl{gShlv-TIESQNz~j*%G1#68B&x6YXWH^oz1b*j39xqsjOwg38QwMX
zHoi>U*(&>QV@9w_ajyYBs|J8|IeQl0wmjnUWqZgcVO=!KPZ_82moVJR2$^EE(4PDw
z(iVOti!IZu=GP}%dWA2r=~vD{7)do-hcV({)NBDd>C_g4^>`YlF#S>|MZDd^v_qT&
z&2aw6G?J^?0JX#qLXH3*1|WhMSey0J5U6X|3JYopfKTO+|A11V$k#hPl|rS@1~xGK
z6oIMIT~KK!@zV*eO_7Cg+3G~ePkFLU2-rxb8xzjRNrr5)Qu;<DJ<Q`-XHhG1u@Q}D
zo#RUCF^l2ywsj8-Vuocqo9(rY>-@nvT%afcLX=aB9?3eO><sOZK$aGKuaQH760``x
zt57-*SvJ8eci;wB5J(!RUWIZxv}Rr=LBs%QuDuWGu4zPpP}68AjRx}DVyl{vt6m@i
zJbcNP$*|HqQVpYt$+jTyP>Kny7pqo6i!D{-QWj)%vC_e!=!2(1*qfe4tNFK7BjbKK
zGoT)Ruq>bxPf|CkIT?CkmAuK$&`v3WMy&MArD2MSP8@_9<GTA{%ee<^Rof{;;=o;|
zo78m?#GI^=PLTVpZuSsL^5>rjZ7eI}$O?Q>qt6mt_ZvhL8nRru_@cH4nro9A4=ku(
zphB3rjH!Tp39B0v#grYVhupOTh#d0ypo~G37&d4`pFiAGr*x^KxD))&t8#5tDV|HG
zus?#ICNF7HPblr#3n|)V$>CLPJngWWAY7F7!ol@YWb(WBfuX|Bn;^<ExdrYot+IQ6
z%>=w(!&Xu|gX5R8O^R(c#_>5&n8bz?LfD$-??9P}q-2}I5WM-WPQotHD$wfJn;nSE
zC}DsX(<2brv6w_GZKgMxBxgt_2Gs~4Ux(2TC)4zow(eH(dImK;-k$iEz4PIPXllO&
zkAEtfqpX!(cmczf?!z0^91s#6Q+~kMlE0?DX<p@@_@aLdsC5+pB2NHUO+?o}!nMb5
zn@}@~^g2)}A`qk&`mE*>pHcQN$m%@OvEyKud)7g0;qszCDk<<wE@idfYT(ZPI*!pq
z!}=}}2m=~Gc@msAc2yIth9olJ|JAkixc|}=eX?9lCh;n?lEyvIfZPv5Tj;MKr0Zgn
ze};u-Wryd%I}d*+T(*<x3gmwIpaYf$J1*b7?^W$>8?dSele@{*dd@4Aqs~bQD;3t^
zQ7he!$5DsYRr#DN^(yFw?v6{wSbi9@)0}|W5#t5nb;T>Z`8tbY19G6o7*!F{)ldS)
zd!z9!ce3`+n*o8wKIc(xV0J$;Pnk{53ettbMhdU1fB>Vx1s_okc<tfrT{?=!e!5`=
zUw2dBz~^BUFBJKy_<SJh7XZY8;a?A{Fp}+XjPqM(tz9t$yMH?fcQ?0svT0*Jr;?KG
zbma)yo?1X*xsFtsr?3Mb?F30ZR0$)gReIu?9BhL#UdO`f3LVq>uF9&;8O~6DVf0=d
zb>pX6IEz=<mF*hVXV#FJcuH<ipz`S4pjv2X=;p>URH=3lPSA}Iu4>j^qVggx++fM(
z=4~3Zafv@#g-=lJcgfD0@!uxb4B|HQv;*F55c`>uiBGac)RDZ-T<lCgW^mT1utSK>
zCYNAK9$L~M)|-z4DO(@T&eB8oh_V&kas39{gZWcOS2x{$5ur+FU{=%Yi*2Oc$*VAl
zl^l+X)!N;n5q?5-OD`P^S5BP`oyc}k4`ZiY&fpn%Jz^tvifL6rdNXZO1Kk0|BHF!j
zglKfC8R<@)K}tZJ5|Tg-*d|q_tTImqWo*`5C6yIvH6%%O62Y=8=qZSYfPn?`0dHNn
z;ZJaVDntd}yqXm#EX_G^EyrcI;JZ-{r6*&V;O(~5w|vO43S1)t)9jc!Mt%mz;5_UO
zNpUDryM#8WdkiaONZ=I(+42a0i8FVQP*yh2P#y<Vo_X*axmsKpzNlybRMPfX(}})x
zni+#F=<6A*cs=ljW@xq%Ge2y;5$crQ2K6`OEWne7NvBVOmw5)!`^yfj@ajn5MeRpz
z6HnYeY3Xsl;!m%h{+?#`!phxQ&FSDqh2wWz+A*@2*SN5LyY?9K(Ehz=XM1khg7U^|
zPbF|PNS%sD-0zke)Wj&H2H0EggXi^X1RTn64NvUxTWm|ZZ%i>89Gvg^O=2*qq5Eb{
z*N)rB#yvd78!HVtbWf18b@Y?qUSP0YdH3~Gae9}QX7mM|yfN-EBIt_9NC=u?OjSQK
z{=BdxPGtJEbu5=3g&m6Px|Nf=x=BjSj`)>OwcV|@4}^-HIxG=Gw^Q<9MDjWw-x#?)
z#U=N3tn==C*GL0C)jS{nuiB`sun(eIzUdZL^eWg3=V-0z!ruZmthRYM_OpZs`KdQW
zgGtm<2L|Ip8*<?_P|k|Kr*CR?3&C|JT>aoo?vBWxM+fDPM_t7Wcjd(Hhb&>P5bnO*
z)n0CQ@woCFHl~d;F=bLVXrS~($Xr6Ph*$m$p;Vq?*(AUcBQ1OaMPt*?%gtIRzo@J2
zQRvnhhiW2eLzBP0F?YX6z#F{t4p(kB4nvq=R>n(S6=i{33Jr<-t|*nrNQScPmkfiS
zL&56!TNifpaXLjEJqd~>y!KQ+@_tiMD|0Eq1rr&_Hd=Cpo<tlNK|K5pukdOMBaM3A
z^(N+ape*NCZV5R>v0hp}+nS}sh7Dtw8u}QBo98Su<!bske6bp|k}yU%Npq@frSm|8
zKD*j!8yV(2Zm7hzKjC3$^MolSWr__Q(TGMo3KpMkZi`5*gXbBvZq#s19V^`=<Z3gF
zRW4`M*&{@13oX3vn@b@Lv4>}{&FSd!TF<290P4w~-Q9hW(dXDO3CC?zCd)|rD00yG
zDo55RluMve=grt#;K+0HX2nh^l|Tww`*J_~#?oBK;)*es0RZjzEDSHf_q%q8$Z5<B
zuwnna=_?+G^)0I;;Q3p_)dmd*?FGhjFlWExY{L;9)g4l}z6E=QOe+l)ErSf89XRYg
zP0D=0FU#AU{+i;slWtZ%4}+d}G+m6lv<v_~Hk_blnXGnsibD_|By(1l7ll%TqpH}@
z8_I*mOcYrFByC-iyb@0$f5Xo}HeV;k)5?o7EB+7}WeT>6KW>%F(Jxe1CT@Qmp{ZAd
z53Sd0v8)OKd30DcW?m=VR4aSWyLxbQ3cN~8$JFtfjCfMm5lfuH?5K_CuM=2Iy%yRQ
zq|tW?u;PUC%wUYyc5JQF_W0|ZmvS{euzRJZ2eRbC<15+5-+LYF$Li5>7aGiqg^q$n
z9hbn&BsVg^iAfH+iQxWj#$9C2TG3K5h_ZM6xXT(K25dFj+S2l9NohX`IbEE`a;h%_
z;DL>?g5}oBk$-@+3~b1!8Ls-K1!u4MUb0YJN?gH=L`cHi6P<QzttJAFC;nk5NTy#A
z%fF|avhTmFuAV5SR*vxuI(ceviF8WL2GLTWi0cK8U1O?OrNGpHuBB5RJ)M8Ssi1{I
z)i%aC$6-Cp!UWmAi9x5?4^x{$Ak<zn=By7!O5~A_mY7~BHKR)p12TZ}R#?7+FVg?D
zig+Vf6?7iq|1cBk`!4nH*2M(gsW?lT+AA@$9}=|YHYHCMtY|o)nJokUQ#!Ot@HtU}
zzo5toONzn_-&_xL5*TzLQqAgn#PZ5xWP1(feSka;A8^olH()Ocl|ta_X*YyDZG2L(
zsRw|X>q`tCHpLJ7TzkoEDS&ukhU$OGZ8WRP^FGfowKhsH3loDTN=+hmeM>)o1uES-
ztAJJa`EyeZc@2VGTP0`~w4f#{l9#4wNbY86fQ+HnTu6;nv1BAlZZF{JLDi(yg+%G4
zl1Ch=E4)#7;eGW2E+cOW!`m9@5zyUW<J1wj&Y^RP5CG1`e2O`wb69YEj~lO?;K+vm
z?F!mID+%b+fW>$9nNtEln>Bhf=6nAhEAB^|<UX-&c{(>(Udh2H-LXN14qTFYh&i0-
z7P!4}88ZJ{6bi|iqhmS9R}ttBH4t>`>2ptGpl+&trS$B#>^P!Vjy}sKnv3M&)Oe7!
zX*mfos>Yr(3rO@jqYUEatZ{&WE>Nzg3J!<AzH)Jpb*0*-1(~JWv;%!y(*PO?vf41`
zEeHO$)Ii!_x;Vw0q=m{8CHDE!QH2df`orKd6%|h^L&9E}R37mPGiRL>h1;MdI%`XW
zfkV_}v8$jlb0Mf|i4#-yHY|6~7d+>QRg<;0L>6=7L*Qqngib2y3MwORQH^ou%HLU7
zdlVlZ{ZPW5Jo#59U%U(?6l!ao?@Lk=`qa`7{jol7yD1p3$LmG9ccw5D+=LNuiN53Y
z$5YB=2tCxGw9V3erXS+1dLKLU$Ei4F%!uTu)MG16XTjyYE!y*W-?^llwr8H3K-A;O
z_DRYNu78(cL9t4A7Y85y&mZinM4G24s9ad_UHu%A;(Yq>!hV+DcHTcfIU4s~E-YNU
za&&<i<-b*@Y!7nPpJX-A>!cE+Rxq6NokG<W-d`_gA6W>n6<TOzG-5f3pWG<CAs_aG
zG&o&toYo^Z)p-L!W%*qvplJ~P+Gx&B?UA!4t*R`9+>Z6K9k#~E(SNtMV^<D<tnS}v
zETgez2IUQKwBU}mnL6I&w5^LL9}skN^#57KapLIe+|%duXOxSne!(9v*(sEH>4xEm
zadwB@Le<WvNsoJM=*I5@nsJngu(V=0MFdTN+R)6s>bA<nMGtdtEw$C11HY@(m*%vU
zzLOi!QHki~Z>Fp22*ogXGgW0lQ~f59f+a<Cl>2uRdeW3Xhs-i=TQ;geB~7Anu`($r
zBTE!vjlNoE#AZO8PJC)kKaZ@yKFw|p&Oe8oqZu~J@HQ!fS^~it*CT%D9S0eqN{j$!
zWBho&>@Zn)ttbh)*2!FMeOIVcJI-s>?N-@pkM*S{XpWWOcay&-`UV7I0trL#hBCcJ
zR+Q*s8;^M{$KN+sx@37+e)cKxUzRb31|!K)((XoIUzfNF^A;0E`2Tv~5{leQ>Q(TJ
zll>-{Jv*5@u;FOvb4hu9kJzK0N*Y5<TYNXUNm?}!QwF2;86^i7uRPTPtpuWQ%*74?
zGb(#j(UPo5YH5Di7>frS%P$B(!_<c!4++n6GFVmD;(6uE@o$}U?=s!EnrJr$8(F$S
zXAi=GLl1YB#JhMEj;fX#0vc{<Rr<+OQrM<$MKka9qQS>94z3h=V)H7Xc9sl*S`!r+
zZAAjXjZ|6*;1^?p1aH(Hn~yLkI*P)-BG4wl(Z2H<f_Q|_d^I6&|GI=R0?lhFz4=m}
zSL4>nE>NRFgl_$^om0yqzA{XeE-$v4JST*UmiXsSgUeHJVr$r9t1L<s0-$LNr;UTG
z0ZPYJ=j2DTOg$g-V<_~1P(u!FU62bhI+B^jkk%<%+uv7L0BV_L^n(t@4Y)o|R<odV
zkm|bBWP!!Wy)nWVN4jZ-ZBS+~l|bFD)`i%fKF2{GkODs`SPBQJIBvIZHjlrz632*@
z<~<-$lPc)bg(D@}MjKgBmQ<NL$tRh#H*yCIP*}j&vp6~!^%0ux4zO^S3d4n$;H;DJ
zm1YQoUSZox%S0oxtX#)N>N9W>XPD$nh7_J9p>b5J*({=nx<ZCs2{L9|o)n!W@*q>q
z;ggC}T4kOA_s*)N&T2Gt;Ss3&Q3sRSV{kC<GQUlE&3h5XX(xuL6)DA&;26?tCy?85
zP>A&)d&nyXc{=27qN(IB@6v8Q)@ncAaKgqw^W|cSj7bDL?oI~N0?uc0nz)do;{awp
zoYMh|l;4&ks&K#UGwX|3@I8w5;24jQUyv~-GlDbE*52GuYW7)5nk&&iz~!-(p$tD3
zd1%m@wu9=5)vuDHm88mKM{tS;V;fKjr|kG#652j#vOvlU16`q4E^AlFUNVJQw1^<e
z($*G##u&-D8bq|1Pgu%3;+4af!4w*~I?JgeO`C0mq=cLh^5#>*zc=S8{-JEuB=2<u
z9>U%Ws`<;4ULH_+^ousg)WNerud;gNl}7q0#{*f4$1;C*B&v3pL#m}2xS)3<nBR4j
z;^b&f=Qt*hW`o12i2gTGO><vUeMhShQ9Fy8UIV$-$oF5Zn;x4iiT{*$+9c2@aGLKT
zj03D-f?ZNmm6%$x4oOZ7JlSq$kRY<KTQL;U@Obj50#)bb;fE}v;onxLO5H!zS~NzU
z4BjcU!<Yp*s$N?y2>bVJ2Cy8E`A7<yl;mx&ZB;uQ)|eb6XP26-cq71mk<6z^Dn)j4
z@yu4!v?_UD?z4Ph_E=%9#@Hvt*{9Rn7>*jAz!>ac?@wP3W*{G*?_K*V79K5v+1ntX
zitOVyj#mGwnm<&|m}AY`+DnPX$6+z6(ErVB{nR;dpVSuk`pLo>1jgo-FiU>GgM4l5
zEH0CE6UeOO{jY0GRs9hx00i0<+gsx+%+T`2YFjf?R}pHeBtxyA$L87o5Z{@x9WoX-
zxx;}o-^IG=9!x~2L5AGcFIkHZdAvIOtI<)mH84eY%TlZLzO#<OI9u|(cvWJjWjP2T
zebHe@zqEY1;=hKyJK}9uDe;7aFe`jQ0>^w#kTXXW^>@t}_Oo%Dkh|JL+;!5>2Bo#|
zKv2n7lB8bAHYVQ6PcFkkP9{(hy;><lHJwH`3cNIXRh<%#6w30==87P;^#zlF=jBDq
z+H8dTLY6liU14>ktjeF<@%tbg7v01is+k>7{RHYi-9+jcLb+KtNorxy94@NB#Ht5s
z0{1l(-ZP{*%G3Ju0Rg4Pr<v;M@<CulUa8S1p5v-{-$8(4J`RxW#93wq=124HH8XLV
z?3BfaH8GtgkEdJ4#aha#%K%elJ^h9w#bLJ$7fRSyVG`7*^-OM(`G@w>>rL;yl4~uY
zP9JYp9xPa7DsG!}62?>M!@Ij=S2L5!KU=m-X4Bpt9njz}S*#2=`Uae%+d3C-in1P2
zG)Ya{atyyKD8s&SAC@a@r<QPM(I*M^N4YG>a1ui3QGrZ$(}>)g{GIw&j~;pvDI1Te
z2eXS(4Z55y-3*k@pE*K6nBH-8eMV+IuGO1)NK<4Uzg54_;SDajLqrU^iIfPjm8+lX
z_&Y<Vdoqomt|CVt=FXRYTvc6apna?tRV<L2^Ge1HaIEVUqJ29?z@rwk=F>cXG|83`
z%Mj`$FRTJ`6>^3aR#p=8>ATOf<5W2F#=EXez|0!mnS-*iC5t1gLs_Tc3~)sd+mFT9
zEZrXCgLj!{51K$ibB%>`4P%Y7&qnx<0y^1RwQOaX>51!Ql8uz*Qe9Lj!@ZBw*J&TF
zITAu<MW5!~))|8Tni1b>uXo7MeCpsKgxMu>6y&)UZnzGs_cb{YFlV*Zh|^MK^Cw+z
zAhTQdW~|O!Is|WMemiZh!G1*5*G{#eeaNJ}@$;R)vi4N|ql^YtjWwd&yv+}<p1+-S
zO{0zSSRMu#OiELN8Fu%AHiqr7BcHr6G-&m5XfrITrIuDp)X$Y4&g!ZASUnAyad9!}
z15vC>6V73qGPgyYksG=@c^{i#@95^%w;WLG34}6k_cmIVU`1H;Biz~U18!9wm=wl=
z&jo#ie&TRRGF;K7J7y+vlbfCd&4QimGV-7<p;#sfEO$M_;Hi>V<<KnM<?ygFdBjdY
zEW1*oxbP*E%GnT00VhtGYh~D7xEHrc(onA|hsDUcqU{%keTQct#7qd$L?ty_PdA8)
z-J~+bdnoRDLs}jju~~;Z4hh<uEFDvvvDYYku+g;&*#f(olmZA%x&QX43Hcmv*`DOx
zj_miLKbGQrjiIpQnMSdPA33SRM}Pz+USaVW0he7k<%J;u=HH>GxI!QU3~-dTrJ(3(
zRbjMbvuld%;y^l25&@^Iu7Xo$;D}fSrzh{uAI5z_4frx|Gz>u?ui=jCd;Kv_o3Wmx
zqFVNIjJ{p~)V;4}7hNcv))n*T(H@%O`!W6g<T@r$$!czM`3t%O)*8o>X{l+Zv?Pc9
zj(pY#J7!<_3Z=VQom34+I6|M|lLAcco_=IzNlOpi-1@l1y{+PH`%mcL`Zjh3uFOOj
zrs1n*54P1hM2JUEt6*^D8G0m25l0xvI8pe5SM3sSBmj<r3{0I+`-W>(Lzd6EF1T3a
zTtH<r2cLcJZ%*OLQ2A6;Jazv|KU(1Rmm%7<5_+ZNheeWZ@Hy;sv_$RCz_w_`GW+;N
z2Z{m8{3HaNzaN7I9cJaR!({{e{JzfnSp%Re1V7;<uJ|;Sw$wrk{c)K++rR{Hq#|cg
z<iB+ZcE>@5H<9W%AU6S92;HRB-9CT=r*qX5d;48_FwK=14Ry||dzk296C;0=I-&53
zv{HdA_T^vSy?tCP_useDp}DlW`w6a&l4ni~sESSJ4RtwaTh2mXEcN+jA|@FTP!vF}
zBs|l2F_Hmt$JkgcaU#^t@5AlF-V8e^42Tk2H6~M1wihXkRpO>^uW%3O(Takk7h<gp
zHHe_Q9RX^CQSsF3FvbU#^oSIR+C-wFJYnbGQ@3~lT2nPfALq%wn-ScHT!m5^mf#)%
zU=U#A7nrfhN?Wqfli^V2!Yj?A{7$}Wd@y*#2^q*uL{b+&w9*~PAmRLE8LdTALs^(A
zx9@Yxb|a{LsHDKoUBz*uV9uY)*Xppu3<Y@3;Dmo>RM+_(DesgiHmdvsT6|fn0`YH!
zEaHl;)-&pe#-C2+v@E2KiskNigBypAbKJahXg!t~1|kZPA+yRuC}|a-Ro>QF2rv(9
z{R);M+Kr4I7KcxF-eo8x*d0AJktMb1X$EGwRUBz##T$N$gerLqhSRkwPTNP~5ZiyS
z?ZYUdHh{@7RAZ|O3eny-Qg@|K-CSSy6r{-fiI4M-siO}cE4P=6cP*$n&Al@=UHH1!
z(Qzry$~M;{$2;<nZEUWMc4N_V0argJz3*1cl<K(zlWM2}ddWhYVLBI^kfgLJ?>-LF
zh+6E_mNUCv#}kvh$rvq+It3ALJ(}Fbd5D;yBGjG6Wh!oj&*BJOp71Or>TsC#em%8m
zaL7-7hX7xeLP8x!zNDuWOdHrH8BmWyr<F@Xg;86po$wN)UmZH+?8tL9D`lnpUNw0k
z>)m=caIQ&izY`5{*Q!cQI5?~_io5(NnWhkck2fdqS3=42#Rt%>HU%f&Q$*d8rz;C;
zZCpvqVt9|5cvnp75IevUIo#qjn84JLnLZ=YH3U;%7B3^pbxskua)bM`I84mu!fnpn
z)i#U2EpyYuOWDIcZueo_#FV)_(t4{4*W$`(+%ehJ)4u=5STonB5*r-H;jVhLPr&Dr
zI-7onOk)!;O$XM#E}Y{vdv;r0`w@bhcE`*B{3=2F7rL~sToLA7uFs>)`(&=k#kaby
zzl0-RN}q{%(WfOwZR+<FE`o+TA+yyajTH_MAnhzviamF4oTs+iDg@2cu3##3oBQ^u
z$SiV%;^EPA(@*8Wbg`vphbE!op8+=xb{wtrX%g;YN#x{YKLic*@?15y6n7<NYrzG#
zQ>4Q!|2UeAL`!R#E1X2yZ?DNm-H9ujC9xPL7Q2Mc4$zex3EujdZZK#DMn~_?P6H79
zeL2-<H?cTBy>s2{J!S;l1GcR<Cx;#m?_?olh+dz?V(srRA&I=&iz|RgmjXzfdr+C<
z7s5IEMxXVY!i;}Wyp;ZXZbkA@U$pS6<%6Bbmsr<4b>!voZ0C`R^Z&)Bm>;+z<E3gk
z5iNZ<(rpfrFLF?IUrD&p>aMqQ7UPkeVKaECcp88wh9TE{I+&)y!CLo$kUkyj(v`k0
zc0(rqlCdt!T`7dKq1#bO7~-_a%E(4;#9giS5AG0cIq;jEZ8#K{|2CInsKvYYMZ$7B
z^og{$`oF6eU##-pU4yuQB<5ayQ_ffb7Lic1+43Z!lZ~8&JY^eTAJ4{B-LFj>y?2u)
z+ht~RdqXP@!KAP^Hq-s7KsH7jegC_Hsp?W~`yeUvyqm3#j4JF1^xbmSW!VX`T0fdA
zHX!Y0<Jo*omGaUk*t5oa8xTKjQ8y|~deKa=dz5=BpG&(`8p#ngfU(jerV@%HETxU|
zRnm3t$x0(RrB&n%)vjq(^RET&M9S63#NOGvNquPhX*<Dj6z%I@UXQmc+n5sjs!emM
zHmpYL@JxU1%5kQ=q~WnI8Mjw*8%}=ESX-}Tsm1q9ey3f_wo^UZ6icp`j6NH-vaDB(
zq@GTDe^U*M;9n9lC+MJwkYl@7>2;H0`R=L5?cRVbR$srRGViUOeff#htLLO-I3+8l
zQ-(9-M<piaxb5O1Rl%jkYw-R1JP24)EfXkD*Z5_1yX>ng5=YfJl(USe=#DH>XV+-;
zPRiD?rq^#QwD%ni&&NW2>0;7dT>VdcFSZc>j?qO_t~csYsKG>K1~%^<@9VQLL<8Hi
zSnXx^t$Q;6(MzbMNprKFVe@qqjk6W6ID+%#S4?_ZyQ<{^90)fHO|4C6@zR;PxPHyn
z{VJ5Y-Z=K{5vpTg_1XQ#u^zWFox^no;vSlMBaC|Ygv~iVUsHS54Xj*USaEjs<B^Sr
zFRV_fwDuzt`{3VAI@oP}>J|cdglmf6aer-5H#%Ft728acnJxGB_uV5s-(ZDTYOr;v
z$@%i8oqA*Z^?)|V2Kp)o)cxA@d$v@g-hcGSa%88e8Cw3ZNvWKA2wjK`5AJzgIdX@d
z%oeK^BwACa<nQv#LD**vqS4J`hg^KcaqK8HN!|p(B6bAoufYB{-S+w|egs?rV~H2{
zmdsE)Rd9k|2Phw~qoe>>?TX;9gbM+2jJiooU`T~=LEkrWE}?p+*pr*IbjU8Es%F!C
z%HgyH0t6I>_PS&e<+xRvTum$%=wV)_Lasux!@MucF$%dcoA}eW?vtb-W_If+lTdtu
z61g`;_jEK>bx~b6q~vHir2!TiXt-nyH8*4ygu=qPZA)jZNbSLD*+vOl0!whLWLy9Y
z=4&w{UF?NBynaF~0M0z=M~3>M4MsLe0*%x?F`5u+c*&3l^=K*!Cj5NWR?*<+sWrQ8
zmV*B|9PFtp9p3~uzg|{k9Pjd!H1Xc6g%r9ZQ?vvh2^CB0$rXi~E>Eu9wpM2nU(`rA
z)wQ*Hz-^S|=mzIXq7o{tRbgv#s!WgTtGsK_K^Pb9IWmI_>hTXpgdS@jQAeU}0cGZb
zjBgrKQ6ecbuxGJs6S$!`we3Z$?_>^EXw}OM_<Z)edC+QBVc2EJE%B7MPWuXHU_x`E
zEn%e{^sf)lUMNGRC^$BkOy5b&24GpQ9yH(!L(;yhmMQXIUQk9+?NaYA;S|Y+D#L?{
zZX^Suu6IC9w()EOty|K@!<??#(s|eTLQ#JIM`5S$!}C%mcscsnKP%VdqM)mz#%f9g
zNR&_~GoJ=C@B)$KJU|5k3Y7~hvCWJEFY}ak1*YU4EJ!Mmzaak)srv7nwga<roZdg2
zit%5<`v2y%9h~f4?2YYh{!g;{e*kS;u&nJjIUc(FK<PgPS4XW$Z0o!3Y|$KWNM+X=
zd|Q{mvjoaa|Ed*-3r<M(i2i=gB%qK=Ic?J31QkV&dpeqN&`-45TDKaSOeNFYCntzZ
zIH5B&np6{*QBDl&A%JS$fyA@uMUkd`xL^-kH%f0L(Y&mB_`hf&pKAy(OF(`VlNjeW
z>Z76Tvn1OHGjEwztL}l*%#Ks-o6H!ETE0!WjkQTm)<l?Qn@IX#h4oj-qIJdaF!quY
zWQzH~HNrwt>N6wV7J(j8TGD373o<~HY$H!<N`ir#bU_$FsWh|Du4=mfeei71<~+(Q
z8<sy{(O`lz0&h?OmSrXkK^?|CWQ3gv8u=kB`a)Dqv`aE?RWY9eNlYj`76xkojZl<I
zLX`~e%TzH(Xn>n|ZrKWKj@)Z2@*}HML?X)!l|VcTD!~NztK`7^JhHdw2J59Qt;-Or
zk^M>lvVMO>J_ghcnI0T#men|MSAh4OwE)YIlo9K{c&d@r%gM>pP)olFK)FqVo)k<<
z5cPJF9N=M*pvC4f8%d7v*s)5#=6K{m64?wfH$eyYYc$crFtLy@5Jk5{x?wtzgpf8W
zBK6~)YFLC>7I<IO{_+C*00FW!ww-X0EgTdEkQ#TSKQ8{ebu-83_C@ly2$V!117Z#^
zOv(CMM?z!EJjO}xmHzK5nj(KYM1pO-=&?Lt6#OPH1-V~ko9qz{;H^b9{|Mg~xF6_T
znrY8X&$(w?kNeJygV^ju^itFAte^k;<%WIzsoZBz!{xL7Gg-Z>i@(2#CO;zk?7Vtn
z)iIoT^6QQV$oS6LLCa>oCwn@8wR!6bK5Tfs12dM_;e^GNoY}1`#%^m_)6P{H{O8Te
z47bi_mo;(xn!R1E^lOzndxqy-o6sJ<t+DHRm#ZVL5b$<rW`E9g8%+z{&fHcdyEi}D
zX8;&b=h}@3J!mT{2JD~b$NpA2vEsl@?2A%R2JCHJ7@eL*k(cl6%^d-H-2+TAc2cQI
z+X2h1NbW22jICC$WXaneJpjY<8yS8(ft+m1dz`<kw)QpnmA0_AV4!R3t)o3Z`aPFH
zLue>`XR^`4!EW~38`TS?dXWK><6W-y^g7Mux$CRh3$hKrAXZr&$vZYGXO^%zJHV)h
zL++tp)P+|KP#SySg96j7TN5TE75+iUJI|jtE>ZH{0pKB&ItSCcrk1^@mCgV%aK18=
z=1TzwE?^ptdah5^zc9Ra6_E}mDHE6RcJ|(P-Zbcn)5b=-W2CZ23}BW$(L%4u6hZ$~
z#5dkL0eL2Oe*AKs-PVAqt#zoj18l$W%}2!wl|TT%lDd1-)WT+=`*wDR{eXCt0;Le-
zYsF1SJMa#h!fQ>V|M2Z0@m<j7LW$Tj#bA&6je$;ar(o5hZnXqT;@(A1hvV)l8~;Js
zXWeZacId_dTSZg2VRT7XX#S<@Luc40Lr+&lWE0(RCLVyKG(j+SySuD_As~xGcq~DU
z%R?meiA4w!T6nO`I+ckZnm{X6KG-!OoHP5Eb%dL3QNt81IYBBp8=zParUN#JrP&=K
z9wV-7h!ouC^sw)tT$vp*!kU1Vb*z+fFZ<OimZu`Db97<{AkiWMd$>RlQgN3d@wn9a
zH<iKuqC#l5-((=xx44i@HldQ}Tbd{&yRNcsp0xXXNV|v#=wkMa*S9+OGw_jqgM&2!
zdYgRdFjzOp{SoZHCmN8%U9>$3%yc?#GI&Il_iU7?V<#>ZofVuSB(t+8l1KOPI6DAo
zr(K_TB(=hq0t0>7pX3}(ij+cR21GdpNIO-gKiJ$onNTO`T*VA3(^!QdT~U*0EzUxF
zt!D!CB<aT@K=A>9poG)fg&lhrl0O`p8JY5-X|_{$5z4YzL+PPX_C=RT#^|KkHJ8+X
z5>+JdPGkrdS>oW29E2#RJ?9b56hN=BTWnmNOjd-!_c~I%9BhM5F3Wz^!4ra4hlG_-
zc+@R|m7)VH;bhRplIW%2d$d<|<TRDcnINQ;sRr^59U3mtqtOe@wZJso!n=`RgNADe
zJUl{h;WUXV5hVQTe0QjvdIBdGS602PgzuRQU>E^RpkIXWX-MoIP$z%TPQDO(b08iw
zjA%63s_|Js2;HME88_9LHqwZO&?w}SKzBj$U8nXQa-vR2-Pwjoav*L_Nr8YTn5z@I
zgykR-1Apk-45o`R<BJE+V+m|DuzNd?#Z+%!+ol8h{utdKr;bU(`<;15KqTpeb+;6+
zOEskf)-!hWEfssY!tS~!XHZ<;Pmy9<2)YItxA_1xE|pHTM#|`tf<&f-N{f*S?P+`{
zRxGX2ZykGCuhph#XD856Gb2S}fsFbQC^-_Jt8eE~t?GfO0C@{8UE%HebK`nSSLf}h
zIc%b70y4}`7?CPti}$#>NPFC{nGNBk2UjAZtZW}vx?eK7KL>t&)2WZr$SL#!ab-En
z?eLWkG6<{y?gNZ~?QT_FUgZfyeR64hIgy1QuSj7Q8Ey(!!&i`WJm$;00qmfZ_m-3M
zsG~*C<n+}tDDEWIw~Z_GeM6|#m!(iS`of$~6eE|RZ>oG%NUK|v3(JRLYQ9-X#H^7Z
z==zCZ$|@OO#CV{D<os&1u#)pU?FQ3`6#bg<5-c&QhBV-;weViUi&`89QFQZk&yI@H
z$?kYgfkDg3P1yER$?~6R5!5h3YKS*<_l!u%bEmM#j{3qAj%7}Pj7k>C1w&l6IWM*p
zcD-ftDp<7n2$P&S7)nA<`QR9E#AxQ{IU+D)ssD}&{j-#`eM~q&WC*&MejAL3Ib(3n
zaGlsZ6(opXOnvmDj4M?@FbGT>3*+GMij^ZS68I+~UGn7lHqC}n`wEb)OH}(7-pd+?
zvP|=;a(NB1P;)j*YzXYLN%lJ`zMBI-Bw^f{sd1IgAz1PZ;1VG*kf6;eA>>7eApGqc
z+=rLD6Zc!W>PK0LO$)UaVyqP|zFgv>o=Kf?9>`33n}U_Se{xTfGg^35QPm|SQoIrj
z%rNR}*fXmi2o&1^LL5}I40E88=$f#FjVCam=lh%!Vi*Uw*$!PCTY5)?Q76JTFqr%C
z&4ANfA{Hx@mhewYc;a{|0vM;i3<2vC9SGWdMSFvhP@0zT&FG`v|4?+Wczx61iK_e&
zTOgCCJQ*5$wpp9*&uRSaYiIH5@zZq3Q1^uL)v;F2^7Q3>XJM#}4~oCMZ)n;!RSkO!
z?oc!-L`7N8AchZfZ*pKZ>DRj5WvgFF!Lo{oT26KRa*S*UPt*q!rPpZ1sm5D;m{hs?
zYCg_5zuu_MrVR97BUa$T+@9$?dYnM-0yd8+5T!*{P>mZL7T9dBjsAQvt3*mUgVb;J
z8Dn(P#4JpiJE|k^+(L_8GJh&zompqz_V$bT^Gi^=XD!9kDPd)M?{#C~7ad6g9OH||
zBe;lo+s?pU0O)++dBEIgsLW?Q8#6&A@6<@ltdvty37y4ys82}D$*v%1DQ={!n4~V(
z6T$LO&f`eRT4ZDzt-<S!xw70sl2|QKH{rfQgei`QwqH+8-IP<;`r9IMm7s`oQ>X-L
zsqAA~Q$=fvp=jmUYJ^h+JEc!7&5Pn3$I!nvinz^X>exapA-RC85LsF!sPXBE{Fcom
zpMYznytM>_vYSu3b3S*r>ij&vQO_WwHM<qq6p<7gmfMIk-cA=pBm3I{5wz(Jm7vbT
z#Kts>Tt^r8xPLTo*4n_Os;v-}mjwuY%MpUx@w@*tu#WPI=vKWn3Lo)Y5aH*s;9H@m
zHbwx<WbvV)m&sVS^X`NtFcd*b)|pB@s|GxX--V9s=#upI6L+`<R&bkejL&P3^Xc<(
z{1{D-8xfT&hD8Ns6(5AxY&^Ah&|C^Oy~N^v89M!o?ODhl=(Erh&)@g;K-_p*gx<Jz
z{DVLB1q@|pRR!-w5(eMkF85TuHyJ3>{P{Q16zv1hf0ei1apftd&}U4b7nw#CwIdn)
zf&RO*mCeh-5dUu)@yC#GeA*e5^FLVL+&UsQ#(RP;m}+#Y3Cz9{lt)FI99b_<N=hb?
zjMM=z&7VIw5FPk0mkio`r24?(Bu<;b1}X0b9+WX4XqC7!6HB#2x<9kR@Q0K15r(5$
zljuRUE{(oP)E{rAkMSeHhe-(*s%9g>nUJzlGBLjdP?eI9=iYWyuy};d37qVXj{2%H
z7J8*eom0~>m^mqL)o^5QR(cvr!~+w@v#NpM_2$<$8JfL5%Y7&nyS+B-Fq9yg0>eA@
z9lz;!=gz4loe<}zeNXJ=WmMqoy7}pUr-k2yeYBqt)p$+Q<RFjcI1yllYZ#Wd`cpvo
z8;TlARMzQ!q2R(N$jmL1g=LO!@|^|YV7TbH(gtJ7+_7)e7m1|+eDxqiwX2x;{Y28x
z=nj@R)|8|>Q<%~9*xA)LQ$3i~fmFUK9va1MR9CrNx=imIk5KmboZ{3(ym*7Cc*N)@
zngbN^VB{Ugn*!9t#r#>Lg@tl;nrRc*G+;Dea_+<@Bp<)n$~6vBn`YeasiQ(}&C#k2
zbN<l}<j=W9Rc;Nxs%-u6JkV!b!X?l5%p*2K$)_14j*5ndZSe^N#*G1c`^Mi>X+de-
zJYma=!mPnt56%m1!QkFb`Z(5gz^NXw#3-nSu03WShe`-@{v?=lo3j0ILSF$5bcWQh
zMC-_if=@Qe!>Fm^Q<S1i_uyd!b3+n)p0z2V)D%-ouGtv}=^u_E=K`x^h_2O;%ON34
z00{kqzbA2#U<fBdp)$Q!?+Zw~eeC{+&N{cvGwA+r#t-KnoneZ%kNfJ+L$!@{{XtTy
zq_r97xaF_U#BSZf6VfjTr>Io87NqI#3hk=u!q285>F6)J+ul=gT@^}DTEk&L_0k0(
z%gCWgoSR_cV;}VYsZ({#XR90jRZ;%_yJd^<9~AIEooZuh>|$we=ls9u)oYzgdu&d)
z-<v+6biccH*VvLSd^o`-0k+GX(sXgeE@+z05tY_skH7aZ_IQ#$qQ9@im17c*QHLa(
zGz!3?HjyP1QD2cMW*;#<K0isahnfhwH%+gH?DW5pw7GU|o1C%co)j8Hi>f%K10cO~
zhaeHf)QKkj{W}lTaD77xGED?=>nul>R7z<hSKD0L2GQqN6|;cY^g$`Kr4Dasf9kWt
zZIaAsV%}w@*G*>3jAkDhuwA%vi$(5Wv;=pw@fy_sd|a*E?AVnz%{gO`ZkYEykZ4CJ
z(5zjt`%x0%m9T_*BGG5w&OOq|huk(9bVMb`94i7SqxoT&5bYcOHTOvxHOzz5S8^dS
zFZ8X_lz)r~CY5`)0!2G(N_?}YE2=!Z#9O*E53h_rpGe@lq)<HPQa!9$<@d*vIXsRs
z_rh6*`JokTlh^_{3@YcDN>WD~GiT`Yhb-$jv7QN+cH(=7(Rw}qtkjSbSu{^4dQ1nZ
zVNJdkZ^ufjQAILmoK~OmgmWuLCB86jRz@S&BkXOHf85;I0MsstxkQBzR<VkII)l{d
zj9h}Nj+#CUHORMl&+i`^WatG$527PofMDi&uoy+sFm_;-3*w7y^dJrGH}W+ik_`Cq
zA|ygGA(0vIEyC!g=|qXNLIchKmIO=(His-Cc=V-5-S3`b$}2bqs?TC-=7$AFJU>4y
zub(h5wi}8G0me^XkAG9D2VNb)*A>2ti8W?}G#E8xKwo-BDI&`oY9?^8VLs$pAcVpu
zKBPiaXUHSHcB0x4^<-SWDpWkTmt{mm5J05VMkvlR6=EO_Wq)Bjx4+^N1Rp@;H+&@D
z#uHg&ZpN!r8ukc#i2{sWrp8d#kcgPZ<P>5E=a<=%0R@DNE??p?%)`)u`w-jF<e4mw
zCL{pSFs`ulMtGZc#Fd7N5#nQG{t3j#sO>gU%-Pp5X;NXNrBR}3y!cQ!_=T|66RA?a
zxJGu~MLdma$&q1W>Cj56(QT<wwOyU129ekl(D?asivUzh3LAB*h3pnNkoM%8M(N|2
z2Rhr|_%{|C<jF5I1e!+^TS1rv3Un?Q;dS*CG)nD}%B{YDrHG6`h*9Lg2=Z?s+GqDs
zpaLLnRFB%XuKC65jY&b^8w9fudLv!@Mv|o=yKLUt#@7v0cxOXN!WUJ!t<E(xq^Js1
zS}@By{(VjwX2jMCS(!+UQT3vt``UFD0JwF7o*e<>C~lS#I!yQ?7vN;e#oq|m6{iha
zt2aL)HHpLe%2p(N+lTr+z1Pc|Hs2T5TWxm$%he=vJSGo)fReK*)j#TjfYW2W{hb6q
z88L!!^VHU>-yf)AZ)y>@LCUavV}eJB*beKCk#04S(iV16l4p%Uh<@9I7z3Eu#tX0E
z<+r2$Z^io<ui^#Id_GsMkkM=B0F4VMB*N`8hwxqa8`dw#$b<%niZ7i~U=E+g2rf<>
zcvy@EiLoS>o4)oAdrg|O90J~LGSHbo@>Z3V<wEqub!mcb8+X9KRkK>-0-`-kI@3We
zlgVm)sPCq7D>`!!(c-c%VmfWCf)q=wrvGlFwYzG&24k7DIRR*ozT8B|wh?cI^{cfi
z;x?<6z0QxbnHvN-S*sS|W~ka!8RUhGWa9<y#_HYa{c8sF2*!o$#wCN)=LRT;ZiDJZ
z%t7o4X-m`qqesQTs`DiyaS&948+nj17~D+!A*8H$%Ydly3HBr)SZ>%GX~w8=$)t7B
zvRf(^mq*8`LajE+`o~V!^wth?OGwg>L})TPVYwWae2K_-=1G+r5JW&&g+uW`t;NVw
zc4(6h{Hvs*rl>9O2^!SSl1|nen?PsciSNg{L|uOTtL4wj!Ub5bqxg<DGaQ>cf46bU
zGb87bh1(q{wF`&?!7splSloJe)3^ps0niFSQthgL)*1kkLGn$vkuR?_iLD@446?W<
zs;W@vLaYrPBH7F>CN0sunb^Y4R*&HWheIov|F@EzkOa8pT#=;CH|HQQj%MvFh162(
zOsfbJZhe1bWFP-$;r;x4f5ZM~WB(k%j0XD`G?3rx*Sh0zPHH@xWHo+5ydS$8Pr>as
zrZbgLe;iik`$?T=f~V9=m7f4_a9k_cJsjOwc&PYEi^Qz6?iE%Ea4;1^{<~HHfr_Z_
z1Ee)CWkaR1W1=TNY(T}{%fR?8QERFpF;bj-OneBOg(<Apg=CteRIcu|g%;THrw6UD
zR3%UVRtexU2Ka0eC{nGad4rOgaWFaX;}~=Kd_}AsrhX8TLa*oaFSHk(Udjptj!o^P
ztI&32G#Lvf@G><+Vs>QS3Q_=+J1d5gj?l+ec`kU;F>X()Iu7g%0N0+{)#n{-Jf=^d
z`YeTz(%cxa6gkp3im#^?2zNcJqL%JtVgLHu7_&$naPeajhI<uLbc#8O9^teuq3IyX
zD+!Cff;w9EPTJzfz`n~9$zHQiO^vef2TQPDv2!A<F+QmQu0pn1LXMWhyp8JI<AiNs
zHwXkAp##}!L{hnsQ>ld1WwDt!(~lsE`X?%UQo$X!la<PNzZtbB0KoINsmf79f}KK9
zlQLp4KX(B7IHV)EHMQAdTG;)iULaY8e10=Ep*d;?jXi}`x|hm5YQ=gYO{iU99ogG8
zbCVe>H9&P!%h>SR-@h)zDV&&jyl|5|q%8GNBgh)DAHnruP7A%@&VTxD9Pq@pj)56p
zz}V;=hZ-bzAPT^ZDJkr^BQA$_e&q4Juebsf%Um2M@8aBAR-Z{D<BmtxH+SVtzuA<6
zfVwLtl%1F|3;<Sx8XWN~`3RMtJ~|UXIvUe*C##WjY8Id_)_pnwXbK$PY|zH1Fe&UD
zPM201my@Gb-f^a-mmQIGz!2djF)(jF@u!w_FLUL_e-3~PYA^M*k++|VfqLCRZT?{D
z^=0IoBQA+_q>LEYR$8()sA<dDTH(%}Qf^CMXORg=v=!2Rvx&^DXA=O5ZAEo(Rc8TW
z0LTn9qW`Nc0FXag3)||E@Y@>sqvMRVZ6|#l3u(RNoh`K;!j+!8BA7~(k(Z>3E4T4{
z47ln1$ZWX<U}QYUwu6Ch8Q>zaM@$sgqqnvR?T99;Hr;X3tqt|$Fwf`sR5jVnF`s1t
zBbG<2BPq5YSoU83*`Q`Pvr$6_S+%4dr=a%Mm6igpuJy12^<R};c{o&iA0K63uDG%{
zcHNLIF<0TmRMKl?m=Z48*J(`DkfpL!WVytU_ol*JBD=9gUGi26qr#Lm!Ye`-A=`V#
zpmT=QJ<oHVXZ|?P=kq<^@9%u)_dCnyv+q_FiaGIyaY@IC$ovXXRog(j(@MBMO`gtb
zM5&6uLMYD<JTk&@FGsNWDE^dcD!8j&lI>9LXpomUNeXTv+pS4a6m`ot3+}3EQGSpI
z?<kL`Z)QE0EA5%>+<LdPy?E9?WIwie*U@(prC2OBfS5j+(BD#S(|}I>6|syzv((?Y
zpx@NE%-N2+NdBP4ZD%gr>soBFOD|DY#NY^Lmy&h2hg74RDV|S}*XK5=Oy{}22I>|f
zRfGvozGO3rnkD!KpZ7)7Xu<j%`g+eTVva`kyN6i4bTMnMmd(t-dyq8w9xE2JG+N1Y
z36{O6n^*cYJfFaJs<+|1+_~(X(?}w@F@Ef&al_5b>LCYlz3f(MFrSSCrqyY2pL<bv
zu0QH{>kJ`h;a=Ru0JFEQ{TVhY)aTI+iLoy=x)P{L0ydVmL;b)f^}5`K&C<UhbNev%
z!=c3pg*Pcmevb;$TOa(*oKo#e9xS>>*7+A!Pq~1%x&t04TRG`JUD$+(En;1YCO6Eu
z#{OK1PI<@^N5Z51rQ8zGBMW`{FJ^YQxeSJko5*ET9khk&daeki&$q|$>ZK>SW~CL{
z-x%bmsjBD|sS@;^Gh&<c+iR2`btpw!|8+C5;l$NF$FA>AO9~>4+Q^?eZ6bZM*GeLx
zEj)*mb7bex?a~5sU6xUk(#Pu8Z^(w;MeMD&U>j>2K28j4`Ir&!_o~BH>x-1{s}Wlc
z-KHFwX;UO|fG~``!ehHEd~MXI=Di}n3c2UAY{~oI^Shba#9~bxc--z^@PZdLiTB=*
ztQZg^AnQr~p%~>l$>tF63EVB^+f^Nb3CE)1MLDMK#rYu9ahZRGp~c!cH1y<HBgqaf
zCQdJ|wGZ+-m@aY_6uO+W6DE{tDd<pR6f{#>cXYZ?k8`R`SyPj0hfnlNCl-$FvD1mi
zOFc8H(lMygex7QW7a%P0o1i>pu!Rzo`i>~8&qvISd6QI#sF5IEs1~gYy~<0uHh$L_
z{RQJ0B>B;oAI}j5%M(JzJ#_!MjuSy;N`7hdzg%mvJ7T)*<`EiA#qpFn!qRLkp-z`;
z?yP!$V=SROE9AUqFn>n7x-@pKgZn67QCITc`ng!vL|nC(mO?eDxIX!6QAf1jLAb4W
zOtT7Ev~7XNf^}S$_$sL+pptC(cw72_AfS#*+j-ZPK<Ay$`T$FxwUtkDd<B}eGbkR~
z*{vRDXD6v6xm#5kp{%x>6S~5ZRUUGpi6*77z+gYE!8_ux-uAw0=-+q_c;BKiCRKGu
z&7^?LH0*b@g&dLd94{vG^V<N7lvqSB=jc;7dBP#+a*ZXMV{p-^%M3-_VLlZXe6XjN
z5WXj|#))D!z2qqH1V2?@a#G*;-r*J)=1(s4;R9LM!%;cL_8k14pR$DGj2`ms50uE#
z6h*o78W6ov^BR%rEovV7W;;*w_Kf!ERce}y6kD{F#0_DN{84|9t<^R<Q;q3l*snu}
z6-5cmQh&H>*9JNu%}y(P%(J8f`i451@6Q{Sv3dens-GNuawTnoqv;g$LjUdip=@qQ
z#bZp)tj-?_->Y_f<PxtMa36KgoD!KDW@pLS`6a|_Z1KN_(JjQ5%R(2EYVXM89IS*t
z*jsXm$6m{yJFM19?LUWO=L!(7H77g)b7A?=g>gRhfPYu)<Raol(mSpBD<6f;H@8v5
z3DeSPX_IpeR`29V`D3Wp;XalPa_Li~9QEyv&yi<1v`(c+R!6rCpEdP*Dp#EmkS;D4
zHJg8L*<ub~(Q;w;{vPN2sm>WppU9hMBWE(ZMk?dU4S9>7snida<p$Za6E5{S{X92&
zK7GN-NRDSU4<X@9(^C;Toi<Y`cc_}q;~Ki~QtuFiho5yhK`4XoS%nw+P+;=lo(Ytv
zm(0aa=Jmous-zT|jIyO?1_w}f+@{^ynW<U!VvB&pAJaDYcDmr#jVKu;FeukI7GQ}^
z-*&(j^=ZFoD%dI*3l`Y+r;bk;N9R^hTo5R|H7L5n*w%moz`^V=+C%QL^2YFHK!7lu
zi>4b&j|~{<u#C%LP{0*gF|57!SAAX}V%n%@xSqffGpd~lu18EG$YNeSd3wYU1+=ZO
z>A^SeB^th^wD&pj!(cx4Fqi}+_*p3SO7O1szRm=&h(AC=)-B&W<#duu8$40L87dWm
zoWKgny3X{v{RhCZi90GiO<(H(HH!nYY?Ii?0=16&ezItVfSTuk87$->44Yc%{1^w+
z83oMI@e71wGoO?nqktMUfGP5oAQUU*V6biYKE+1KdN2jMDuiMS0egUH6Y+Y+szX)X
z!Az!V8=1fw@83TYTFs%V=wN)D`bPZqvHQ=7pvvB0A^{Bu(Ym(jkM$Ay1+r1#7|ejv
zf-tPq9U^xO<Z2VCW5!xQrC7lP@&{H4)`MU9*WaoH-%@*|!vdWZ=zpR>%U)^z|FH9I
zRDJ{p>$HXn?s;qR=5Ex0WK09}ttT*Yt=DS2kawWA%EH(72E9iOM)e3-MWwe-hC9|<
zq0@7`ary^F$6j4U2Tuk8&`l<SjER6w`oN$s)<8j1z;6Z00vLeO=B0u#PIed!m>>h&
F{{fuiDn0-J


From 48f7746d810c22068db5b5a7b1dbb17fa47ca665 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Sat, 2 Aug 2014 20:40:36 -0700
Subject: [PATCH 38/69] Removed the waste line

---
 python/pyspark/java_gateway.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/python/pyspark/java_gateway.py b/python/pyspark/java_gateway.py
index f7f4a82ede3a0..cea7d0975e5d1 100644
--- a/python/pyspark/java_gateway.py
+++ b/python/pyspark/java_gateway.py
@@ -76,10 +76,7 @@ def run(self):
         EchoOutputThread(proc.stdout).start()
 
     # Connect to the gateway
-    # If start_callback_server is True, it looks like callback server is not killed
-    # process is hang up and test case does not move forward.
-    #gateway = JavaGateway(GatewayClient(port=gateway_port), auto_convert=False, start_callback_server=True)
-    gateway = JavaGateway(GatewayClient(port=gateway_port), auto_convert=False, start_callback_server=False)
+    gateway = JavaGateway(GatewayClient(port=gateway_port), auto_convert=False)
 
     # Import the classes used by PySpark
     java_import(gateway.jvm, "org.apache.spark.SparkConf")

From d2127d67d87c580a6f787973dcb4dea671243ae4 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Sun, 3 Aug 2014 19:25:13 -0700
Subject: [PATCH 39/69] implemented reduce and count function in Dstream

---
 .../python/streaming/network_wordcount.py     |  2 ++
 python/pyspark/streaming/dstream.py           | 27 ++++++++++++-------
 2 files changed, 19 insertions(+), 10 deletions(-)

diff --git a/examples/src/main/python/streaming/network_wordcount.py b/examples/src/main/python/streaming/network_wordcount.py
index 2bbb36a6b787e..f6fba4488e238 100644
--- a/examples/src/main/python/streaming/network_wordcount.py
+++ b/examples/src/main/python/streaming/network_wordcount.py
@@ -19,5 +19,7 @@
     reduced_lines = mapped_lines.reduceByKey(add)
 
     reduced_lines.pyprint()
+    count_lines = mapped_lines.count()
+    count_lines.pyprint()
     ssc.start()
     ssc.awaitTermination()
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 0ba2b4b38a281..e6cd2eb9a49af 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -22,25 +22,23 @@ def count(self):
         """
 
         """
-        pass
-        #TODO: make sure count implementation, thiis different from what pyspark does
-        #return self._mapPartitions(lambda i: [sum(1 for _ in i)]).map(lambda x: (None, 1))
+        # TODO: make sure count implementation, this different from what pyspark does
+        return self._mapPartitions(lambda i: [sum(1 for _ in i)])._sum()
 
     def _sum(self):
         """
         """
-        pass
-        #return self._mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
+        return self._mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
 
     def print_(self):
         """
-        Since print is reserved name for python, we cannot make a print method function.
+        Since print is reserved name for python, we cannot define a print method function.
         This function prints serialized data in RDD in DStream because Scala and Java cannot
-        deserialized pickled python object. Please use DStream.pyprint() instead to print result.
+        deserialized pickled python object. Please use DStream.pyprint() instead to print results.
 
         Call DStream.print().
         """
-        #hack to call print function in DStream
+        # a hack to call print function in DStream
         getattr(self._jdstream, "print")()
 
     def filter(self, f):
@@ -79,17 +77,23 @@ def _mapPartitionsWithIndex(self, f, preservesPartitioning=False):
         """
         return PipelinedDStream(self, f, preservesPartitioning)
 
+    def reduce(self, func):
+        """
+
+        """
+        return self.map(lambda x: (None, x)).reduceByKey(func, 1).map(lambda x: x[1])
+
     def reduceByKey(self, func, numPartitions=None):
         """
         Merge the value for each key using an associative reduce function.
 
         This will also perform the merging locally on each mapper before
-        sending resuls to reducer, similarly to a "combiner" in MapReduce.
+        sending results to reducer, similarly to a "combiner" in MapReduce.
 
         Output will be hash-partitioned with C{numPartitions} partitions, or
         the default parallelism level if C{numPartitions} is not specified.
         """
-        return self.combineByKey(lambda x:x, func, func, numPartitions)
+        return self.combineByKey(lambda x: x, func, func, numPartitions)
 
     def combineByKey(self, createCombiner, mergeValue, mergeCombiners,
                       numPartitions = None):
@@ -99,6 +103,7 @@ def combineByKey(self, createCombiner, mergeValue, mergeCombiners,
         """
         if numPartitions is None:
             numPartitions = self._defaultReducePartitions()
+
         def combineLocally(iterator):
             combiners = {}
             for x in iterator:
@@ -116,6 +121,7 @@ def combineLocally(iterator):
             return combiners.iteritems()
         locally_combined = self._mapPartitions(combineLocally)
         shuffled = locally_combined.partitionBy(numPartitions)
+
         def _mergeCombiners(iterator):
             combiners = {}
             for (k, v) in iterator:
@@ -124,6 +130,7 @@ def _mergeCombiners(iterator):
                 else:
                     combiners[k] = mergeCombiners(combiners[k], v)
             return combiners.iteritems()
+
         return shuffled._mapPartitions(_mergeCombiners)
 
     def partitionBy(self, numPartitions, partitionFunc=None):

From 31e42607a84f10cfa4c9e48f95ffa6280df68e7f Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Sun, 3 Aug 2014 21:51:11 -0700
Subject: [PATCH 40/69] clean up examples

---
 .../main/python/streaming/network_wordcount.py    | 10 ++++------
 examples/src/main/python/streaming/wordcount.py   | 15 ++++-----------
 2 files changed, 8 insertions(+), 17 deletions(-)

diff --git a/examples/src/main/python/streaming/network_wordcount.py b/examples/src/main/python/streaming/network_wordcount.py
index f6fba4488e238..9b7af07803b4d 100644
--- a/examples/src/main/python/streaming/network_wordcount.py
+++ b/examples/src/main/python/streaming/network_wordcount.py
@@ -14,12 +14,10 @@
     ssc = StreamingContext(conf=conf, duration=Seconds(1))
 
     lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
-    fm_lines = lines.flatMap(lambda x: x.split(" "))
-    mapped_lines = fm_lines.map(lambda x: (x, 1))
-    reduced_lines = mapped_lines.reduceByKey(add)
+    words = lines.flatMap(lambda line: line.split(" "))
+    mapped_words = words.map(lambda word: (word, 1))
+    count = mapped_words.reduceByKey(add)
 
-    reduced_lines.pyprint()
-    count_lines = mapped_lines.count()
-    count_lines.pyprint()
+    count.pyprint()
     ssc.start()
     ssc.awaitTermination()
diff --git a/examples/src/main/python/streaming/wordcount.py b/examples/src/main/python/streaming/wordcount.py
index ee52c4e178142..2426345711086 100644
--- a/examples/src/main/python/streaming/wordcount.py
+++ b/examples/src/main/python/streaming/wordcount.py
@@ -11,21 +11,14 @@
         exit(-1)
     conf = SparkConf()
     conf.setAppName("PythonStreamingWordCount")
-    conf.set("spark.default.parallelism", 1)
 
-# still has a bug
-#    ssc = StreamingContext(appName="PythonStreamingWordCount", duration=Seconds(1))
     ssc = StreamingContext(conf=conf, duration=Seconds(1))
 
     lines = ssc.textFileStream(sys.argv[1])
-    fm_lines = lines.flatMap(lambda x: x.split(" "))
-    filtered_lines = fm_lines.filter(lambda line: "Spark" in line)
-    mapped_lines = fm_lines.map(lambda x: (x, 1))
-    reduced_lines = mapped_lines.reduceByKey(add)
+    words = lines.flatMap(lambda line: line.split(" "))
+    mapped_words = words.map(lambda x: (x, 1))
+    count = mapped_words.reduceByKey(add)
     
-    fm_lines.pyprint()
-    filtered_lines.pyprint()
-    mapped_lines.pyprint()
-    reduced_lines.pyprint()
+    count.pyprint()
     ssc.start()
     ssc.awaitTermination()

From c40c0eff4847d876e2b68d99befc8242df41db32 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Sun, 3 Aug 2014 22:05:28 -0700
Subject: [PATCH 41/69] added stop in StreamingContext

---
 python/pyspark/streaming/context.py | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 5952e81a4bef3..01201f66421f8 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -121,3 +121,15 @@ def textFileStream(self, directory):
         file system. FIle names starting with . are ignored.
         """
         return DStream(self._jssc.textFileStream(directory), self, UTF8Deserializer())
+
+    def stop(self, stopSparkContext=True):
+        """
+        Stop the execution of the streams immediately (does not wait for all received data
+        to be processed).
+        """
+        
+        try:
+            self._jssc.stop(stopSparkContext)
+        finally:
+            # Stop Callback server
+            SparkContext._gateway.shutdown()

From a613b852668f88069555b7039d4e3c9f536bab93 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Sun, 3 Aug 2014 23:27:56 -0700
Subject: [PATCH 42/69] clean up dstream.py

---
 python/pyspark/streaming/dstream.py | 11 +----------
 1 file changed, 1 insertion(+), 10 deletions(-)

diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index e6cd2eb9a49af..7233ae5249e6d 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -20,9 +20,7 @@ def __init__(self, jdstream, ssc, jrdd_deserializer):
 
     def count(self):
         """
-
         """
-        # TODO: make sure count implementation, this different from what pyspark does
         return self._mapPartitions(lambda i: [sum(1 for _ in i)])._sum()
 
     def _sum(self):
@@ -79,7 +77,6 @@ def _mapPartitionsWithIndex(self, f, preservesPartitioning=False):
 
     def reduce(self, func):
         """
-
         """
         return self.map(lambda x: (None, x)).reduceByKey(func, 1).map(lambda x: x[1])
 
@@ -107,12 +104,6 @@ def combineByKey(self, createCombiner, mergeValue, mergeCombiners,
         def combineLocally(iterator):
             combiners = {}
             for x in iterator:
-
-                #TODO for count operation make sure count implementation
-                # This is different from what pyspark does
-                #if isinstance(x, int):
-                #    x = ("", x)
-
                 (k, v) = x
                 if k not in combiners:
                     combiners[k] = createCombiner(v)
@@ -142,6 +133,7 @@ def partitionBy(self, numPartitions, partitionFunc=None):
 
         if partitionFunc is None:
             partitionFunc = lambda x: 0 if x is None else hash(x)
+
         # Transferring O(n) objects to Java is too expensive.  Instead, we'll
         # form the hash buckets in Python, transferring O(numPartitions) objects
         # to Java.  Each object is a (splitNumber, [objects]) pair.
@@ -215,7 +207,6 @@ def takeAndPrint(rdd, time):
 
         self.foreachRDD(takeAndPrint)
 
-
     #def transform(self, func):
     #    from utils import RDDFunction
     #    wrapped_func = RDDFunction(self.ctx, self._jrdd_deserializer, func)

From fb08559258681d8f2a0e56f0aa8d5df027bb7a90 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Sun, 3 Aug 2014 23:47:14 -0700
Subject: [PATCH 43/69] initial commit for testcase

---
 python/pyspark/streaming_tests.py | 58 +++++++++++++++++++++++++++++++
 1 file changed, 58 insertions(+)
 create mode 100644 python/pyspark/streaming_tests.py

diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
new file mode 100644
index 0000000000000..95c5489a5695b
--- /dev/null
+++ b/python/pyspark/streaming_tests.py
@@ -0,0 +1,58 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+"""
+Unit tests for PySpark; additional tests are implemented as doctests in
+individual modules.
+
+This file will merged to tests.py. But for now, this file is separated to
+focus to streaming test case
+
+"""
+from fileinput import input
+from glob import glob
+import os
+import re
+import shutil
+import subprocess
+import sys
+import tempfile
+import time
+import unittest
+import zipfile
+
+from pyspark.streaming.context import StreamingContext
+from pyspark.streaming.duration import *
+
+
+SPARK_HOME = os.environ["SPARK_HOME"]
+
+
+class PySparkStreamingTestCase(unittest.TestCase):
+
+    def setUp(self):
+        self._old_sys_path = list(sys.path)
+        class_name = self.__class__.__name__
+        self.ssc = StreamingContext(appName=class_name, duration=Seconds(1))
+
+    def tearDown(self):
+        self.ssc.stop()
+        sys.path = self._old_sys_path
+
+
+if __name__ == "__main__":
+    unittest.main()

From 28aa56dbc6f7d07c86aa5c9095c6cd9c43d99e8f Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 4 Aug 2014 09:47:48 -0700
Subject: [PATCH 44/69] WIP

---
 .../main/python/streaming/test_oprations.py   | 24 +++++++++++++++++++
 python/pyspark/streaming/dstream.py           |  1 -
 .../streaming/api/python/PythonDStream.scala  |  3 ++-
 3 files changed, 26 insertions(+), 2 deletions(-)
 create mode 100644 examples/src/main/python/streaming/test_oprations.py

diff --git a/examples/src/main/python/streaming/test_oprations.py b/examples/src/main/python/streaming/test_oprations.py
new file mode 100644
index 0000000000000..cb338ced5f228
--- /dev/null
+++ b/examples/src/main/python/streaming/test_oprations.py
@@ -0,0 +1,24 @@
+import sys
+from operator import add
+
+from pyspark.conf import SparkConf
+from pyspark.streaming.context import StreamingContext
+from pyspark.streaming.duration import *
+
+if __name__ == "__main__":
+    if len(sys.argv) != 3:
+        print >> sys.stderr, "Usage: wordcount <hostname> <port>"
+        exit(-1)
+    conf = SparkConf()
+    conf.setAppName("PythonStreamingNetworkWordCount")
+    ssc = StreamingContext(conf=conf, duration=Seconds(1))
+
+    lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
+    words = lines.flatMap(lambda line: line.split(" "))
+    mapped_words = words.map(lambda word: (word, 1))
+    count = mapped_words.reduceByKey(add)
+
+    count.pyprint()
+    ssc.start()
+#    ssc.awaitTermination()
+    ssc.stop()
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 7233ae5249e6d..c5452b952cac4 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -120,7 +120,6 @@ def _mergeCombiners(iterator):
                     combiners[k] = v
                 else:
                     combiners[k] = mergeCombiners(combiners[k], v)
-            return combiners.iteritems()
 
         return shuffled._mapPartitions(_mergeCombiners)
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 751b7504f1cea..59ac8ffa7924b 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -124,4 +124,5 @@ class PythonTransformedDStream(
 
   val asJavaDStream  = JavaDStream.fromDStream(this)
 }
-*/
\ No newline at end of file
+*/
+

From ba5112dd4a636cf25e5fb28cfecf8417a72bd423 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 4 Aug 2014 09:57:16 -0700
Subject: [PATCH 45/69] update comment

---
 python/pyspark/streaming/dstream.py | 28 ++++++++++++++++++++++++----
 1 file changed, 24 insertions(+), 4 deletions(-)

diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 7233ae5249e6d..f4655d11b9b10 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -1,3 +1,20 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
 from collections import defaultdict
 from itertools import chain, ifilter, imap
 import operator
@@ -20,11 +37,13 @@ def __init__(self, jdstream, ssc, jrdd_deserializer):
 
     def count(self):
         """
+        Return a new DStream which contains the number of elements in this DStream.
         """
         return self._mapPartitions(lambda i: [sum(1 for _ in i)])._sum()
 
     def _sum(self):
         """
+        Add up the elements in this DStream.
         """
         return self._mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
 
@@ -41,7 +60,7 @@ def print_(self):
 
     def filter(self, f):
         """
-        Return DStream containing only the elements that satisfy predicate.
+        Return a new DStream containing only the elements that satisfy predicate.
         """
         def func(iterator): return ifilter(f, iterator)
         return self._mapPartitions(func)
@@ -56,7 +75,7 @@ def func(s, iterator): return chain.from_iterable(imap(f, iterator))
 
     def map(self, f):
         """
-        Return DStream by applying a function to each element of DStream.
+        Return a new DStream by applying a function to each element of DStream.
         """
         def func(iterator): return imap(f, iterator)
         return self._mapPartitions(func)
@@ -71,12 +90,14 @@ def func(s, iterator): return f(iterator)
     def _mapPartitionsWithIndex(self, f, preservesPartitioning=False):
         """
         Return a new DStream by applying a function to each partition of this DStream,
-        While tracking the index of the original partition.
+        while tracking the index of the original partition.
         """
         return PipelinedDStream(self, f, preservesPartitioning)
 
     def reduce(self, func):
         """
+        Return a new DStream by reduceing the elements of this RDD using the specified
+        commutative and associative binary operator.
         """
         return self.map(lambda x: (None, x)).reduceByKey(func, 1).map(lambda x: x[1])
 
@@ -268,4 +289,3 @@ def _jdstream(self):
 
     def _is_pipelinable(self):
         return not (self.is_cached)
-

From 56fae45acb729608f255192ccea7d6406fe4f825 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 4 Aug 2014 16:07:48 -0700
Subject: [PATCH 46/69] WIP

---
 .../main/python/streaming/test_oprations.py   |  5 +--
 python/pyspark/streaming/context.py           |  5 +++
 python/pyspark/streaming/dstream.py           |  4 ++-
 python/pyspark/streaming/utils.py             |  1 -
 .../streaming/api/python/PythonDStream.scala  | 32 +++++++++++++++++--
 5 files changed, 41 insertions(+), 6 deletions(-)

diff --git a/examples/src/main/python/streaming/test_oprations.py b/examples/src/main/python/streaming/test_oprations.py
index cb338ced5f228..084902b6a2f0d 100644
--- a/examples/src/main/python/streaming/test_oprations.py
+++ b/examples/src/main/python/streaming/test_oprations.py
@@ -15,10 +15,11 @@
 
     lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
     words = lines.flatMap(lambda line: line.split(" "))
+#    ssc.checkpoint("checkpoint")
     mapped_words = words.map(lambda word: (word, 1))
     count = mapped_words.reduceByKey(add)
 
     count.pyprint()
     ssc.start()
-#    ssc.awaitTermination()
-    ssc.stop()
+    ssc.awaitTermination()
+#    ssc.stop()
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 01201f66421f8..dfaa5cfbbae27 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -133,3 +133,8 @@ def stop(self, stopSparkContext=True):
         finally:
             # Stop Callback server
             SparkContext._gateway.shutdown()
+
+    def checkpoint(self, directory):
+        """
+        """
+        self._jssc.checkpoint(directory)
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 37f625e2806e9..3026254f8fab6 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -172,7 +172,8 @@ def add_shuffle_key(split, iterator):
         with _JavaStackTrace(self.ctx) as st:
             partitioner = self.ctx._jvm.PythonPartitioner(numPartitions,
                                                       id(partitionFunc))
-            jdstream = self.ctx._jvm.PairwiseDStream(keyed._jdstream.dstream(), partitioner).asJavaDStream()
+            jdstream = self.ctx._jvm.PythonPairwiseDStream(keyed._jdstream.dstream(),
+                                                           partitioner).asJavaDStream()
         dstream = DStream(jdstream, self._ssc, BatchedSerializer(outputSerializer))
         # This is required so that id(partitionFunc) remains unique, even if
         # partitionFunc is a lambda:
@@ -233,6 +234,7 @@ def takeAndPrint(rdd, time):
     #    jdstream = self.ctx._jvm.PythonTransformedDStream(self._jdstream.dstream(), wrapped_func).toJavaDStream
     #    return DStream(jdstream, self._ssc, ...)  ## DO NOT KNOW HOW 
 
+
 class PipelinedDStream(DStream):
     def __init__(self, prev, func, preservesPartitioning=False):
         if not isinstance(prev, PipelinedDStream) or not prev._is_pipelinable():
diff --git a/python/pyspark/streaming/utils.py b/python/pyspark/streaming/utils.py
index c60ecd1ed607a..aa5e19adbd927 100644
--- a/python/pyspark/streaming/utils.py
+++ b/python/pyspark/streaming/utils.py
@@ -37,7 +37,6 @@ class Java:
         implements = ['org.apache.spark.streaming.api.python.PythonRDDFunction']
 
 
-
 def msDurationToString(ms):
     """
     Returns a human-readable string representing a duration such as "35ms"
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 59ac8ffa7924b..861def33671f1 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -25,7 +25,7 @@ import org.apache.spark._
 import org.apache.spark.rdd.RDD
 import org.apache.spark.api.python._
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.streaming.{Duration, Time}
+import org.apache.spark.streaming.{StreamingContext, Duration, Time}
 import org.apache.spark.streaming.dstream._
 import org.apache.spark.streaming.api.java._
 
@@ -64,7 +64,7 @@ class PythonDStream[T: ClassTag](
 }
 
 
-private class PairwiseDStream(prev:DStream[Array[Byte]], partitioner: Partitioner) extends
+private class PythonPairwiseDStream(prev:DStream[Array[Byte]], partitioner: Partitioner) extends
 DStream[Array[Byte]](prev.ssc){
   override def dependencies = List(prev)
 
@@ -105,6 +105,7 @@ class PythonForeachDStream(
 
   this.register()
 }
+
 /*
 This does not work. Ignore this for now. -TD
 class PythonTransformedDStream(
@@ -126,3 +127,30 @@ class PythonTransformedDStream(
 }
 */
 
+/**
+ * This is a input stream just for the unitest. This is equivalent to a checkpointable,
+ * replayable, reliable message queue like Kafka. It requires a sequence as input, and
+ * returns the i_th element at the i_th batch unde manual clock.
+ */
+class PythonTestInputStream(ssc_ : StreamingContext, filename: String, numPartitions: Int)
+  extends InputDStream[Array[Byte]](ssc_) {
+
+  def start() {}
+
+  def stop() {}
+
+  def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
+    logInfo("Computing RDD for time " + validTime)
+    val index = ((validTime - zeroTime) / slideDuration - 1).toInt
+    //val selectedInput = if (index < input.size) input(index) else Seq[T]()
+
+    // lets us test cases where RDDs are not created
+    //if (filename == null)
+    //  return None
+
+    //val rdd = ssc.sc.makeRDD(selectedInput, numPartitions)
+    val rdd = PythonRDD.readRDDFromFile(ssc.sc, filename, numPartitions).rdd
+    logInfo("Created RDD " + rdd.id + " with " + filename)
+    Some(rdd)
+  }
+}
\ No newline at end of file

From f671cdb57475cac5a0418898c42a02df91c83ed5 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Tue, 5 Aug 2014 00:09:38 -0700
Subject: [PATCH 47/69] WIP: added PythonTestInputStream

---
 .../main/python/streaming/test_oprations.py   | 14 +++--------
 python/pyspark/streaming/context.py           | 25 +++++++++++++++++++
 python/pyspark/streaming/dstream.py           |  1 +
 .../api/java/JavaStreamingContext.scala       |  3 +++
 .../streaming/api/python/PythonDStream.scala  | 13 ++++++----
 5 files changed, 41 insertions(+), 15 deletions(-)

diff --git a/examples/src/main/python/streaming/test_oprations.py b/examples/src/main/python/streaming/test_oprations.py
index 084902b6a2f0d..3338a766b9cc3 100644
--- a/examples/src/main/python/streaming/test_oprations.py
+++ b/examples/src/main/python/streaming/test_oprations.py
@@ -6,20 +6,14 @@
 from pyspark.streaming.duration import *
 
 if __name__ == "__main__":
-    if len(sys.argv) != 3:
-        print >> sys.stderr, "Usage: wordcount <hostname> <port>"
-        exit(-1)
     conf = SparkConf()
     conf.setAppName("PythonStreamingNetworkWordCount")
     ssc = StreamingContext(conf=conf, duration=Seconds(1))
 
-    lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
-    words = lines.flatMap(lambda line: line.split(" "))
-#    ssc.checkpoint("checkpoint")
-    mapped_words = words.map(lambda word: (word, 1))
-    count = mapped_words.reduceByKey(add)
+    test_input = ssc._testInputStream([1,1,1,1])
+    mapped = test_input.map(lambda x: (x, 1))
+    mapped.pyprint()
 
-    count.pyprint()
     ssc.start()
-    ssc.awaitTermination()
+#    ssc.awaitTermination()
 #    ssc.stop()
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index dfaa5cfbbae27..d544eab9b8fc7 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -17,6 +17,7 @@
 
 import sys
 from signal import signal, SIGTERM, SIGINT
+from tempfile import NamedTemporaryFile
 
 from pyspark.conf import SparkConf
 from pyspark.files import SparkFiles
@@ -138,3 +139,27 @@ def checkpoint(self, directory):
         """
         """
         self._jssc.checkpoint(directory)
+
+    def _testInputStream(self, test_input, numSlices=None):
+
+        numSlices = numSlices or self._sc.defaultParallelism
+        # Calling the Java parallelize() method with an ArrayList is too slow,
+        # because it sends O(n) Py4J commands.  As an alternative, serialized
+        # objects are written to a file and loaded through textFile().
+        tempFile = NamedTemporaryFile(delete=False, dir=self._sc._temp_dir)
+        # Make sure we distribute data evenly if it's smaller than self.batchSize
+        if "__len__" not in dir(test_input):
+            c = list(test_input)    # Make it a list so we can compute its length
+        batchSize = min(len(test_input) // numSlices, self._sc._batchSize)
+        if batchSize > 1:
+            serializer = BatchedSerializer(self._sc._unbatched_serializer,
+                                           batchSize)
+        else:
+            serializer = self._sc._unbatched_serializer
+        serializer.dump_stream(test_input, tempFile)
+        tempFile.close()
+        print tempFile.name
+        jinput_stream = self._jvm.PythonTestInputStream(self._jssc,
+                                                        tempFile.name,
+                                                        numSlices).asJavaDStream()
+        return DStream(jinput_stream, self, UTF8Deserializer())
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 3026254f8fab6..77c9a22239c69 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -141,6 +141,7 @@ def _mergeCombiners(iterator):
                     combiners[k] = v
                 else:
                     combiners[k] = mergeCombiners(combiners[k], v)
+            return combiners.iteritems()
 
         return shuffled._mapPartitions(_mergeCombiners)
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaStreamingContext.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaStreamingContext.scala
index 18605cac7006c..b51d5ff0be9fc 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaStreamingContext.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaStreamingContext.scala
@@ -546,6 +546,9 @@ class JavaStreamingContext(val ssc: StreamingContext) {
  * JavaStreamingContext object contains a number of utility functions.
  */
 object JavaStreamingContext {
+  implicit def fromStreamingContext(ssc: StreamingContext): JavaStreamingContext = new JavaStreamingContext(ssc)
+
+  implicit def toStreamingContext(jssc: JavaStreamingContext): StreamingContext = jssc.ssc
 
   /**
    * Either recreate a StreamingContext from checkpoint data or create a new StreamingContext.
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 861def33671f1..96440b15d0285 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -23,6 +23,7 @@ import scala.reflect.ClassTag
 
 import org.apache.spark._
 import org.apache.spark.rdd.RDD
+import org.apache.spark.api.java._
 import org.apache.spark.api.python._
 import org.apache.spark.broadcast.Broadcast
 import org.apache.spark.streaming.{StreamingContext, Duration, Time}
@@ -130,10 +131,10 @@ class PythonTransformedDStream(
 /**
  * This is a input stream just for the unitest. This is equivalent to a checkpointable,
  * replayable, reliable message queue like Kafka. It requires a sequence as input, and
- * returns the i_th element at the i_th batch unde manual clock.
+ * returns the i_th element at the i_th batch under manual clock.
  */
-class PythonTestInputStream(ssc_ : StreamingContext, filename: String, numPartitions: Int)
-  extends InputDStream[Array[Byte]](ssc_) {
+class PythonTestInputStream(ssc_ : JavaStreamingContext, filename: String, numPartitions: Int)
+  extends InputDStream[Array[Byte]](JavaStreamingContext.toStreamingContext(ssc_)){
 
   def start() {}
 
@@ -141,7 +142,7 @@ class PythonTestInputStream(ssc_ : StreamingContext, filename: String, numPartit
 
   def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
     logInfo("Computing RDD for time " + validTime)
-    val index = ((validTime - zeroTime) / slideDuration - 1).toInt
+    //val index = ((validTime - zeroTime) / slideDuration - 1).toInt
     //val selectedInput = if (index < input.size) input(index) else Seq[T]()
 
     // lets us test cases where RDDs are not created
@@ -149,8 +150,10 @@ class PythonTestInputStream(ssc_ : StreamingContext, filename: String, numPartit
     //  return None
 
     //val rdd = ssc.sc.makeRDD(selectedInput, numPartitions)
-    val rdd = PythonRDD.readRDDFromFile(ssc.sc, filename, numPartitions).rdd
+    val rdd = PythonRDD.readRDDFromFile(JavaSparkContext.fromSparkContext(ssc_.sparkContext), filename, numPartitions).rdd
     logInfo("Created RDD " + rdd.id + " with " + filename)
     Some(rdd)
   }
+
+  val asJavaDStream  = JavaDStream.fromDStream(this)
 }
\ No newline at end of file

From a120d071f8b8e07b6c57386d8ffede8890f827dc Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Wed, 6 Aug 2014 19:11:17 -0700
Subject: [PATCH 48/69] WIP

---
 .../scala/org/apache/spark/api/python/PythonRDD.scala  |  2 ++
 examples/src/main/python/streaming/test_oprations.py   | 10 +++++++---
 python/pyspark/streaming/context.py                    |  6 +++++-
 3 files changed, 14 insertions(+), 4 deletions(-)

diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
index b4ce4b88ca65d..668e318e7a545 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
@@ -306,6 +306,8 @@ private[spark] object PythonRDD extends Logging {
     } catch {
       case eof: EOFException => {}
     }
+    println("RDDDD ==================")
+    println(objs)
     JavaRDD.fromRDD(sc.sc.parallelize(objs, parallelism))
   }
 
diff --git a/examples/src/main/python/streaming/test_oprations.py b/examples/src/main/python/streaming/test_oprations.py
index 3338a766b9cc3..5ee0bd4b31253 100644
--- a/examples/src/main/python/streaming/test_oprations.py
+++ b/examples/src/main/python/streaming/test_oprations.py
@@ -9,11 +9,15 @@
     conf = SparkConf()
     conf.setAppName("PythonStreamingNetworkWordCount")
     ssc = StreamingContext(conf=conf, duration=Seconds(1))
+    ssc.checkpoint("/tmp/spark_ckp")
 
-    test_input = ssc._testInputStream([1,1,1,1])
-    mapped = test_input.map(lambda x: (x, 1))
-    mapped.pyprint()
+    test_input = ssc._testInputStream([[1],[1],[1]])
+#    ssc.checkpoint("/tmp/spark_ckp")
+    fm_test = test_input.flatMap(lambda x: x.split(" "))
+    mapped_test = fm_test.map(lambda x: (x, 1))
 
+
+    mapped_test.print_()
     ssc.start()
 #    ssc.awaitTermination()
 #    ssc.stop()
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index d544eab9b8fc7..882db547faa39 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -146,7 +146,10 @@ def _testInputStream(self, test_input, numSlices=None):
         # Calling the Java parallelize() method with an ArrayList is too slow,
         # because it sends O(n) Py4J commands.  As an alternative, serialized
         # objects are written to a file and loaded through textFile().
-        tempFile = NamedTemporaryFile(delete=False, dir=self._sc._temp_dir)
+
+        #tempFile = NamedTemporaryFile(delete=False, dir=self._sc._temp_dir)
+        tempFile = open("/tmp/spark_rdd", "wb")
+
         # Make sure we distribute data evenly if it's smaller than self.batchSize
         if "__len__" not in dir(test_input):
             c = list(test_input)    # Make it a list so we can compute its length
@@ -157,6 +160,7 @@ def _testInputStream(self, test_input, numSlices=None):
         else:
             serializer = self._sc._unbatched_serializer
         serializer.dump_stream(test_input, tempFile)
+        tempFile.flush()
         tempFile.close()
         print tempFile.name
         jinput_stream = self._jvm.PythonTestInputStream(self._jssc,

From 90ae568e4fe63338d60b92fe105090a67bb15f9b Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Sun, 10 Aug 2014 18:43:09 -0700
Subject: [PATCH 49/69] WIP added test case

---
 .../apache/spark/api/python/PythonRDD.scala   |  2 -
 .../main/python/streaming/test_oprations.py   | 25 +++++---
 python/pyspark/streaming/context.py           | 16 +++--
 python/pyspark/streaming/dstream.py           | 22 +++++--
 python/pyspark/streaming_tests.py             | 62 +++++++++++++++++--
 python/pyspark/worker.py                      |  2 +-
 .../streaming/api/java/JavaDStreamLike.scala  |  9 +++
 .../streaming/api/python/PythonDStream.scala  | 19 +++---
 .../spark/streaming/dstream/DStream.scala     | 17 +++++
 9 files changed, 134 insertions(+), 40 deletions(-)

diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
index 668e318e7a545..b4ce4b88ca65d 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
@@ -306,8 +306,6 @@ private[spark] object PythonRDD extends Logging {
     } catch {
       case eof: EOFException => {}
     }
-    println("RDDDD ==================")
-    println(objs)
     JavaRDD.fromRDD(sc.sc.parallelize(objs, parallelism))
   }
 
diff --git a/examples/src/main/python/streaming/test_oprations.py b/examples/src/main/python/streaming/test_oprations.py
index 5ee0bd4b31253..24ebe23d63166 100644
--- a/examples/src/main/python/streaming/test_oprations.py
+++ b/examples/src/main/python/streaming/test_oprations.py
@@ -9,15 +9,22 @@
     conf = SparkConf()
     conf.setAppName("PythonStreamingNetworkWordCount")
     ssc = StreamingContext(conf=conf, duration=Seconds(1))
-    ssc.checkpoint("/tmp/spark_ckp")
 
-    test_input = ssc._testInputStream([[1],[1],[1]])
-#    ssc.checkpoint("/tmp/spark_ckp")
-    fm_test = test_input.flatMap(lambda x: x.split(" "))
-    mapped_test = fm_test.map(lambda x: (x, 1))
+    test_input = ssc._testInputStream([1,2,3])
+    class buff:
+        pass
+   
+    fm_test = test_input.map(lambda x: (x, 1))
+    fm_test.test_output(buff)
 
-
-    mapped_test.print_()
     ssc.start()
-#    ssc.awaitTermination()
-#    ssc.stop()
+    while True:
+        ssc.awaitTermination(50)
+        try:
+            buff.result
+            break
+        except AttributeError:
+            pass
+
+    ssc.stop()
+    print buff.result
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 882db547faa39..0d7665d645be8 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -100,10 +100,10 @@ def awaitTermination(self, timeout=None):
         """
         Wait for the execution to stop.
         """
-        if timeout:
-            self._jssc.awaitTermination(timeout)
-        else:
+        if timeout is None:
             self._jssc.awaitTermination()
+        else:
+            self._jssc.awaitTermination(timeout)
 
     # start from simple one. storageLevel is not passed for now.
     def socketTextStream(self, hostname, port):
@@ -137,6 +137,7 @@ def stop(self, stopSparkContext=True):
 
     def checkpoint(self, directory):
         """
+        Not tested
         """
         self._jssc.checkpoint(directory)
 
@@ -147,8 +148,7 @@ def _testInputStream(self, test_input, numSlices=None):
         # because it sends O(n) Py4J commands.  As an alternative, serialized
         # objects are written to a file and loaded through textFile().
 
-        #tempFile = NamedTemporaryFile(delete=False, dir=self._sc._temp_dir)
-        tempFile = open("/tmp/spark_rdd", "wb")
+        tempFile = NamedTemporaryFile(delete=False, dir=self._sc._temp_dir)
 
         # Make sure we distribute data evenly if it's smaller than self.batchSize
         if "__len__" not in dir(test_input):
@@ -160,10 +160,8 @@ def _testInputStream(self, test_input, numSlices=None):
         else:
             serializer = self._sc._unbatched_serializer
         serializer.dump_stream(test_input, tempFile)
-        tempFile.flush()
-        tempFile.close()
-        print tempFile.name
+
         jinput_stream = self._jvm.PythonTestInputStream(self._jssc,
                                                         tempFile.name,
                                                         numSlices).asJavaDStream()
-        return DStream(jinput_stream, self, UTF8Deserializer())
+        return DStream(jinput_stream, self, PickleSerializer())
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 77c9a22239c69..47196196466db 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -47,7 +47,7 @@ def _sum(self):
         """
         return self._mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
 
-    def print_(self):
+    def print_(self, label=None):
         """
         Since print is reserved name for python, we cannot define a print method function.
         This function prints serialized data in RDD in DStream because Scala and Java cannot
@@ -56,7 +56,7 @@ def print_(self):
         Call DStream.print().
         """
         # a hack to call print function in DStream
-        getattr(self._jdstream, "print")()
+        getattr(self._jdstream, "print")(label)
 
     def filter(self, f):
         """
@@ -217,6 +217,7 @@ def pyprint(self):
 
         """
         def takeAndPrint(rdd, time):
+            print "take and print ==================="
             taken = rdd.take(11)
             print "-------------------------------------------"
             print "Time: %s" % (str(time))
@@ -229,11 +230,24 @@ def takeAndPrint(rdd, time):
 
         self.foreachRDD(takeAndPrint)
 
-    #def transform(self, func):
+    #def transform(self, func): - TD
     #    from utils import RDDFunction
     #    wrapped_func = RDDFunction(self.ctx, self._jrdd_deserializer, func)
     #    jdstream = self.ctx._jvm.PythonTransformedDStream(self._jdstream.dstream(), wrapped_func).toJavaDStream
-    #    return DStream(jdstream, self._ssc, ...)  ## DO NOT KNOW HOW 
+    #    return DStream(jdstream, self._ssc, ...)  ## DO NOT KNOW HOW
+
+    def _test_output(self, buff):
+        """
+        This function is only for testcase.
+        Store data in dstream to buffer to valify the result in tesecase
+        """
+        def get_output(rdd, time):
+            taken = rdd.take(11)
+            buff.result = taken
+        self.foreachRDD(get_output)
+
+    def output(self):
+        self._jdstream.outputToFile()
 
 
 class PipelinedDStream(DStream):
diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index 95c5489a5695b..0660be10b027b 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -19,12 +19,13 @@
 Unit tests for PySpark; additional tests are implemented as doctests in
 individual modules.
 
-This file will merged to tests.py. But for now, this file is separated to
-focus to streaming test case
+This file will merged to tests.py. But for now, this file is separated due
+to focusing to streaming test case
 
 """
 from fileinput import input
 from glob import glob
+from itertools import chain
 import os
 import re
 import shutil
@@ -41,18 +42,69 @@
 
 SPARK_HOME = os.environ["SPARK_HOME"]
 
+class buff:
+    """
+    Buffer for store the output from stream
+    """
+    result = None
 
 class PySparkStreamingTestCase(unittest.TestCase):
-
     def setUp(self):
-        self._old_sys_path = list(sys.path)
+        print "set up"
         class_name = self.__class__.__name__
         self.ssc = StreamingContext(appName=class_name, duration=Seconds(1))
 
     def tearDown(self):
+        print "tear donw"
         self.ssc.stop()
-        sys.path = self._old_sys_path
+        time.sleep(10)
+
+class TestBasicOperationsSuite(PySparkStreamingTestCase):
+    def setUp(self):
+        PySparkStreamingTestCase.setUp(self)
+        buff.result = None
+        self.timeout = 10 # seconds
+
+    def tearDown(self):
+        PySparkStreamingTestCase.tearDown(self)
+
+    def test_map(self):
+        test_input = [range(1,5), range(5,9), range(9, 13)]
+        def test_func(dstream):
+            return dstream.map(lambda x: str(x))
+        expected = map(str, test_input)
+        output = self.run_stream(test_input, test_func)
+        self.assertEqual(output, expected)
+
+    def test_flatMap(self):
+        test_input = [range(1,5), range(5,9), range(9, 13)]
+        def test_func(dstream):
+            return dstream.flatMap(lambda x: (x, x * 2))
+        # Maybe there be good way to create flatmap
+        excepted = map(lambda x: list(chain.from_iterable((map(lambda y:[y, y*2], x)))), 
+                       test_input)
+        output = self.run_stream(test_input, test_func)
+
+    def run_stream(self, test_input, test_func):
+        # Generate input stream with user-defined input
+        test_input_stream = self.ssc._testInputStream(test_input)
+        # Applyed test function to stream
+        test_stream = test_func(test_input_stream)
+        # Add job to get outpuf from stream
+        test_stream._test_output(buff)
+        self.ssc.start()
 
+        start_time = time.time()
+        while True:
+            current_time = time.time()
+            # check time out
+            if (current_time - start_time) > self.timeout:
+                self.ssc.stop()
+                break
+            self.ssc.awaitTermination(50)
+            if buff.result is not None:
+                break
+        return buff.result
 
 if __name__ == "__main__":
     unittest.main()
diff --git a/python/pyspark/worker.py b/python/pyspark/worker.py
index f43210c6c0301..7ca3252270d5a 100644
--- a/python/pyspark/worker.py
+++ b/python/pyspark/worker.py
@@ -58,7 +58,7 @@ def main(infile, outfile):
 
         # fetch names of includes (*.zip and *.egg files) and construct PYTHONPATH
         sys.path.append(spark_files_dir) # *.py files that were added will be copied here
-        num_python_includes =  read_int(infile)
+        num_python_includes = read_int(infile)
         for _ in range(num_python_includes):
             filename = utf8_deserializer.loads(infile)
             sys.path.append(os.path.join(spark_files_dir, filename))
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
index a6184de4e83c1..7a002bbe74ca9 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
@@ -54,6 +54,15 @@ trait JavaDStreamLike[T, This <: JavaDStreamLike[T, This, R], R <: JavaRDDLike[T
     dstream.print()
   }
 
+  def print(label: String = null): Unit = {
+    dstream.print(label)
+  }
+
+  def outputToFile(): Unit = {
+    dstream.outputToFile()
+  }
+
+
   /**
    * Return a new DStream in which each RDD has a single element generated by counting each RDD
    * of this DStream.
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 96440b15d0285..94c644fa81d45 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -17,9 +17,14 @@
 
 package org.apache.spark.streaming.api.python
 
+import java.io._
+import java.io.{ObjectInputStream, IOException}
 import java.util.{List => JList, ArrayList => JArrayList, Map => JMap, Collections}
 
+import scala.collection.mutable.ArrayBuffer
 import scala.reflect.ClassTag
+import scala.collection.JavaConversions._
+
 
 import org.apache.spark._
 import org.apache.spark.rdd.RDD
@@ -51,6 +56,8 @@ class PythonDStream[T: ClassTag](
   override def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
     parent.getOrCompute(validTime) match{
       case Some(rdd) =>
+        logInfo("RDD ID in python DStream     ===========")
+        logInfo("RDD id " + rdd.id)
         val pythonRDD = new PythonRDD(rdd, command, envVars, pythonIncludes, preservePartitoning, pythonExec, broadcastVars, accumulator)
         Some(pythonRDD.asJavaRDD.rdd)
       case None => None
@@ -77,7 +84,7 @@ DStream[Array[Byte]](prev.ssc){
         val pairwiseRDD = new PairwiseRDD(rdd)
         /*
          * Since python operation is executed by Scala after StreamingContext.start.
-         * What PairwiseDStream does is equivalent to following python code in pySpark.
+         * What PythonPairwiseDStream does is equivalent to python code in pySpark.
          *
          * with _JavaStackTrace(self.context) as st:
          *    pairRDD = self.ctx._jvm.PairwiseRDD(keyed._jrdd.rdd()).asJavaPairRDD()
@@ -142,18 +149,10 @@ class PythonTestInputStream(ssc_ : JavaStreamingContext, filename: String, numPa
 
   def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
     logInfo("Computing RDD for time " + validTime)
-    //val index = ((validTime - zeroTime) / slideDuration - 1).toInt
-    //val selectedInput = if (index < input.size) input(index) else Seq[T]()
-
-    // lets us test cases where RDDs are not created
-    //if (filename == null)
-    //  return None
-
-    //val rdd = ssc.sc.makeRDD(selectedInput, numPartitions)
     val rdd = PythonRDD.readRDDFromFile(JavaSparkContext.fromSparkContext(ssc_.sparkContext), filename, numPartitions).rdd
     logInfo("Created RDD " + rdd.id + " with " + filename)
     Some(rdd)
   }
 
   val asJavaDStream  = JavaDStream.fromDStream(this)
-}
\ No newline at end of file
+}
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index d8dbdf59e7ff1..bafff80adc54b 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -623,6 +623,23 @@ abstract class DStream[T: ClassTag] (
     new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
   }
 
+
+  def print(label: String = null) {
+    def foreachFunc = (rdd: RDD[T], time: Time) => {
+      val first11 = rdd.take(11)
+      println ("-------------------------------------------")
+      println ("Time: " + time)
+      println ("-------------------------------------------")
+      if(label != null){
+        println (label)
+      }
+      first11.take(10).foreach(println)
+      if (first11.size > 10) println("...")
+      println()
+    }
+    new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
+  }
+
   /**
    * Return a new DStream in which each RDD contains all the elements in seen in a
    * sliding window of time over this DStream. The new DStream generates RDDs with

From 2cfd3a0bf14beb50b7c4f2fc7ddcd5d3bdfd8c38 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 11 Aug 2014 03:21:22 -0700
Subject: [PATCH 50/69] added basic operation test cases

---
 .../main/python/streaming/test_oprations.py   | 19 ++--
 python/pyspark/streaming/context.py           | 43 +++++----
 python/pyspark/streaming/dstream.py           |  8 +-
 python/pyspark/streaming_tests.py             | 95 +++++++++++++++----
 .../streaming/api/python/PythonDStream.scala  | 27 +++++-
 5 files changed, 135 insertions(+), 57 deletions(-)

diff --git a/examples/src/main/python/streaming/test_oprations.py b/examples/src/main/python/streaming/test_oprations.py
index 24ebe23d63166..70a62058286e9 100644
--- a/examples/src/main/python/streaming/test_oprations.py
+++ b/examples/src/main/python/streaming/test_oprations.py
@@ -9,22 +9,23 @@
     conf = SparkConf()
     conf.setAppName("PythonStreamingNetworkWordCount")
     ssc = StreamingContext(conf=conf, duration=Seconds(1))
-
-    test_input = ssc._testInputStream([1,2,3])
-    class buff:
+    class Buff:
+        result = list()
         pass
+    Buff.result = list()
+
+    test_input = ssc._testInputStream([range(1,4), range(4,7), range(7,10)])
    
     fm_test = test_input.map(lambda x: (x, 1))
-    fm_test.test_output(buff)
+    fm_test.pyprint()
+    fm_test._test_output(Buff.result)
 
     ssc.start()
     while True:
         ssc.awaitTermination(50)
-        try:
-            buff.result
+        if len(Buff.result) == 3:
             break
-        except AttributeError:
-            pass
 
     ssc.stop()
-    print buff.result
+    print Buff.result
+
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 0d7665d645be8..be142fd4f327b 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -123,14 +123,14 @@ def textFileStream(self, directory):
         """
         return DStream(self._jssc.textFileStream(directory), self, UTF8Deserializer())
 
-    def stop(self, stopSparkContext=True):
+    def stop(self, stopSparkContext=True, stopGraceFully=False):
         """
         Stop the execution of the streams immediately (does not wait for all received data
         to be processed).
         """
         
         try:
-            self._jssc.stop(stopSparkContext)
+            self._jssc.stop(stopSparkContext, stopGraceFully)
         finally:
             # Stop Callback server
             SparkContext._gateway.shutdown()
@@ -141,27 +141,34 @@ def checkpoint(self, directory):
         """
         self._jssc.checkpoint(directory)
 
-    def _testInputStream(self, test_input, numSlices=None):
-
+    def _testInputStream(self, test_inputs, numSlices=None):
+        """
+        Generate multiple files to make "stream" in Scala side for test.
+        Scala chooses one of the files and generates RDD using PythonRDD.readRDDFromFile.
+        """
         numSlices = numSlices or self._sc.defaultParallelism
         # Calling the Java parallelize() method with an ArrayList is too slow,
         # because it sends O(n) Py4J commands.  As an alternative, serialized
         # objects are written to a file and loaded through textFile().
 
-        tempFile = NamedTemporaryFile(delete=False, dir=self._sc._temp_dir)
-
-        # Make sure we distribute data evenly if it's smaller than self.batchSize
-        if "__len__" not in dir(test_input):
-            c = list(test_input)    # Make it a list so we can compute its length
-        batchSize = min(len(test_input) // numSlices, self._sc._batchSize)
-        if batchSize > 1:
-            serializer = BatchedSerializer(self._sc._unbatched_serializer,
-                                           batchSize)
-        else:
-            serializer = self._sc._unbatched_serializer
-        serializer.dump_stream(test_input, tempFile)
-
+        tempFiles = list()
+        for test_input in test_inputs:
+            tempFile = NamedTemporaryFile(delete=False, dir=self._sc._temp_dir)
+
+            # Make sure we distribute data evenly if it's smaller than self.batchSize
+            if "__len__" not in dir(test_input):
+                c = list(test_input)    # Make it a list so we can compute its length
+            batchSize = min(len(test_input) // numSlices, self._sc._batchSize)
+            if batchSize > 1:
+                serializer = BatchedSerializer(self._sc._unbatched_serializer,
+                                               batchSize)
+            else:
+                serializer = self._sc._unbatched_serializer
+            serializer.dump_stream(test_input, tempFile)
+            tempFiles.append(tempFile.name)
+
+        jtempFiles = ListConverter().convert(tempFiles, SparkContext._gateway._gateway_client)
         jinput_stream = self._jvm.PythonTestInputStream(self._jssc,
-                                                        tempFile.name,
+                                                        jtempFiles,
                                                         numSlices).asJavaDStream()
         return DStream(jinput_stream, self, PickleSerializer())
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 47196196466db..0f0a1847535ce 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -217,7 +217,6 @@ def pyprint(self):
 
         """
         def takeAndPrint(rdd, time):
-            print "take and print ==================="
             taken = rdd.take(11)
             print "-------------------------------------------"
             print "Time: %s" % (str(time))
@@ -242,13 +241,10 @@ def _test_output(self, buff):
         Store data in dstream to buffer to valify the result in tesecase
         """
         def get_output(rdd, time):
-            taken = rdd.take(11)
-            buff.result = taken
+            taken = rdd.collect()
+            buff.append(taken)
         self.foreachRDD(get_output)
 
-    def output(self):
-        self._jdstream.outputToFile()
-
 
 class PipelinedDStream(DStream):
     def __init__(self, prev, func, preservesPartitioning=False):
diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index 0660be10b027b..d2e638a7d2acc 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -35,76 +35,133 @@
 import time
 import unittest
 import zipfile
+import operator
 
+from pyspark.context import SparkContext
 from pyspark.streaming.context import StreamingContext
 from pyspark.streaming.duration import *
 
 
 SPARK_HOME = os.environ["SPARK_HOME"]
 
-class buff:
+class StreamOutput:
     """
-    Buffer for store the output from stream
+    a class to store the output from stream
     """
-    result = None
+    result = list()
 
 class PySparkStreamingTestCase(unittest.TestCase):
     def setUp(self):
-        print "set up"
         class_name = self.__class__.__name__
         self.ssc = StreamingContext(appName=class_name, duration=Seconds(1))
 
     def tearDown(self):
-        print "tear donw"
-        self.ssc.stop()
-        time.sleep(10)
+        # Do not call StreamingContext.stop directly because we do not wait to shutdown
+        # call back server and py4j client
+        self.ssc._jssc.stop()
+        self.ssc._sc.stop()
+        # Why does it long time to terminaete StremaingContext and SparkContext?
+        # Should we change the sleep time if this depends on machine spec?
+        time.sleep(5)
+
+    @classmethod
+    def tearDownClass(cls):
+        time.sleep(5)
+        SparkContext._gateway._shutdown_callback_server()
 
 class TestBasicOperationsSuite(PySparkStreamingTestCase):
+    """
+    Input and output of this TestBasicOperationsSuite is the equivalent to 
+    Scala TestBasicOperationsSuite.
+    """
     def setUp(self):
         PySparkStreamingTestCase.setUp(self)
-        buff.result = None
+        StreamOutput.result = list()
         self.timeout = 10 # seconds
 
     def tearDown(self):
         PySparkStreamingTestCase.tearDown(self)
 
+    @classmethod
+    def tearDownClass(cls):
+        PySparkStreamingTestCase.tearDownClass()
+
     def test_map(self):
+        """Basic operation test for DStream.map"""
         test_input = [range(1,5), range(5,9), range(9, 13)]
         def test_func(dstream):
             return dstream.map(lambda x: str(x))
-        expected = map(str, test_input)
-        output = self.run_stream(test_input, test_func)
-        self.assertEqual(output, expected)
+        expected_output = map(lambda x: map(lambda y: str(y), x), test_input)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
 
     def test_flatMap(self):
+        """Basic operation test for DStream.faltMap"""
         test_input = [range(1,5), range(5,9), range(9, 13)]
         def test_func(dstream):
             return dstream.flatMap(lambda x: (x, x * 2))
-        # Maybe there be good way to create flatmap
-        excepted = map(lambda x: list(chain.from_iterable((map(lambda y:[y, y*2], x)))), 
+        expected_output = map(lambda x: list(chain.from_iterable((map(lambda y: [y, y * 2], x)))), 
                        test_input)
-        output = self.run_stream(test_input, test_func)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_filter(self):
+        """Basic operation test for DStream.filter"""
+        test_input = [range(1,5), range(5,9), range(9, 13)]
+        def test_func(dstream):
+            return dstream.filter(lambda x: x % 2 == 0)
+        expected_output = map(lambda x: filter(lambda y: y % 2 == 0, x), test_input)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_count(self):
+        """Basic operation test for DStream.count"""
+        test_input = [[], [1], range(1, 3), range(1,4), range(1,5)]
+        def test_func(dstream):
+            return dstream.count()
+        expected_output = map(lambda x: [len(x)], test_input)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+        
+    def test_reduce(self):
+        """Basic operation test for DStream.reduce"""
+        test_input = [range(1,5), range(5,9), range(9, 13)]
+        def test_func(dstream):
+            return dstream.reduce(operator.add)
+        expected_output = map(lambda x: [reduce(operator.add, x)], test_input)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_reduceByKey(self):
+        """Basic operation test for DStream.reduceByKey"""
+        test_input = [["a", "a", "b"], ["", ""], []]
+        def test_func(dstream):
+            return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add)
+        expected_output = [[("a", 2), ("b", 1)],[("", 2)], []]
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
 
-    def run_stream(self, test_input, test_func):
+    def _run_stream(self, test_input, test_func, expected_output):
+        """Start stream and return the output"""
         # Generate input stream with user-defined input
         test_input_stream = self.ssc._testInputStream(test_input)
         # Applyed test function to stream
         test_stream = test_func(test_input_stream)
         # Add job to get outpuf from stream
-        test_stream._test_output(buff)
+        test_stream._test_output(StreamOutput.result)
         self.ssc.start()
 
         start_time = time.time()
+        # loop until get the result from stream
         while True:
             current_time = time.time()
             # check time out
             if (current_time - start_time) > self.timeout:
-                self.ssc.stop()
                 break
             self.ssc.awaitTermination(50)
-            if buff.result is not None:
+            if len(expected_output) == len(StreamOutput.result):
                 break
-        return buff.result
+        return StreamOutput.result
 
 if __name__ == "__main__":
     unittest.main()
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 94c644fa81d45..21809d8d3b97a 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -56,8 +56,6 @@ class PythonDStream[T: ClassTag](
   override def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
     parent.getOrCompute(validTime) match{
       case Some(rdd) =>
-        logInfo("RDD ID in python DStream     ===========")
-        logInfo("RDD id " + rdd.id)
         val pythonRDD = new PythonRDD(rdd, command, envVars, pythonIncludes, preservePartitoning, pythonExec, broadcastVars, accumulator)
         Some(pythonRDD.asJavaRDD.rdd)
       case None => None
@@ -140,7 +138,7 @@ class PythonTransformedDStream(
  * replayable, reliable message queue like Kafka. It requires a sequence as input, and
  * returns the i_th element at the i_th batch under manual clock.
  */
-class PythonTestInputStream(ssc_ : JavaStreamingContext, filename: String, numPartitions: Int)
+class PythonTestInputStream(ssc_ : JavaStreamingContext, inputFiles: JArrayList[String], numPartitions: Int)
   extends InputDStream[Array[Byte]](JavaStreamingContext.toStreamingContext(ssc_)){
 
   def start() {}
@@ -149,8 +147,27 @@ class PythonTestInputStream(ssc_ : JavaStreamingContext, filename: String, numPa
 
   def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
     logInfo("Computing RDD for time " + validTime)
-    val rdd = PythonRDD.readRDDFromFile(JavaSparkContext.fromSparkContext(ssc_.sparkContext), filename, numPartitions).rdd
-    logInfo("Created RDD " + rdd.id + " with " + filename)
+    inputFiles.foreach(logInfo(_))
+    // make a temporary file
+    // make empty RDD
+    val prefix = "spark"
+    val suffix = ".tmp"
+    val tempFile = File.createTempFile(prefix, suffix)
+    val index = ((validTime - zeroTime) / slideDuration - 1).toInt
+    logInfo("Index: " + index)
+
+    val selectedInputFile: String = {
+      if (inputFiles.isEmpty){
+        tempFile.getAbsolutePath
+      }else if (index < inputFiles.size()) {
+        inputFiles.get(index)
+      } else {
+        tempFile.getAbsolutePath
+      }
+    }
+
+    val rdd = PythonRDD.readRDDFromFile(JavaSparkContext.fromSparkContext(ssc_.sparkContext), selectedInputFile, numPartitions).rdd
+    logInfo("Created RDD " + rdd.id + " with " + selectedInputFile)
     Some(rdd)
   }
 

From db0a30355e9e861bd775dee48daa292ff4139c68 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 11 Aug 2014 03:22:23 -0700
Subject: [PATCH 51/69] delete waste file

---
 .../main/python/streaming/test_oprations.py   | 31 -------------------
 1 file changed, 31 deletions(-)
 delete mode 100644 examples/src/main/python/streaming/test_oprations.py

diff --git a/examples/src/main/python/streaming/test_oprations.py b/examples/src/main/python/streaming/test_oprations.py
deleted file mode 100644
index 70a62058286e9..0000000000000
--- a/examples/src/main/python/streaming/test_oprations.py
+++ /dev/null
@@ -1,31 +0,0 @@
-import sys
-from operator import add
-
-from pyspark.conf import SparkConf
-from pyspark.streaming.context import StreamingContext
-from pyspark.streaming.duration import *
-
-if __name__ == "__main__":
-    conf = SparkConf()
-    conf.setAppName("PythonStreamingNetworkWordCount")
-    ssc = StreamingContext(conf=conf, duration=Seconds(1))
-    class Buff:
-        result = list()
-        pass
-    Buff.result = list()
-
-    test_input = ssc._testInputStream([range(1,4), range(4,7), range(7,10)])
-   
-    fm_test = test_input.map(lambda x: (x, 1))
-    fm_test.pyprint()
-    fm_test._test_output(Buff.result)
-
-    ssc.start()
-    while True:
-        ssc.awaitTermination(50)
-        if len(Buff.result) == 3:
-            break
-
-    ssc.stop()
-    print Buff.result
-

From 3334169e73141abfe1cb486d76fc983be7b1df92 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 11 Aug 2014 03:41:24 -0700
Subject: [PATCH 52/69] fixed PEP-008 violation

---
 python/pyspark/streaming/context.py |  5 ----
 python/pyspark/streaming/dstream.py | 19 +++++++++------
 python/pyspark/streaming_tests.py   | 37 +++++++++++++++--------------
 3 files changed, 31 insertions(+), 30 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index be142fd4f327b..088a4965b6b13 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -19,12 +19,7 @@
 from signal import signal, SIGTERM, SIGINT
 from tempfile import NamedTemporaryFile
 
-from pyspark.conf import SparkConf
-from pyspark.files import SparkFiles
-from pyspark.java_gateway import launch_gateway
 from pyspark.serializers import PickleSerializer, BatchedSerializer, UTF8Deserializer
-from pyspark.storagelevel import *
-from pyspark.rdd import RDD
 from pyspark.context import SparkContext
 from pyspark.streaming.dstream import DStream
 
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 0f0a1847535ce..746f323628c1c 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -49,7 +49,7 @@ def _sum(self):
 
     def print_(self, label=None):
         """
-        Since print is reserved name for python, we cannot define a print method function.
+        Since print is reserved name for python, we cannot define a "print" method function.
         This function prints serialized data in RDD in DStream because Scala and Java cannot
         deserialized pickled python object. Please use DStream.pyprint() instead to print results.
 
@@ -159,8 +159,8 @@ def partitionBy(self, numPartitions, partitionFunc=None):
         # form the hash buckets in Python, transferring O(numPartitions) objects
         # to Java.  Each object is a (splitNumber, [objects]) pair.
         outputSerializer = self.ctx._unbatched_serializer
-        def add_shuffle_key(split, iterator):
 
+        def add_shuffle_key(split, iterator):
             buckets = defaultdict(list)
 
             for (k, v) in iterator:
@@ -205,6 +205,11 @@ def getNumPartitions(self):
 
     def foreachRDD(self, func):
         """
+        Apply userdefined function to all RDD in a DStream.
+        This python implementation could be expensive because it uses callback server
+        in order to apply function to RDD in DStream.
+        This is an output operator, so this DStream will be registered as an output
+        stream and there materialized.
         """
         from utils import RDDFunction
         wrapped_func = RDDFunction(self.ctx, self._jrdd_deserializer, func)
@@ -214,7 +219,6 @@ def pyprint(self):
         """
         Print the first ten elements of each RDD generated in this DStream. This is an output
         operator, so this DStream will be registered as an output stream and there materialized.
-
         """
         def takeAndPrint(rdd, time):
             taken = rdd.take(11)
@@ -235,14 +239,15 @@ def takeAndPrint(rdd, time):
     #    jdstream = self.ctx._jvm.PythonTransformedDStream(self._jdstream.dstream(), wrapped_func).toJavaDStream
     #    return DStream(jdstream, self._ssc, ...)  ## DO NOT KNOW HOW
 
-    def _test_output(self, buff):
+    def _test_output(self, result):
         """
-        This function is only for testcase.
-        Store data in dstream to buffer to valify the result in tesecase
+        This function is only for test case.
+        Store data in a DStream to result to verify the result in tese case
         """
         def get_output(rdd, time):
             taken = rdd.collect()
-            buff.append(taken)
+            result.append(taken)
+
         self.foreachRDD(get_output)
 
 
diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index d2e638a7d2acc..ef9b87756fcef 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -23,18 +23,10 @@
 to focusing to streaming test case
 
 """
-from fileinput import input
-from glob import glob
 from itertools import chain
 import os
-import re
-import shutil
-import subprocess
-import sys
-import tempfile
 import time
 import unittest
-import zipfile
 import operator
 
 from pyspark.context import SparkContext
@@ -44,12 +36,14 @@
 
 SPARK_HOME = os.environ["SPARK_HOME"]
 
+
 class StreamOutput:
     """
     a class to store the output from stream
     """
     result = list()
 
+
 class PySparkStreamingTestCase(unittest.TestCase):
     def setUp(self):
         class_name = self.__class__.__name__
@@ -69,6 +63,7 @@ def tearDownClass(cls):
         time.sleep(5)
         SparkContext._gateway._shutdown_callback_server()
 
+
 class TestBasicOperationsSuite(PySparkStreamingTestCase):
     """
     Input and output of this TestBasicOperationsSuite is the equivalent to 
@@ -77,7 +72,7 @@ class TestBasicOperationsSuite(PySparkStreamingTestCase):
     def setUp(self):
         PySparkStreamingTestCase.setUp(self)
         StreamOutput.result = list()
-        self.timeout = 10 # seconds
+        self.timeout = 10  # seconds
 
     def tearDown(self):
         PySparkStreamingTestCase.tearDown(self)
@@ -88,7 +83,8 @@ def tearDownClass(cls):
 
     def test_map(self):
         """Basic operation test for DStream.map"""
-        test_input = [range(1,5), range(5,9), range(9, 13)]
+        test_input = [range(1, 5), range(5, 9), range(9, 13)]
+
         def test_func(dstream):
             return dstream.map(lambda x: str(x))
         expected_output = map(lambda x: map(lambda y: str(y), x), test_input)
@@ -97,17 +93,19 @@ def test_func(dstream):
 
     def test_flatMap(self):
         """Basic operation test for DStream.faltMap"""
-        test_input = [range(1,5), range(5,9), range(9, 13)]
+        test_input = [range(1, 5), range(5, 9), range(9, 13)]
+
         def test_func(dstream):
             return dstream.flatMap(lambda x: (x, x * 2))
         expected_output = map(lambda x: list(chain.from_iterable((map(lambda y: [y, y * 2], x)))), 
-                       test_input)
+                              test_input)
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
     def test_filter(self):
         """Basic operation test for DStream.filter"""
-        test_input = [range(1,5), range(5,9), range(9, 13)]
+        test_input = [range(1, 5), range(5, 9), range(9, 13)]
+
         def test_func(dstream):
             return dstream.filter(lambda x: x % 2 == 0)
         expected_output = map(lambda x: filter(lambda y: y % 2 == 0, x), test_input)
@@ -116,7 +114,8 @@ def test_func(dstream):
 
     def test_count(self):
         """Basic operation test for DStream.count"""
-        test_input = [[], [1], range(1, 3), range(1,4), range(1,5)]
+        test_input = [[], [1], range(1, 3), range(1, 4), range(1, 5)]
+
         def test_func(dstream):
             return dstream.count()
         expected_output = map(lambda x: [len(x)], test_input)
@@ -125,7 +124,8 @@ def test_func(dstream):
         
     def test_reduce(self):
         """Basic operation test for DStream.reduce"""
-        test_input = [range(1,5), range(5,9), range(9, 13)]
+        test_input = [range(1, 5), range(5, 9), range(9, 13)]
+
         def test_func(dstream):
             return dstream.reduce(operator.add)
         expected_output = map(lambda x: [reduce(operator.add, x)], test_input)
@@ -135,9 +135,10 @@ def test_func(dstream):
     def test_reduceByKey(self):
         """Basic operation test for DStream.reduceByKey"""
         test_input = [["a", "a", "b"], ["", ""], []]
+
         def test_func(dstream):
             return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add)
-        expected_output = [[("a", 2), ("b", 1)],[("", 2)], []]
+        expected_output = [[("a", 2), ("b", 1)], [("", 2)], []]
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
@@ -145,9 +146,9 @@ def _run_stream(self, test_input, test_func, expected_output):
         """Start stream and return the output"""
         # Generate input stream with user-defined input
         test_input_stream = self.ssc._testInputStream(test_input)
-        # Applyed test function to stream
+        # Applied test function to stream
         test_stream = test_func(test_input_stream)
-        # Add job to get outpuf from stream
+        # Add job to get output from stream
         test_stream._test_output(StreamOutput.result)
         self.ssc.start()
 

From e8c7bfc556da45d33f9ffecf8c6b802fe7a7e49c Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 11 Aug 2014 04:31:59 -0700
Subject: [PATCH 53/69] remove export PYSPARK_PYTHON in spark submit

---
 bin/spark-submit | 16 ----------------
 1 file changed, 16 deletions(-)

diff --git a/bin/spark-submit b/bin/spark-submit
index a297714c67da0..9e7cecedd0325 100755
--- a/bin/spark-submit
+++ b/bin/spark-submit
@@ -37,22 +37,6 @@ done
 
 DEPLOY_MODE=${DEPLOY_MODE:-"client"}
 
-
-# This is a hack to make DStream.pyprint work. 
-# This will be removed after pyprint is moved to PythonDStream.
-# Problem is that print function is in (Scala)DStream. 
-# Whenever python code is executed, we call PythonDStream which passes
-# pythonExec(which python Spark should execute). pythonExec is used to call python.
-# Since pyprint is located in DStream, Spark does not know which python should use. 
-# In that case, get python path from PYSPARK_PYTHON, environmental variable. 
-
-# Figure out which Python executable to use
-if [[ -z "$PYSPARK_PYTHON" ]]; then
-  PYSPARK_PYTHON="python"
-fi
-export PYSPARK_PYTHON
-
-
 if [ -n "$DRIVER_MEMORY" ] && [ $DEPLOY_MODE == "client" ]; then
   export SPARK_DRIVER_MEMORY=$DRIVER_MEMORY
 fi

From bdde697368cee7c06fcbcf4f2102fedf3a58536f Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 11 Aug 2014 04:42:08 -0700
Subject: [PATCH 54/69] removed unnesessary changes

---
 .../org/apache/spark/streaming/dstream/DStream.scala      | 8 +-------
 1 file changed, 1 insertion(+), 7 deletions(-)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index bafff80adc54b..46ef05d9c37a1 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -17,14 +17,11 @@
 
 package org.apache.spark.streaming.dstream
 
-
-import java.io._
+import java.io.{IOException, ObjectInputStream, ObjectOutputStream}
 
 import scala.deprecated
 import scala.collection.mutable.HashMap
 import scala.reflect.ClassTag
-import java.io.{IOException, ObjectInputStream, ObjectOutputStream}
-import scala.util.control.Breaks._
 
 import org.apache.spark.{Logging, SparkException}
 import org.apache.spark.rdd.{BlockRDD, RDD}
@@ -34,7 +31,6 @@ import org.apache.spark.streaming.StreamingContext._
 import org.apache.spark.streaming.scheduler.Job
 import org.apache.spark.util.MetadataCleaner
 import org.apache.spark.streaming.Duration
-import org.apache.spark.api.python.PythonRDD
 
 /**
  * A Discretized Stream (DStream), the basic abstraction in Spark Streaming, is a continuous
@@ -562,11 +558,9 @@ abstract class DStream[T: ClassTag] (
     // DStreams can't be serialized with closures, we can't proactively check 
     // it for serializability and so we pass the optional false to SparkContext.clean
 
-    // serialized python
     val cleanedF = context.sparkContext.clean(transformFunc, false)
     val realTransformFunc =  (rdds: Seq[RDD[_]], time: Time) => {
       assert(rdds.length == 1)
-      // if transformfunc is fine, it is okay
       cleanedF(rdds.head.asInstanceOf[RDD[T]], time)
     }
     new TransformedDStream[U](Seq(this), realTransformFunc)

From a65f3021fc8aa5f82889a18a728eed3c901996d0 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 11 Aug 2014 05:32:28 -0700
Subject: [PATCH 55/69] edited the comment to add more precise description

---
 python/pyspark/streaming_tests.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index ef9b87756fcef..ec45acec94dbf 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -50,8 +50,8 @@ def setUp(self):
         self.ssc = StreamingContext(appName=class_name, duration=Seconds(1))
 
     def tearDown(self):
-        # Do not call StreamingContext.stop directly because we do not wait to shutdown
-        # call back server and py4j client
+        # Do not call pyspark.streaming.context.StreamingContext.stop directly because
+        # we do not wait to shutdowncall back server and py4j client
         self.ssc._jssc.stop()
         self.ssc._sc.stop()
         # Why does it long time to terminaete StremaingContext and SparkContext?
@@ -146,7 +146,7 @@ def _run_stream(self, test_input, test_func, expected_output):
         """Start stream and return the output"""
         # Generate input stream with user-defined input
         test_input_stream = self.ssc._testInputStream(test_input)
-        # Applied test function to stream
+        # Apply test function to stream
         test_stream = test_func(test_input_stream)
         # Add job to get output from stream
         test_stream._test_output(StreamOutput.result)
@@ -160,6 +160,7 @@ def _run_stream(self, test_input, test_func, expected_output):
             if (current_time - start_time) > self.timeout:
                 break
             self.ssc.awaitTermination(50)
+            # check if the output is the same length of expexted output
             if len(expected_output) == len(StreamOutput.result):
                 break
         return StreamOutput.result

From 90a6484066ec2c157db6650d470e0b66cf42b342 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 11 Aug 2014 16:34:12 -0700
Subject: [PATCH 56/69] added mapValues and flatMapVaules WIP for glom and
 mapPartitions test

---
 python/pyspark/streaming/context.py |  2 +
 python/pyspark/streaming/dstream.py | 69 ++++++++++++++++++++++-------
 python/pyspark/streaming_tests.py   | 48 +++++++++++++++++++-
 3 files changed, 101 insertions(+), 18 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 088a4965b6b13..eee298badcbad 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -140,6 +140,8 @@ def _testInputStream(self, test_inputs, numSlices=None):
         """
         Generate multiple files to make "stream" in Scala side for test.
         Scala chooses one of the files and generates RDD using PythonRDD.readRDDFromFile.
+
+        QueStream maybe good way to implement this function
         """
         numSlices = numSlices or self._sc.defaultParallelism
         # Calling the Java parallelize() method with an ArrayList is too slow,
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 746f323628c1c..5a6cf57ef1d9f 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -35,25 +35,31 @@ def __init__(self, jdstream, ssc, jrdd_deserializer):
         self.ctx = ssc._sc
         self._jrdd_deserializer = jrdd_deserializer
 
+    def context(self):
+        """
+        Return the StreamingContext associated with this DStream
+        """
+        return self._ssc
+
     def count(self):
         """
         Return a new DStream which contains the number of elements in this DStream.
         """
-        return self._mapPartitions(lambda i: [sum(1 for _ in i)])._sum()
+        return self.mapPartitions(lambda i: [sum(1 for _ in i)])._sum()
 
     def _sum(self):
         """
         Add up the elements in this DStream.
         """
-        return self._mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
+        return self.mapPartitions(lambda x: [sum(x)]).reduce(operator.add)
 
     def print_(self, label=None):
         """
         Since print is reserved name for python, we cannot define a "print" method function.
         This function prints serialized data in RDD in DStream because Scala and Java cannot
-        deserialized pickled python object. Please use DStream.pyprint() instead to print results.
+        deserialized pickled python object. Please use DStream.pyprint() to print results.
 
-        Call DStream.print().
+        Call DStream.print() and this function will print byte array in the DStream
         """
         # a hack to call print function in DStream
         getattr(self._jdstream, "print")(label)
@@ -63,29 +69,32 @@ def filter(self, f):
         Return a new DStream containing only the elements that satisfy predicate.
         """
         def func(iterator): return ifilter(f, iterator)
-        return self._mapPartitions(func)
+        return self.mapPartitions(func)
 
     def flatMap(self, f, preservesPartitioning=False):
         """
         Pass each value in the key-value pair DStream through flatMap function
         without changing the keys: this also retains the original RDD's partition.
         """
-        def func(s, iterator): return chain.from_iterable(imap(f, iterator))
+        def func(s, iterator):
+            return chain.from_iterable(imap(f, iterator))
         return self._mapPartitionsWithIndex(func, preservesPartitioning)
 
-    def map(self, f):
+    def map(self, f, preservesPartitioning=False):
         """
         Return a new DStream by applying a function to each element of DStream.
         """
-        def func(iterator): return imap(f, iterator)
-        return self._mapPartitions(func)
+        def func(iterator):
+            return imap(f, iterator)
+        return self.mapPartitions(func, preservesPartitioning)
 
-    def _mapPartitions(self, f):
+    def mapPartitions(self, f, preservesPartitioning=False):
         """
         Return a new DStream by applying a function to each partition of this DStream.
         """
-        def func(s, iterator): return f(iterator)
-        return self._mapPartitionsWithIndex(func)
+        def func(s, iterator):
+            return f(iterator)
+        return self._mapPartitionsWithIndex(func, preservesPartitioning)
 
     def _mapPartitionsWithIndex(self, f, preservesPartitioning=False):
         """
@@ -131,7 +140,7 @@ def combineLocally(iterator):
                 else:
                     combiners[k] = mergeValue(combiners[k], v)
             return combiners.iteritems()
-        locally_combined = self._mapPartitions(combineLocally)
+        locally_combined = self.mapPartitions(combineLocally)
         shuffled = locally_combined.partitionBy(numPartitions)
 
         def _mergeCombiners(iterator):
@@ -143,7 +152,7 @@ def _mergeCombiners(iterator):
                     combiners[k] = mergeCombiners(combiners[k], v)
             return combiners.iteritems()
 
-        return shuffled._mapPartitions(_mergeCombiners)
+        return shuffled.mapPartitions(_mergeCombiners)
 
     def partitionBy(self, numPartitions, partitionFunc=None):
         """
@@ -233,6 +242,34 @@ def takeAndPrint(rdd, time):
 
         self.foreachRDD(takeAndPrint)
 
+    def mapValues(self, f):
+        """
+        Pass each value in the key-value pair RDD through a map function
+        without changing the keys; this also retains the original RDD's
+        partitioning.
+        """
+        map_values_fn = lambda (k, v): (k, f(v))
+        return self.map(map_values_fn, preservesPartitioning=True)
+
+    def flatMapValues(self, f):
+        """
+        Pass each value in the key-value pair RDD through a flatMap function
+        without changing the keys; this also retains the original RDD's
+        partitioning.
+        """
+        flat_map_fn = lambda (k, v): ((k, x) for x in f(v))
+        return self.flatMap(flat_map_fn, preservesPartitioning=True)
+
+    def glom(self):
+        """
+        Return a new DStream in which RDD is generated by applying glom() to RDD of
+        this DStream. Applying glom() to an RDD coalesces all elements within each partition into
+        an list.
+        """
+        def func(iterator):
+            yield list(iterator)
+        return self.mapPartitions(func)
+
     #def transform(self, func): - TD
     #    from utils import RDDFunction
     #    wrapped_func = RDDFunction(self.ctx, self._jrdd_deserializer, func)
@@ -242,7 +279,7 @@ def takeAndPrint(rdd, time):
     def _test_output(self, result):
         """
         This function is only for test case.
-        Store data in a DStream to result to verify the result in tese case
+        Store data in a DStream to result to verify the result in test case
         """
         def get_output(rdd, time):
             taken = rdd.collect()
@@ -305,4 +342,4 @@ def _jdstream(self):
         return self._jdstream_val
 
     def _is_pipelinable(self):
-        return not (self.is_cached)
+        return not self.is_cached
diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index ec45acec94dbf..25ea350ca425f 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -142,10 +142,54 @@ def test_func(dstream):
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
-    def _run_stream(self, test_input, test_func, expected_output):
+    def test_mapValues(self):
+        """Basic operation test for DStream.mapValues"""
+        test_input = [["a", "a", "b"], ["", ""], []]
+
+        def test_func(dstream):
+            return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add).mapValues(lambda x: x + 10)
+        expected_output = [[("a", 12), ("b", 11)], [("", 12)], []]
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_flatMapValues(self):
+        """Basic operation test for DStream.flatMapValues"""
+        test_input = [["a", "a", "b"], ["", ""], []]
+
+        def test_func(dstream):
+            return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add).flatMapValues(lambda x: (x, x + 10))
+        expected_output = [[("a", 2), ("a", 12), ("b", 1), ("b", 11)], [("", 2), ("", 12)], []]
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_glom(self):
+        """Basic operation test for DStream.glom"""
+        test_input = [range(1, 5), range(5, 9), range(9, 13)]
+        numSlices = 2
+
+        def test_func(dstream):
+            dstream.pyprint()
+            return dstream.glom()
+        expected_output = [[[1,2], [3,4]],[[5,6], [7,8]],[[9,10], [11,12]]]
+        output = self._run_stream(test_input, test_func, expected_output, numSlices)
+        self.assertEqual(expected_output, output)
+
+    def test_mapPartitions(self):
+        """Basic operation test for DStream.mapPartitions"""
+        test_input = [range(1, 5), range(5, 9), range(9, 13)]
+        numSlices = 2
+
+        def test_func(dstream):
+            dstream.pyprint()
+            return dstream.mapPartitions(lambda x: reduce(operator.add, x))
+        expected_output = [[3, 7],[11, 15],[19, 23]]
+        output = self._run_stream(test_input, test_func, expected_output, numSlices)
+        self.assertEqual(expected_output, output)
+
+    def _run_stream(self, test_input, test_func, expected_output, numSlices=None):
         """Start stream and return the output"""
         # Generate input stream with user-defined input
-        test_input_stream = self.ssc._testInputStream(test_input)
+        test_input_stream = self.ssc._testInputStream(test_input, numSlices)
         # Apply test function to stream
         test_stream = test_func(test_input_stream)
         # Add job to get output from stream

From 0704b86a9963c1d62b1934ce2fb47094b3fb03d3 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Wed, 13 Aug 2014 21:04:26 -0700
Subject: [PATCH 57/69] WIP: solved partitioned and None is not recognized

---
 python/pyspark/streaming/context.py           | 20 ++++++++++-
 python/pyspark/streaming/dstream.py           | 16 +++++++++
 python/pyspark/streaming_tests.py             | 23 ++++++------
 .../streaming/api/python/PythonDStream.scala  | 35 ++++++++++++++++++-
 4 files changed, 82 insertions(+), 12 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index eee298badcbad..32b52f74e16f0 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -154,7 +154,7 @@ def _testInputStream(self, test_inputs, numSlices=None):
 
             # Make sure we distribute data evenly if it's smaller than self.batchSize
             if "__len__" not in dir(test_input):
-                c = list(test_input)    # Make it a list so we can compute its length
+                test_input = list(test_input)    # Make it a list so we can compute its length
             batchSize = min(len(test_input) // numSlices, self._sc._batchSize)
             if batchSize > 1:
                 serializer = BatchedSerializer(self._sc._unbatched_serializer,
@@ -162,6 +162,7 @@ def _testInputStream(self, test_inputs, numSlices=None):
             else:
                 serializer = self._sc._unbatched_serializer
             serializer.dump_stream(test_input, tempFile)
+            tempFile.close()
             tempFiles.append(tempFile.name)
 
         jtempFiles = ListConverter().convert(tempFiles, SparkContext._gateway._gateway_client)
@@ -169,3 +170,20 @@ def _testInputStream(self, test_inputs, numSlices=None):
                                                         jtempFiles,
                                                         numSlices).asJavaDStream()
         return DStream(jinput_stream, self, PickleSerializer())
+
+    
+    def _testInputStream2(self, test_inputs, numSlices=None):
+        """
+        This is inpired by QueStream implementation. Give list of RDD and generate DStream
+        which contain the RDD.
+        """
+        test_rdds = list()
+        for test_input in test_inputs:
+            test_rdd = self._sc.parallelize(test_input, numSlices)
+            print test_rdd.glom().collect()
+            test_rdds.append(test_rdd._jrdd)
+
+        jtest_rdds = ListConverter().convert(test_rdds, SparkContext._gateway._gateway_client)
+        jinput_stream = self._jvm.PythonTestInputStream2(self._jssc, jtest_rdds).asJavaDStream()
+
+        return DStream(jinput_stream, self, BatchedSerializer(PickleSerializer()))
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 5a6cf57ef1d9f..101bfdbca0102 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -233,6 +233,8 @@ def takeAndPrint(rdd, time):
             taken = rdd.take(11)
             print "-------------------------------------------"
             print "Time: %s" % (str(time))
+            print rdd.glom().collect()
+            print "-------------------------------------------"
             print "-------------------------------------------"
             for record in taken[:10]:
                 print record
@@ -288,6 +290,20 @@ def get_output(rdd, time):
         self.foreachRDD(get_output)
 
 
+# TODO: implement groupByKey
+# TODO: impelment union
+# TODO: implement cache
+# TODO: implement persist
+# TODO: implement repertitions
+# TODO: implement saveAsTextFile
+# TODO: implement cogroup
+# TODO: implement join
+# TODO: implement countByValue
+# TODO: implement leftOuterJoin
+# TODO: implemtnt rightOuterJoin
+
+
+
 class PipelinedDStream(DStream):
     def __init__(self, prev, func, preservesPartitioning=False):
         if not isinstance(prev, PipelinedDStream) or not prev._is_pipelinable():
diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index 25ea350ca425f..e346bc227fe46 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -71,8 +71,9 @@ class TestBasicOperationsSuite(PySparkStreamingTestCase):
     """
     def setUp(self):
         PySparkStreamingTestCase.setUp(self)
-        StreamOutput.result = list()
         self.timeout = 10  # seconds
+        self.numInputPartitions = 2
+        self.result = list()
 
     def tearDown(self):
         PySparkStreamingTestCase.tearDown(self)
@@ -137,6 +138,8 @@ def test_reduceByKey(self):
         test_input = [["a", "a", "b"], ["", ""], []]
 
         def test_func(dstream):
+            print "reduceByKey"
+            dstream.map(lambda x: (x, 1)).pyprint()
             return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add)
         expected_output = [[("a", 2), ("b", 1)], [("", 2)], []]
         output = self._run_stream(test_input, test_func, expected_output)
@@ -168,9 +171,8 @@ def test_glom(self):
         numSlices = 2
 
         def test_func(dstream):
-            dstream.pyprint()
             return dstream.glom()
-        expected_output = [[[1,2], [3,4]],[[5,6], [7,8]],[[9,10], [11,12]]]
+        expected_output = [[[1,2], [3,4]], [[5,6], [7,8]], [[9,10], [11,12]]]
         output = self._run_stream(test_input, test_func, expected_output, numSlices)
         self.assertEqual(expected_output, output)
 
@@ -180,20 +182,21 @@ def test_mapPartitions(self):
         numSlices = 2
 
         def test_func(dstream):
-            dstream.pyprint()
-            return dstream.mapPartitions(lambda x: reduce(operator.add, x))
-        expected_output = [[3, 7],[11, 15],[19, 23]]
+            def f(iterator): yield sum(iterator)
+            return dstream.mapPartitions(f)
+        expected_output = [[3, 7], [11, 15], [19, 23]]
         output = self._run_stream(test_input, test_func, expected_output, numSlices)
         self.assertEqual(expected_output, output)
 
     def _run_stream(self, test_input, test_func, expected_output, numSlices=None):
         """Start stream and return the output"""
         # Generate input stream with user-defined input
-        test_input_stream = self.ssc._testInputStream(test_input, numSlices)
+        numSlices = numSlices or self.numInputPartitions
+        test_input_stream = self.ssc._testInputStream2(test_input, numSlices)
         # Apply test function to stream
         test_stream = test_func(test_input_stream)
         # Add job to get output from stream
-        test_stream._test_output(StreamOutput.result)
+        test_stream._test_output(self.result)
         self.ssc.start()
 
         start_time = time.time()
@@ -205,9 +208,9 @@ def _run_stream(self, test_input, test_func, expected_output, numSlices=None):
                 break
             self.ssc.awaitTermination(50)
             # check if the output is the same length of expexted output
-            if len(expected_output) == len(StreamOutput.result):
+            if len(expected_output) == len(self.result):
                 break
-        return StreamOutput.result
+        return self.result
 
 if __name__ == "__main__":
     unittest.main()
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 21809d8d3b97a..20e0b0d177d0f 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -165,7 +165,7 @@ class PythonTestInputStream(ssc_ : JavaStreamingContext, inputFiles: JArrayList[
         tempFile.getAbsolutePath
       }
     }
-
+    println("PythonTestInputStreaming numPartitons" + numPartitions )
     val rdd = PythonRDD.readRDDFromFile(JavaSparkContext.fromSparkContext(ssc_.sparkContext), selectedInputFile, numPartitions).rdd
     logInfo("Created RDD " + rdd.id + " with " + selectedInputFile)
     Some(rdd)
@@ -173,3 +173,36 @@ class PythonTestInputStream(ssc_ : JavaStreamingContext, inputFiles: JArrayList[
 
   val asJavaDStream  = JavaDStream.fromDStream(this)
 }
+
+/**
+ * This is a input stream just for the unitest. This is equivalent to a checkpointable,
+ * replayable, reliable message queue like Kafka. It requires a sequence as input, and
+ * returns the i_th element at the i_th batch under manual clock.
+ * This implementation is close to QueStream
+ */
+
+class PythonTestInputStream2(ssc_ : JavaStreamingContext, inputRDDs: JArrayList[JavaRDD[Array[Byte]]])
+  extends InputDStream[Array[Byte]](JavaStreamingContext.toStreamingContext(ssc_)) {
+
+  def start() {}
+
+  def stop() {}
+
+  def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
+    val emptyRDD = ssc.sparkContext.emptyRDD[Array[Byte]]
+    val index = ((validTime - zeroTime) / slideDuration - 1).toInt
+    val selectedRDD = {
+      if (inputRDDs.isEmpty) {
+        emptyRDD
+      } else if (index < inputRDDs.size()) {
+        inputRDDs.get(index).rdd
+      } else {
+        emptyRDD
+      }
+    }
+
+    Some(selectedRDD)
+  }
+
+  val asJavaDStream  = JavaDStream.fromDStream(this)
+}
\ No newline at end of file

From 080541a6d77cb85f788c297670cca24fbbc9f9b5 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Thu, 14 Aug 2014 02:19:46 -0700
Subject: [PATCH 58/69] broke something

---
 python/pyspark/rdd.py                         |  3 ++-
 python/pyspark/streaming/context.py           | 10 ++++++----
 python/pyspark/streaming/dstream.py           | 20 +++++++++++++++++++
 python/pyspark/streaming_tests.py             |  2 ++
 python/pyspark/worker.py                      | 11 ++++++++++
 .../streaming/api/python/PythonDStream.scala  |  1 -
 6 files changed, 41 insertions(+), 6 deletions(-)

diff --git a/python/pyspark/rdd.py b/python/pyspark/rdd.py
index f64f48e3a4c9c..942382b40d28f 100644
--- a/python/pyspark/rdd.py
+++ b/python/pyspark/rdd.py
@@ -283,7 +283,8 @@ def mapPartitions(self, f, preservesPartitioning=False):
         >>> rdd.mapPartitions(f).collect()
         [3, 7]
         """
-        def func(s, iterator): return f(iterator)
+        def func(s, iterator): 
+            return f(iterator)
         return self.mapPartitionsWithIndex(func)
 
     def mapPartitionsWithIndex(self, f, preservesPartitioning=False):
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 32b52f74e16f0..809158aedbc96 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -169,8 +169,7 @@ def _testInputStream(self, test_inputs, numSlices=None):
         jinput_stream = self._jvm.PythonTestInputStream(self._jssc,
                                                         jtempFiles,
                                                         numSlices).asJavaDStream()
-        return DStream(jinput_stream, self, PickleSerializer())
-
+        return DStream(jinput_stream, self, BatchedSerializer(PickleSerializer()))
     
     def _testInputStream2(self, test_inputs, numSlices=None):
         """
@@ -178,12 +177,15 @@ def _testInputStream2(self, test_inputs, numSlices=None):
         which contain the RDD.
         """
         test_rdds = list()
+        test_rdd_deserializers = list()
         for test_input in test_inputs:
             test_rdd = self._sc.parallelize(test_input, numSlices)
-            print test_rdd.glom().collect()
             test_rdds.append(test_rdd._jrdd)
+            test_rdd_deserializers.append(test_rdd._jrdd_deserializer)
 
         jtest_rdds = ListConverter().convert(test_rdds, SparkContext._gateway._gateway_client)
         jinput_stream = self._jvm.PythonTestInputStream2(self._jssc, jtest_rdds).asJavaDStream()
 
-        return DStream(jinput_stream, self, BatchedSerializer(PickleSerializer()))
+        dstream = DStream(jinput_stream, self, test_rdd_deserializers[0])
+        dstream._test_switch_dserializer(test_rdd_deserializers)
+        return dstream
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 101bfdbca0102..0a93a46d2b2a2 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -17,6 +17,7 @@
 
 from collections import defaultdict
 from itertools import chain, ifilter, imap
+import time
 import operator
 
 from pyspark.serializers import NoOpSerializer,\
@@ -289,6 +290,25 @@ def get_output(rdd, time):
 
         self.foreachRDD(get_output)
 
+    def _test_switch_dserializer(self, serializer_que):
+        """
+        Deserializer is dynamically changed based on numSlice and the number of
+        input. This function choose deserializer. Currently this is just FIFO.
+        """
+        
+        jrdd_deserializer = self._jrdd_deserializer
+
+        def switch(rdd, jtime):
+            try:
+                print serializer_que
+                jrdd_deserializer = serializer_que.pop(0)
+                print jrdd_deserializer
+            except Exception as e:
+                print e
+
+        self.foreachRDD(switch)
+
+
 
 # TODO: implement groupByKey
 # TODO: impelment union
diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index e346bc227fe46..e23b86e8f040e 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -118,6 +118,8 @@ def test_count(self):
         test_input = [[], [1], range(1, 3), range(1, 4), range(1, 5)]
 
         def test_func(dstream):
+            print "count"
+            dstream.count().pyprint()
             return dstream.count()
         expected_output = map(lambda x: [len(x)], test_input)
         output = self._run_stream(test_input, test_func, expected_output)
diff --git a/python/pyspark/worker.py b/python/pyspark/worker.py
index 7ca3252270d5a..8ee2f0b3a260f 100644
--- a/python/pyspark/worker.py
+++ b/python/pyspark/worker.py
@@ -23,6 +23,7 @@
 import time
 import socket
 import traceback
+import itertools
 # CloudPickler needs to be imported so that depicklers are registered using the
 # copy_reg module.
 from pyspark.accumulators import _accumulatorRegistry
@@ -74,6 +75,16 @@ def main(infile, outfile):
         (func, deserializer, serializer) = command
         init_time = time.time()
         iterator = deserializer.load_stream(infile)
+        print "deserializer in worker: %s" % str(deserializer)
+        iterator, walk = itertools.tee(iterator)
+        if isinstance(walk, int):
+            print "this is int"
+            print walk
+        else:
+            try:
+                print list(walk)
+            except:
+                print list(walk)
         serializer.dump_stream(func(split_index, iterator), outfile)
     except Exception as e:
         # Write the error to stderr in addition to trying to pass it back to
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 20e0b0d177d0f..e8788d4579dea 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -165,7 +165,6 @@ class PythonTestInputStream(ssc_ : JavaStreamingContext, inputFiles: JArrayList[
         tempFile.getAbsolutePath
       }
     }
-    println("PythonTestInputStreaming numPartitons" + numPartitions )
     val rdd = PythonRDD.readRDDFromFile(JavaSparkContext.fromSparkContext(ssc_.sparkContext), selectedInputFile, numPartitions).rdd
     logInfo("Created RDD " + rdd.id + " with " + selectedInputFile)
     Some(rdd)

From 2112638167e258609551df6e6036f33e08ff82e3 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Thu, 14 Aug 2014 18:07:10 -0700
Subject: [PATCH 59/69] all tests are passed if numSlice is 2 and the numver of
 each input is over 4

---
 python/pyspark/streaming/context.py           |  5 +++-
 python/pyspark/streaming_tests.py             | 28 +++++++++----------
 .../streaming/api/python/PythonDStream.scala  | 18 ++++++++++++
 3 files changed, 36 insertions(+), 15 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 809158aedbc96..123fa67f837e3 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -187,5 +187,8 @@ def _testInputStream2(self, test_inputs, numSlices=None):
         jinput_stream = self._jvm.PythonTestInputStream2(self._jssc, jtest_rdds).asJavaDStream()
 
         dstream = DStream(jinput_stream, self, test_rdd_deserializers[0])
-        dstream._test_switch_dserializer(test_rdd_deserializers)
         return dstream
+
+    def _testInputStream3(self):
+        jinput_stream = self._jvm.PythonTestInputStream3(self._jssc).asJavaDStream()
+        return DStream(jinput_stream, self, UTF8Deserializer())
diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index e23b86e8f040e..19cce3f185833 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -37,13 +37,6 @@
 SPARK_HOME = os.environ["SPARK_HOME"]
 
 
-class StreamOutput:
-    """
-    a class to store the output from stream
-    """
-    result = list()
-
-
 class PySparkStreamingTestCase(unittest.TestCase):
     def setUp(self):
         class_name = self.__class__.__name__
@@ -115,7 +108,8 @@ def test_func(dstream):
 
     def test_count(self):
         """Basic operation test for DStream.count"""
-        test_input = [[], [1], range(1, 3), range(1, 4), range(1, 5)]
+        #test_input = [[], [1], range(1, 3), range(1, 4), range(1, 5)]
+        test_input = [range(1, 5), range(1,10), range(1,20)]
 
         def test_func(dstream):
             print "count"
@@ -137,33 +131,39 @@ def test_func(dstream):
 
     def test_reduceByKey(self):
         """Basic operation test for DStream.reduceByKey"""
-        test_input = [["a", "a", "b"], ["", ""], []]
+        #test_input = [["a", "a", "b"], ["", ""], []]
+        test_input = [["a", "a", "b", "b"], ["", "", "", ""], []]
 
         def test_func(dstream):
             print "reduceByKey"
             dstream.map(lambda x: (x, 1)).pyprint()
             return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add)
-        expected_output = [[("a", 2), ("b", 1)], [("", 2)], []]
+        #expected_output = [[("a", 2), ("b", 1)], [("", 2)], []]
+        expected_output = [[("a", 2), ("b", 2)], [("", 4)], []]
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
     def test_mapValues(self):
         """Basic operation test for DStream.mapValues"""
-        test_input = [["a", "a", "b"], ["", ""], []]
+        #test_input = [["a", "a", "b"], ["", ""], []]
+        test_input = [["a", "a", "b", "b"], ["", "", "", ""], []]
 
         def test_func(dstream):
             return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add).mapValues(lambda x: x + 10)
-        expected_output = [[("a", 12), ("b", 11)], [("", 12)], []]
+        #expected_output = [[("a", 12), ("b", 11)], [("", 12)], []]
+        expected_output = [[("a", 12), ("b", 12)], [("", 14)], []]
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
     def test_flatMapValues(self):
         """Basic operation test for DStream.flatMapValues"""
-        test_input = [["a", "a", "b"], ["", ""], []]
+        #test_input = [["a", "a", "b"], ["", ""], []]
+        test_input = [["a", "a", "b", "b"], ["", "", "",""], []]
 
         def test_func(dstream):
             return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add).flatMapValues(lambda x: (x, x + 10))
-        expected_output = [[("a", 2), ("a", 12), ("b", 1), ("b", 11)], [("", 2), ("", 12)], []]
+        #expected_output = [[("a", 2), ("a", 12), ("b", 1), ("b", 11)], [("", 2), ("", 12)], []]
+        expected_output = [[("a", 2), ("a", 12), ("b", 2), ("b", 12)], [("", 4), ("", 14)], []]
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index e8788d4579dea..7e46516a8a050 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -204,4 +204,22 @@ class PythonTestInputStream2(ssc_ : JavaStreamingContext, inputRDDs: JArrayList[
   }
 
   val asJavaDStream  = JavaDStream.fromDStream(this)
+}
+
+
+class PythonTestInputStream3(ssc_ : JavaStreamingContext)
+  extends InputDStream[Any](JavaStreamingContext.toStreamingContext(ssc_)) {
+
+  def start() {}
+
+  def stop() {}
+
+  def compute(validTime: Time): Option[RDD[Any]] = {
+    val index = ((validTime - zeroTime) / slideDuration - 1).toInt
+    val selectedInput = ArrayBuffer(1, 2, 3).toSeq
+    val rdd :RDD[Any] = ssc.sc.makeRDD(selectedInput, 2)
+    Some(rdd)
+  }
+
+  val asJavaDStream = JavaDStream.fromDStream(this)
 }
\ No newline at end of file

From 536def42b9c8b0b81499e5e06d22b813f18d0bdd Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Thu, 14 Aug 2014 23:42:34 -0700
Subject: [PATCH 60/69] basic function test cases are passed

---
 python/pyspark/streaming_tests.py             | 209 +++++++++++++-----
 python/pyspark/worker.py                      |  11 -
 .../streaming/api/python/PythonDStream.scala  |  58 +----
 3 files changed, 160 insertions(+), 118 deletions(-)

diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index 19cce3f185833..6d85a7faae859 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -24,7 +24,6 @@
 
 """
 from itertools import chain
-import os
 import time
 import unittest
 import operator
@@ -34,9 +33,6 @@
 from pyspark.streaming.duration import *
 
 
-SPARK_HOME = os.environ["SPARK_HOME"]
-
-
 class PySparkStreamingTestCase(unittest.TestCase):
     def setUp(self):
         class_name = self.__class__.__name__
@@ -49,7 +45,7 @@ def tearDown(self):
         self.ssc._sc.stop()
         # Why does it long time to terminaete StremaingContext and SparkContext?
         # Should we change the sleep time if this depends on machine spec?
-        time.sleep(5)
+        time.sleep(8)
 
     @classmethod
     def tearDownClass(cls):
@@ -59,8 +55,17 @@ def tearDownClass(cls):
 
 class TestBasicOperationsSuite(PySparkStreamingTestCase):
     """
-    Input and output of this TestBasicOperationsSuite is the equivalent to 
-    Scala TestBasicOperationsSuite.
+    2 tests for each function for batach deserializer and unbatch deserilizer because
+    we cannot change the deserializer after streaming process starts.
+    Default numInputPartitions is 2.
+    If the number of input element is over 3, that DStream use batach deserializer.
+    If not, that DStream use unbatch deserializer.
+
+    Most of the operation uses UTF8 deserializer to get value from Scala.
+    I am wondering if these test are enough or not.
+    All tests input should have list of lists. This represents stream.
+    Every batch interval, the first object of list are chosen to make DStream.
+    Please see the BasicTestSuits in Scala or QueStream which is close to this implementation.
     """
     def setUp(self):
         PySparkStreamingTestCase.setUp(self)
@@ -75,8 +80,8 @@ def tearDown(self):
     def tearDownClass(cls):
         PySparkStreamingTestCase.tearDownClass()
 
-    def test_map(self):
-        """Basic operation test for DStream.map"""
+    def test_map_batch(self):
+        """Basic operation test for DStream.map with batch deserializer"""
         test_input = [range(1, 5), range(5, 9), range(9, 13)]
 
         def test_func(dstream):
@@ -85,8 +90,18 @@ def test_func(dstream):
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
-    def test_flatMap(self):
-        """Basic operation test for DStream.faltMap"""
+    def test_map_unbatach(self):
+        """Basic operation test for DStream.map with unbatch deserializer"""
+        test_input = [range(1, 4), range(4, 7), range(7, 10)]
+
+        def test_func(dstream):
+            return dstream.map(lambda x: str(x))
+        expected_output = map(lambda x: map(lambda y: str(y), x), test_input)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_flatMap_batch(self):
+        """Basic operation test for DStream.faltMap with batch deserializer"""
         test_input = [range(1, 5), range(5, 9), range(9, 13)]
 
         def test_func(dstream):
@@ -96,8 +111,19 @@ def test_func(dstream):
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
-    def test_filter(self):
-        """Basic operation test for DStream.filter"""
+    def test_flatMap_unbatch(self):
+        """Basic operation test for DStream.faltMap with unbatch deserializer"""
+        test_input = [range(1, 4), range(4, 7), range(7, 10)]
+
+        def test_func(dstream):
+            return dstream.flatMap(lambda x: (x, x * 2))
+        expected_output = map(lambda x: list(chain.from_iterable((map(lambda y: [y, y * 2], x)))),
+                              test_input)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_filter_batch(self):
+        """Basic operation test for DStream.filter with batch deserializer"""
         test_input = [range(1, 5), range(5, 9), range(9, 13)]
 
         def test_func(dstream):
@@ -106,21 +132,38 @@ def test_func(dstream):
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
-    def test_count(self):
-        """Basic operation test for DStream.count"""
-        #test_input = [[], [1], range(1, 3), range(1, 4), range(1, 5)]
-        test_input = [range(1, 5), range(1,10), range(1,20)]
+    def test_filter_unbatch(self):
+        """Basic operation test for DStream.filter with unbatch deserializer"""
+        test_input = [range(1, 4), range(4, 7), range(7, 10)]
+
+        def test_func(dstream):
+            return dstream.filter(lambda x: x % 2 == 0)
+        expected_output = map(lambda x: filter(lambda y: y % 2 == 0, x), test_input)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_count_batch(self):
+        """Basic operation test for DStream.count with batch deserializer"""
+        test_input = [range(1, 5), range(1, 10), range(1, 20)]
 
         def test_func(dstream):
-            print "count"
-            dstream.count().pyprint()
             return dstream.count()
         expected_output = map(lambda x: [len(x)], test_input)
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
-        
-    def test_reduce(self):
-        """Basic operation test for DStream.reduce"""
+
+    def test_count_unbatch(self):
+        """Basic operation test for DStream.count with unbatch deserializer"""
+        test_input = [[], [1], range(1, 3), range(1, 4)]
+
+        def test_func(dstream):
+            return dstream.count()
+        expected_output = map(lambda x: [len(x)], test_input)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_reduce_batch(self):
+        """Basic operation test for DStream.reduce with batch deserializer"""
         test_input = [range(1, 5), range(5, 9), range(9, 13)]
 
         def test_func(dstream):
@@ -129,67 +172,132 @@ def test_func(dstream):
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
-    def test_reduceByKey(self):
-        """Basic operation test for DStream.reduceByKey"""
-        #test_input = [["a", "a", "b"], ["", ""], []]
-        test_input = [["a", "a", "b", "b"], ["", "", "", ""], []]
+    def test_reduce_unbatch(self):
+        """Basic operation test for DStream.reduce with unbatch deserializer"""
+        test_input = [[1], range(1, 3), range(1, 4)]
+
+        def test_func(dstream):
+            return dstream.reduce(operator.add)
+        expected_output = map(lambda x: [reduce(operator.add, x)], test_input)
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_reduceByKey_batch(self):
+        """Basic operation test for DStream.reduceByKey with batch deserializer"""
+        test_input = [["a", "a", "b", "b"], ["", "", "", ""]]
+
+        def test_func(dstream):
+            return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add)
+        expected_output = [[("a", 2), ("b", 2)], [("", 4)]]
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_reduceByKey_unbatch(self):
+        """Basic operation test for DStream.reduceByKey with unbatch deserilizer"""
+        test_input = [["a", "a", "b"], ["", ""], []]
 
         def test_func(dstream):
-            print "reduceByKey"
-            dstream.map(lambda x: (x, 1)).pyprint()
             return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add)
-        #expected_output = [[("a", 2), ("b", 1)], [("", 2)], []]
-        expected_output = [[("a", 2), ("b", 2)], [("", 4)], []]
+        expected_output = [[("a", 2), ("b", 1)], [("", 2)], []]
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
-    def test_mapValues(self):
-        """Basic operation test for DStream.mapValues"""
-        #test_input = [["a", "a", "b"], ["", ""], []]
-        test_input = [["a", "a", "b", "b"], ["", "", "", ""], []]
+    def test_mapValues_batch(self):
+        """Basic operation test for DStream.mapValues with batch deserializer"""
+        test_input = [["a", "a", "b", "b"], ["", "", "", ""]]
 
         def test_func(dstream):
-            return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add).mapValues(lambda x: x + 10)
-        #expected_output = [[("a", 12), ("b", 11)], [("", 12)], []]
-        expected_output = [[("a", 12), ("b", 12)], [("", 14)], []]
+            return dstream.map(lambda x: (x, 1))\
+                          .reduceByKey(operator.add)\
+                          .mapValues(lambda x: x + 10)
+        expected_output = [[("a", 12), ("b", 12)], [("", 14)]]
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
-    def test_flatMapValues(self):
-        """Basic operation test for DStream.flatMapValues"""
-        #test_input = [["a", "a", "b"], ["", ""], []]
-        test_input = [["a", "a", "b", "b"], ["", "", "",""], []]
+    def test_mapValues_unbatch(self):
+        """Basic operation test for DStream.mapValues with unbatch deserializer"""
+        test_input = [["a", "a", "b"], ["", ""], []]
 
         def test_func(dstream):
-            return dstream.map(lambda x: (x, 1)).reduceByKey(operator.add).flatMapValues(lambda x: (x, x + 10))
-        #expected_output = [[("a", 2), ("a", 12), ("b", 1), ("b", 11)], [("", 2), ("", 12)], []]
-        expected_output = [[("a", 2), ("a", 12), ("b", 2), ("b", 12)], [("", 4), ("", 14)], []]
+            return dstream.map(lambda x: (x, 1))\
+                          .reduceByKey(operator.add)\
+                          .mapValues(lambda x: x + 10)
+        expected_output = [[("a", 12), ("b", 11)], [("", 12)], []]
         output = self._run_stream(test_input, test_func, expected_output)
         self.assertEqual(expected_output, output)
 
-    def test_glom(self):
-        """Basic operation test for DStream.glom"""
+    def test_flatMapValues_batch(self):
+        """Basic operation test for DStream.flatMapValues with batch deserializer"""
+        test_input = [["a", "a", "b", "b"], ["", "", "", ""]]
+
+        def test_func(dstream):
+            return dstream.map(lambda x: (x, 1))\
+                          .reduceByKey(operator.add)\
+                          .flatMapValues(lambda x: (x, x + 10))
+        expected_output = [[("a", 2), ("a", 12), ("b", 2), ("b", 12)], [("", 4), ("", 14)]]
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_flatMapValues_unbatch(self):
+        """Basic operation test for DStream.flatMapValues with unbatch deserializer"""
+        test_input = [["a", "a", "b"], ["", ""], []]
+
+        def test_func(dstream):
+            return dstream.map(lambda x: (x, 1))\
+                          .reduceByKey(operator.add)\
+                          .flatMapValues(lambda x: (x, x + 10))
+        expected_output = [[("a", 2), ("a", 12), ("b", 1), ("b", 11)], [("", 2), ("", 12)], []]
+        output = self._run_stream(test_input, test_func, expected_output)
+        self.assertEqual(expected_output, output)
+
+    def test_glom_batch(self):
+        """Basic operation test for DStream.glom with batch deserializer"""
         test_input = [range(1, 5), range(5, 9), range(9, 13)]
         numSlices = 2
 
         def test_func(dstream):
             return dstream.glom()
-        expected_output = [[[1,2], [3,4]], [[5,6], [7,8]], [[9,10], [11,12]]]
+        expected_output = [[[1, 2], [3, 4]], [[5, 6], [7, 8]], [[9, 10], [11, 12]]]
+        output = self._run_stream(test_input, test_func, expected_output, numSlices)
+        self.assertEqual(expected_output, output)
+
+    def test_glom_unbatach(self):
+        """Basic operation test for DStream.glom with unbatch deserialiser"""
+        test_input = [range(1, 4), range(4, 7), range(7, 10)]
+        numSlices = 2
+
+        def test_func(dstream):
+            return dstream.glom()
+        expected_output = [[[1], [2, 3]], [[4], [5, 6]], [[7], [8, 9]]]
         output = self._run_stream(test_input, test_func, expected_output, numSlices)
         self.assertEqual(expected_output, output)
 
-    def test_mapPartitions(self):
-        """Basic operation test for DStream.mapPartitions"""
+    def test_mapPartitions_batch(self):
+        """Basic operation test for DStream.mapPartitions with batch deserializer"""
         test_input = [range(1, 5), range(5, 9), range(9, 13)]
         numSlices = 2
 
         def test_func(dstream):
-            def f(iterator): yield sum(iterator)
+            def f(iterator):
+                yield sum(iterator)
             return dstream.mapPartitions(f)
         expected_output = [[3, 7], [11, 15], [19, 23]]
         output = self._run_stream(test_input, test_func, expected_output, numSlices)
         self.assertEqual(expected_output, output)
 
+    def test_mapPartitions_unbatch(self):
+        """Basic operation test for DStream.mapPartitions with unbatch deserializer"""
+        test_input = [range(1, 4), range(4, 7), range(7, 10)]
+        numSlices = 2
+
+        def test_func(dstream):
+            def f(iterator):
+                yield sum(iterator)
+            return dstream.mapPartitions(f)
+        expected_output = [[1, 5], [4, 11], [7, 17]]
+        output = self._run_stream(test_input, test_func, expected_output, numSlices)
+        self.assertEqual(expected_output, output)
+
     def _run_stream(self, test_input, test_func, expected_output, numSlices=None):
         """Start stream and return the output"""
         # Generate input stream with user-defined input
@@ -212,6 +320,7 @@ def _run_stream(self, test_input, test_func, expected_output, numSlices=None):
             # check if the output is the same length of expexted output
             if len(expected_output) == len(self.result):
                 break
+
         return self.result
 
 if __name__ == "__main__":
diff --git a/python/pyspark/worker.py b/python/pyspark/worker.py
index 8ee2f0b3a260f..7ca3252270d5a 100644
--- a/python/pyspark/worker.py
+++ b/python/pyspark/worker.py
@@ -23,7 +23,6 @@
 import time
 import socket
 import traceback
-import itertools
 # CloudPickler needs to be imported so that depicklers are registered using the
 # copy_reg module.
 from pyspark.accumulators import _accumulatorRegistry
@@ -75,16 +74,6 @@ def main(infile, outfile):
         (func, deserializer, serializer) = command
         init_time = time.time()
         iterator = deserializer.load_stream(infile)
-        print "deserializer in worker: %s" % str(deserializer)
-        iterator, walk = itertools.tee(iterator)
-        if isinstance(walk, int):
-            print "this is int"
-            print walk
-        else:
-            try:
-                print list(walk)
-            except:
-                print list(walk)
         serializer.dump_stream(func(split_index, iterator), outfile)
     except Exception as e:
         # Write the error to stderr in addition to trying to pass it back to
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 7e46516a8a050..9f1e1f4d3cca7 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -133,45 +133,6 @@ class PythonTransformedDStream(
 }
 */
 
-/**
- * This is a input stream just for the unitest. This is equivalent to a checkpointable,
- * replayable, reliable message queue like Kafka. It requires a sequence as input, and
- * returns the i_th element at the i_th batch under manual clock.
- */
-class PythonTestInputStream(ssc_ : JavaStreamingContext, inputFiles: JArrayList[String], numPartitions: Int)
-  extends InputDStream[Array[Byte]](JavaStreamingContext.toStreamingContext(ssc_)){
-
-  def start() {}
-
-  def stop() {}
-
-  def compute(validTime: Time): Option[RDD[Array[Byte]]] = {
-    logInfo("Computing RDD for time " + validTime)
-    inputFiles.foreach(logInfo(_))
-    // make a temporary file
-    // make empty RDD
-    val prefix = "spark"
-    val suffix = ".tmp"
-    val tempFile = File.createTempFile(prefix, suffix)
-    val index = ((validTime - zeroTime) / slideDuration - 1).toInt
-    logInfo("Index: " + index)
-
-    val selectedInputFile: String = {
-      if (inputFiles.isEmpty){
-        tempFile.getAbsolutePath
-      }else if (index < inputFiles.size()) {
-        inputFiles.get(index)
-      } else {
-        tempFile.getAbsolutePath
-      }
-    }
-    val rdd = PythonRDD.readRDDFromFile(JavaSparkContext.fromSparkContext(ssc_.sparkContext), selectedInputFile, numPartitions).rdd
-    logInfo("Created RDD " + rdd.id + " with " + selectedInputFile)
-    Some(rdd)
-  }
-
-  val asJavaDStream  = JavaDStream.fromDStream(this)
-}
 
 /**
  * This is a input stream just for the unitest. This is equivalent to a checkpointable,
@@ -180,7 +141,7 @@ class PythonTestInputStream(ssc_ : JavaStreamingContext, inputFiles: JArrayList[
  * This implementation is close to QueStream
  */
 
-class PythonTestInputStream2(ssc_ : JavaStreamingContext, inputRDDs: JArrayList[JavaRDD[Array[Byte]]])
+class PythonTestInputStream(ssc_ : JavaStreamingContext, inputRDDs: JArrayList[JavaRDD[Array[Byte]]])
   extends InputDStream[Array[Byte]](JavaStreamingContext.toStreamingContext(ssc_)) {
 
   def start() {}
@@ -206,20 +167,3 @@ class PythonTestInputStream2(ssc_ : JavaStreamingContext, inputRDDs: JArrayList[
   val asJavaDStream  = JavaDStream.fromDStream(this)
 }
 
-
-class PythonTestInputStream3(ssc_ : JavaStreamingContext)
-  extends InputDStream[Any](JavaStreamingContext.toStreamingContext(ssc_)) {
-
-  def start() {}
-
-  def stop() {}
-
-  def compute(validTime: Time): Option[RDD[Any]] = {
-    val index = ((validTime - zeroTime) / slideDuration - 1).toInt
-    val selectedInput = ArrayBuffer(1, 2, 3).toSeq
-    val rdd :RDD[Any] = ssc.sc.makeRDD(selectedInput, 2)
-    Some(rdd)
-  }
-
-  val asJavaDStream = JavaDStream.fromDStream(this)
-}
\ No newline at end of file

From a14c7e1a59370949a5f1eab16e448cc0012fa65e Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Thu, 14 Aug 2014 23:46:45 -0700
Subject: [PATCH 61/69] modified streaming test case to add coment

---
 python/pyspark/streaming_tests.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index 6d85a7faae859..02996ccce9a3e 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -18,6 +18,9 @@
 """
 Unit tests for PySpark; additional tests are implemented as doctests in
 individual modules.
+Other option is separate this test case with other tests.
+This makes sense becuase streaming tests takes long time due to waiting time
+for stoping callback server.
 
 This file will merged to tests.py. But for now, this file is separated due
 to focusing to streaming test case
@@ -45,7 +48,7 @@ def tearDown(self):
         self.ssc._sc.stop()
         # Why does it long time to terminaete StremaingContext and SparkContext?
         # Should we change the sleep time if this depends on machine spec?
-        time.sleep(8)
+        time.sleep(10)
 
     @classmethod
     def tearDownClass(cls):
@@ -302,7 +305,7 @@ def _run_stream(self, test_input, test_func, expected_output, numSlices=None):
         """Start stream and return the output"""
         # Generate input stream with user-defined input
         numSlices = numSlices or self.numInputPartitions
-        test_input_stream = self.ssc._testInputStream2(test_input, numSlices)
+        test_input_stream = self.ssc._testInputStream(test_input, numSlices)
         # Apply test function to stream
         test_stream = test_func(test_input_stream)
         # Add job to get output from stream

From e3033fcdd24258eb3836c0c07e5c959c3dfde7d2 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Fri, 15 Aug 2014 11:28:39 -0700
Subject: [PATCH 62/69] remove waste duplicated code

---
 python/pyspark/streaming/context.py | 43 +----------------
 python/pyspark/streaming/dstream.py | 75 +++++++++++++++++++++--------
 2 files changed, 56 insertions(+), 62 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 123fa67f837e3..60bcf86783e95 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -130,48 +130,7 @@ def stop(self, stopSparkContext=True, stopGraceFully=False):
             # Stop Callback server
             SparkContext._gateway.shutdown()
 
-    def checkpoint(self, directory):
-        """
-        Not tested
-        """
-        self._jssc.checkpoint(directory)
-
     def _testInputStream(self, test_inputs, numSlices=None):
-        """
-        Generate multiple files to make "stream" in Scala side for test.
-        Scala chooses one of the files and generates RDD using PythonRDD.readRDDFromFile.
-
-        QueStream maybe good way to implement this function
-        """
-        numSlices = numSlices or self._sc.defaultParallelism
-        # Calling the Java parallelize() method with an ArrayList is too slow,
-        # because it sends O(n) Py4J commands.  As an alternative, serialized
-        # objects are written to a file and loaded through textFile().
-
-        tempFiles = list()
-        for test_input in test_inputs:
-            tempFile = NamedTemporaryFile(delete=False, dir=self._sc._temp_dir)
-
-            # Make sure we distribute data evenly if it's smaller than self.batchSize
-            if "__len__" not in dir(test_input):
-                test_input = list(test_input)    # Make it a list so we can compute its length
-            batchSize = min(len(test_input) // numSlices, self._sc._batchSize)
-            if batchSize > 1:
-                serializer = BatchedSerializer(self._sc._unbatched_serializer,
-                                               batchSize)
-            else:
-                serializer = self._sc._unbatched_serializer
-            serializer.dump_stream(test_input, tempFile)
-            tempFile.close()
-            tempFiles.append(tempFile.name)
-
-        jtempFiles = ListConverter().convert(tempFiles, SparkContext._gateway._gateway_client)
-        jinput_stream = self._jvm.PythonTestInputStream(self._jssc,
-                                                        jtempFiles,
-                                                        numSlices).asJavaDStream()
-        return DStream(jinput_stream, self, BatchedSerializer(PickleSerializer()))
-    
-    def _testInputStream2(self, test_inputs, numSlices=None):
         """
         This is inpired by QueStream implementation. Give list of RDD and generate DStream
         which contain the RDD.
@@ -184,7 +143,7 @@ def _testInputStream2(self, test_inputs, numSlices=None):
             test_rdd_deserializers.append(test_rdd._jrdd_deserializer)
 
         jtest_rdds = ListConverter().convert(test_rdds, SparkContext._gateway._gateway_client)
-        jinput_stream = self._jvm.PythonTestInputStream2(self._jssc, jtest_rdds).asJavaDStream()
+        jinput_stream = self._jvm.PythonTestInputStream(self._jssc, jtest_rdds).asJavaDStream()
 
         dstream = DStream(jinput_stream, self, test_rdd_deserializers[0])
         return dstream
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 0a93a46d2b2a2..ea418822759c4 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -17,12 +17,13 @@
 
 from collections import defaultdict
 from itertools import chain, ifilter, imap
-import time
 import operator
 
 from pyspark.serializers import NoOpSerializer,\
     BatchedSerializer, CloudPickleSerializer, pack_long
 from pyspark.rdd import _JavaStackTrace
+from pyspark.storagelevel import StorageLevel
+from pyspark.resultiterable import ResultIterable
 
 from py4j.java_collections import ListConverter, MapConverter
 
@@ -35,6 +36,8 @@ def __init__(self, jdstream, ssc, jrdd_deserializer):
         self._ssc = ssc
         self.ctx = ssc._sc
         self._jrdd_deserializer = jrdd_deserializer
+        self.is_cached = False
+        self.is_checkpointed = False
 
     def context(self):
         """
@@ -234,8 +237,6 @@ def takeAndPrint(rdd, time):
             taken = rdd.take(11)
             print "-------------------------------------------"
             print "Time: %s" % (str(time))
-            print rdd.glom().collect()
-            print "-------------------------------------------"
             print "-------------------------------------------"
             for record in taken[:10]:
                 print record
@@ -290,32 +291,65 @@ def get_output(rdd, time):
 
         self.foreachRDD(get_output)
 
-    def _test_switch_dserializer(self, serializer_que):
+    def cache(self):
+        """
+        Persist this DStream with the default storage level (C{MEMORY_ONLY_SER}).
+        """
+        self.is_cached = True
+        self.persist(StorageLevel.MEMORY_ONLY_SER)
+        return self
+
+    def persist(self, storageLevel):
+        """
+        Set this DStream's storage level to persist its values across operations
+        after the first time it is computed. This can only be used to assign
+        a new storage level if the DStream does not have a storage level set yet.
+        """
+        self.is_cached = True
+        javaStorageLevel = self.ctx._getJavaStorageLevel(storageLevel)
+        self._jdstream.persist(javaStorageLevel)
+        return self
+
+    def checkpoint(self, interval):
         """
-        Deserializer is dynamically changed based on numSlice and the number of
-        input. This function choose deserializer. Currently this is just FIFO.
+        Mark this DStream for checkpointing. It will be saved to a file inside the
+        checkpoint directory set with L{SparkContext.setCheckpointDir()}
+
+        I am not sure this part in DStream
+        and
+        all references to its parent RDDs will be removed. This function must
+        be called before any job has been executed on this RDD. It is strongly
+        recommended that this RDD is persisted in memory, otherwise saving it
+        on a file will require recomputation.
+
+        interval must be pysprak.streaming.duration
         """
-        
-        jrdd_deserializer = self._jrdd_deserializer
+        self.is_checkpointed = True
+        self._jdstream.checkpoint(interval)
+        return self
+
+    def groupByKey(self, numPartitions=None):
+        def createCombiner(x):
+            return [x]
 
-        def switch(rdd, jtime):
-            try:
-                print serializer_que
-                jrdd_deserializer = serializer_que.pop(0)
-                print jrdd_deserializer
-            except Exception as e:
-                print e
+        def mergeValue(xs, x):
+            xs.append(x)
+            return xs
 
-        self.foreachRDD(switch)
+        def mergeCombiners(a, b):
+            a.extend(b)
+            return a
 
+        return self.combineByKey(createCombiner, mergeValue, mergeCombiners,
+                                 numPartitions).mapValues(lambda x: ResultIterable(x))
 
 
 # TODO: implement groupByKey
+# TODO: implement saveAsTextFile
+
+# Following operation has dependency to transform
 # TODO: impelment union
-# TODO: implement cache
-# TODO: implement persist
 # TODO: implement repertitions
-# TODO: implement saveAsTextFile
 # TODO: implement cogroup
 # TODO: implement join
 # TODO: implement countByValue
@@ -342,6 +376,7 @@ def pipeline_func(split, iterator):
             self._prev_jdstream = prev._prev_jdstream  # maintain the pipeline
             self._prev_jrdd_deserializer = prev._prev_jrdd_deserializer
         self.is_cached = False
+        self.is_checkpointed = False
         self._ssc = prev._ssc
         self.ctx = prev.ctx
         self.prev = prev
@@ -378,4 +413,4 @@ def _jdstream(self):
         return self._jdstream_val
 
     def _is_pipelinable(self):
-        return not self.is_cached
+        return not (self.is_cached or self.is_checkpointed)

From 89ae38a0d6bc299ebb9aa81c7510812874ce7879 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Fri, 15 Aug 2014 17:10:56 -0700
Subject: [PATCH 63/69] added saveAsTextFiles and saveAsPickledFiles

---
 python/pyspark/streaming/context.py           | 17 +++++----
 python/pyspark/streaming/dstream.py           | 35 ++++++++++++++++---
 python/pyspark/streaming/utils.py             |  6 ++++
 python/pyspark/streaming_tests.py             | 32 +++++++++++++++++
 .../streaming/api/python/PythonDStream.scala  |  2 +-
 5 files changed, 78 insertions(+), 14 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 60bcf86783e95..691f9b06ad4e9 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -114,7 +114,7 @@ def textFileStream(self, directory):
         Create an input stream that monitors a Hadoop-compatible file system
         for new files and reads them as text files. Files must be wrriten to the
         monitored directory by "moving" them from another location within the same
-        file system. FIle names starting with . are ignored.
+        file system. File names starting with . are ignored.
         """
         return DStream(self._jssc.textFileStream(directory), self, UTF8Deserializer())
 
@@ -132,8 +132,9 @@ def stop(self, stopSparkContext=True, stopGraceFully=False):
 
     def _testInputStream(self, test_inputs, numSlices=None):
         """
-        This is inpired by QueStream implementation. Give list of RDD and generate DStream
-        which contain the RDD.
+        This function is only for test.
+        This implementation is inpired by QueStream implementation. 
+        Give list of RDD to generate DStream which contains the RDD.
         """
         test_rdds = list()
         test_rdd_deserializers = list()
@@ -142,12 +143,10 @@ def _testInputStream(self, test_inputs, numSlices=None):
             test_rdds.append(test_rdd._jrdd)
             test_rdd_deserializers.append(test_rdd._jrdd_deserializer)
 
+#        if len(set(test_rdd_deserializers)) > 1:
+#            raise IOError("Deserializer should be one type to run test case. "
+#                          "See the SparkContext.parallelize to understand how to decide deserializer")
         jtest_rdds = ListConverter().convert(test_rdds, SparkContext._gateway._gateway_client)
         jinput_stream = self._jvm.PythonTestInputStream(self._jssc, jtest_rdds).asJavaDStream()
 
-        dstream = DStream(jinput_stream, self, test_rdd_deserializers[0])
-        return dstream
-
-    def _testInputStream3(self):
-        jinput_stream = self._jvm.PythonTestInputStream3(self._jssc).asJavaDStream()
-        return DStream(jinput_stream, self, UTF8Deserializer())
+        return DStream(jinput_stream, self, test_rdd_deserializers[0])
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index ea418822759c4..679360dbca08d 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -24,6 +24,8 @@
 from pyspark.rdd import _JavaStackTrace
 from pyspark.storagelevel import StorageLevel
 from pyspark.resultiterable import ResultIterable
+from pyspark.streaming.utils import rddToFileName
+
 
 from py4j.java_collections import ListConverter, MapConverter
 
@@ -343,21 +345,46 @@ def mergeCombiners(a, b):
         return self.combineByKey(createCombiner, mergeValue, mergeCombiners,
                                  numPartitions).mapValues(lambda x: ResultIterable(x))
 
+    def countByValue(self):
+        def countPartition(iterator):
+            counts = defaultdict(int)
+            for obj in iterator:
+                counts[obj] += 1
+            yield counts
+
+        def mergeMaps(m1, m2):
+            for (k, v) in m2.iteritems():
+                m1[k] += v
+            return m1
+
+        return self.mapPartitions(countPartition).reduce(mergeMaps).flatMap(lambda x: x.items())
+
+    def saveAsTextFiles(self, prefix, suffix=None):
+
+        def saveAsTextFile(rdd, time):
+            path = rddToFileName(prefix, suffix, time)
+            rdd.saveAsTextFile(path)
+
+        return self.foreachRDD(saveAsTextFile)
+
+    def saveAsPickledFiles(self, prefix, suffix=None):
+
+        def saveAsTextFile(rdd, time):
+            path = rddToFileName(prefix, suffix, time)
+            rdd.saveAsPickleFile(path)
+
+        return self.foreachRDD(saveAsTextFile)
 
-# TODO: implement groupByKey
-# TODO: implement saveAsTextFile
 
 # Following operation has dependency to transform
 # TODO: impelment union
 # TODO: implement repertitions
 # TODO: implement cogroup
 # TODO: implement join
-# TODO: implement countByValue
 # TODO: implement leftOuterJoin
 # TODO: implemtnt rightOuterJoin
 
 
-
 class PipelinedDStream(DStream):
     def __init__(self, prev, func, preservesPartitioning=False):
         if not isinstance(prev, PipelinedDStream) or not prev._is_pipelinable():
diff --git a/python/pyspark/streaming/utils.py b/python/pyspark/streaming/utils.py
index aa5e19adbd927..9178577743e0b 100644
--- a/python/pyspark/streaming/utils.py
+++ b/python/pyspark/streaming/utils.py
@@ -53,3 +53,9 @@ def msDurationToString(ms):
         return "%.1f m" % (float(ms) / minute)
     else:
         return "%.2f h" % (float(ms) / hour)
+
+def rddToFileName(prefix, suffix, time):
+    if suffix is not None:
+        return prefix + "-" + str(time) + "." + suffix
+    else:
+        return prefix + "-" + str(time)
diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index 02996ccce9a3e..2bb01ed3a0642 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -301,6 +301,38 @@ def f(iterator):
         output = self._run_stream(test_input, test_func, expected_output, numSlices)
         self.assertEqual(expected_output, output)
 
+    def test_countByValue_batch(self):
+        """Basic operation test for DStream.countByValue with batch deserializer"""
+        test_input = [range(1, 5) + range(1,5), range(5, 7) + range(5, 9), ["a"] * 2 + ["b"] + [""] ]
+
+        def test_func(dstream):
+            return dstream.countByValue()
+        expected_output = [[(1, 2), (2, 2), (3, 2), (4, 2)],
+                           [(5, 2), (6, 2), (7, 1), (8, 1)],
+                           [("a", 2), ("b", 1), ("", 1)]]
+        output = self._run_stream(test_input, test_func, expected_output)
+        for result in (output, expected_output):
+            self._sort_result_based_on_key(result)
+        self.assertEqual(expected_output, output)
+
+    def test_countByValue_unbatch(self):
+        """Basic operation test for DStream.countByValue with unbatch deserializer"""
+        test_input = [range(1, 4), [1, 1, ""], ["a", "a", "b"]]
+
+        def test_func(dstream):
+            return dstream.countByValue()
+        expected_output = [[(1, 1), (2, 1), (3, 1)],
+                           [(1, 2), ("", 1)],
+                           [("a", 2), ("b", 1)]]
+        output = self._run_stream(test_input, test_func, expected_output)
+        for result in (output, expected_output):
+            self._sort_result_based_on_key(result)
+        self.assertEqual(expected_output, output)
+
+    def _sort_result_based_on_key(self, outputs):
+        for output in outputs:
+            output.sort(key=lambda x: x[0])
+
     def _run_stream(self, test_input, test_func, expected_output, numSlices=None):
         """Start stream and return the output"""
         # Generate input stream with user-defined input
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
index 9f1e1f4d3cca7..38b9004ab7439 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/python/PythonDStream.scala
@@ -138,7 +138,7 @@ class PythonTransformedDStream(
  * This is a input stream just for the unitest. This is equivalent to a checkpointable,
  * replayable, reliable message queue like Kafka. It requires a sequence as input, and
  * returns the i_th element at the i_th batch under manual clock.
- * This implementation is close to QueStream
+ * This implementation is inspired by QueStream
  */
 
 class PythonTestInputStream(ssc_ : JavaStreamingContext, inputRDDs: JArrayList[JavaRDD[Array[Byte]]])

From ea9c8731b3d997ead7015d721c66231064e19ff9 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Fri, 15 Aug 2014 22:30:58 -0700
Subject: [PATCH 64/69] added TODO coments

---
 python/pyspark/streaming/context.py |  3 ++-
 python/pyspark/streaming/dstream.py | 16 ++++++++++++++--
 2 files changed, 16 insertions(+), 3 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 691f9b06ad4e9..470ed270cdbfb 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -17,7 +17,6 @@
 
 import sys
 from signal import signal, SIGTERM, SIGINT
-from tempfile import NamedTemporaryFile
 
 from pyspark.serializers import PickleSerializer, BatchedSerializer, UTF8Deserializer
 from pyspark.context import SparkContext
@@ -79,6 +78,7 @@ def _clean_up_trigger(self):
         """Kill py4j callback server properly using signal lib"""
 
         def clean_up_handler(*args):
+            SparkContext._gateway._shutdown_callback_server()
             SparkContext._gateway.shutdown()
             sys.exit(0)
 
@@ -128,6 +128,7 @@ def stop(self, stopSparkContext=True, stopGraceFully=False):
             self._jssc.stop(stopSparkContext, stopGraceFully)
         finally:
             # Stop Callback server
+            SparkContext._gateway._shutdown_callback_server()
             SparkContext._gateway.shutdown()
 
     def _testInputStream(self, test_inputs, numSlices=None):
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index 679360dbca08d..ef0e2258e9922 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -376,15 +376,27 @@ def saveAsTextFile(rdd, time):
         return self.foreachRDD(saveAsTextFile)
 
 
+# TODO: implement updateStateByKey
+# TODO: implement slice
+
+# Window Operations
+# TODO: implement window
+# TODO: implement groupByKeyAndWindow
+# TODO: implement reduceByKeyAndWindow
+# TODO: implement countByValueAndWindow
+# TODO: implement countByWindow
+# TODO: implement reduceByWindow
+
 # Following operation has dependency to transform
-# TODO: impelment union
+# TODO: implement transform
+# TODO: implement transformWith
+# TODO: implement union
 # TODO: implement repertitions
 # TODO: implement cogroup
 # TODO: implement join
 # TODO: implement leftOuterJoin
 # TODO: implemtnt rightOuterJoin
 
-
 class PipelinedDStream(DStream):
     def __init__(self, prev, func, preservesPartitioning=False):
         if not isinstance(prev, PipelinedDStream) or not prev._is_pipelinable():

From d8b593b20351d32d4ac3948778bf2ebbab86879f Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 18 Aug 2014 00:30:17 -0700
Subject: [PATCH 65/69] add comments

---
 python/pyspark/java_gateway.py      |  5 ++---
 python/pyspark/streaming/context.py | 13 ++++++-----
 python/pyspark/streaming/dstream.py | 24 ++++++++++++++++++++
 python/pyspark/streaming_tests.py   | 34 ++++++++++++++++++++++-------
 4 files changed, 59 insertions(+), 17 deletions(-)

diff --git a/python/pyspark/java_gateway.py b/python/pyspark/java_gateway.py
index cea7d0975e5d1..8f9a747f9590b 100644
--- a/python/pyspark/java_gateway.py
+++ b/python/pyspark/java_gateway.py
@@ -82,15 +82,14 @@ def run(self):
     java_import(gateway.jvm, "org.apache.spark.SparkConf")
     java_import(gateway.jvm, "org.apache.spark.api.java.*")
     java_import(gateway.jvm, "org.apache.spark.api.python.*")
-    java_import(gateway.jvm, "org.apache.spark.streaming.*")
+    java_import(gateway.jvm, "org.apache.spark.streaming.*")  # do we need this?
     java_import(gateway.jvm, "org.apache.spark.streaming.api.java.*")
     java_import(gateway.jvm, "org.apache.spark.streaming.api.python.*")
-    java_import(gateway.jvm, "org.apache.spark.streaming.dstream.*")
+    java_import(gateway.jvm, "org.apache.spark.streaming.dstream.*")  # do we need this?
     java_import(gateway.jvm, "org.apache.spark.mllib.api.python.*")
     java_import(gateway.jvm, "org.apache.spark.sql.SQLContext")
     java_import(gateway.jvm, "org.apache.spark.sql.hive.HiveContext")
     java_import(gateway.jvm, "org.apache.spark.sql.hive.LocalHiveContext")
     java_import(gateway.jvm, "org.apache.spark.sql.hive.TestHiveContext")
     java_import(gateway.jvm, "scala.Tuple2")
-
     return gateway
diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index 470ed270cdbfb..e380626aa080b 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -64,7 +64,9 @@ def __init__(self, master=None, appName=None, sparkHome=None, pyFiles=None,
                         pyFiles=pyFiles, environment=environment, batchSize=batchSize,
                         serializer=serializer, conf=conf, gateway=gateway)
 
-        # Start py4j callback server
+        # Start py4j callback server.
+        # Callback sever is need only by SparkStreming; therefore the callback sever
+        # is started in StreamingContext.
         SparkContext._gateway.restart_callback_server()
         self._clean_up_trigger()
         self._jvm = self._sc._jvm
@@ -78,6 +80,8 @@ def _clean_up_trigger(self):
         """Kill py4j callback server properly using signal lib"""
 
         def clean_up_handler(*args):
+            # Make sure stop callback server.
+            # This need improvement how to terminate callback sever properly.
             SparkContext._gateway._shutdown_callback_server()
             SparkContext._gateway.shutdown()
             sys.exit(0)
@@ -100,7 +104,7 @@ def awaitTermination(self, timeout=None):
         else:
             self._jssc.awaitTermination(timeout)
 
-    # start from simple one. storageLevel is not passed for now.
+    #TODO: add storageLevel
     def socketTextStream(self, hostname, port):
         """
         Create an input from TCP source hostname:port. Data is received using
@@ -134,7 +138,7 @@ def stop(self, stopSparkContext=True, stopGraceFully=False):
     def _testInputStream(self, test_inputs, numSlices=None):
         """
         This function is only for test.
-        This implementation is inpired by QueStream implementation. 
+        This implementation is inspired by QueStream implementation.
         Give list of RDD to generate DStream which contains the RDD.
         """
         test_rdds = list()
@@ -144,9 +148,6 @@ def _testInputStream(self, test_inputs, numSlices=None):
             test_rdds.append(test_rdd._jrdd)
             test_rdd_deserializers.append(test_rdd._jrdd_deserializer)
 
-#        if len(set(test_rdd_deserializers)) > 1:
-#            raise IOError("Deserializer should be one type to run test case. "
-#                          "See the SparkContext.parallelize to understand how to decide deserializer")
         jtest_rdds = ListConverter().convert(test_rdds, SparkContext._gateway._gateway_client)
         jinput_stream = self._jvm.PythonTestInputStream(self._jssc, jtest_rdds).asJavaDStream()
 
diff --git a/python/pyspark/streaming/dstream.py b/python/pyspark/streaming/dstream.py
index ef0e2258e9922..8ed50d3dd2531 100644
--- a/python/pyspark/streaming/dstream.py
+++ b/python/pyspark/streaming/dstream.py
@@ -331,6 +331,17 @@ def checkpoint(self, interval):
         return self
 
     def groupByKey(self, numPartitions=None):
+        """
+        Return a new DStream which contains group the values for each key in the
+        DStream into a single sequence.
+        Hash-partitions the resulting RDD with into numPartitions partitions in
+        the DStream.
+
+        Note: If you are grouping in order to perform an aggregation (such as a
+        sum or average) over each key, using reduceByKey will provide much
+        better performance.
+
+        """
         def createCombiner(x):
             return [x]
 
@@ -346,6 +357,10 @@ def mergeCombiners(a, b):
                                  numPartitions).mapValues(lambda x: ResultIterable(x))
 
     def countByValue(self):
+        """
+        Return new DStream which contains the count of each unique value in this
+        DStreeam as a (value, count) pairs.
+        """
         def countPartition(iterator):
             counts = defaultdict(int)
             for obj in iterator:
@@ -360,6 +375,9 @@ def mergeMaps(m1, m2):
         return self.mapPartitions(countPartition).reduce(mergeMaps).flatMap(lambda x: x.items())
 
     def saveAsTextFiles(self, prefix, suffix=None):
+        """
+        Save this DStream as a text file, using string representations of elements.
+        """
 
         def saveAsTextFile(rdd, time):
             path = rddToFileName(prefix, suffix, time)
@@ -368,6 +386,11 @@ def saveAsTextFile(rdd, time):
         return self.foreachRDD(saveAsTextFile)
 
     def saveAsPickledFiles(self, prefix, suffix=None):
+        """
+        Save this DStream as a SequenceFile of serialized objects. The serializer
+        used is L{pyspark.serializers.PickleSerializer}, default batch size
+        is 10.
+        """
 
         def saveAsTextFile(rdd, time):
             path = rddToFileName(prefix, suffix, time)
@@ -397,6 +420,7 @@ def saveAsTextFile(rdd, time):
 # TODO: implement leftOuterJoin
 # TODO: implemtnt rightOuterJoin
 
+
 class PipelinedDStream(DStream):
     def __init__(self, prev, func, preservesPartitioning=False):
         if not isinstance(prev, PipelinedDStream) or not prev._is_pipelinable():
diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index 2bb01ed3a0642..ef308fdd6aa59 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -18,12 +18,11 @@
 """
 Unit tests for PySpark; additional tests are implemented as doctests in
 individual modules.
-Other option is separate this test case with other tests.
-This makes sense becuase streaming tests takes long time due to waiting time
-for stoping callback server.
 
-This file will merged to tests.py. But for now, this file is separated due
-to focusing to streaming test case
+This file would be merged to tests.py after all functions are ready.
+But for now, this file is separated due to focusing to streaming test case.
+
+Callback server seems like unstable sometimes, which cause error in test case.
 
 """
 from itertools import chain
@@ -43,10 +42,10 @@ def setUp(self):
 
     def tearDown(self):
         # Do not call pyspark.streaming.context.StreamingContext.stop directly because
-        # we do not wait to shutdowncall back server and py4j client
+        # we do not wait to shutdown call back server and py4j client
         self.ssc._jssc.stop()
         self.ssc._sc.stop()
-        # Why does it long time to terminaete StremaingContext and SparkContext?
+        # Why does it long time to terminate StremaingContext and SparkContext?
         # Should we change the sleep time if this depends on machine spec?
         time.sleep(10)
 
@@ -68,7 +67,7 @@ class TestBasicOperationsSuite(PySparkStreamingTestCase):
     I am wondering if these test are enough or not.
     All tests input should have list of lists. This represents stream.
     Every batch interval, the first object of list are chosen to make DStream.
-    Please see the BasicTestSuits in Scala or QueStream which is close to this implementation.
+    Please see the BasicTestSuits in Scala which is close to this implementation.
     """
     def setUp(self):
         PySparkStreamingTestCase.setUp(self)
@@ -358,5 +357,24 @@ def _run_stream(self, test_input, test_func, expected_output, numSlices=None):
 
         return self.result
 
+class TestSaveAsFilesSuite(PySparkStreamingTestCase):
+    def setUp(self):
+        PySparkStreamingTestCase.setUp(self)
+        self.timeout = 10  # seconds
+        self.numInputPartitions = 2
+        self.result = list()
+
+    def tearDown(self):
+        PySparkStreamingTestCase.tearDown(self)
+
+    @classmethod
+    def tearDownClass(cls):
+        PySparkStreamingTestCase.tearDownClass()
+
+
+
+
+
+
 if __name__ == "__main__":
     unittest.main()

From e7ebb08da3c59102cfad08ce4d687e56d02a0edf Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 18 Aug 2014 00:35:50 -0700
Subject: [PATCH 66/69] removed wasted print in DStream

---
 .../streaming/api/java/JavaDStreamLike.scala    |  9 ---------
 .../spark/streaming/dstream/DStream.scala       | 17 -----------------
 2 files changed, 26 deletions(-)

diff --git a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
index 7a002bbe74ca9..a6184de4e83c1 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/api/java/JavaDStreamLike.scala
@@ -54,15 +54,6 @@ trait JavaDStreamLike[T, This <: JavaDStreamLike[T, This, R], R <: JavaRDDLike[T
     dstream.print()
   }
 
-  def print(label: String = null): Unit = {
-    dstream.print(label)
-  }
-
-  def outputToFile(): Unit = {
-    dstream.outputToFile()
-  }
-
-
   /**
    * Return a new DStream in which each RDD has a single element generated by counting each RDD
    * of this DStream.
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index 46ef05d9c37a1..39ad591e8896e 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -617,23 +617,6 @@ abstract class DStream[T: ClassTag] (
     new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
   }
 
-
-  def print(label: String = null) {
-    def foreachFunc = (rdd: RDD[T], time: Time) => {
-      val first11 = rdd.take(11)
-      println ("-------------------------------------------")
-      println ("Time: " + time)
-      println ("-------------------------------------------")
-      if(label != null){
-        println (label)
-      }
-      first11.take(10).foreach(println)
-      if (first11.size > 10) println("...")
-      println()
-    }
-    new ForEachDStream(this, context.sparkContext.clean(foreachFunc)).register()
-  }
-
   /**
    * Return a new DStream in which each RDD contains all the elements in seen in a
    * sliding window of time over this DStream. The new DStream generates RDDs with

From 636090ac5323cdde6c72d48336b716693a80e010 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 18 Aug 2014 13:24:17 -0700
Subject: [PATCH 67/69] added sparkContext as input parameter in
 StreamingContext

---
 python/pyspark/streaming/context.py | 16 ++++++++++------
 1 file changed, 10 insertions(+), 6 deletions(-)

diff --git a/python/pyspark/streaming/context.py b/python/pyspark/streaming/context.py
index e380626aa080b..3f455a3e06072 100644
--- a/python/pyspark/streaming/context.py
+++ b/python/pyspark/streaming/context.py
@@ -34,7 +34,7 @@ class StreamingContext(object):
 
     def __init__(self, master=None, appName=None, sparkHome=None, pyFiles=None,
         environment=None, batchSize=1024, serializer=PickleSerializer(), conf=None,
-        gateway=None, duration=None):
+        gateway=None, sparkContext=None, duration=None):
         """
         Create a new StreamingContext. At least the master and app name and duration
         should be set, either through the named parameters here or through C{conf}.
@@ -55,14 +55,18 @@ def __init__(self, master=None, appName=None, sparkHome=None, pyFiles=None,
         @param conf: A L{SparkConf} object setting Spark properties.
         @param gateway: Use an existing gateway and JVM, otherwise a new JVM
                will be instatiated.
-        @param duration: A L{Duration} Duration for SparkStreaming
+        @param sparkContext: L{SparkContext} object.
+        @param duration: A L{Duration} object for SparkStreaming.
 
         """
 
-        # Create the Python Sparkcontext
-        self._sc = SparkContext(master=master, appName=appName, sparkHome=sparkHome,
-                        pyFiles=pyFiles, environment=environment, batchSize=batchSize,
-                        serializer=serializer, conf=conf, gateway=gateway)
+        if sparkContext is None:
+            # Create the Python Sparkcontext
+            self._sc = SparkContext(master=master, appName=appName, sparkHome=sparkHome,
+                            pyFiles=pyFiles, environment=environment, batchSize=batchSize,
+                            serializer=serializer, conf=conf, gateway=gateway)
+        else:
+            self._sc = sparkContext
 
         # Start py4j callback server.
         # Callback sever is need only by SparkStreming; therefore the callback sever

From a3d2379d79fdb8573963564f5c5be98558e495f2 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 18 Aug 2014 14:39:45 -0700
Subject: [PATCH 68/69] added gorupByKey testcase

---
 python/pyspark/streaming_tests.py | 70 ++++++++++++++++++++++++-------
 1 file changed, 54 insertions(+), 16 deletions(-)

diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index ef308fdd6aa59..c35d352c66ca5 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -275,7 +275,7 @@ def test_func(dstream):
         self.assertEqual(expected_output, output)
 
     def test_mapPartitions_batch(self):
-        """Basic operation test for DStream.mapPartitions with batch deserializer"""
+        """Basic operation test for DStream.mapPartitions with batch deserializer."""
         test_input = [range(1, 5), range(5, 9), range(9, 13)]
         numSlices = 2
 
@@ -288,7 +288,7 @@ def f(iterator):
         self.assertEqual(expected_output, output)
 
     def test_mapPartitions_unbatch(self):
-        """Basic operation test for DStream.mapPartitions with unbatch deserializer"""
+        """Basic operation test for DStream.mapPartitions with unbatch deserializer."""
         test_input = [range(1, 4), range(4, 7), range(7, 10)]
         numSlices = 2
 
@@ -301,8 +301,8 @@ def f(iterator):
         self.assertEqual(expected_output, output)
 
     def test_countByValue_batch(self):
-        """Basic operation test for DStream.countByValue with batch deserializer"""
-        test_input = [range(1, 5) + range(1,5), range(5, 7) + range(5, 9), ["a"] * 2 + ["b"] + [""] ]
+        """Basic operation test for DStream.countByValue with batch deserializer."""
+        test_input = [range(1, 5) + range(1,5), range(5, 7) + range(5, 9), ["a", "a", "b", ""]]
 
         def test_func(dstream):
             return dstream.countByValue()
@@ -315,7 +315,7 @@ def test_func(dstream):
         self.assertEqual(expected_output, output)
 
     def test_countByValue_unbatch(self):
-        """Basic operation test for DStream.countByValue with unbatch deserializer"""
+        """Basic operation test for DStream.countByValue with unbatch deserializer."""
         test_input = [range(1, 4), [1, 1, ""], ["a", "a", "b"]]
 
         def test_func(dstream):
@@ -328,30 +328,72 @@ def test_func(dstream):
             self._sort_result_based_on_key(result)
         self.assertEqual(expected_output, output)
 
+    def test_groupByKey_batch(self):
+        """Basic operation test for DStream.groupByKey with batch deserializer."""
+        test_input = [range(1, 5), [1, 1, 1, 2, 2, 3], ["a", "a", "b", "", "", ""]]
+        def test_func(dstream):
+            return dstream.map(lambda x: (x,1)).groupByKey()
+        expected_output = [[(1, [1]), (2, [1]), (3, [1]), (4, [1])],
+                           [(1, [1, 1, 1]), (2, [1, 1]), (3, [1])],
+                           [("a", [1, 1]), ("b", [1]), ("", [1, 1, 1])]]
+        scattered_output = self._run_stream(test_input, test_func, expected_output)
+        output = self._convert_iter_value_to_list(scattered_output)
+        for result in (output, expected_output):
+            self._sort_result_based_on_key(result)
+        self.assertEqual(expected_output, output)
+
+    def test_groupByKey_unbatch(self):
+        """Basic operation test for DStream.groupByKey with unbatch deserializer."""
+        test_input = [range(1, 4), [1, 1, ""], ["a", "a", "b"]]
+        def test_func(dstream):
+            return dstream.map(lambda x: (x,1)).groupByKey()
+        expected_output = [[(1, [1]), (2, [1]), (3, [1])],
+                           [(1, [1, 1]), ("", [1])],
+                           [("a", [1, 1]), ("b", [1])]]
+        scattered_output = self._run_stream(test_input, test_func, expected_output)
+        output = self._convert_iter_value_to_list(scattered_output)
+        for result in (output, expected_output):
+            self._sort_result_based_on_key(result)
+        self.assertEqual(expected_output, output)
+
+    def _convert_iter_value_to_list(self, outputs):
+        """Return key value pair list. Value is converted to iterator to list."""
+        result = list()
+        for output in outputs:
+            result.append(map(lambda (x, y): (x, list(y)), output))
+        return result
+
     def _sort_result_based_on_key(self, outputs):
+        """Sort the list base onf first value."""
         for output in outputs:
             output.sort(key=lambda x: x[0])
 
     def _run_stream(self, test_input, test_func, expected_output, numSlices=None):
-        """Start stream and return the output"""
-        # Generate input stream with user-defined input
+        """
+        Start stream and return the output.
+        @param test_input: dataset for the test. This should be list of lists.
+        @param test_func: wrapped test_function. This function should return PythonDstream object.
+        @param expexted_output: expected output for this testcase.
+        @param numSlices: the number of slices in the rdd in the dstream.
+        """
+        # Generate input stream with user-defined input.
         numSlices = numSlices or self.numInputPartitions
         test_input_stream = self.ssc._testInputStream(test_input, numSlices)
-        # Apply test function to stream
+        # Apply test function to stream.
         test_stream = test_func(test_input_stream)
-        # Add job to get output from stream
+        # Add job to get output from stream.
         test_stream._test_output(self.result)
         self.ssc.start()
 
         start_time = time.time()
-        # loop until get the result from stream
+        # Loop until get the expected the number of the result from the stream.
         while True:
             current_time = time.time()
-            # check time out
+            # Check time out.
             if (current_time - start_time) > self.timeout:
                 break
             self.ssc.awaitTermination(50)
-            # check if the output is the same length of expexted output
+            # Check if the output is the same length of expexted output.
             if len(expected_output) == len(self.result):
                 break
 
@@ -372,9 +414,5 @@ def tearDownClass(cls):
         PySparkStreamingTestCase.tearDownClass()
 
 
-
-
-
-
 if __name__ == "__main__":
     unittest.main()

From 665bfdb48523ecb7aa5174341a74c55c2088a891 Mon Sep 17 00:00:00 2001
From: giwa <ugw.gi.world@gmail.com>
Date: Mon, 18 Aug 2014 15:12:31 -0700
Subject: [PATCH 69/69] added testcase for combineByKey

---
 python/pyspark/streaming_tests.py | 35 +++++++++++++++++++++++++++++--
 1 file changed, 33 insertions(+), 2 deletions(-)

diff --git a/python/pyspark/streaming_tests.py b/python/pyspark/streaming_tests.py
index c35d352c66ca5..7f6960faed1a0 100644
--- a/python/pyspark/streaming_tests.py
+++ b/python/pyspark/streaming_tests.py
@@ -332,7 +332,7 @@ def test_groupByKey_batch(self):
         """Basic operation test for DStream.groupByKey with batch deserializer."""
         test_input = [range(1, 5), [1, 1, 1, 2, 2, 3], ["a", "a", "b", "", "", ""]]
         def test_func(dstream):
-            return dstream.map(lambda x: (x,1)).groupByKey()
+            return dstream.map(lambda x: (x, 1)).groupByKey()
         expected_output = [[(1, [1]), (2, [1]), (3, [1]), (4, [1])],
                            [(1, [1, 1, 1]), (2, [1, 1]), (3, [1])],
                            [("a", [1, 1]), ("b", [1]), ("", [1, 1, 1])]]
@@ -345,8 +345,9 @@ def test_func(dstream):
     def test_groupByKey_unbatch(self):
         """Basic operation test for DStream.groupByKey with unbatch deserializer."""
         test_input = [range(1, 4), [1, 1, ""], ["a", "a", "b"]]
+
         def test_func(dstream):
-            return dstream.map(lambda x: (x,1)).groupByKey()
+            return dstream.map(lambda x: (x, 1)).groupByKey()
         expected_output = [[(1, [1]), (2, [1]), (3, [1])],
                            [(1, [1, 1]), ("", [1])],
                            [("a", [1, 1]), ("b", [1])]]
@@ -356,6 +357,36 @@ def test_func(dstream):
             self._sort_result_based_on_key(result)
         self.assertEqual(expected_output, output)
 
+    def test_combineByKey_batch(self):
+        """Basic operation test for DStream.combineByKey with batch deserializer."""
+        test_input = [range(1, 5), [1, 1, 1, 2, 2, 3], ["a", "a", "b", "", "", ""]]
+
+        def test_func(dstream):
+            def add(a, b): return a + str(b)
+            return dstream.map(lambda x: (x, 1)).combineByKey(str, add, add)
+        expected_output = [[(1, "1"), (2, "1"), (3, "1"), (4, "1")],
+                           [(1, "111"), (2, "11"), (3, "1")],
+                           [("a", "11"), ("b", "1"), ("", "111")]]
+        output = self._run_stream(test_input, test_func, expected_output)
+        for result in (output, expected_output):
+            self._sort_result_based_on_key(result)
+        self.assertEqual(expected_output, output)
+
+    def test_combineByKey_unbatch(self):
+        """Basic operation test for DStream.combineByKey with unbatch deserializer."""
+        test_input = [range(1, 4), [1, 1, ""], ["a", "a", "b"]]
+
+        def test_func(dstream):
+            def add(a, b): return a + str(b)
+            return dstream.map(lambda x: (x, 1)).combineByKey(str, add, add)
+        expected_output = [[(1, "1"), (2, "1"), (3, "1")],
+                           [(1, "11"), ("", "1")],
+                           [("a", "11"), ("b", "1")]]
+        output = self._run_stream(test_input, test_func, expected_output)
+        for result in (output, expected_output):
+            self._sort_result_based_on_key(result)
+        self.assertEqual(expected_output, output)
+
     def _convert_iter_value_to_list(self, outputs):
         """Return key value pair list. Value is converted to iterator to list."""
         result = list()