danish-rehman · July 2, 2016 09:10
diff --git a/bot_stream.py b/bot_stream.py
 import random

 nouns = ("puppy", "car", "rabbit", "girl", "monkey")
 verbs = ("runs", "hits", "jumps", "drives", "barfs")
 adv = ("crazily.", "dutifully.", "foolishly.", "merrily.", "occasionally.")
 adj = ("adorable", "clueless", "dirty", "odd", "stupid")

 while True:
    num = random.randrange(0,5)
    print nouns[num] + ' ' + verbs[num] + ' ' + adv[num] + ' ' + adj[num]
diff --git a/Cmd1.md b/Cmd1.md
diff --git a/Cmd2.md b/Cmd2.md
diff --git a/network_count.py b/network_count.py

 """
 Counts words in UTF8 encoded, '\n' delimited text received from the network every second.
 Usage: network_wordcount.py <hostname> <port>
   <hostname> and <port> describe the TCP server that Spark Streaming would connect to receive data.

 To run this on your local machine, you need to first run a Netcat server
    `$ nc -lk 9999`
 and then run the example
    `$ bin/spark-submit examples/src/main/python/streaming/network_wordcount.py localhost 9999`
 """
 from __future__ import print_function

 import sys

 from pyspark import SparkContext
 from pyspark.streaming import StreamingContext

 if __name__ == "__main__":
    if len(sys.argv) != 3:
        print("Usage: network_wordcount.py <hostname> <port>", file=sys.stderr)
        exit(-1)
    sc = SparkContext(appName="PythonStreamingNetworkWordCount")
    ssc = StreamingContext(sc, 1)

    lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
    counts = lines.flatMap(lambda line: line.split(" "))\
                  .map(lambda word: (word, 1))\
                  .reduceByKey(lambda a, b: a+b)
    counts.pprint()

    ssc.start()
    ssc.awaitTermination()
	import random

	nouns = ("puppy", "car", "rabbit", "girl", "monkey")
	verbs = ("runs", "hits", "jumps", "drives", "barfs")
	adv = ("crazily.", "dutifully.", "foolishly.", "merrily.", "occasionally.")
	adj = ("adorable", "clueless", "dirty", "odd", "stupid")

	while True:
	num = random.randrange(0,5)
	print nouns[num] + ' ' + verbs[num] + ' ' + adv[num] + ' ' + adj[num]

	"""
	Counts words in UTF8 encoded, '\n' delimited text received from the network every second.
	Usage: network_wordcount.py <hostname> <port>
	<hostname> and <port> describe the TCP server that Spark Streaming would connect to receive data.

	To run this on your local machine, you need to first run a Netcat server
	`$ nc -lk 9999`
	and then run the example
	`$ bin/spark-submit examples/src/main/python/streaming/network_wordcount.py localhost 9999`
	"""
	from __future__ import print_function

	import sys

	from pyspark import SparkContext
	from pyspark.streaming import StreamingContext

	if __name__ == "__main__":
	if len(sys.argv) != 3:
	print("Usage: network_wordcount.py <hostname> <port>", file=sys.stderr)
	exit(-1)
	sc = SparkContext(appName="PythonStreamingNetworkWordCount")
	ssc = StreamingContext(sc, 1)

	lines = ssc.socketTextStream(sys.argv[1], int(sys.argv[2]))
	counts = lines.flatMap(lambda line: line.split(" "))\
	.map(lambda word: (word, 1))\
	.reduceByKey(lambda a, b: a+b)
	counts.pprint()

	ssc.start()
	ssc.awaitTermination()