11.03.2020
import findspark
findspark.init('/home/bigdata/Documents/spark-3.0.0')
from pyspark import SparkContext, SparkConf
from pyspark.streaming import StreamingContext
config = SparkConf().setAppName("output_operation_example")
sc = SparkContext(conf=config)
ssc = StreamingContext(sc, 1)
ssc.checkpoint("checkpoint")
lines = ssc.socketTextStream("localhost", 5000)
words = lines.flatMap(lambda line: line.split(" "))
counter = words.countByValueAndWindow(15, 5)
counter.saveAsTextFiles("output/counter")
ssc.start()
ssc.stop(stopGraceFully=True, stopSparkContext=True)