!pip install -q findspark
import findspark
findspark.init('/home/bigdata/Documents/spark-3.0.0')
from pyspark import SparkContext, SparkConf
from pyspark.streaming import StreamingContext
config = SparkConf().setAppName("Window Operation")
sc = SparkContext(conf=config)
ssc = StreamingContext(sc, 1)
ssc.checkpoint("checkpoint")
lines = ssc.socketTextStream("localhost", 5000)
words = lines.flatMap(lambda line: line.split(" "))
pairs = words.map(lambda word: 1 if word=='spark' else 0)
pairs.window(15, 5).pprint()
ssc.start()
ssc.stop(stopSparkContext=True, stopGraceFully=True)