//輸入源
object WordCountHDFSSource {
def main(args: Array[String]): Unit = {
System.setProperty("hadoop.home.dir", "E:\\software\\bigdate\\hadoop-2.6.0-cdh5.15.0\\hadoop-2.6.0-cdh5.15.0")
val conf = new SparkConf();
conf.setMaster("local[2]") //一個線程用於讀數據,一個用於處理數據
conf.setAppName("WordCountStreaming")
val sc = new SparkContext(conf);
val batch=5
val streamingContext = new StreamingContext(sc, Seconds(batch))
//監聽本地目錄
val sourceDS=streamingContext.textFileStream("E:\\sparkdata")
sourceDS.flatMap(
line=>{
line.split(" ")
})
.map((_,1))
.reduceByKey(_+_)
.print()
streamingContext.start()
streamingContext.awaitTermination()
}
}