diff --git a/code/spark/spark-streaming-flume/src/main/scala/com/heibaiying/flume/PullBasedWordCount.scala b/code/spark/spark-streaming-flume/src/main/scala/com/heibaiying/flume/PullBasedWordCount.scala index e0d1ba5..89cf835 100644 --- a/code/spark/spark-streaming-flume/src/main/scala/com/heibaiying/flume/PullBasedWordCount.scala +++ b/code/spark/spark-streaming-flume/src/main/scala/com/heibaiying/flume/PullBasedWordCount.scala @@ -18,9 +18,8 @@ object PullBasedWordCount { // 1.获取输入流 val flumeStream = FlumeUtils.createPollingStream(ssc, "hadoop001", 8888) - // 2.词频统计 - flumeStream.map(line => new String(line.event.getBody.array()).trim) - .flatMap(_.split(" ")).map((_, 1)).reduceByKey(_ + _).print() + // 2.打印输入流中的数据 + flumeStream.map(line => new String(line.event.getBody.array()).trim).print() ssc.start() ssc.awaitTermination() diff --git a/code/spark/spark-streaming-flume/src/main/scala/com/heibaiying/flume/PushBasedWordCount.scala b/code/spark/spark-streaming-flume/src/main/scala/com/heibaiying/flume/PushBasedWordCount.scala index 6f5d6c0..cf3668f 100644 --- a/code/spark/spark-streaming-flume/src/main/scala/com/heibaiying/flume/PushBasedWordCount.scala +++ b/code/spark/spark-streaming-flume/src/main/scala/com/heibaiying/flume/PushBasedWordCount.scala @@ -19,9 +19,8 @@ object PushBasedWordCount { // 1.获取输入流 val flumeStream = FlumeUtils.createStream(ssc, "hadoop001", 8888) - // 2.词频统计 - flumeStream.map(line => new String(line.event.getBody.array()).trim) - .flatMap(_.split(" ")).map((_, 1)).reduceByKey(_ + _).print() + // 2.打印输入流的数据 + flumeStream.map(line => new String(line.event.getBody.array()).trim).print() ssc.start() ssc.awaitTermination() diff --git a/pictures/spark-flume-console.png b/pictures/spark-flume-console.png new file mode 100644 index 0000000..409f9fb Binary files /dev/null and b/pictures/spark-flume-console.png differ diff --git a/pictures/spark-flume-input.png b/pictures/spark-flume-input.png new file mode 100644 index 0000000..bef2384 Binary files /dev/null and b/pictures/spark-flume-input.png differ