Spark-stream 主动poll数据

来源:互联网 发布:ff14捏脸数据下载 编辑:程序博客网 时间:2024/05/18 13:10
import java.net.InetSocketAddressimport org.apache.spark.SparkConfimport org.apache.spark.storage.StorageLevelimport org.apache.spark.streaming.flume.FlumeUtilsimport org.apache.spark.streaming.{Seconds, StreamingContext}object FlumePollWordCount {  def main(args: Array[String]) {    val conf = new SparkConf().setAppName("FlumePollWordCount").setMaster("local[2]")    val ssc = new StreamingContext(conf, Seconds(5))    //从flume中拉取数据(flume的地址)    val address = Seq(new InetSocketAddress("172.16.0.11", 8888))    val flumeStream = FlumeUtils.createPollingStream(ssc, address, StorageLevel.MEMORY_AND_DISK)    val words = flumeStream.flatMap(x => new String(x.event.getBody().array()).split(" ")).map((_,1))    val results = words.reduceByKey(_+_)    results.print()    ssc.start()    ssc.awaitTermination()  }}

原创粉丝点击