• Flink ADD Multi Source


    import java.util.Properties

    import org.apache.flink.api.common.serialization.SimpleStringSchema
    import org.apache.flink.streaming.api.scala.{StreamExecutionEnvironment, _}
    import org.apache.flink.streaming.connectors.kafka.FlinkKafkaConsumer011

    object MultiDataStreamExample {
    def main(args: Array[String]): Unit = {
    //设置环境
    val env: StreamExecutionEnvironment = StreamExecutionEnvironment.createLocalEnvironment()
    //设置数据源
    val valueDeserializer: SimpleStringSchema = new SimpleStringSchema;
    val kafkaProps = new Properties()
    kafkaProps.setProperty("bootstrap.servers", "node01:9092,node02:9092,node-3:9092")
    kafkaProps.setProperty("group.id", "test")
    val helloStream: FlinkKafkaConsumer011[String] = new FlinkKafkaConsumer011[String]("hello", valueDeserializer, kafkaProps)
    val hello1Stream: FlinkKafkaConsumer011[String] = new FlinkKafkaConsumer011[String]("hello1", valueDeserializer, kafkaProps)
    val hello2Stream: FlinkKafkaConsumer011[String] = new FlinkKafkaConsumer011[String]("hello2", valueDeserializer, kafkaProps)

    val s1: DataStream[String] = env.addSource(helloStream)
    val s2: DataStream[String] = env.addSource(hello1Stream)
    val s3: DataStream[String] = env.addSource(hello2Stream)

    val allStream: DataStream[String] = s1.union(s2).union(s3)
    //计算逻辑
    val flatMapDataStream: DataStream[String] = allStream.flatMap(_.split(" "))
    val mapDataStream: DataStream[(String, Int)] = flatMapDataStream.map((_, 1))
    val keyedStream: KeyedStream[(String, Int), String] = mapDataStream.keyBy(_._1)
    val reduceDataStream: DataStream[(String, Int)] = keyedStream.reduce((x, y) => {
    print(x._2)
    (x._1, x._2 + y._2)
    })
    //输出结果
    reduceDataStream.addSink(x => {
    print(x)
    })
    //提交任务
    env.execute("word count")
    }
    }
    个人网站:shuoyizui.com 公众号:写个框架玩 近期在公众号会发布一系列文章,主要是想完成一个简化的MapReduce框架的编写。实现Mapreduce编程模型、任务远程提交、任务分配、任务执行等功能。设计到了动态代理、反射、网络通信、序列化、消息队列、netty、自定义类加载器、多线程、shell等技术点。
  • 相关阅读:
    Oracle数据库管理
    Oracle——范式
    GUID
    java课上知识点整理—语句
    java课上知识点整理—java代码结构、标识符、数据类型、运算符
    使用css实现时间轴
    超简单的轮播实现
    第一个vue示例-高仿微信
    12. thymeleaf中资源相对路径的解决
    11. 将博客部署到tomcat上
  • 原文地址:https://www.cnblogs.com/maoxiangyi/p/10911898.html
Copyright © 2020-2023  润新知