Flink,union DataSet数据集,union实例,java版本

数据集union,不去重

package union;

import org.apache.flink.api.java.DataSet;
import org.apache.flink.api.java.ExecutionEnvironment;
import org.apache.flink.api.java.tuple.Tuple2;

/**
 * @Author you guess
 * @Date 2020/6/17 12:33
 * @Version 1.0
 * @Desc
 */
public class UnionDataSetTest {

    public static void main(String[] args) throws Exception {
        ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment();

        DataSet<Tuple2<Long, String>> source1 = env.fromElements(
                Tuple2.of(1L, "xiaoming"),
                Tuple2.of(2L, "xiaowang"));

        DataSet<Tuple2<Long, String>> source2 = env.fromElements(
                Tuple2.of(1L, "xiaoming"),
                Tuple2.of(2L, "xiaowang"),
                Tuple2.of(3L, "hhhhhh"));

//        source1.union(source2).print();
//        (1,xiaoming)
//        (1,xiaoming)
//        (2,xiaowang)
//        (2,xiaowang)
//        (3,hhhhhh)

        //source1.unionAll(source2);//无unionAll方法


        //处理数据集不用显式调用execute,不然执行抛异常java.lang.RuntimeException。处理数据流才需要调用execute
        //env.execute("Flink CoGroupDataSetTest by Java ");
    }
}

flink版本1.9.2,java版本1.8

發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章