滚动窗口
- 时间不重叠,只有一个时间参数,即多长时间滚动一次
- 滚动窗口又分为滚动事件时间窗口,滚动处理时间窗口
- 事件时间指数据中的时间字段
- 处理时间指系统时间
TumblingProcess
package com.hehe.window;
import org.apache.flink.api.common.functions.FlatMapFunction;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.flink.streaming.api.datastream.DataStreamSource;
import org.apache.flink.streaming.api.datastream.SingleOutputStreamOperator;
import org.apache.flink.streaming.api.environment.StreamExecutionEnvironment;
import org.apache.flink.streaming.api.windowing.assigners.TumblingProcessingTimeWindows;
import org.apache.flink.streaming.api.windowing.time.Time;
import org.apache.flink.util.Collector;
//每10秒滚动统计一次且不叠加
public class TumblingProcess {
public static void main(String[] args) {
StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
DataStreamSource<String> ds = env.socketTextStream("master", 8888);
SingleOutputStreamOperator<Tuple2<String, Integer>> sum = ds.flatMap(new FlatMapFunction<String, Tuple2<String, Integer>>() {
@Override
public void flatMap(String s, Collector<Tuple2<String, Integer>> collector) {
for (String str : s.split(",")) {
collector.collect(Tuple2.of(str, 1));
}
}
}).keyBy(0).window(TumblingProcessingTimeWindows.of(Time.seconds(10))).sum(1);
sum.print().setParallelism(1);
try {