summaryrefslogtreecommitdiff
path: root/src/main/java/com/zdjizhi/etl/connection/SketchProcessFunction.java
blob: b27958a6bce85ee0a5aff85f6c448792b511329d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
package com.zdjizhi.etl.connection;

import cn.hutool.core.convert.Convert;
import cn.hutool.core.date.DateUtil;
import cn.hutool.log.Log;
import cn.hutool.log.LogFactory;
import com.alibaba.fastjson.util.TypeUtils;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.flink.api.java.tuple.Tuple5;
import org.apache.flink.streaming.api.functions.windowing.ProcessWindowFunction;
import org.apache.flink.streaming.api.windowing.windows.TimeWindow;
import org.apache.flink.util.Collector;

import java.util.LinkedHashMap;
import java.util.Map;

import static com.zdjizhi.common.FlowWriteConfig.LOG_AGGREGATE_DURATION;


/**
 * @author 94976
 */
public class SketchProcessFunction extends ProcessWindowFunction<Map<String, Object>, Map<String, Object>, Tuple2<String, String>, TimeWindow> {

    private static final Log logger = LogFactory.get();

    @Override
    public void process(Tuple2<String, String> keys, Context context, Iterable<Map<String, Object>> elements, Collector<Map<String, Object>> out) {
        Map<String, Object> middleResult = getMiddleResult(keys, elements);
        try {
            if (middleResult != null) {
                out.collect(middleResult);
                logger.debug("获取中间聚合结果:{}", middleResult.toString());
            }
        } catch (Exception e) {
            logger.error("获取中间聚合结果失败,middleResult: {}\n{}", middleResult.toString(), e);
        }
    }

    private Map<String, Object> getMiddleResult(Tuple2<String, String> keys, Iterable<Map<String, Object>> elements) {

        Tuple5<Long, Long, Long, Long, Long> values = connAggregate(elements);
        try {
            if (values != null) {
                Map<String, Object> result = new LinkedHashMap<>();
                result.put("start_time", values.f0);
                result.put("end_time", values.f1);
                result.put("src_ip", keys.f0);
                result.put("dst_ip", keys.f1);
                result.put("sessions", values.f2);
                result.put("packets", values.f3);
                result.put("bytes", values.f4);
                return result;
            }

        } catch (Exception e) {
            logger.error("加载中间结果集失败,keys: {} values: {}\n{}", keys, values, e);
        }
        return null;
    }

    private Tuple5<Long, Long, Long, Long, Long> connAggregate(Iterable<Map<String, Object>> elements) {
        long sessions = 0L;
        long packets = 0L;
        long bytes = 0L;
        long startTime = DateUtil.currentSeconds();
        long endTime = DateUtil.currentSeconds();
        try {
            for (Map<String, Object> newSketchLog : elements) {
                long connStartTime = Convert.toLong(newSketchLog.get("sketch_start_time"));
                if (connStartTime > 0) {
                    sessions += TypeUtils.castToLong(newSketchLog.get("sketch_sessions"));
                    packets += TypeUtils.castToLong(newSketchLog.get("sketch_packets"));
                    bytes += TypeUtils.castToLong(newSketchLog.get("sketch_bytes"));

                    startTime = Math.min(connStartTime, startTime);
                    endTime = Math.max(connStartTime, endTime);
                }
            }
            return Tuple5.of(startTime, endTime + LOG_AGGREGATE_DURATION, sessions, packets, bytes);
        } catch (Exception e) {
            logger.error("聚合中间结果集失败 {}", e);
        }
        return null;
    }
}