summaryrefslogtreecommitdiff
path: root/src/main/java/com/zdjizhi/etl/SketchProcessFunction.java
blob: 54d53b6256cb82167c7bf0bbbcf848534ccefa47 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
package com.zdjizhi.etl;

import cn.hutool.core.convert.Convert;
import cn.hutool.log.Log;
import cn.hutool.log.LogFactory;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.flink.api.java.tuple.Tuple5;
import org.apache.flink.streaming.api.functions.windowing.ProcessWindowFunction;
import org.apache.flink.streaming.api.windowing.windows.TimeWindow;
import org.apache.flink.util.Collector;

import java.util.LinkedHashMap;
import java.util.Map;

import static com.zdjizhi.common.FlowWriteConfig.LOG_AGGREGATE_DURATION;


/**
 * @author 94976
 */
public class SketchProcessFunction extends ProcessWindowFunction<Map<String, Object>, Map<String, Object>, Tuple2<String, String>, TimeWindow> {

    private static final Log logger = LogFactory.get();

    @Override
    public void process(Tuple2<String, String> keys, Context context, Iterable<Map<String, Object>> elements, Collector<Map<String, Object>> out) {
        Map<String, Object> middleResult = getMiddleResult(keys, elements);
        try {
            if (middleResult != null) {
                out.collect(middleResult);
                logger.debug("获取中间聚合结果:{}", middleResult.toString());
            }
        } catch (Exception e) {
            logger.error("获取中间聚合结果失败,middleResult: {}\n{}", middleResult.toString(), e);
        }
    }

    private Map<String, Object> getMiddleResult(Tuple2<String, String> keys, Iterable<Map<String, Object>> elements) {

        Tuple5<Long, Long, Long, Long, Long> values = connAggregate(elements);
        try {
            if (values != null) {
                Map<String, Object> result = new LinkedHashMap<>();
                result.put("start_time", values.f0);
                result.put("end_time", values.f1);
                result.put("src_ip", keys.f0);
                result.put("dst_ip", keys.f1);
                result.put("sessions", values.f2);
                result.put("packets", values.f3);
                result.put("bytes", values.f4);
                return result;
            }

        } catch (Exception e) {
            logger.error("加载中间结果集失败,keys: {} values: {}\n{}", keys, values, e);
        }
        return null;
    }

    private Tuple5<Long, Long, Long, Long, Long> connAggregate(Iterable<Map<String, Object>> elements) {
        long sessions = 0;
        long packets = 0;
        long bytes = 0;
        long startTime = System.currentTimeMillis() / 1000;
        long endTime = System.currentTimeMillis() / 1000;
        try {
            for (Map<String, Object> newSketchLog : elements) {
                sessions += Convert.toLong(newSketchLog.get("sketch_sessions"));
                packets += Convert.toLong(newSketchLog.get("sketch_packets"));
                bytes += Convert.toLong(newSketchLog.get("sketch_bytes"));
                long connStartTimetime = Convert.toLong(newSketchLog.get("sketch_start_time"));
                startTime = connStartTimetime < startTime ? connStartTimetime : startTime;
                endTime = connStartTimetime > endTime ? connStartTimetime : endTime;
            }
            return Tuple5.of(startTime, endTime + LOG_AGGREGATE_DURATION, sessions, packets, bytes);
        } catch (Exception e) {
            logger.error("聚合中间结果集失败 {}", e);
        }
        return null;
    }
}