diff options
| author | zhanghongqing <[email protected]> | 2022-07-07 14:07:27 +0800 |
|---|---|---|
| committer | zhanghongqing <[email protected]> | 2022-07-07 14:07:27 +0800 |
| commit | f552793230d0428cbc63714ee296c1ce4971a31b (patch) | |
| tree | 1bf3a26d957710b261f61a65559d393f55bf9382 /src/main/java/com/zdjizhi/etl/DnsProcessFunction.java | |
Initial commit
Diffstat (limited to 'src/main/java/com/zdjizhi/etl/DnsProcessFunction.java')
| -rw-r--r-- | src/main/java/com/zdjizhi/etl/DnsProcessFunction.java | 101 |
1 files changed, 101 insertions, 0 deletions
diff --git a/src/main/java/com/zdjizhi/etl/DnsProcessFunction.java b/src/main/java/com/zdjizhi/etl/DnsProcessFunction.java new file mode 100644 index 0000000..46d0814 --- /dev/null +++ b/src/main/java/com/zdjizhi/etl/DnsProcessFunction.java @@ -0,0 +1,101 @@ +package com.zdjizhi.etl; + +import cn.hutool.core.convert.Convert; +import cn.hutool.core.util.StrUtil; +import com.zdjizhi.enums.DnsType; +import org.apache.flink.streaming.api.functions.windowing.ProcessWindowFunction; +import org.apache.flink.streaming.api.windowing.windows.TimeWindow; +import org.apache.flink.util.Collector; +import org.slf4j.Logger; +import org.slf4j.LoggerFactory; + +import java.util.ArrayList; +import java.util.HashMap; +import java.util.List; +import java.util.Map; + +import static com.zdjizhi.common.FlowWriteConfig.LOG_AGGREGATE_DURATION; + + +/** + * @author 94976 + */ +public class DnsProcessFunction extends ProcessWindowFunction<Map<String, Object>, Map<String, Object>, String, TimeWindow> { + + private static final Logger logger = LoggerFactory.getLogger(DnsProcessFunction.class); + + @Override + public void process(String keys, Context context, Iterable<Map<String, Object>> elements, Collector<Map<String, Object>> out) { + + try { + getMiddleResult(out, elements); + } catch (Exception e) { + logger.error("获取中间聚合结果失败,middleResult: {}", e); + } + } + + /** + * 拆分dns_record + * 五种:a/aaaa/cname/mx/ns + * + * @param elements + * @return + */ + private void getMiddleResult(Collector<Map<String, Object>> out, Iterable<Map<String, Object>> elements) { + long startTime = System.currentTimeMillis() / 1000; + long endTime = System.currentTimeMillis() / 1000; + String dnsQname = ""; + try { + Map<String, Long> distinctA = new HashMap<>(); + Map<String, Long> distinctAAAA = new HashMap<>(); + Map<String, Long> distinctCname = new HashMap<>(); + Map<String, Long> distinctNs = new HashMap<>(); + Map<String, Long> distinctMx = new HashMap<>(); + for (Map<String, Object> log : elements) { + List<String> dnsA = splitDns(log, "dns_a"); + List<String> dnsAAAA = splitDns(log, "dns_aaaa"); + List<String> dnsCname = splitDns(log, "dns_cname"); + List<String> dnsNs = splitDns(log, "dns_ns"); + List<String> dnsMx = splitDns(log, "dns_mx"); + + dnsA.forEach(x -> distinctA.merge(x, 1L, Long::sum)); + dnsAAAA.forEach(x -> distinctAAAA.merge(x, 1L, Long::sum)); + dnsCname.forEach(x -> distinctCname.merge(x, 1L, Long::sum)); + dnsNs.forEach(x -> distinctNs.merge(x, 1L, Long::sum)); + dnsMx.forEach(x -> distinctMx.merge(x, 1L, Long::sum)); + + long connStartTimetime = Convert.toLong(log.get("capure_time_s")); + startTime = connStartTimetime < startTime ? connStartTimetime : startTime; + endTime = connStartTimetime > endTime ? connStartTimetime : endTime; + dnsQname = StrUtil.toString(log.get("dns_qname")); + } + getNewDns(startTime, endTime, dnsQname, distinctA, DnsType.a.toString(), out); + getNewDns(startTime, endTime, dnsQname, distinctAAAA, DnsType.aaaa.toString(), out); + getNewDns(startTime, endTime, dnsQname, distinctCname, DnsType.cname.toString(), out); + getNewDns(startTime, endTime, dnsQname, distinctNs, DnsType.ns.toString(), out); + getNewDns(startTime, endTime, dnsQname, distinctMx, DnsType.mx.toString(), out); + + } catch (Exception e) { + logger.error("聚合中间结果集失败 {}", e); + } + } + + + private static List<String> splitDns(Map<String, Object> log, String key) { + + return StrUtil.split(StrUtil.toString(log.get(key)), ","); + } + + private void getNewDns(long startTime, long endTime, String dnsQname, Map<String, Long> distinctMap, String type, Collector<Map<String, Object>> out) { + for (Map.Entry<String, Long> dns : distinctMap.entrySet()) { + Map<String, Object> newDns = new HashMap<>(); + newDns.put("start_time", startTime); + newDns.put("end_time", endTime + LOG_AGGREGATE_DURATION); + newDns.put("record_type", type); + newDns.put("qname", dnsQname); + newDns.put("record", dns.getKey()); + newDns.put("sessions", dns.getValue()); + out.collect(newDns); + } + } +} |
