diff --git a/pom.xml b/pom.xml
index 7cdc355..221db19 100644
--- a/pom.xml
+++ b/pom.xml
@@ -6,7 +6,7 @@
com.zdjizhi
knowledge-log
- 202207
+ 20220722
log-completion-schema
http://www.example.com
@@ -174,23 +174,6 @@
${scope.type}
-
-
- org.apache.zookeeper
- zookeeper
- 3.4.10
-
-
- slf4j-log4j12
- org.slf4j
-
-
- log4j-over-slf4j
- org.slf4j
-
-
-
-
cglib
cglib-nodep
@@ -204,12 +187,6 @@
compile
-
- org.apache.httpcomponents
- httpclient
- 4.5.2
-
-
com.jayway.jsonpath
json-path
diff --git a/properties/service_flow_config.properties b/properties/service_flow_config.properties
index 7fef174..bffc433 100644
--- a/properties/service_flow_config.properties
+++ b/properties/service_flow_config.properties
@@ -1,6 +1,6 @@
#--------------------------------\u5730\u5740\u914D\u7F6E------------------------------#
#\u7BA1\u7406kafka\u5730\u5740,\u591A\u53F0\u9017\u53F7\u8FDE\u63A5ip1:9094,ip2:9094
-source.kafka.servers=192.168.45.102:9094
+source.kafka.servers=192.168.44.85:9094,192.168.44.86:9094,192.168.44.87:9094
#\u7BA1\u7406\u8F93\u51FAkafka\u5730\u5740
sink.kafka.servers=
@@ -8,14 +8,14 @@ sink.kafka.servers=
tools.library=
#--------------------------------Kafka\u6D88\u8D39/\u751F\u4EA7\u914D\u7F6E------------------------------#
#\u8BFB\u53D6topic,\u5B58\u50A8\u8BE5spout id\u7684\u6D88\u8D39offset\u4FE1\u606F\uFF0C\u53EF\u901A\u8FC7\u8BE5\u62D3\u6251\u547D\u540D;\u5177\u4F53\u5B58\u50A8offset\u7684\u4F4D\u7F6E\uFF0C\u786E\u5B9A\u4E0B\u6B21\u8BFB\u53D6\u4E0D\u91CD\u590D\u7684\u6570\u636E\uFF1B
-group.id=KNOWLEDGE-GROUP
+group.id=KNOWLEDGE-GROUP3
#--------------------------------topology\u914D\u7F6E------------------------------#
#consumer \u5E76\u884C\u5EA6
-source.parallelism=12
+source.parallelism=1
#\u8F6C\u6362\u51FD\u6570\u5E76\u884C\u5EA6
-transform.parallelism=12
+transform.parallelism=1
#kafka producer \u5E76\u884C\u5EA6
-sink.parallelism=12
+sink.parallelism=1
#--------------------------------\u4E1A\u52A1\u914D\u7F6E------------------------------#
#1 connection\u65E5\u5FD7 \uFF0C2 dns\u65E5\u5FD7
@@ -24,7 +24,7 @@ log.type=1
#\u751F\u4EA7\u8005\u538B\u7F29\u6A21\u5F0F none or snappy
producer.kafka.compression.type=none
#kafka\u6570\u636E\u6E90topic
-source.kafka.topic.connection=CONNECTION-RECORD-LOG
+source.kafka.topic.connection=test12
source.kafka.topic.sketch=CONNECTION-SKETCH-RECORD-LOG
source.kafka.topic.dns=DNS-RECORD-LOG
#\u5199\u5165clickhouse\u672C\u5730\u8868
@@ -40,10 +40,10 @@ sink.arangodb.table.r.mx.domain2domain=R_MX_DOMAIN2DOMAIN
sink.arangodb.table.r.resolve.domain2ip=R_RESOLVE_DOMAIN2IP
sink.arangodb.table.r.nx.domain2domain=R_NX_DOMAIN2DOMAIN
-#\u4F7F\u7528flink\u5165\u5E93\u539F\u59CB\u65E5\u5FD7\uFF0C\u6216\u8005\u9009\u62E9\u5B89\u88C5gohangout\u5165\u5E93 0\uFF1A\u5426\uFF0C1\uFF1A\u662F
+#\u4F7F\u7528flink\u5165\u5E93\u539F\u59CB\u65E5\u5FD70\uFF1A\u5426\uFF0C1\uFF1A\u662F
sink.ck.raw.log.insert.open=1
#clickhouse\u914D\u7F6E\uFF0C\u591A\u4E2A\u9017\u53F7\u8FDE\u63A5 ip1:8123,ip2:8123
-ck.hosts=192.168.45.102:8123,192.168.45.102:8123
+ck.hosts=192.168.44.85:8123,192.168.44.86:8123,192.168.44.87:8123
ck.database=tsg_galaxy_v3
ck.username=default
ck.pin=galaxy2019
@@ -53,7 +53,7 @@ ck.socket.timeout=300000
#clickhouse\u5165\u5E93\u6279\u91CF\u5355\u4F4D\u6761
ck.batch=10
#clickhouse\u5165\u5E93\u524D\u79EF\u7D2F\u6279\u91CF\u65F6\u95F4\u5355\u4F4D\u6BEB\u79D2
-sink.ck.batch.delay.time=1000
+sink.ck.batch.delay.time=2000
#flink \u65E5\u5FD7\u5EF6\u8FDF\u8D85\u65F6\u65F6\u95F4
flink.watermark.max.delay.time=50
@@ -68,8 +68,8 @@ arangodb.port=8529
arangodb.user=root
arangodb.password=galaxy_2019
arangodb.db.name=knowledge
-arangodb.batch=100000
+arangodb.batch=10000
arangodb.ttl=3600
arangodb.thread.pool.number=10
#\u6279\u91CF\u7D2F\u8BA1\u65F6\u95F4\u5355\u4F4D\u6BEB\u79D2ms
-sink.arangodb.batch.delay.time=5
\ No newline at end of file
+sink.arangodb.batch.delay.time=1000
\ No newline at end of file
diff --git a/src/main/java/com/zdjizhi/enums/DnsType.java b/src/main/java/com/zdjizhi/enums/DnsType.java
index a5c5586..95776c8 100644
--- a/src/main/java/com/zdjizhi/enums/DnsType.java
+++ b/src/main/java/com/zdjizhi/enums/DnsType.java
@@ -9,11 +9,11 @@ import static com.zdjizhi.common.FlowWriteConfig.*;
**/
public enum DnsType {
//对应dns类型,编码,入库表
- A("a", "0x0001", R_RESOLVE_DOMAIN2IP),
- AAAA("aaaa", "0x001c", R_RESOLVE_DOMAIN2IP),
- CNAME("cname", "0x0005", R_CNAME_DOMAIN2DOMAIN),
- MX("mx", "0x000f", R_MX_DOMAIN2DOMAIN),
- NS("ns", "0x0002", R_NX_DOMAIN2DOMAIN);
+ A("a", "1", R_RESOLVE_DOMAIN2IP),
+ AAAA("aaaa", "28", R_RESOLVE_DOMAIN2IP),
+ CNAME("cname", "5", R_CNAME_DOMAIN2DOMAIN),
+ MX("mx", "15", R_MX_DOMAIN2DOMAIN),
+ NS("ns", "2", R_NX_DOMAIN2DOMAIN);
private String type;
private String code;
diff --git a/src/main/java/com/zdjizhi/etl/CountTriggerWithTimeout.java b/src/main/java/com/zdjizhi/etl/CountTriggerWithTimeout.java
index ba348bd..66b36a9 100644
--- a/src/main/java/com/zdjizhi/etl/CountTriggerWithTimeout.java
+++ b/src/main/java/com/zdjizhi/etl/CountTriggerWithTimeout.java
@@ -54,7 +54,6 @@ public class CountTriggerWithTimeout extends Trigger {
this.stateName = stateName;
}
-
private TriggerResult fireAndPurge(TimeWindow window, TriggerContext ctx) throws Exception {
clear(window, ctx);
return TriggerResult.FIRE_AND_PURGE;
@@ -90,7 +89,7 @@ public class CountTriggerWithTimeout extends Trigger {
if (time >= window.getEnd()) {
return TriggerResult.CONTINUE;
} else {
- logger.info("fire with process tiem: " + time);
+ logger.debug("fire with process tiem: " + time);
return fireAndPurge(window, ctx);
}
}
@@ -106,7 +105,7 @@ public class CountTriggerWithTimeout extends Trigger {
if (time >= window.getEnd()) {
return TriggerResult.CONTINUE;
} else {
- logger.info("fire with event tiem: " + time);
+ logger.debug("fire with event tiem: " + time);
return fireAndPurge(window, ctx);
}
}
diff --git a/src/main/java/com/zdjizhi/etl/LogFormat.java b/src/main/java/com/zdjizhi/etl/LogFormat.java
new file mode 100644
index 0000000..c0edaa8
--- /dev/null
+++ b/src/main/java/com/zdjizhi/etl/LogFormat.java
@@ -0,0 +1,19 @@
+package com.zdjizhi.etl;
+
+import com.zdjizhi.utils.json.TypeUtils;
+
+import java.util.Map;
+
+public class LogFormat {
+
+ public static Map connTime(Map value) {
+ value.put("conn_start_time", TypeUtils.coverMSToS(value.get("conn_start_time")));
+ return value;
+ }
+
+
+ public static Map sketchTime(Map value) {
+ value.put("sketch_start_time", TypeUtils.coverMSToS(value.get("sketch_start_time")));
+ return value;
+ }
+}
diff --git a/src/main/java/com/zdjizhi/etl/connection/ConnProcessFunction.java b/src/main/java/com/zdjizhi/etl/connection/ConnProcessFunction.java
index cec2425..6fa11d6 100644
--- a/src/main/java/com/zdjizhi/etl/connection/ConnProcessFunction.java
+++ b/src/main/java/com/zdjizhi/etl/connection/ConnProcessFunction.java
@@ -1,6 +1,7 @@
package com.zdjizhi.etl.connection;
import cn.hutool.core.convert.Convert;
+import cn.hutool.core.date.DateUtil;
import cn.hutool.log.Log;
import cn.hutool.log.LogFactory;
import org.apache.flink.api.java.tuple.Tuple2;
@@ -47,8 +48,8 @@ public class ConnProcessFunction extends ProcessWindowFunction