tsg kz版本

This commit is contained in:
wanglihui
2020-09-17 19:12:35 +08:00
parent 0d5e4e9be2
commit 4ed79bfe79
9 changed files with 281 additions and 142 deletions

View File

@@ -1,5 +1,5 @@
#spark任务配置
spark.sql.shuffle.partitions=5
spark.sql.shuffle.partitions=10
spark.executor.memory=4g
spark.app.name=test
spark.network.timeout=300s
@@ -7,13 +7,15 @@ repartitionNumber=36
spark.serializer=org.apache.spark.serializer.KryoSerializer
master=local[*]
#spark读取clickhouse配置
spark.read.clickhouse.url=jdbc:clickhouse://192.168.40.186:8123/tsg_galaxy_v3
spark.read.clickhouse.url=jdbc:clickhouse://192.168.44.12:8123/tsg_galaxy_v3
#spark.read.clickhouse.url=jdbc:clickhouse://192.168.40.186:8123/tsg_galaxy_v3
spark.read.clickhouse.driver=ru.yandex.clickhouse.ClickHouseDriver
spark.read.clickhouse.user=default
spark.read.clickhouse.password=111111
spark.read.clickhouse.numPartitions=144
spark.read.clickhouse.password=ceiec2019
#spark.read.clickhouse.password=111111
spark.read.clickhouse.numPartitions=5
spark.read.clickhouse.fetchsize=10000
spark.read.clickhouse.partitionColumn=common_recv_time
spark.read.clickhouse.partitionColumn=LAST_FOUND_TIME
clickhouse.socket.timeout=300000
#arangoDB配置
arangoDB.host=192.168.40.182
@@ -22,24 +24,20 @@ arangoDB.user=upsert
arangoDB.password=ceiec2018
#arangoDB.DB.name=insert_iplearn_index
arangoDB.DB.name=ip-learning-test-0
#arangoDB.DB.name=ip-learning-test
arangoDB.ttl=3600
thread.pool.number=5
thread.pool.number=10
#读取clickhouse时间范围方式0读取过去一小时1指定时间范围
clickhouse.time.limit.type=0
read.clickhouse.max.time=1571245220
read.clickhouse.min.time=1571245210
read.clickhouse.max.time=1600246160
read.clickhouse.min.time=1597197469
#读取arangoDB时间范围方式0正常读1指定时间范围
arango.time.limit.type=0
read.arango.max.time=1571245320
read.arango.min.time=1571245200
arangoDB.read.limit=
arangoDB.read.sepNum=10
update.arango.batch=10000
distinct.client.ip.num=10000
recent.count.hour=24
update.interval=10800
update.interval=3600