2020-06-28 18:27:48 +08:00
|
|
|
|
#spark任务配置
|
2020-09-17 19:12:35 +08:00
|
|
|
|
spark.sql.shuffle.partitions=10
|
2020-08-06 16:13:59 +08:00
|
|
|
|
spark.executor.memory=4g
|
2020-06-28 18:27:48 +08:00
|
|
|
|
spark.app.name=test
|
|
|
|
|
|
spark.network.timeout=300s
|
|
|
|
|
|
repartitionNumber=36
|
|
|
|
|
|
spark.serializer=org.apache.spark.serializer.KryoSerializer
|
|
|
|
|
|
master=local[*]
|
|
|
|
|
|
#spark读取clickhouse配置
|
2020-09-17 19:12:35 +08:00
|
|
|
|
spark.read.clickhouse.url=jdbc:clickhouse://192.168.44.12:8123/tsg_galaxy_v3
|
2020-08-06 16:13:59 +08:00
|
|
|
|
spark.read.clickhouse.driver=ru.yandex.clickhouse.ClickHouseDriver
|
|
|
|
|
|
spark.read.clickhouse.user=default
|
2020-09-17 19:12:35 +08:00
|
|
|
|
spark.read.clickhouse.password=ceiec2019
|
|
|
|
|
|
spark.read.clickhouse.numPartitions=5
|
2020-08-06 16:13:59 +08:00
|
|
|
|
spark.read.clickhouse.fetchsize=10000
|
2020-09-17 19:12:35 +08:00
|
|
|
|
spark.read.clickhouse.partitionColumn=LAST_FOUND_TIME
|
2020-06-28 18:27:48 +08:00
|
|
|
|
clickhouse.socket.timeout=300000
|
|
|
|
|
|
#arangoDB配置
|
2020-08-06 16:13:59 +08:00
|
|
|
|
arangoDB.host=192.168.40.182
|
2020-06-28 18:27:48 +08:00
|
|
|
|
arangoDB.port=8529
|
2020-08-06 16:13:59 +08:00
|
|
|
|
arangoDB.user=upsert
|
|
|
|
|
|
arangoDB.password=ceiec2018
|
|
|
|
|
|
#arangoDB.DB.name=insert_iplearn_index
|
|
|
|
|
|
arangoDB.DB.name=ip-learning-test-0
|
2020-09-17 19:12:35 +08:00
|
|
|
|
#arangoDB.DB.name=ip-learning-test
|
2020-06-28 18:27:48 +08:00
|
|
|
|
arangoDB.ttl=3600
|
|
|
|
|
|
|
2020-09-17 19:12:35 +08:00
|
|
|
|
thread.pool.number=10
|
2020-08-06 16:13:59 +08:00
|
|
|
|
|
|
|
|
|
|
#读取clickhouse时间范围方式,0:读取过去一小时;1:指定时间范围
|
|
|
|
|
|
clickhouse.time.limit.type=0
|
2020-09-17 19:12:35 +08:00
|
|
|
|
read.clickhouse.max.time=1600246160
|
|
|
|
|
|
read.clickhouse.min.time=1597197469
|
2020-08-06 16:13:59 +08:00
|
|
|
|
|
2020-09-17 19:12:35 +08:00
|
|
|
|
arangoDB.read.sepNum=10
|
2020-08-06 16:13:59 +08:00
|
|
|
|
update.arango.batch=10000
|
|
|
|
|
|
|
|
|
|
|
|
distinct.client.ip.num=10000
|
|
|
|
|
|
recent.count.hour=24
|
|
|
|
|
|
|
2020-09-17 19:12:35 +08:00
|
|
|
|
update.interval=3600
|