|
@@ -53,7 +53,7 @@ public class AdHourStreamJob {
|
|
|
int parallelismKafka = Integer.parseInt(props.getProperty(ApplicationProperties.FLINK_PARALLELISM_KAFKA));
|
|
|
|
|
|
// checkpoint配置
|
|
|
- env.enableCheckpointing(2 * 60 * 1000L, CheckpointingMode.EXACTLY_ONCE);
|
|
|
+ env.enableCheckpointing(5 * 60 * 1000L, CheckpointingMode.EXACTLY_ONCE);
|
|
|
// checkpoint执行超时时间,超时则 checkpoint失败
|
|
|
env.getCheckpointConfig().setCheckpointTimeout(5 * 60 * 1000L);
|
|
|
// checkpoint执行最小间隔时间
|
|
@@ -92,7 +92,9 @@ public class AdHourStreamJob {
|
|
|
// 分钟流-写入原始表
|
|
|
new KeyedBatchStream<>("adMinuteODSStream", adMinuteODSStream.keyBy(AdDataOfMinuteODS::getStatDay), 6000L, 2 * 60 * 1000L)
|
|
|
.toBatch()
|
|
|
+ .setParallelism(12)
|
|
|
.addSink(new TunnelBatchStreamSink<>(AdDataOfMinuteODS.class))
|
|
|
+ .setParallelism(12)
|
|
|
.name("sink_ad_minute_ods");
|
|
|
|
|
|
// 分钟流-计算
|
|
@@ -108,7 +110,9 @@ public class AdHourStreamJob {
|
|
|
.setParallelism(parallelismKafka);
|
|
|
new KeyedBatchStream<>("adMinuteDWDStream", adMinuteDWDStream.keyBy(AdStatOfMinuteDWD::getStatDay), 3000L, 60 * 1000L)
|
|
|
.toBatch()
|
|
|
+ .setParallelism(6)
|
|
|
.addSink(new TunnelBatchStreamSink<>(AdStatOfMinuteDWD.class))
|
|
|
+ .setParallelism(6)
|
|
|
.name("sink_ad_minute_dwd");
|
|
|
|
|
|
//分钟流-写入 ck
|
|
@@ -126,7 +130,9 @@ public class AdHourStreamJob {
|
|
|
// 小时流-写入原始表
|
|
|
new KeyedBatchStream<>("adHourODSStream", adHourODSStream.keyBy(AdDataOfHourODS::getStatDay), 3000L, 3 * 60 * 1000L)
|
|
|
.toBatch()
|
|
|
+ .setParallelism(6)
|
|
|
.addSink(new TunnelBatchStreamSink<>(AdDataOfHourODS.class))
|
|
|
+ .setParallelism(6)
|
|
|
.name("sink_ad_hour_ods");
|
|
|
|
|
|
// 小时流-计算
|
|
@@ -137,7 +143,9 @@ public class AdHourStreamJob {
|
|
|
// 小时流-写入maxCompute
|
|
|
new KeyedBatchStream<>("adHourDWDStream", adHourDWDStream.keyBy(AdStatOfHourDWD::getStatDay), 3000L, 3 * 60 * 1000L)
|
|
|
.toBatch()
|
|
|
+ .setParallelism(6)
|
|
|
.addSink(new TunnelBatchStreamSink<>(AdStatOfHourDWD.class))
|
|
|
+ .setParallelism(6)
|
|
|
.name("sink_ad_hour_dwd");
|
|
|
|
|
|
// 分钟流转小时流同时填充空白的小时
|