rtdmp_merge_ck.sh 902 Bytes
Newer Older
wang-jinfeng committed
1 2 3 4 5 6 7 8 9 10 11
#!/bin/bash

source ../dmp_env.sh

today=${ScheduleTime}

date_time=$(date +"%Y%m%d%H" -d "-1 hour $today")

host="ip-172-31-20-35.ec2.internal"
cluster="cluster_1st"
database="dwh"
WangJinfeng committed
12
table="audience_merge_v1"
wang-jinfeng committed
13 14

spark-submit --class mobvista.dmp.datasource.rtdmp.RTDmpMergeCK \
WangJinfeng committed
15 16 17 18 19 20 21 22
  --name "RTDmpMergeCK.wangjf.${date_time}" \
  --conf spark.sql.shuffle.partitions=1000 \
  --conf spark.default.parallelism=1000 \
  --conf spark.kryoserializer.buffer.max=256m \
  --conf spark.speculation=false \
  --conf spark.speculation.quantile=0.9 \
  --conf spark.speculation.multiplier=1.3 \
  --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
23
  --master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 10 \
WangJinfeng committed
24
  ../${JAR} -date_time "${date_time}" -host ${host} -cluster ${cluster} -database ${database} -table ${table}
wang-jinfeng committed
25 26

if [[ $? -ne 0 ]]; then
WangJinfeng committed
27 28
  exit 255
fi