joypac_user_info.sh 1.02 KB
Newer Older
wang-jinfeng committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29
#!/bin/sh

source ../dmp_env.sh

LOG_TIME=$(date -d "$ScheduleTime 1 days ago" +"%Y%m%d")
date_path=$(date -d "$ScheduleTime 1 days ago" +"%Y/%m/%d")

INTPUT="s3://mob-emr-test/dataplatform/DataWareHouse/data/dwh/dm_user_info/${date_path}"

check_await ${INTPUT}/_SUCCESS

sleep 60

DICT_PATH="s3://mob-emr-test/dataplatform/data/joypac/dict_package/${date_path}"
OUTPUT_PATH="s3://mob-emr-test/dataplatform/data/joypac/user_info/${date_path}"

spark-submit --class mobvista.dmp.datasource.joypac.JoypacUserFeatureJob \
 --conf spark.yarn.executor.memoryOverhead=2048  \
 --conf spark.network.timeout=720s \
 --conf spark.default.parallelism=1000 \
 --conf spark.kryoserializer.buffer.max=512m \
 --conf spark.kryoserializer.buffer=64m \
 --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
 --master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g  --executor-cores 2  --num-executors 100 \
 ../${JAR} -date ${LOG_TIME} -output ${OUTPUT_PATH} -dict_output ${DICT_PATH} -coalesce 200

if [[ $? -ne 0 ]];then
  exit 255
fi