#!/bin/sh
# # # # # # # # # # # # # # # # # # # # # #
# @author :fengliang
# @revision: 2017-12-12
# @desc : 抽取adn当天位置信息
# # # # # # # # # # # # # # # # # # # # # #
source ../../dmp_env.sh
today=${ScheduleTime:-$1}
dt=$(date +"%Y%m%d" -d "-1 day $today")
date_path=$(date +"%Y/%m/%d" -d "-1 day $today")
INPUT_PATH="${MDS_ADN_SDK_REQUEST_DAILY}/$date_path"
OUTPUT_PATH="${MDS_DMP_ADDRESS_DAILY}/$date_path/adn_request"
check_await "${INPUT_PATH}/_SUCCESS"
hadoop fs -rm -r $OUTPUT_PATH
spark-submit --class mobvista.dmp.datasource.address.AddressInfoTotal \
--conf spark.yarn.executor.memoryOverhead=1024 --conf spark.network.timeout=720s \
--conf spark.sql.shuffle.partitions=200 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 40 \
../../${JAR} -input ${INPUT_PATH} -output ${OUTPUT_PATH} -dailyFormat "rcfile" -parallelism 200 -coalesce 20 \
-indices "0,2,3,5,6"
if [ $? -ne 0 ];then
exit 255
fi
mount_partition "mds_dmp_address_daily" "dt='$dt', business='adn_request_sdk'" "$OUTPUT_PATH"
if [ $? -ne 0 ];then
exit 255
fi