#!/bin/sh # # # # # # # # # # # # # # # # # # # # # # # @author :fengliang # @revision: 2017-12-12 # @desc : 抽取adn当天位置信息 # # # # # # # # # # # # # # # # # # # # # # source ../../dmp_env.sh today=${ScheduleTime:-$1} dt=$(date +"%Y%m%d" -d "-1 day $today") date_path=$(date +"%Y/%m/%d" -d "-1 day $today") INPUT_PATH="${MDS_ADN_SDK_REQUEST_DAILY}/$date_path" OUTPUT_PATH="${MDS_DMP_ADDRESS_DAILY}/$date_path/adn_request" check_await "${INPUT_PATH}/_SUCCESS" hadoop fs -rm -r $OUTPUT_PATH spark-submit --class mobvista.dmp.datasource.address.AddressInfoTotal \ --conf spark.yarn.executor.memoryOverhead=1024 --conf spark.network.timeout=720s \ --conf spark.sql.shuffle.partitions=200 \ --master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 40 \ ../../${JAR} -input ${INPUT_PATH} -output ${OUTPUT_PATH} -dailyFormat "rcfile" -parallelism 200 -coalesce 20 \ -indices "0,2,3,5,6" if [ $? -ne 0 ];then exit 255 fi mount_partition "mds_dmp_address_daily" "dt='$dt', business='adn_request_sdk'" "$OUTPUT_PATH" if [ $? -ne 0 ];then exit 255 fi