#!/usr/bin/env bash # # # # # # # # # # # # # # # # # # # # # # # @file :all_cross.sh # @author :liushuai # @revision:2017-05-17 20:09 # @desc :dmp 4个数据源纯新增 # # # # # # # # # # # # # # # # # # # # # # date_path=$(date +%Y/%m/%d -d "-2 day $ScheduleTime") old_date_path=$(date +%Y/%m/%d -d "-3 day $ScheduleTime") source ../prd_env.sh INPUT_PATH="s3://mob-emr-test/dataplatform/DataWareHouse/data/dwh/dm_install_list/${date_path}/{ga,3s,dsp_req,adn_install,adn_request_sdk}/" INPUT_ALL="s3://mob-emr-test/dataplatform/DataWareHouse/data/dwh/dm_install_list/${old_date_path}/" TEMP_OUTPUT="s3://mob-emr-test/liushuai/prd/${date_path}/tmp_all_merge" OUTPUT="s3://mob-emr-test/liushuai/prd/${date_path}/new_all_merge/" hadoop fs -rmr "${OUTPUT}" "${TEMP_OUTPUT}" hadoop jar ../${JAR} mobvista.prd.datasource.newall.NewAllMergeMR \ -Dmapreduce.fileoutputcommitter.algorithm.version=2 \ -Dday=${date_path} -DoldDay=${old_date_path} \ "${INPUT_PATH}" "${INPUT_ALL}" "${TEMP_OUTPUT}" "${OUTPUT}" "100,10"