1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
#!/bin/bash
# # # # # # # # # # # # # # # # # # # # # #
# @file : ga_interest_install.sh
# @author: houying
# @date : 16-10-24
# # # # # # # # # # # # # # # # # # # # # #
source ../dmp_env.sh
LOG_TIME=$(date -d "$ScheduleTime 1 days ago" "+%Y%m%d")
year=${LOG_TIME:0:4}
month=${LOG_TIME:4:2}
day=${LOG_TIME:6:2}
INPUT_INSTALL_PATH="$DM_INSTALL_LIST/$year/$month/$day/ga"
INPUT_APP_TAG_PATH="$APP_TAG_PATH/$year/$month/$day"
OUTPUT_PATH="$DM_INTEREST_PATH/${year}/${month}/${day}/ga"
check_await "$INPUT_APP_TAG_PATH/_SUCCESS"
REDUCE_NUM=$(calculate_reduce_num "$INPUT_INSTALL_PATH")
hadoop fs -rm -r ${OUTPUT_PATH}
hadoop jar ../${JAR} mobvista.dmp.common.InterestDeviceDistinctMR \
-Dmapreduce.job.reduces=${REDUCE_NUM} \
-Dmapreduce.map.memory.mb=4096 \
-Dmapreduce.map.java.opts=-Xmx2458m \
-Dmapreduce.reduce.memory.mb=4096 \
-Dmapreduce.reduce.java.opts=-Xmx2458m \
-Dmapreduce.fileoutputcommitter.algorithm.version=2 \
"$INPUT_APP_TAG_PATH/part-r-00000" "$INPUT_INSTALL_PATH" "$OUTPUT_PATH" "ga interest tag job" || exit 1
if [ $? -ne 0 ]; then
exit 255
fi
mount_partition "dm_interest_tag" "year='$year', month='$month', day='$day', business='ga'" "$OUTPUT_PATH"
echo "[Ga Interest Tag End!]"