Commit 1d221fa6 by WangJinfeng

update dmp spark-submit

parent a58447ad
...@@ -32,7 +32,7 @@ hadoop fs -rmr $store_output_path ...@@ -32,7 +32,7 @@ hadoop fs -rmr $store_output_path
spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \
--conf spark.sql.shuffle.partitions=20 \ --conf spark.sql.shuffle.partitions=20 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 4 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 4 \
../${JAR} \ ../${JAR} \
-date $date -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 20 -date $date -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 20
if [ $? -ne 0 ]; then if [ $? -ne 0 ]; then
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.tracking_3s.TrackingTagDaily \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.tracking_3s.TrackingTagDaily \
--conf spark.sql.shuffle.partitions=5 \ --conf spark.sql.shuffle.partitions=5 \
--conf spark.default.parallelism=5 \ --conf spark.default.parallelism=5 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 3 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 3 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 2 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 2
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \
--conf spark.default.parallelism=8 \ --conf spark.default.parallelism=8 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 2 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 2 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 4 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 4
......
...@@ -40,7 +40,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \ ...@@ -40,7 +40,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \
--conf spark.default.parallelism=20 \ --conf spark.default.parallelism=20 \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \
../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 10 ../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 10
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -41,7 +41,7 @@ spark-submit --class mobvista.dmp.datasource.postback_3s.PostBackDaily \ ...@@ -41,7 +41,7 @@ spark-submit --class mobvista.dmp.datasource.postback_3s.PostBackDaily \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--jars s3://mob-emr-test/dataplatform/DataWareHouse/offline/myjar/hive-hcatalog-core-2.3.3.jar \ --jars s3://mob-emr-test/dataplatform/DataWareHouse/offline/myjar/hive-hcatalog-core-2.3.3.jar \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 3 --num-executors 100 \ --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 3 --num-executors 100 \
../${JAR} -output ${OUTPUT_PATH} -coalesce 100 \ ../${JAR} -output ${OUTPUT_PATH} -coalesce 100 \
-today ${dt_today} -last_sunday ${dt_yesterday} -today ${dt_today} -last_sunday ${dt_yesterday}
......
...@@ -28,7 +28,7 @@ hadoop fs -rmr ${store_output_path} ...@@ -28,7 +28,7 @@ hadoop fs -rmr ${store_output_path}
spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \
--conf spark.yarn.executor.memoryOverhead=2048 \ --conf spark.yarn.executor.memoryOverhead=2048 \
--conf spark.sql.shuffle.partitions=1000 \ --conf spark.sql.shuffle.partitions=1000 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 3 --num-executors 40 \ --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 3 --num-executors 40 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 1000 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 1000
......
...@@ -28,7 +28,7 @@ spark-submit --class mobvista.dmp.datasource.postback_3s.PostBackTagDaily \ ...@@ -28,7 +28,7 @@ spark-submit --class mobvista.dmp.datasource.postback_3s.PostBackTagDaily \
--conf spark.sql.shuffle.partitions=10 \ --conf spark.sql.shuffle.partitions=10 \
--conf spark.default.parallelism=10 \ --conf spark.default.parallelism=10 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 5 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 5
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \
--conf spark.default.parallelism=100 \ --conf spark.default.parallelism=100 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 5 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 5 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 40 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 40
......
...@@ -24,7 +24,7 @@ spark-submit --class mobvista.dmp.datasource.postback_3s.PostBackInstallList \ ...@@ -24,7 +24,7 @@ spark-submit --class mobvista.dmp.datasource.postback_3s.PostBackInstallList \
--conf spark.yarn.executor.memoryOverhead=2048 \ --conf spark.yarn.executor.memoryOverhead=2048 \
--conf spark.network.timeout=720s \ --conf spark.network.timeout=720s \
--conf spark.default.parallelism=1000 \ --conf spark.default.parallelism=1000 \
--master yarn --deploy-mode cluster --name PostBackInstallList --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 20 \ --deploy-mode cluster --name PostBackInstallList --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 20 \
../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 1000 -coalesce 400 ../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 1000 -coalesce 400
......
...@@ -39,9 +39,8 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \ ...@@ -39,9 +39,8 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \
--conf spark.sql.shuffle.partitions=1000 \ --conf spark.sql.shuffle.partitions=1000 \
--conf spark.default.parallelism=1000 \ --conf spark.default.parallelism=1000 \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 40 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 25 \ ../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 400
../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 200
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
exit 255 exit 255
......
...@@ -48,7 +48,7 @@ spark-submit --class mobvista.dmp.datasource.packagelist.MergeCampaignList \ ...@@ -48,7 +48,7 @@ spark-submit --class mobvista.dmp.datasource.packagelist.MergeCampaignList \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.yarn.executor.memoryOverhead=2048 \ --conf spark.yarn.executor.memoryOverhead=2048 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 4 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 4 \
../${JAR} -input_dmp_data_adn ${INPUT_DMP_DATA_ADN} -input_campaign_adn ${INPUT_CAMPAIGN_ADN} -coalesce 20 \ ../${JAR} -input_dmp_data_adn ${INPUT_DMP_DATA_ADN} -input_campaign_adn ${INPUT_CAMPAIGN_ADN} -coalesce 20 \
-output ${CAMPAIGN_TAG_OUTPUT} -today ${yester_year}-${yester_month}-${yester_day} || exit 1 -output ${CAMPAIGN_TAG_OUTPUT} -today ${yester_year}-${yester_month}-${yester_day} || exit 1
......
...@@ -22,7 +22,7 @@ hadoop fs -rm -r $OUTPUT_PATH ...@@ -22,7 +22,7 @@ hadoop fs -rm -r $OUTPUT_PATH
spark-submit --class mobvista.dmp.datasource.address.AddressInfoTotal \ spark-submit --class mobvista.dmp.datasource.address.AddressInfoTotal \
--conf spark.yarn.executor.memoryOverhead=1024 --conf spark.network.timeout=720s \ --conf spark.yarn.executor.memoryOverhead=1024 --conf spark.network.timeout=720s \
--conf spark.sql.shuffle.partitions=200 \ --conf spark.sql.shuffle.partitions=200 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 40 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 40 \
../../${JAR} -input ${INPUT_PATH} -output ${OUTPUT_PATH} -dailyFormat "rcfile" -parallelism 200 -coalesce 20 \ ../../${JAR} -input ${INPUT_PATH} -output ${OUTPUT_PATH} -dailyFormat "rcfile" -parallelism 200 -coalesce 20 \
-indices "0,2,3,5,6" -indices "0,2,3,5,6"
......
...@@ -25,15 +25,15 @@ OUTPUT_PATH="$DMP_ADN_REQUEST_DEVICE_IDS/$year/$month/$day/adn_request" ...@@ -25,15 +25,15 @@ OUTPUT_PATH="$DMP_ADN_REQUEST_DEVICE_IDS/$year/$month/$day/adn_request"
## REDUCE_NUM=$(calculate_reduce_num "$INPUT_ADN_DSP_PATH") ## REDUCE_NUM=$(calculate_reduce_num "$INPUT_ADN_DSP_PATH")
hadoop fs -rm -r ${OUTPUT_PATH}/* hadoop fs -rm -r ${OUTPUT_PATH}/*
export HADOOP_CLIENT_OPTS="-Xmx2096m $HADOOP_CLIENT_OPTS" export HADOOP_CLIENT_OPTS="-Xmx4096m $HADOOP_CLIENT_OPTS"
hadoop jar ../${JAR} mobvista.dmp.datasource.adn.mapreduce.AdnDeviceIdsMR \ hadoop jar ../${JAR} mobvista.dmp.datasource.adn.mapreduce.AdnDeviceIdsMR \
-Dmapreduce.job.reduces=1000 \ -Dmapreduce.job.reduces=2000 \
-Dmapred.child.java.opts=-Xmx4096m \ -Dmapred.child.java.opts=-Xmx8192m \
-Dmapreduce.map.memory.mb=8192 \ -Dmapreduce.map.memory.mb=10240 \
-Dmapreduce.map.java.opts=-Xmx4096m \ -Dmapreduce.map.java.opts=-Xmx8192m \
-Dmapreduce.reduce.memory.mb=8192 \ -Dmapreduce.reduce.memory.mb=10240 \
-Dmapreduce.reduce.java.opts=-Xmx4096m \ -Dmapreduce.reduce.java.opts=-Xmx8192m \
-Dtask.date="$year-$month-$day" \ -Dtask.date="$year-$month-$day" \
-Dmapreduce.fileoutputcommitter.algorithm.version=2 \ -Dmapreduce.fileoutputcommitter.algorithm.version=2 \
"$INPUT_ADN_DSP_PATH" "$OUTPUT_PATH" || exit 1 "$INPUT_ADN_DSP_PATH" "$OUTPUT_PATH" || exit 1
......
...@@ -24,7 +24,7 @@ hadoop fs -rm -r $ETL_ADN_REQ_ORG_HOURS_PATH ...@@ -24,7 +24,7 @@ hadoop fs -rm -r $ETL_ADN_REQ_ORG_HOURS_PATH
spark-submit --class mobvista.dmp.datasource.adn.AdnOrgLogEtlHours \ spark-submit --class mobvista.dmp.datasource.adn.AdnOrgLogEtlHours \
--conf spark.yarn.executor.memoryOverhead=3072 \ --conf spark.yarn.executor.memoryOverhead=3072 \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 4 --num-executors 20 \ --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 4 --num-executors 20 \
../../${JAR} -datetime "$yt$mt$dt$hhpath" -output $ETL_ADN_REQ_ORG_HOURS_PATH -coalesce 200 -region frankfurt || exit 1 ../../${JAR} -datetime "$yt$mt$dt$hhpath" -output $ETL_ADN_REQ_ORG_HOURS_PATH -coalesce 200 -region frankfurt || exit 1
if [[ $? -ne 0 ]]; then if [[ $? -ne 0 ]]; then
......
...@@ -24,7 +24,7 @@ hadoop fs -rm -r $ETL_ADN_REQ_ORG_HOURS_PATH ...@@ -24,7 +24,7 @@ hadoop fs -rm -r $ETL_ADN_REQ_ORG_HOURS_PATH
spark-submit --class mobvista.dmp.datasource.adn.AdnOrgLogEtlHours \ spark-submit --class mobvista.dmp.datasource.adn.AdnOrgLogEtlHours \
--conf spark.yarn.executor.memoryOverhead=3072 \ --conf spark.yarn.executor.memoryOverhead=3072 \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 4 --num-executors 20 \ --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 4 --num-executors 20 \
../../${JAR} -datetime "$yt$mt$dt$hhpath" -output $ETL_ADN_REQ_ORG_HOURS_PATH -coalesce 200 -region seoul || exit 1 ../../${JAR} -datetime "$yt$mt$dt$hhpath" -output $ETL_ADN_REQ_ORG_HOURS_PATH -coalesce 200 -region seoul || exit 1
if [[ $? -ne 0 ]]; then if [[ $? -ne 0 ]]; then
......
...@@ -23,7 +23,7 @@ hadoop fs -rm -r $ETL_ADN_REQ_ORG_HOURS_PATH ...@@ -23,7 +23,7 @@ hadoop fs -rm -r $ETL_ADN_REQ_ORG_HOURS_PATH
spark-submit --class mobvista.dmp.datasource.adn.AdnOrgLogEtlHours \ spark-submit --class mobvista.dmp.datasource.adn.AdnOrgLogEtlHours \
--conf spark.yarn.executor.memoryOverhead=3072 \ --conf spark.yarn.executor.memoryOverhead=3072 \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 6g --executor-cores 4 --num-executors 50 \ --deploy-mode cluster --executor-memory 10g --driver-memory 6g --executor-cores 4 --num-executors 50 \
../../${JAR} -datetime "$yt$mt$dt$hhpath" -output $ETL_ADN_REQ_ORG_HOURS_PATH -coalesce 400 -region singapore || exit 1 ../../${JAR} -datetime "$yt$mt$dt$hhpath" -output $ETL_ADN_REQ_ORG_HOURS_PATH -coalesce 400 -region singapore || exit 1
if [[ $? -ne 0 ]]; then if [[ $? -ne 0 ]]; then
......
...@@ -24,7 +24,7 @@ hadoop fs -rm -r $ETL_ADN_REQ_ORG_HOURS_PATH ...@@ -24,7 +24,7 @@ hadoop fs -rm -r $ETL_ADN_REQ_ORG_HOURS_PATH
spark-submit --class mobvista.dmp.datasource.adn.AdnOrgLogEtlHours \ spark-submit --class mobvista.dmp.datasource.adn.AdnOrgLogEtlHours \
--conf spark.yarn.executor.memoryOverhead=3072 \ --conf spark.yarn.executor.memoryOverhead=3072 \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 4 --num-executors 20 \ --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 4 --num-executors 20 \
../../${JAR} -datetime "$yt$mt$dt$hhpath" -output $ETL_ADN_REQ_ORG_HOURS_PATH -coalesce 200 -region virginia || exit 1 ../../${JAR} -datetime "$yt$mt$dt$hhpath" -output $ETL_ADN_REQ_ORG_HOURS_PATH -coalesce 200 -region virginia || exit 1
if [[ $? -ne 0 ]]; then if [[ $? -ne 0 ]]; then
......
...@@ -21,7 +21,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnClickDaily \ ...@@ -21,7 +21,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnClickDaily \
--conf spark.default.parallelism=1000 \ --conf spark.default.parallelism=1000 \
--conf spark.kryoserializer.buffer.max=512m \ --conf spark.kryoserializer.buffer.max=512m \
--conf spark.kryoserializer.buffer=64m \ --conf spark.kryoserializer.buffer=64m \
--master yarn --deploy-mode cluster \ --deploy-mode cluster \
--executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 50 \ --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 50 \
../.././DMP.jar \ ../.././DMP.jar \
-datetime ${LOG_TIME} -output ${OUTPUT_ADN_INSTALL_DAILY} -coalesce 200 -datetime ${LOG_TIME} -output ${OUTPUT_ADN_INSTALL_DAILY} -coalesce 200
......
...@@ -21,7 +21,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnClickJoinInstallDaily \ ...@@ -21,7 +21,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnClickJoinInstallDaily \
--conf spark.default.parallelism=2000 \ --conf spark.default.parallelism=2000 \
--conf spark.kryoserializer.buffer.max=512m \ --conf spark.kryoserializer.buffer.max=512m \
--conf spark.kryoserializer.buffer=64m \ --conf spark.kryoserializer.buffer=64m \
--master yarn --deploy-mode cluster \ --deploy-mode cluster \
--executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 50 \ --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 50 \
../.././DMP.jar \ ../.././DMP.jar \
-input_click ${INPUT_CLICK_PATH} -input_install ${INPUT_ADN_INSTALL_PATH} -output ${OUTPUT_ADN_INSTALL_DAILY} -coalesce 200 -input_click ${INPUT_CLICK_PATH} -input_install ${INPUT_ADN_INSTALL_PATH} -output ${OUTPUT_ADN_INSTALL_DAILY} -coalesce 200
......
...@@ -28,7 +28,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnInstallDaily \ ...@@ -28,7 +28,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnInstallDaily \
--conf spark.default.parallelism=100 \ --conf spark.default.parallelism=100 \
--conf spark.kryoserializer.buffer.max=512m \ --conf spark.kryoserializer.buffer.max=512m \
--conf spark.kryoserializer.buffer=64m \ --conf spark.kryoserializer.buffer=64m \
--master yarn --deploy-mode cluster \ --deploy-mode cluster \
--executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \ --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \
../.././DMP.jar \ ../.././DMP.jar \
-datetime ${LOG_TIME} -output ${TMP_OUTPUT_ADN_INSTALL_DAILY} -coalesce 20 -datetime ${LOG_TIME} -output ${TMP_OUTPUT_ADN_INSTALL_DAILY} -coalesce 20
......
...@@ -32,7 +32,7 @@ hadoop fs -rmr ${store_output_path} ...@@ -32,7 +32,7 @@ hadoop fs -rmr ${store_output_path}
spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \
--conf spark.sql.shuffle.partitions=20 \ --conf spark.sql.shuffle.partitions=20 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 5 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 5 \
../../${JAR} \ ../../${JAR} \
-date $date -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 20 -date $date -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 20
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnInstallTagDaily \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnInstallTagDaily \
--conf spark.sql.shuffle.partitions=50 \ --conf spark.sql.shuffle.partitions=50 \
--conf spark.default.parallelism=10 \ --conf spark.default.parallelism=10 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 4 --num-executors 5 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 4 --num-executors 5 \
../../${JAR} \ ../../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 1 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 1
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \
--conf spark.default.parallelism=8 \ --conf spark.default.parallelism=8 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 2 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 2 \
../../${JAR} \ ../../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 4 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 4
......
...@@ -34,7 +34,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \ ...@@ -34,7 +34,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \
--conf spark.sql.shuffle.partitions=1000 \ --conf spark.sql.shuffle.partitions=1000 \
--conf spark.default.parallelism=1000 \ --conf spark.default.parallelism=1000 \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 6g --executor-cores 4 --num-executors 20 \ --deploy-mode cluster --executor-memory 10g --driver-memory 6g --executor-cores 4 --num-executors 20 \
../../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 100 ../../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 100
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \
--conf spark.kryoserializer.buffer=64m \ --conf spark.kryoserializer.buffer=64m \
--conf spark.sql.adaptive.enabled=true \ --conf spark.sql.adaptive.enabled=true \
--conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \ --conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 40 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 40 \
../../${JAR} \ ../../${JAR} \
-date ${date} -coalesce 200 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING} -date ${date} -coalesce 200 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING}
......
...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \ ...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \
--conf spark.speculation=true \ --conf spark.speculation=true \
--conf spark.speculation.quantile=0.8 \ --conf spark.speculation.quantile=0.8 \
--conf spark.speculation.multiplier=1.2 \ --conf spark.speculation.multiplier=1.2 \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 10 \ --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 10 \
../../${JAR} \ ../../${JAR} \
-output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business} -output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business}
' '
......
...@@ -21,7 +21,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnPreClickDaily \ ...@@ -21,7 +21,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnPreClickDaily \
--conf spark.default.parallelism=1000 \ --conf spark.default.parallelism=1000 \
--conf spark.kryoserializer.buffer.max=512m \ --conf spark.kryoserializer.buffer.max=512m \
--conf spark.kryoserializer.buffer=64m \ --conf spark.kryoserializer.buffer=64m \
--master yarn --deploy-mode cluster \ --deploy-mode cluster \
--executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 50 \ --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 50 \
../.././DMP.jar \ ../.././DMP.jar \
-datetime ${LOG_TIME} -output ${OUTPUT_ADN_INSTALL_DAILY} -coalesce 200 -datetime ${LOG_TIME} -output ${OUTPUT_ADN_INSTALL_DAILY} -coalesce 200
......
...@@ -32,7 +32,7 @@ spark-submit --class mobvista.dmp.datasource.adn_request_sdk.AdnRequestSdkEtlDai ...@@ -32,7 +32,7 @@ spark-submit --class mobvista.dmp.datasource.adn_request_sdk.AdnRequestSdkEtlDai
--conf spark.storage.memoryFraction=0.4 \ --conf spark.storage.memoryFraction=0.4 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--conf spark.serializer=org.apache.spark.serializer.KryoSerializer \ --conf spark.serializer=org.apache.spark.serializer.KryoSerializer \
--master yarn --deploy-mode cluster --name "AdnRequestSdkEtlDaily.${LOG_TIME}" --executor-memory 10g --driver-memory 6g --executor-cores 5 --num-executors 100 \ --deploy-mode cluster --name "AdnRequestSdkEtlDaily.${LOG_TIME}" --executor-memory 10g --driver-memory 6g --executor-cores 5 --num-executors 100 \
../../${JAR} -appIdMapping ${INPUT_MAPPING_PATH} -manualAppIdMapping ${DIM_MANUAL_MAPPING} -output ${TMP_OUTPUT_PATH} -date ${LOG_TIME} -coalesce 2000 ../../${JAR} -appIdMapping ${INPUT_MAPPING_PATH} -manualAppIdMapping ${DIM_MANUAL_MAPPING} -output ${TMP_OUTPUT_PATH} -date ${LOG_TIME} -coalesce 2000
if [[ $? -ne 0 ]]; then if [[ $? -ne 0 ]]; then
......
...@@ -34,7 +34,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \ ...@@ -34,7 +34,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \
--conf spark.yarn.executor.memoryOverhead=2048 \ --conf spark.yarn.executor.memoryOverhead=2048 \
--conf spark.sql.shuffle.partitions=4000 \ --conf spark.sql.shuffle.partitions=4000 \
--conf spark.default.parallelism=4000 \ --conf spark.default.parallelism=4000 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 100 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 100 \
../../${JAR} \ ../../${JAR} \
-date $date -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 400 -date $date -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 400
if [ $? -ne 0 ]; then if [ $? -ne 0 ]; then
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnRequestSdkTagDaily \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn.AdnRequestSdkTagDaily \
--conf spark.sql.shuffle.partitions=20 \ --conf spark.sql.shuffle.partitions=20 \
--conf spark.default.parallelism=5 \ --conf spark.default.parallelism=5 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 2 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 2 \
../../${JAR} \ ../../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 20 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 20
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \
--conf spark.default.parallelism=200 \ --conf spark.default.parallelism=200 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 10 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 10 \
../../${JAR} \ ../../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 100 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 100
......
...@@ -37,7 +37,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \ ...@@ -37,7 +37,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \
--conf spark.sql.files.maxPartitionBytes=536870912 \ --conf spark.sql.files.maxPartitionBytes=536870912 \
--conf spark.sql.adaptive.enabled=true \ --conf spark.sql.adaptive.enabled=true \
--conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \ --conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 6g --executor-cores 3 --num-executors 200 \ --deploy-mode cluster --executor-memory 10g --driver-memory 6g --executor-cores 3 --num-executors 200 \
../../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 2000 ../../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 2000
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -32,7 +32,7 @@ spark-submit --class mobvista.dmp.datasource.adn_request_other.EtlAdnRequestOthe ...@@ -32,7 +32,7 @@ spark-submit --class mobvista.dmp.datasource.adn_request_other.EtlAdnRequestOthe
--conf spark.storage.memoryFraction=0.4 \ --conf spark.storage.memoryFraction=0.4 \
--conf spark.driver.maxResultSize=5g \ --conf spark.driver.maxResultSize=5g \
--conf spark.executor.extraJavaOptions=-XX:+UseG1GC \ --conf spark.executor.extraJavaOptions=-XX:+UseG1GC \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 40 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 40 \
../../${JAR} -input "${INPUT_PATH}/*/*" -output $OUTPUT_PATH ../../${JAR} -input "${INPUT_PATH}/*/*" -output $OUTPUT_PATH
if [ $? -ne 0 ]; then if [ $? -ne 0 ]; then
exit 255 exit 255
......
...@@ -33,7 +33,7 @@ hadoop fs -rmr ${store_output_path} ...@@ -33,7 +33,7 @@ hadoop fs -rmr ${store_output_path}
spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--conf spark.yarn.executor.memoryOverhead=3072 \ --conf spark.yarn.executor.memoryOverhead=3072 \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 80 \ --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 80 \
../../${JAR} \ ../../${JAR} \
-date $date -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 2000 -date $date -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 2000
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn_request_other.AdnRequestOtherTa ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn_request_other.AdnRequestOtherTa
--conf spark.sql.shuffle.partitions=20 \ --conf spark.sql.shuffle.partitions=20 \
--conf spark.default.parallelism=10 \ --conf spark.default.parallelism=10 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \
../../${JAR} \ ../../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 10 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 10
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \
--conf spark.default.parallelism=200 \ --conf spark.default.parallelism=200 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 20 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 20 \
../../${JAR} \ ../../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 100 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 100
......
...@@ -27,7 +27,7 @@ hadoop fs -rm -r "$OUTPUT_PATH" ...@@ -27,7 +27,7 @@ hadoop fs -rm -r "$OUTPUT_PATH"
spark-submit --class mobvista.dmp.datasource.adn_request_other.AdnRequestOtherInstall \ spark-submit --class mobvista.dmp.datasource.adn_request_other.AdnRequestOtherInstall \
--conf spark.yarn.executor.memoryOverhead=2048 \ --conf spark.yarn.executor.memoryOverhead=2048 \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 200 \ --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 200 \
../../${JAR} \ ../../${JAR} \
-input "${INPUT_PATH}" -output $OUTPUT_PATH -date $date -oldInput $OLD_INPUT_PATH -parallelism 2000 -coalesce 2000 -input "${INPUT_PATH}" -output $OUTPUT_PATH -date $date -oldInput $OLD_INPUT_PATH -parallelism 2000 -coalesce 2000
if [ $? -ne 0 ]; then if [ $? -ne 0 ]; then
......
...@@ -35,7 +35,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \ ...@@ -35,7 +35,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \
--conf spark.default.parallelism=1000 \ --conf spark.default.parallelism=1000 \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 50 \ --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 50 \
../../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 400 ../../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 400
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \
--conf spark.kryoserializer.buffer=64m \ --conf spark.kryoserializer.buffer=64m \
--conf spark.sql.adaptive.enabled=true \ --conf spark.sql.adaptive.enabled=true \
--conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \ --conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 100 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 100 \
../../${JAR} \ ../../${JAR} \
-date ${date} -coalesce 1000 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING} -date ${date} -coalesce 1000 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING}
......
...@@ -38,7 +38,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \ ...@@ -38,7 +38,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \
--conf spark.speculation=true \ --conf spark.speculation=true \
--conf spark.speculation.quantile=0.8 \ --conf spark.speculation.quantile=0.8 \
--conf spark.speculation.multiplier=1.2 \ --conf spark.speculation.multiplier=1.2 \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 30 \ --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 30 \
../../${JAR} \ ../../${JAR} \
-output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business} -output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business}
' '
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \
--conf spark.kryoserializer.buffer=64m \ --conf spark.kryoserializer.buffer=64m \
--conf spark.sql.adaptive.enabled=true \ --conf spark.sql.adaptive.enabled=true \
--conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \ --conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 100 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 100 \
../../${JAR} \ ../../${JAR} \
-date ${date} -coalesce 1000 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING} -date ${date} -coalesce 1000 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING}
......
...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \ ...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \
--conf spark.speculation=true \ --conf spark.speculation=true \
--conf spark.speculation.quantile=0.8 \ --conf spark.speculation.quantile=0.8 \
--conf spark.speculation.multiplier=1.2 \ --conf spark.speculation.multiplier=1.2 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 2 --num-executors 40 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 2 --num-executors 40 \
../../${JAR} \ ../../${JAR} \
-output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business} -output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business}
' '
......
...@@ -32,7 +32,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \ ...@@ -32,7 +32,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \
--conf spark.default.parallelism=4000 \ --conf spark.default.parallelism=4000 \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC " \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC " \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 100 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 100 \
../../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 2000 ../../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 2000
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.adn_adx.AdnAdxDeviceTag \ ...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.adn_adx.AdnAdxDeviceTag \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--conf spark.sql.hive.verifyPartitionPath=true \ --conf spark.sql.hive.verifyPartitionPath=true \
--jars s3://mob-emr-test/dataplatform/DataWareHouse/offline/myjar/hive-hcatalog-core-2.3.3.jar \ --jars s3://mob-emr-test/dataplatform/DataWareHouse/offline/myjar/hive-hcatalog-core-2.3.3.jar \
--master yarn --deploy-mode cluster --name AdnAdxDeviceTag --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 32 \ --deploy-mode cluster --name AdnAdxDeviceTag --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 32 \
../${JAR} -outputadxdevtag ${OUTPUT_ADN_ADX_DEVICE_TAG_PATH} \ ../${JAR} -outputadxdevtag ${OUTPUT_ADN_ADX_DEVICE_TAG_PATH} \
-coalesce 80 \ -coalesce 80 \
-today ${dt_today} -yesterday ${dt_yesterday} -today ${dt_today} -yesterday ${dt_yesterday}
......
...@@ -36,7 +36,7 @@ spark-submit --class mobvista.dmp.datasource.adn_adx.AdnTecentAdxDataMidWay \ ...@@ -36,7 +36,7 @@ spark-submit --class mobvista.dmp.datasource.adn_adx.AdnTecentAdxDataMidWay \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--conf spark.sql.hive.verifyPartitionPath=true \ --conf spark.sql.hive.verifyPartitionPath=true \
--jars s3://mob-emr-test/dataplatform/DataWareHouse/offline/myjar/hive-hcatalog-core-2.3.3.jar,s3://mob-emr-test/dataplatform/DataWareHouse/offline/myjar/json-serde-1.3.7-jar-with-dependencies.jar \ --jars s3://mob-emr-test/dataplatform/DataWareHouse/offline/myjar/hive-hcatalog-core-2.3.3.jar,s3://mob-emr-test/dataplatform/DataWareHouse/offline/myjar/json-serde-1.3.7-jar-with-dependencies.jar \
--master yarn --deploy-mode cluster --name AdnTecentAdxDataMidWay --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 100 \ --deploy-mode cluster --name AdnTecentAdxDataMidWay --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 100 \
../${JAR} -outputadxtmp ${OUTPUT_ODS_ADX_TMP_PATH} -dimadxpkg ${OUTPUT_DIM_ADN_ADX_PKG_PATH} \ ../${JAR} -outputadxtmp ${OUTPUT_ODS_ADX_TMP_PATH} -dimadxpkg ${OUTPUT_DIM_ADN_ADX_PKG_PATH} \
-coalesce 60 \ -coalesce 60 \
-today ${dt_today} -today ${dt_today}
......
...@@ -30,7 +30,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkDaily \ ...@@ -30,7 +30,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkDaily \
--conf spark.default.parallelism=2000 \ --conf spark.default.parallelism=2000 \
--conf spark.driver.maxResultSize=8g \ --conf spark.driver.maxResultSize=8g \
--conf spark.app.coalesce=60000 \ --conf spark.app.coalesce=60000 \
--master yarn --deploy-mode cluster --name adn_sdk_daily --executor-memory 10g --driver-memory 6g --executor-cores 3 --num-executors 300 \ --deploy-mode cluster --name adn_sdk_daily --executor-memory 10g --driver-memory 6g --executor-cores 3 --num-executors 300 \
../${JAR} ../${JAR}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -34,7 +34,7 @@ hadoop fs -rmr ${store_output_path} ...@@ -34,7 +34,7 @@ hadoop fs -rmr ${store_output_path}
spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 3 --num-executors 200 \ --deploy-mode cluster --executor-memory 8g --driver-memory 6g --executor-cores 3 --num-executors 200 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 2000 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 2000
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkTagDaily \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkTagDaily \
--conf spark.sql.shuffle.partitions=10 \ --conf spark.sql.shuffle.partitions=10 \
--conf spark.default.parallelism=10 \ --conf spark.default.parallelism=10 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 10 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 10
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \
--conf spark.default.parallelism=1000 \ --conf spark.default.parallelism=1000 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 50 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 50 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 100 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 100
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkEtlHour \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkEtlHour \
--conf spark.storage.memoryFraction=0.4 \ --conf spark.storage.memoryFraction=0.4 \
--conf spark.driver.maxResultSize=8g \ --conf spark.driver.maxResultSize=8g \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --name adn_sdk_etl_hour.${date}.${hour} --executor-memory 4g --driver-memory 4g --executor-cores 4 --num-executors 20 \ --deploy-mode cluster --name adn_sdk_etl_hour.${date}.${hour} --executor-memory 4g --driver-memory 4g --executor-cores 4 --num-executors 20 \
../${JAR} -coalesce 4000 -date ${date} -hour ${hour} -input ${INPUT_PATH} -output ${OUTPUT_PATH} ../${JAR} -coalesce 4000 -date ${date} -hour ${hour} -input ${INPUT_PATH} -output ${OUTPUT_PATH}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -38,7 +38,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkInstallList \ ...@@ -38,7 +38,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkInstallList \
--conf spark.shuffle.memoryFraction=0.4 \ --conf spark.shuffle.memoryFraction=0.4 \
--conf spark.sql.adaptive.enabled=true \ --conf spark.sql.adaptive.enabled=true \
--conf spark.sql.adaptive.advisoryPartitionSizeInBytes=268435456 \ --conf spark.sql.adaptive.advisoryPartitionSizeInBytes=268435456 \
--master yarn --deploy-mode cluster --name adn_sdk_install --executor-memory 15g --driver-memory 4g --executor-cores 5 --num-executors 60 \ --deploy-mode cluster --name adn_sdk_install --executor-memory 15g --driver-memory 4g --executor-cores 5 --num-executors 60 \
../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 2000 -coalesce 2000 ../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 2000 -coalesce 2000
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -35,7 +35,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \ ...@@ -35,7 +35,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \
--conf spark.default.parallelism=4000 \ --conf spark.default.parallelism=4000 \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 100 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 100 \
../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 2000 ../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 2000
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \
--conf spark.kryoserializer.buffer=64m \ --conf spark.kryoserializer.buffer=64m \
--conf spark.sql.adaptive.enabled=true \ --conf spark.sql.adaptive.enabled=true \
--conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \ --conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 80 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 80 \
../${JAR} \ ../${JAR} \
-date ${date} -coalesce 1000 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING} -date ${date} -coalesce 1000 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING}
......
...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \ ...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \
--conf spark.speculation=true \ --conf spark.speculation=true \
--conf spark.speculation.quantile=0.8 \ --conf spark.speculation.quantile=0.8 \
--conf spark.speculation.multiplier=1.2 \ --conf spark.speculation.multiplier=1.2 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 3 --num-executors 80 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 3 --num-executors 80 \
../${JAR} \ ../${JAR} \
-output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business} -output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business}
' '
......
...@@ -34,7 +34,7 @@ hadoop fs -rmr ${store_output_path} ...@@ -34,7 +34,7 @@ hadoop fs -rmr ${store_output_path}
spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 6g --executor-cores 4 --num-executors 150 \ --deploy-mode cluster --executor-memory 10g --driver-memory 6g --executor-cores 4 --num-executors 150 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 2000 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 2000
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \
--conf spark.default.parallelism=100 \ --conf spark.default.parallelism=100 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 20 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 20 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 100 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 100
......
...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkInstallList \ ...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.adn_sdk.AdnSdkInstallList \
--conf spark.sql.adaptive.enabled=true \ --conf spark.sql.adaptive.enabled=true \
--conf spark.sql.adaptive.advisoryPartitionSizeInBytes=268435456 \ --conf spark.sql.adaptive.advisoryPartitionSizeInBytes=268435456 \
--conf spark.app.version=1 \ --conf spark.app.version=1 \
--master yarn --deploy-mode cluster --name "adn_sdk_v2_install.${LOG_TIME}" --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 50 \ --deploy-mode cluster --name "adn_sdk_v2_install.${LOG_TIME}" --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 50 \
../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 200 -coalesce 200 ../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 200 -coalesce 200
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -35,7 +35,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \ ...@@ -35,7 +35,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \
--conf spark.default.parallelism=500 \ --conf spark.default.parallelism=500 \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 50 \ --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 50 \
../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 200 ../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 200
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.dm.FixInstallListRuid \
--conf spark.kryoserializer.buffer=64m \ --conf spark.kryoserializer.buffer=64m \
--conf spark.sql.adaptive.enabled=true \ --conf spark.sql.adaptive.enabled=true \
--conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \ --conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 40 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 40 \
../${JAR} \ ../${JAR} \
-date ${date} -coalesce 200 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING} -date ${date} -coalesce 200 -output $OUTPUT_PATH -business ${BUSINESS} -input ${INPUT_MAPPING}
......
...@@ -43,7 +43,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \ ...@@ -43,7 +43,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \
--conf spark.speculation=true \ --conf spark.speculation=true \
--conf spark.speculation.quantile=0.8 \ --conf spark.speculation.quantile=0.8 \
--conf spark.speculation.multiplier=1.2 \ --conf spark.speculation.multiplier=1.2 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 3 --num-executors 80 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 3 --num-executors 80 \
../${JAR} \ ../${JAR} \
-output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business} -output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business}
' '
......
...@@ -35,7 +35,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.CalcDeviceAge \ ...@@ -35,7 +35,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.CalcDeviceAge \
--conf spark.storage.memoryFraction=0.4 \ --conf spark.storage.memoryFraction=0.4 \
--conf spark.shuffle.memoryFraction=0.4 \ --conf spark.shuffle.memoryFraction=0.4 \
--conf spark.sql.files.maxPartitionBytes=134217728 \ --conf spark.sql.files.maxPartitionBytes=134217728 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 100 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 100 \
../${JAR} -date ${LOG_TIME} -merge_input ${INPUT_PATH} -dict_input ${FILEDICT} -output ${OUTPUT_PATH} -parallelism 500 ../${JAR} -date ${LOG_TIME} -merge_input ${INPUT_PATH} -dict_input ${FILEDICT} -output ${OUTPUT_PATH} -parallelism 500
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -27,7 +27,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.CalcPackageAge \ ...@@ -27,7 +27,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.CalcPackageAge \
--conf spark.storage.memoryFraction=0.4 \ --conf spark.storage.memoryFraction=0.4 \
--conf spark.shuffle.memoryFraction=0.4 \ --conf spark.shuffle.memoryFraction=0.4 \
--conf spark.sql.files.maxPartitionBytes=134217728 \ --conf spark.sql.files.maxPartitionBytes=134217728 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 100 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 100 \
../${JAR} -inputPath ${INPUT_PATH} -outputPath ${OUTPUT_PATH} -parallelism 1 -low ${LOW} -high ${HIGH} -unbelievable ${UNBELIEVABLE} ../${JAR} -inputPath ${INPUT_PATH} -outputPath ${OUTPUT_PATH} -parallelism 1 -low ${LOW} -high ${HIGH} -unbelievable ${UNBELIEVABLE}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -36,7 +36,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.GetAgeGender \ ...@@ -36,7 +36,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.GetAgeGender \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--conf spark.default.parallelism=2000 \ --conf spark.default.parallelism=2000 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 60 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 60 \
../${JAR} -ageOutput ${AGE_OUTPUT_PATH} -genderOutput ${GENDER_OUTPUT_PATH} -date ${LOG_TIME} -business ${business} ../${JAR} -ageOutput ${AGE_OUTPUT_PATH} -genderOutput ${GENDER_OUTPUT_PATH} -date ${LOG_TIME} -business ${business}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -58,7 +58,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.GetAgeGender \ ...@@ -58,7 +58,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.GetAgeGender \
--conf spark.speculation.quantile=0.9 \ --conf spark.speculation.quantile=0.9 \
--conf spark.speculation.multiplier=1.5 \ --conf spark.speculation.multiplier=1.5 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 50 \ --deploy-mode cluster --executor-memory 6g --driver-memory 4g --executor-cores 2 --num-executors 50 \
../${JAR} -ageOutput ${AGE_OUTPUT_PATH} -genderOutput ${GENDER_OUTPUT_PATH} -date ${GA_TOTAL_DATE} -business ${business} ../${JAR} -ageOutput ${AGE_OUTPUT_PATH} -genderOutput ${GENDER_OUTPUT_PATH} -date ${GA_TOTAL_DATE} -business ${business}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -52,7 +52,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.MergeInstallAge \ ...@@ -52,7 +52,7 @@ spark-submit --class mobvista.dmp.datasource.age_gender.MergeInstallAge \
--conf spark.sql.files.maxPartitionBytes=536870912 \ --conf spark.sql.files.maxPartitionBytes=536870912 \
--conf spark.sql.adaptive.enabled=true \ --conf spark.sql.adaptive.enabled=true \
--conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \ --conf spark.sql.adaptive.advisoryPartitionSizeInBytes=536870912 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 60 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 5 --num-executors 60 \
../${JAR} -date ${LOG_TIME} \ ../${JAR} -date ${LOG_TIME} \
-ga_age_path ${GA_AGE_PATH} -dsp_age_path ${DSP_AGE_PATH} -age_output ${OUTPUT_PATH} -parallelism 2000 -ga_age_path ${GA_AGE_PATH} -dsp_age_path ${DSP_AGE_PATH} -age_output ${OUTPUT_PATH} -parallelism 2000
......
...@@ -27,7 +27,7 @@ spark-submit --class mobvista.dmp.datasource.TO.TODaily \ ...@@ -27,7 +27,7 @@ spark-submit --class mobvista.dmp.datasource.TO.TODaily \
--conf spark.sql.shuffle.partitions=3000 \ --conf spark.sql.shuffle.partitions=3000 \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 20 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 20 \
../../${JAR} \ ../../${JAR} \
-output ${OUTPUT_PATH} -coalesce 200 -dt_dash_today ${dt_dash_today} -output ${OUTPUT_PATH} -coalesce 200 -dt_dash_today ${dt_dash_today}
......
...@@ -23,7 +23,7 @@ spark-submit --class mobvista.dmp.datasource.TO.TOInstallList \ ...@@ -23,7 +23,7 @@ spark-submit --class mobvista.dmp.datasource.TO.TOInstallList \
--conf spark.yarn.executor.memoryOverhead=2048 \ --conf spark.yarn.executor.memoryOverhead=2048 \
--conf spark.network.timeout=720s \ --conf spark.network.timeout=720s \
--conf spark.default.parallelism=100 \ --conf spark.default.parallelism=100 \
--master yarn --deploy-mode cluster --name PostBackInstallList --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 30 \ --deploy-mode cluster --name PostBackInstallList --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 30 \
../../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 160 -coalesce 160 ../../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 160 -coalesce 160
......
...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.baichuan.BaiChuanJob \ ...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.baichuan.BaiChuanJob \
--conf spark.default.parallelism=100 \ --conf spark.default.parallelism=100 \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 6g --executor-cores 2 --num-executors 20 \ --deploy-mode cluster --executor-memory 6g --driver-memory 6g --executor-cores 2 --num-executors 20 \
../${JAR} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table} ../${JAR} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -24,7 +24,7 @@ spark-submit --class mobvista.dmp.datasource.baichuan.AliDaily \ ...@@ -24,7 +24,7 @@ spark-submit --class mobvista.dmp.datasource.baichuan.AliDaily \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 3 --num-executors 5 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 3 --num-executors 5 \
../${JAR} -date ${LOG_TIME} -partNum 10 -output ${OUTPUT_PATH} -host ${host} -cluster ${cluster} -database ${database} -table ${table} ../${JAR} -date ${LOG_TIME} -partNum 10 -output ${OUTPUT_PATH} -host ${host} -cluster ${cluster} -database ${database} -table ${table}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -36,7 +36,7 @@ hadoop fs -rmr ${store_output_path} ...@@ -36,7 +36,7 @@ hadoop fs -rmr ${store_output_path}
spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTag \
--conf spark.sql.shuffle.partitions=100 \ --conf spark.sql.shuffle.partitions=100 \
--master yarn --deploy-mode cluster --executor-memory 6g --driver-memory 6g --executor-cores 2 --num-executors 5 \ --deploy-mode cluster --executor-memory 6g --driver-memory 6g --executor-cores 2 --num-executors 5 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 40 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 40
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.baichuan.AliTagDaily \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.baichuan.AliTagDaily \
--conf spark.sql.shuffle.partitions=10 \ --conf spark.sql.shuffle.partitions=10 \
--conf spark.default.parallelism=10 \ --conf spark.default.parallelism=10 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 5 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 5 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 5
......
...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \ ...@@ -31,7 +31,7 @@ spark-submit --class mobvista.dmp.datasource.newtag.MatchInterestTagDailyV2 \
--conf spark.default.parallelism=8 \ --conf spark.default.parallelism=8 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 2 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 2 \
../${JAR} \ ../${JAR} \
-date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 8 -date ${date} -manualOutput ${output_path} -business ${business} -storeOutput ${store_output_path} -coalesce 8
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.baichuan.AliInstallList \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.baichuan.AliInstallList \
--conf spark.yarn.executor.memoryOverhead=2048 \ --conf spark.yarn.executor.memoryOverhead=2048 \
--conf spark.network.timeout=720s \ --conf spark.network.timeout=720s \
--conf spark.default.parallelism=1000 \ --conf spark.default.parallelism=1000 \
--master yarn --deploy-mode cluster --name ali_install_wangjf --executor-memory 8g --driver-memory 6g --executor-cores 3 --num-executors 50 \ --deploy-mode cluster --name ali_install_wangjf --executor-memory 8g --driver-memory 6g --executor-cores 3 --num-executors 50 \
../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 400 -coalesce 400 ../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 400 -coalesce 400
......
...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \ ...@@ -39,7 +39,7 @@ spark-submit --class mobvista.dmp.datasource.dm.DmInstallListOrc \
--conf spark.speculation=true \ --conf spark.speculation=true \
--conf spark.speculation.quantile=0.8 \ --conf spark.speculation.quantile=0.8 \
--conf spark.speculation.multiplier=1.2 \ --conf spark.speculation.multiplier=1.2 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 3 --num-executors 80 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 3 --num-executors 80 \
../${JAR} \ ../${JAR} \
-output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business} -output ${OUTPUT_PATH} -input ${INPUT_PATH} -business ${business}
......
...@@ -36,7 +36,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \ ...@@ -36,7 +36,7 @@ spark-submit --class mobvista.dmp.common.InstallListLogic \
--conf spark.default.parallelism=400 \ --conf spark.default.parallelism=400 \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 50 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 50 \
../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 100 ../${JAR} -date ${LOG_TIME} -business ${business} -output ${OUTPUT} -coalesce 100
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -34,7 +34,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliIosActivitionDaily \ ...@@ -34,7 +34,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliIosActivitionDaily \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 4 --num-executors 60 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 4 --num-executors 60 \
../../${JAR} -output ${OUTPUT_PATH} -outputdaily ${ALI_OUTPUT_DAILY_PATH} -coalesce 500 \ ../../${JAR} -output ${OUTPUT_PATH} -outputdaily ${ALI_OUTPUT_DAILY_PATH} -coalesce 500 \
-yesterday ${yesterday} -today ${dt_today} -dt_dash_today ${dt_dash_today} -dt_dash_rec14day ${dt_dash_rec14day} \ -yesterday ${yesterday} -today ${dt_today} -dt_dash_today ${dt_dash_today} -dt_dash_rec14day ${dt_dash_rec14day} \
-request_count_result "${IOS_REQUEST_COUNT_RESULT}/${dt_today}" -last_req_day ${last_req_day} -request_count_result "${IOS_REQUEST_COUNT_RESULT}/${dt_today}" -last_req_day ${last_req_day}
......
...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliOaidActivitionDaily \ ...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliOaidActivitionDaily \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 4 --num-executors 60 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 4 --num-executors 60 \
../../${JAR} -output ${OUTPUT_PATH} -outputdaily ${ALI_OAID_OUTPUT_DAILY_PATH} -coalesce 500 \ ../../${JAR} -output ${OUTPUT_PATH} -outputdaily ${ALI_OAID_OUTPUT_DAILY_PATH} -coalesce 500 \
-yesterday ${yesterday} -today ${dt_today} -dt_dash_today ${dt_dash_today} -dt_dash_rec14day ${dt_dash_rec14day} \ -yesterday ${yesterday} -today ${dt_today} -dt_dash_today ${dt_dash_today} -dt_dash_rec14day ${dt_dash_rec14day} \
-request_count_result "${OAID_REQUEST_COUNT_RESULT}/${dt_today}" -last_req_day ${last_req_day} -request_count_result "${OAID_REQUEST_COUNT_RESULT}/${dt_today}" -last_req_day ${last_req_day}
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliActivitionDaily \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliActivitionDaily \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 4 --num-executors 60 \ --deploy-mode cluster --executor-memory 10g --driver-memory 4g --executor-cores 4 --num-executors 60 \
../../${JAR} -output ${OUTPUT_PATH} -outputdaily ${ALI_OUTPUT_DAILY_PATH} -coalesce 500 \ ../../${JAR} -output ${OUTPUT_PATH} -outputdaily ${ALI_OUTPUT_DAILY_PATH} -coalesce 500 \
-yesterday ${yesterday} -today ${dt_today} -dt_dash_today ${dt_dash_today} -dt_dash_rec14day ${dt_dash_rec14day} \ -yesterday ${yesterday} -today ${dt_today} -dt_dash_today ${dt_dash_today} -dt_dash_rec14day ${dt_dash_rec14day} \
-request_count_result "${REQUEST_COUNT_RESULT}/${dt_today}" -last_req_day ${last_req_day} -request_count_result "${REQUEST_COUNT_RESULT}/${dt_today}" -last_req_day ${last_req_day}
......
...@@ -84,7 +84,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliActivitionPostBackDail ...@@ -84,7 +84,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliActivitionPostBackDail
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 60 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 3 --num-executors 60 \
../${JAR} -output ${OUTPUT_PATH} -iosoutput ${ALI_IOS_OUTPUT} -oaidoutput ${ALI_OAID_OUTPUT} -coalesce 50 \ ../${JAR} -output ${OUTPUT_PATH} -iosoutput ${ALI_IOS_OUTPUT} -oaidoutput ${ALI_OAID_OUTPUT} -coalesce 50 \
-today ${dt_today} -update_date ${dt_dash_today} \ -today ${dt_today} -update_date ${dt_dash_today} \
-dt_dash_rec15day ${dt_dash_rec15day} -syn_to_3s ${ALI_USER_ACTIVATION_SYS_TO3S_PATH} -syn_3s_day ${syn_3s_day} -dt_dash_rec15day ${dt_dash_rec15day} -syn_to_3s ${ALI_USER_ACTIVATION_SYS_TO3S_PATH} -syn_3s_day ${syn_3s_day}
......
...@@ -66,7 +66,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliActivitionPostBackDail ...@@ -66,7 +66,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlAliActivitionPostBackDail
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--conf spark.hadoop.mapreduce.input.fileinputformat.input.dir.recursive=true \ --conf spark.hadoop.mapreduce.input.fileinputformat.input.dir.recursive=true \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 70 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 70 \
../../${JAR} -output ${OUTPUT_PATH} -iosoutput ${ALI_IOS_OUTPUT} -oaidoutput ${ALI_OAID_OUTPUT} -coalesce 300 \ ../../${JAR} -output ${OUTPUT_PATH} -iosoutput ${ALI_IOS_OUTPUT} -oaidoutput ${ALI_OAID_OUTPUT} -coalesce 300 \
-today ${dt_today} -update_date ${dt_dash_today} -dt_taobao_postback_day ${dt_taobao_postback_day}\ -today ${dt_today} -update_date ${dt_dash_today} -dt_taobao_postback_day ${dt_taobao_postback_day}\
-dt_dash_rec15day ${dt_dash_rec15day} -syn_to_3s ${ALI_USER_ACTIVATION_SYS_TO3S_PATH} -syn_3s_day ${syn_3s_day} -dt_dash_rec15day ${dt_dash_rec15day} -syn_to_3s ${ALI_USER_ACTIVATION_SYS_TO3S_PATH} -syn_3s_day ${syn_3s_day}
......
...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlH18FromDmInstallListV2 \ ...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlH18FromDmInstallListV2 \
--conf spark.sql.shuffle.partitions=2000 \ --conf spark.sql.shuffle.partitions=2000 \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 60 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 60 \
../../${JAR} \ ../../${JAR} \
-h18_imei ${IMEI_H_18_GUANGDIANTONG_RES_PATH} -h18_imeimd5 ${IMEIMD5_H_18_GUANGDIANTONG_RES_PATH} \ -h18_imei ${IMEI_H_18_GUANGDIANTONG_RES_PATH} -h18_imeimd5 ${IMEIMD5_H_18_GUANGDIANTONG_RES_PATH} \
-dt_oneday_ago ${dt_oneday_ago} -dt_oneday_ago ${dt_oneday_ago}
......
...@@ -43,7 +43,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlOtherDataFromPostBackDail ...@@ -43,7 +43,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.EtlOtherDataFromPostBackDail
--conf spark.sql.shuffle.partitions=3000 \ --conf spark.sql.shuffle.partitions=3000 \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 150 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 150 \
../../${JAR} \ ../../${JAR} \
-output ${OUTPUT_PATH} \ -output ${OUTPUT_PATH} \
-dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago} -dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago}
......
...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayImeiLaHuoCK \ ...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayImeiLaHuoCK \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--conf hive.exec.orc.default.stripe.size=268435456 \ --conf hive.exec.orc.default.stripe.size=268435456 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 10 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 10 \
../../${JAR} -imeiInput ${IMEIMD5_INPUT} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table} -hour ${hour} ../../${JAR} -imeiInput ${IMEIMD5_INPUT} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table} -hour ${hour}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayImeiLaHuoCK \ ...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayImeiLaHuoCK \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--conf hive.exec.orc.default.stripe.size=268435456 \ --conf hive.exec.orc.default.stripe.size=268435456 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 10 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 10 \
../../${JAR} -imeiInput ${IMEIMD5_INPUT} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table} -hour ${hour} ../../${JAR} -imeiInput ${IMEIMD5_INPUT} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table} -hour ${hour}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayImeiLaHuoCK \ ...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayImeiLaHuoCK \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--conf hive.exec.orc.default.stripe.size=268435456 \ --conf hive.exec.orc.default.stripe.size=268435456 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 10 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 10 \
../../${JAR} -imeiInput ${IMEIMD5_INPUT} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table} -hour ${hour} ../../${JAR} -imeiInput ${IMEIMD5_INPUT} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table} -hour ${hour}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayImeiLaHuoCK \ ...@@ -25,7 +25,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayImeiLaHuoCK \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--conf hive.exec.orc.default.stripe.size=268435456 \ --conf hive.exec.orc.default.stripe.size=268435456 \
--conf spark.sql.files.maxPartitionBytes=268435456 \ --conf spark.sql.files.maxPartitionBytes=268435456 \
--master yarn --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 10 \ --deploy-mode cluster --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 10 \
../../${JAR} -imeiInput ${IMEIMD5_INPUT} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table} -hour ${hour} ../../${JAR} -imeiInput ${IMEIMD5_INPUT} -date ${LOG_TIME} -host ${host} -cluster ${cluster} -database ${database} -table ${table} -hour ${hour}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -37,7 +37,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDaily \ ...@@ -37,7 +37,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDaily \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 120 ../../${JAR} \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 120 ../../${JAR} \
-imeioutput "${ALIPAY_IMEIMD5_OUTPUT_PATH}" \ -imeioutput "${ALIPAY_IMEIMD5_OUTPUT_PATH}" \
-today ${dt_today} -last_req_day ${last_req_day} -dt_after_one_day ${dt_after_one_day}\ -today ${dt_today} -last_req_day ${last_req_day} -dt_after_one_day ${dt_after_one_day}\
-input_one_day ${INPUT_ONE_DAY} -input_two_day ${INPUT_TWO_DAY} -input_three_day ${INPUT_THREE_DAY} \ -input_one_day ${INPUT_ONE_DAY} -input_two_day ${INPUT_TWO_DAY} -input_three_day ${INPUT_THREE_DAY} \
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayTmpDataToDmp \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayTmpDataToDmp \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \
../../${JAR} -imeiRequestInput ${IMEIMD5_REQUEST_INPUT_PATH} -imeiResponseInput ${IMEIMD5_RESPONSE_INPUT_PATH} \ ../../${JAR} -imeiRequestInput ${IMEIMD5_REQUEST_INPUT_PATH} -imeiResponseInput ${IMEIMD5_RESPONSE_INPUT_PATH} \
-output01 ${OUTPUT01} -output02 ${OUTPUT02} -output01 ${OUTPUT01} -output02 ${OUTPUT02}
...@@ -62,7 +62,7 @@ fi ...@@ -62,7 +62,7 @@ fi
# --conf spark.sql.broadcastTimeout=1200 \ # --conf spark.sql.broadcastTimeout=1200 \
# --conf spark.yarn.executor.memoryOverhead=4096 \ # --conf spark.yarn.executor.memoryOverhead=4096 \
# --conf spark.sql.autoBroadcastJoinThreshold=31457280 \ # --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
# --master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \ # --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \
# ../../${JAR} -dt_today ${dt_today} -dt_three_days_ago ${dt_three_days_ago} \ # ../../${JAR} -dt_today ${dt_today} -dt_three_days_ago ${dt_three_days_ago} \
# -ActivationOutput ${ACTIVATIONOUTPUT} -AcquisitionOutput ${ACQUISITIONOUTPUT} # -ActivationOutput ${ACTIVATIONOUTPUT} -AcquisitionOutput ${ACQUISITIONOUTPUT}
# #
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayTmpDataToDmp \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayTmpDataToDmp \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \
../../${JAR} -imeiRequestInput ${IMEIMD5_REQUEST_INPUT_PATH} -imeiResponseInput ${IMEIMD5_RESPONSE_INPUT_PATH} \ ../../${JAR} -imeiRequestInput ${IMEIMD5_REQUEST_INPUT_PATH} -imeiResponseInput ${IMEIMD5_RESPONSE_INPUT_PATH} \
-output01 ${OUTPUT01} -output02 ${OUTPUT02} -output01 ${OUTPUT01} -output02 ${OUTPUT02}
...@@ -62,7 +62,7 @@ fi ...@@ -62,7 +62,7 @@ fi
# --conf spark.sql.broadcastTimeout=1200 \ # --conf spark.sql.broadcastTimeout=1200 \
# --conf spark.yarn.executor.memoryOverhead=4096 \ # --conf spark.yarn.executor.memoryOverhead=4096 \
# --conf spark.sql.autoBroadcastJoinThreshold=31457280 \ # --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
# --master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \ # --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \
# ../../${JAR} -dt_today ${dt_today} -dt_three_days_ago ${dt_three_days_ago} \ # ../../${JAR} -dt_today ${dt_today} -dt_three_days_ago ${dt_three_days_ago} \
# -ActivationOutput ${ACTIVATIONOUTPUT} -AcquisitionOutput ${ACQUISITIONOUTPUT} # -ActivationOutput ${ACTIVATIONOUTPUT} -AcquisitionOutput ${ACQUISITIONOUTPUT}
# #
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayTmpDataToDmp \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayTmpDataToDmp \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \
../../${JAR} -imeiRequestInput ${IMEIMD5_REQUEST_INPUT_PATH} -imeiResponseInput ${IMEIMD5_RESPONSE_INPUT_PATH} \ ../../${JAR} -imeiRequestInput ${IMEIMD5_REQUEST_INPUT_PATH} -imeiResponseInput ${IMEIMD5_RESPONSE_INPUT_PATH} \
-output01 ${OUTPUT01} -output02 ${OUTPUT02} -output01 ${OUTPUT01} -output02 ${OUTPUT02}
...@@ -62,7 +62,7 @@ fi ...@@ -62,7 +62,7 @@ fi
# --conf spark.sql.broadcastTimeout=1200 \ # --conf spark.sql.broadcastTimeout=1200 \
# --conf spark.yarn.executor.memoryOverhead=4096 \ # --conf spark.yarn.executor.memoryOverhead=4096 \
# --conf spark.sql.autoBroadcastJoinThreshold=31457280 \ # --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
# --master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \ # --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \
# ../../${JAR} -dt_today ${dt_today} -dt_three_days_ago ${dt_three_days_ago} \ # ../../${JAR} -dt_today ${dt_today} -dt_three_days_ago ${dt_three_days_ago} \
# -ActivationOutput ${ACTIVATIONOUTPUT} -AcquisitionOutput ${ACQUISITIONOUTPUT} # -ActivationOutput ${ACTIVATIONOUTPUT} -AcquisitionOutput ${ACQUISITIONOUTPUT}
# #
......
...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayTmpDataToDmp \ ...@@ -33,7 +33,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayTmpDataToDmp \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.yarn.executor.memoryOverhead=4096 \ --conf spark.yarn.executor.memoryOverhead=4096 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \
../../${JAR} -imeiRequestInput ${IMEIMD5_REQUEST_INPUT_PATH} -imeiResponseInput ${IMEIMD5_RESPONSE_INPUT_PATH} \ ../../${JAR} -imeiRequestInput ${IMEIMD5_REQUEST_INPUT_PATH} -imeiResponseInput ${IMEIMD5_RESPONSE_INPUT_PATH} \
-output01 ${OUTPUT01} -output02 ${OUTPUT02} -output01 ${OUTPUT01} -output02 ${OUTPUT02}
...@@ -62,7 +62,7 @@ fi ...@@ -62,7 +62,7 @@ fi
# --conf spark.sql.broadcastTimeout=1200 \ # --conf spark.sql.broadcastTimeout=1200 \
# --conf spark.yarn.executor.memoryOverhead=4096 \ # --conf spark.yarn.executor.memoryOverhead=4096 \
# --conf spark.sql.autoBroadcastJoinThreshold=31457280 \ # --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
# --master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \ # --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 4 --num-executors 40 \
# ../../${JAR} -dt_today ${dt_today} -dt_three_days_ago ${dt_three_days_ago} \ # ../../${JAR} -dt_today ${dt_today} -dt_three_days_ago ${dt_three_days_ago} \
# -ActivationOutput ${ACTIVATIONOUTPUT} -AcquisitionOutput ${ACQUISITIONOUTPUT} # -ActivationOutput ${ACTIVATIONOUTPUT} -AcquisitionOutput ${ACQUISITIONOUTPUT}
# #
......
...@@ -20,7 +20,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDF \ ...@@ -20,7 +20,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDF \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 10 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 10 \
../../${JAR} -date ${LOG_TIME} -dt_end_days ${dt_end_days} -partNum 60 -imeiOutput ${IMEIMD5_OUTPUT_PATH} -cluster 'cluster_1st' -hour ${hour} ../../${JAR} -date ${LOG_TIME} -dt_end_days ${dt_end_days} -partNum 60 -imeiOutput ${IMEIMD5_OUTPUT_PATH} -cluster 'cluster_1st' -hour ${hour}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -19,7 +19,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDF \ ...@@ -19,7 +19,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDF \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 10 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 10 \
../../${JAR} -date ${LOG_TIME} -dt_end_days ${dt_end_days} -partNum 60 -imeiOutput ${IMEIMD5_OUTPUT_PATH} -cluster 'cluster_1st' -hour ${hour} ../../${JAR} -date ${LOG_TIME} -dt_end_days ${dt_end_days} -partNum 60 -imeiOutput ${IMEIMD5_OUTPUT_PATH} -cluster 'cluster_1st' -hour ${hour}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -19,7 +19,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDF \ ...@@ -19,7 +19,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDF \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 10 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 10 \
../../${JAR} -date ${LOG_TIME} -dt_end_days ${dt_end_days} -partNum 60 -imeiOutput ${IMEIMD5_OUTPUT_PATH} -cluster 'cluster_1st' -hour ${hour} ../../${JAR} -date ${LOG_TIME} -dt_end_days ${dt_end_days} -partNum 60 -imeiOutput ${IMEIMD5_OUTPUT_PATH} -cluster 'cluster_1st' -hour ${hour}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -19,7 +19,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDF \ ...@@ -19,7 +19,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayLaHuoDF \
--conf spark.kryoserializer.buffer.max=256m \ --conf spark.kryoserializer.buffer.max=256m \
--conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.driver.extraJavaOptions="-XX:+UseG1GC" \
--conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \ --conf spark.executor.extraJavaOptions="-XX:+UseG1GC" \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 10 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 10 \
../../${JAR} -date ${LOG_TIME} -dt_end_days ${dt_end_days} -partNum 60 -imeiOutput ${IMEIMD5_OUTPUT_PATH} -cluster 'cluster_1st' -hour ${hour} ../../${JAR} -date ${LOG_TIME} -dt_end_days ${dt_end_days} -partNum 60 -imeiOutput ${IMEIMD5_OUTPUT_PATH} -cluster 'cluster_1st' -hour ${hour}
if [[ $? -ne 0 ]];then if [[ $? -ne 0 ]];then
......
...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayOtherDataToDmp \ ...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayOtherDataToDmp \
--conf spark.sql.shuffle.partitions=3000 \ --conf spark.sql.shuffle.partitions=3000 \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 140 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 140 \
../../${JAR} \ ../../${JAR} \
-output01 ${OUTPUT_PATH01} -output02 ${OUTPUT_PATH02} \ -output01 ${OUTPUT_PATH01} -output02 ${OUTPUT_PATH02} \
-dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago} -hour ${hour} -dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago} -hour ${hour}
......
...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayOtherDataToDmp \ ...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayOtherDataToDmp \
--conf spark.sql.shuffle.partitions=3000 \ --conf spark.sql.shuffle.partitions=3000 \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 140 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 140 \
../../${JAR} \ ../../${JAR} \
-output01 ${OUTPUT_PATH01} -output02 ${OUTPUT_PATH02} \ -output01 ${OUTPUT_PATH01} -output02 ${OUTPUT_PATH02} \
-dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago} -hour ${hour} -dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago} -hour ${hour}
......
...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayOtherDataToDmp \ ...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayOtherDataToDmp \
--conf spark.sql.shuffle.partitions=3000 \ --conf spark.sql.shuffle.partitions=3000 \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 140 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 140 \
../../${JAR} \ ../../${JAR} \
-output01 ${OUTPUT_PATH01} -output02 ${OUTPUT_PATH02} \ -output01 ${OUTPUT_PATH01} -output02 ${OUTPUT_PATH02} \
-dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago} -hour ${hour} -dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago} -hour ${hour}
......
...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayOtherDataToDmp \ ...@@ -29,7 +29,7 @@ spark-submit --class mobvista.dmp.datasource.taobao.AlipayOtherDataToDmp \
--conf spark.sql.shuffle.partitions=3000 \ --conf spark.sql.shuffle.partitions=3000 \
--conf spark.sql.broadcastTimeout=1200 \ --conf spark.sql.broadcastTimeout=1200 \
--conf spark.sql.autoBroadcastJoinThreshold=31457280 \ --conf spark.sql.autoBroadcastJoinThreshold=31457280 \
--master yarn --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 140 \ --deploy-mode cluster --executor-memory 8g --driver-memory 4g --executor-cores 5 --num-executors 140 \
../../${JAR} \ ../../${JAR} \
-output01 ${OUTPUT_PATH01} -output02 ${OUTPUT_PATH02} \ -output01 ${OUTPUT_PATH01} -output02 ${OUTPUT_PATH02} \
-dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago} -hour ${hour} -dt_today ${dt_today} -dt_oneday_ago ${dt_oneday_ago} -hour ${hour}
......
...@@ -24,7 +24,7 @@ spark-submit --class mobvista.dmp.datasource.TO.TOInstallList \ ...@@ -24,7 +24,7 @@ spark-submit --class mobvista.dmp.datasource.TO.TOInstallList \
--conf spark.network.timeout=720s \ --conf spark.network.timeout=720s \
--conf spark.default.parallelism=100 \ --conf spark.default.parallelism=100 \
--conf spark.read.textfile.tag=1 \ --conf spark.read.textfile.tag=1 \
--master yarn --deploy-mode cluster --name AlipayActivationInstallList --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 30 \ --deploy-mode cluster --name AlipayActivationInstallList --executor-memory 4g --driver-memory 4g --executor-cores 2 --num-executors 30 \
../../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 160 -coalesce 160 ../../${JAR} -input ${INPUT_PATH} -oldInput ${OLD_INPUT_PATH} -output ${OUTPUT_PATH} -date ${dt} -parallelism 160 -coalesce 160
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment