Skip to content
Projects
Groups
Snippets
Help
This project
Loading...
Sign in / Register
Toggle navigation
M
mobvista-dmp
Project
Overview
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
王金锋
mobvista-dmp
Commits
c953965c
Commit
c953965c
authored
Dec 21, 2021
by
WangJinfeng
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
init id_mapping
parent
d8011ba3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
4 additions
and
6 deletions
+4
-6
id_mapping.sh
azkaban/id_mapping/id_mapping.sh
+2
-2
Constant.scala
...n/scala/mobvista/dmp/datasource/id_mapping/Constant.scala
+0
-3
IDMappingGraphx.scala
.../mobvista/dmp/datasource/id_mapping/IDMappingGraphx.scala
+2
-1
No files found.
azkaban/id_mapping/id_mapping.sh
View file @
c953965c
...
...
@@ -24,8 +24,8 @@ spark-submit --class mobvista.dmp.datasource.id_mapping.IDMappingGraphx \
--name
"IDMappingGraphx.
${
LOG_TIME
}
.
${
country
}
.
${
platform
}
"
\
--conf
spark.yarn.executor.memoryOverhead
=
2048
\
--conf
spark.network.timeout
=
720s
\
--conf
spark.sql.shuffle.partitions
=
5
000
\
--conf
spark.default.parallelism
=
5
000
\
--conf
spark.sql.shuffle.partitions
=
10
000
\
--conf
spark.default.parallelism
=
10
000
\
--conf
spark.executor.extraJavaOptions
=
"-XX:+UseG1GC"
\
--master
yarn
--deploy-mode
cluster
--executor-memory
12g
--driver-memory
8g
--executor-cores
5
--num-executors
100
\
../
${
JAR
}
-date
${
LOG_TIME
}
-country
${
country
}
-platform
${
platform
}
-output
${
OUTPUT_PATH
}
-coalesce
500
...
...
src/main/scala/mobvista/dmp/datasource/id_mapping/Constant.scala
View file @
c953965c
...
...
@@ -267,9 +267,6 @@ object Constant {
val
iosIDScoreMap
:
Map
[
String
,
Double
]
=
Map
(
"idfa"
->
1000
,
"sysid"
->
1
,
"xwho"
->
0.9
,
"user_id"
->
0.9
,
"bmosv_osv_upt"
->
0.9
,
"idfv_bundle"
->
0.8
,
"bmosv_upt"
->
0.7
,
"bmosv_ipua_bundle"
->
0.6
,
"bkupid"
->
0.3
)
val
androidCNIDScoreMap
:
Map
[
String
,
Double
]
=
Map
(
"imei"
->
1000
,
"oaid"
->
1000
,
"gaid"
->
1000
,
"sysid"
->
1
,
"xwho"
->
0.9
,
"user_id"
->
0.9
,
"android_pkg"
->
0.8
,
"bmosv_upt"
->
0.7
,
"bmosv_ipua_pkg"
->
0.6
,
"bkupid"
->
0.3
)
val
androidIDScoreMap
:
Map
[
String
,
Double
]
=
Map
(
"gaid"
->
1000
,
"imei"
->
1000
,
"oaid"
->
1000
,
"sysid"
->
1
,
"xwho"
->
0.9
,
"user_id"
->
0.9
,
"android_pkg"
->
0.8
,
"bmosv_upt"
->
0.7
,
"bmosv_ipua_pkg"
->
0.6
,
"bkupid"
->
0.3
)
...
...
src/main/scala/mobvista/dmp/datasource/id_mapping/IDMappingGraphx.scala
View file @
c953965c
...
...
@@ -42,12 +42,13 @@ class IDMappingGraphx extends CommonSparkJob with Serializable {
val
platform
=
commandLine
.
getOptionValue
(
"platform"
)
val
date
=
commandLine
.
getOptionValue
(
"date"
)
val
output
=
commandLine
.
getOptionValue
(
"output"
)
val
result_output
=
commandLine
.
getOptionValue
(
"result_output"
)
val
coalesce
=
Integer
.
parseInt
(
commandLine
.
getOptionValue
(
"coalesce"
))
val
spark
=
MobvistaConstant
.
createSparkSession
(
s
"IDMappingGraphx.$date.$country.$platform"
)
try
{
oldAndTodayIdMapping
(
country
,
platform
,
date
,
spark
,
output
,
output
,
coalesce
)
oldAndTodayIdMapping
(
country
,
platform
,
date
,
spark
,
output
,
result_
output
,
coalesce
)
}
finally
{
if
(
spark
!=
null
)
{
spark
.
stop
()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment