From 19ae7d93a0163c65cf572aba16e7b735e7d54762 Mon Sep 17 00:00:00 2001
From: WangJinfeng <wjf20110627@163.com>
Date: Fri, 24 Sep 2021 14:55:22 +0800
Subject: [PATCH] fix craw package tag bug

---
 src/main/scala/mobvista/dmp/datasource/apptag/CrawPkgsSpark.scala | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/main/scala/mobvista/dmp/datasource/apptag/CrawPkgsSpark.scala b/src/main/scala/mobvista/dmp/datasource/apptag/CrawPkgsSpark.scala
index 9a26cde..cd987b9 100644
--- a/src/main/scala/mobvista/dmp/datasource/apptag/CrawPkgsSpark.scala
+++ b/src/main/scala/mobvista/dmp/datasource/apptag/CrawPkgsSpark.scala
@@ -32,6 +32,7 @@ class CrawPkgsSpark extends CommonSparkJob with Serializable {
     val pkginstallpath = commandLine.getOptionValue("pkginstallpath")
     val coalesce = commandLine.getOptionValue("coalesce")
     val yesday = commandLine.getOptionValue("yesday")
+    val update_date = MobvistaConstant.sdf1.format(MobvistaConstant.sdf2.parse(yesday))
 
     val spark = SparkSession.builder()
       .appName("CrawPkgsSpark")
@@ -75,7 +76,8 @@ class CrawPkgsSpark extends CommonSparkJob with Serializable {
            |SELECT b.package_name, getPlatform(b.package_name) platform
            |  FROM
            |    (SELECT package_name, COUNT(1) counts
-           |      FROM dwh.dmp_install_list LATERAL VIEW explode(getPkgs(install_list)) dmp_table AS package_name WHERE dt = '$yesday' AND business = '14days'
+           |      FROM dwh.dmp_install_list LATERAL VIEW explode(getPkgs(install_list)) dmp_table AS package_name WHERE dt = '$yesday'
+           |      AND update_date = '$update_date' AND business = '14days'
            |      GROUP BY package_name
            |    ) b
            |    LEFT JOIN
--
libgit2 0.27.1