|
@@ -215,23 +215,31 @@ case class deadbeat_info(s: SparkSession,
|
|
|
sql(
|
|
|
s"""
|
|
|
|SELECT *
|
|
|
- |FROM winhc_eci_dev.ads_deadbeat_person
|
|
|
- |WHERE ds > '$target_last_ds'
|
|
|
- |AND card_num IS NOT NULL
|
|
|
- |UNION ALL
|
|
|
- |SELECT t2.*
|
|
|
|FROM (
|
|
|
- | SELECT DISTINCT CONCAT(name,card_num) AS KEY
|
|
|
- | FROM winhc_eci_dev.ads_deadbeat_person
|
|
|
- | WHERE ds > '$target_last_ds'
|
|
|
- | AND card_num IS NOT NULL
|
|
|
- | ) AS t1
|
|
|
- |JOIN (
|
|
|
| SELECT *
|
|
|
- | FROM winhc_eci_dev.ads_deadbeat_person
|
|
|
- | WHERE ds <= '$target_last_ds'
|
|
|
- | ) AS t2
|
|
|
- |ON t1.KEY = CONCAT(t2.name,t2.card_num)
|
|
|
+ | ,ROW_NUMBER() OVER(PARTITION BY rowkey ORDER BY ds DESC ) AS num
|
|
|
+ | FROM (
|
|
|
+ | SELECT *
|
|
|
+ | FROM winhc_eci_dev.ads_deadbeat_person
|
|
|
+ | WHERE ds > '$target_last_ds'
|
|
|
+ | AND card_num IS NOT NULL
|
|
|
+ | UNION ALL
|
|
|
+ | SELECT t2.*
|
|
|
+ | FROM (
|
|
|
+ | SELECT DISTINCT CONCAT(name,card_num) AS my_key
|
|
|
+ | FROM winhc_eci_dev.ads_deadbeat_person
|
|
|
+ | WHERE ds > '$target_last_ds'
|
|
|
+ | AND card_num IS NOT NULL
|
|
|
+ | ) AS t1
|
|
|
+ | JOIN (
|
|
|
+ | SELECT *
|
|
|
+ | FROM winhc_eci_dev.ads_deadbeat_person
|
|
|
+ | WHERE ds <= '$target_last_ds'
|
|
|
+ | ) AS t2
|
|
|
+ | ON t1.my_key = CONCAT(t2.name,t2.card_num)
|
|
|
+ | ) AS t3
|
|
|
+ | ) AS t4
|
|
|
+ |WHERE t4.num = 1
|
|
|
|""".stripMargin)
|
|
|
.createOrReplaceTempView("tmp_ads_deadbeat_person_all_tmp")
|
|
|
|
|
@@ -263,23 +271,8 @@ case class deadbeat_info(s: SparkSession,
|
|
|
| FROM tmp_ads_deadbeat_person_all_tmp
|
|
|
| GROUP BY name
|
|
|
| ,card_num
|
|
|
- |--- UNION ALL
|
|
|
- |--- SELECT md5(cleanup(CONCAT_WS('',rowkey,name))) AS id
|
|
|
- |--- ,name
|
|
|
- |--- ,card_num
|
|
|
- |--- ,NULL AS birth_year
|
|
|
- |--- ,NULL AS gender
|
|
|
- |--- ,NULL AS province
|
|
|
- |--- ,NULL AS city
|
|
|
- |--- ,NULL AS district
|
|
|
- |--- ,get_empty_map(rowkey,tn,deleted,publish_date) AS labels
|
|
|
- |--- FROM winhc_eci_dev.ads_deadbeat_person
|
|
|
- |--- WHERE ds > $target_last_ds
|
|
|
- |--- AND card_num IS NULL
|
|
|
| )
|
|
|
|""".stripMargin)
|
|
|
- // .show(10000)
|
|
|
-
|
|
|
}
|
|
|
|
|
|
|
|
@@ -315,22 +308,30 @@ case class deadbeat_info(s: SparkSession,
|
|
|
sql(
|
|
|
s"""
|
|
|
|SELECT *
|
|
|
- |FROM winhc_eci_dev.ads_deadbeat_company
|
|
|
- |WHERE ds > '$target_last_ds'
|
|
|
- |UNION ALL
|
|
|
- |SELECT t2.*
|
|
|
|FROM (
|
|
|
- | SELECT DISTINCT cid
|
|
|
- | FROM winhc_eci_dev.ads_deadbeat_company
|
|
|
- | WHERE ds > '$target_last_ds'
|
|
|
- | AND cid is not null
|
|
|
- | ) AS t1
|
|
|
- |JOIN (
|
|
|
| SELECT *
|
|
|
- | FROM winhc_eci_dev.ads_deadbeat_company
|
|
|
- | WHERE ds <= '$target_last_ds'
|
|
|
- | ) AS t2
|
|
|
- |ON t1.cid = t2.cid
|
|
|
+ | ,ROW_NUMBER() OVER(PARTITION BY rowkey ORDER BY ds DESC ) AS num
|
|
|
+ | FROM (
|
|
|
+ | SELECT *
|
|
|
+ | FROM winhc_eci_dev.ads_deadbeat_company
|
|
|
+ | WHERE ds > '$target_last_ds'
|
|
|
+ | UNION ALL
|
|
|
+ | SELECT t2.*
|
|
|
+ | FROM (
|
|
|
+ | SELECT DISTINCT cid
|
|
|
+ | FROM winhc_eci_dev.ads_deadbeat_company
|
|
|
+ | WHERE ds > '$target_last_ds'
|
|
|
+ | AND cid IS NOT NULL
|
|
|
+ | ) AS t1
|
|
|
+ | JOIN (
|
|
|
+ | SELECT *
|
|
|
+ | FROM winhc_eci_dev.ads_deadbeat_company
|
|
|
+ | WHERE ds <= '$target_last_ds'
|
|
|
+ | ) AS t2
|
|
|
+ | ON t1.cid = t2.cid
|
|
|
+ | ) AS t3
|
|
|
+ | ) AS t4
|
|
|
+ |WHERE t4.num = 1
|
|
|
|""".stripMargin).createOrReplaceTempView("all_deadbeat_tmp_company_tmp")
|
|
|
|
|
|
sql(
|