@@ -1,107 +0,0 @@
-package com.winhc.bigdata.spark.jobs.deadbeat
-import com.winhc.bigdata.spark.udf.{BaseFunc, CompanyMapping}
-import com.winhc.bigdata.spark.utils.BaseUtil.isWindows
-import com.winhc.bigdata.spark.utils.{BaseUtil, LoggingUtils, SparkUtils}
-import org.apache.spark.sql.SparkSession
-import scala.collection.mutable
- * @Description:查失信、查被执之限高数据预处理
- * @author Yan Yongnian
- * @date 2020/10/13
- */
-object zxr_restrict {
- def main(args: Array[String]): Unit = {
- val project = "winhc_eci_dev"
- println(
- s"""
- |project: $project
- |""".stripMargin)
- val config = mutable.Map(
- "spark.hadoop.odps.project.name" -> s"$project",
- "spark.hadoop.odps.spark.local.partition.amt" -> "100"
- )
- val spark: SparkSession = SparkUtils.InitEnv(this.getClass.getSimpleName, config)
- zxr_restrict(spark, project).precalc()
- spark.stop()
- }
-case class zxr_restrict(s: SparkSession, project: String
- ) extends LoggingUtils with CompanyMapping with BaseFunc {
- override protected val spark: SparkSession = s
- def precalc(): Unit = {
- prepareFunctions(spark)
- case_no_trim_udf()
- //限制高消费预处理(企业)
- var lastDsIncAds = BaseUtil.getPartion(s"$project.inc_ads_company_zxr_restrict", spark)
- spark.sparkContext.setJobDescription(s"处理zxr_restrict($lastDsIncAds)")
- sql(
- s"""
- |insert ${if (isWindows) "INTO" else "OVERWRITE"} table $project.ads_deadbeat_company partition(ds='$lastDsIncAds',tn='zxr_restrict')
- |select
- | rowkey
- | ,cid
- | ,name
- | ,card_num
- | ,publish_date
- | ,deleted
- |from (
- | select
- | rowkey
- | ,new_cid as cid
- | ,coalesce(company_name,company_info) as name
- | ,identity_num as card_num
- | ,case_create_time AS publish_date
- | ,case_no
- | ,court_name
- | ,deleted
- | ,row_number() over(partition by rowkey order by update_time desc) num
- | from (
- | select rowkey,new_cid,company_name,company_info,identity_num,case_create_time,case_no,court_name,deleted
- | from $project.ads_company_zxr_restrict
- | where length(case_no) > 0 and ds > '0'
- | union all
- | select rowkey,new_cid,company_name,company_info,identity_num,case_create_time,case_no,court_name,deleted
- | from $project.inc_ads_company_zxr_restrict
- | where length(case_no) > 0 and ds > '0'
- | )
- | )
- |where num = 1
- |""".stripMargin).show(10, false)
- //限制高消费预处理(个人)
- val columns: Seq[String] = spark.table(s"$project.inc_ads_company_zxr_restrict_person").schema.map(_.name).filter(_!="flag")
- lastDsIncAds = BaseUtil.getPartion(s"$project.ads_company_zxr_restrict_person_cloze", spark)
- spark.sparkContext.setJobDescription(s"处理zxr_restrict_person($lastDsIncAds)")
- sql(
- s"""
- |insert ${if (isWindows) "INTO" else "OVERWRITE"} table $project.ads_deadbeat_person partition(ds='$lastDsIncAds',tn='zxr_restrict_person')
- |select
- | rowkey
- | ,cid
- | ,name
- | ,card_num
- | ,publish_date
- | ,deleted
- |from (
- | select
- | rowkey
- | ,new_cid as cid
- | ,coalesce(company_name,company_info) as name
- | ,identity_num as card_num
- | ,case_create_time AS publish_date
- | ,case_no
- | ,court_name
- | ,deleted
- | ,row_number() over(partition by rowkey order by update_time desc) num
- | from $project.ads_company_zxr_restrict_person_cloze
- | where length(case_no) > 0 and ds=$lastDsIncAds
- | )
- |where num = 1
- |""".stripMargin).show(10, false)
- }