4 years ago · 305a098a8a
--- a/src/main/scala/com/winhc/bigdata/spark/jobs/deadbeat/deadbeat_info.scala
+++ b/src/main/scala/com/winhc/bigdata/spark/jobs/deadbeat/deadbeat_info.scala
@@ -214,7 +214,7 @@ case class deadbeat_info(s: SparkSession,
 
																     spark.udf.register("get_birth_year", get_birth_year _)
															
 
																     spark.udf.register("agg_label", new person_agg_label)
															
 
																     spark.udf.register("get_empty_map", get_empty_map _)
															
 
																-    is_id_card()
															
 
																+    is_id_card_udf()
															
 
																     id_card_trim_udf()
															
 
																     def toTime(str: String): String = DateUtils.toMillisTimestamp(str, pattern = "yyyy-MM-dd HH:mm:ss")
															
@@ -229,10 +229,16 @@ case class deadbeat_info(s: SparkSession,
 
																     mapTables("company_dishonest_info") = ("rowkey", "name", "card_num", "pub_date", "status")
															
 
																     mapTables("company_zxr_final_case") = ("rowkey", "name", "identity_num", "case_create_time", "deleted")
															
 
																     mapTables("company_zxr_restrict") = ("rowkey", "name", "identity_num", "case_create_time", "status")
															
 
																-    mapTables.foreach(m => {
															
 
																-      spark.sparkContext.setJobDescription(s"查老赖（个人）数据预处理:${m._1}")
															
 
																-      deadbeat_info_pre(spark, project = project, table = m._1, rowkey = m._2._1, cid = null, name = m._2._2, card_num = m._2._3, publish_date = m._2._4, deleted = m._2._5).calc()
															
 
																-    })
															
 
																+    val ts = mapTables.map(m => {
															
 
																+      val name = s"查老赖（个人）数据预处理:${m._1}"
															
 
																+      val func = () => {
															
 
																+        spark.sparkContext.setJobDescription(name)
															
 
																+        deadbeat_info_pre(spark, project = project, table = m._1, rowkey = m._2._1, cid = null, name = m._2._2, card_num = m._2._3, publish_date = m._2._4, deleted = m._2._5).calc()
															
 
																+        return true
															
 
																+      }
															
 
																+      (name, func)
															
 
																+    }).toSeq
															
 
																+    AsyncExtract.startAndWait(spark, ts)
															
 
																   }
															
 
																   def person(): Unit = {
															
@@ -311,11 +317,16 @@ case class deadbeat_info(s: SparkSession,
 
																     mapTables("company_dishonest_info") = ("rowkey", "cid", "name", "card_num", "pub_date", "status")
															
 
																     mapTables("company_zxr_final_case") = ("rowkey", "cid", "name", "identity_num", "case_create_time", "deleted")
															
 
																     mapTables("company_zxr_restrict") = ("rowkey", "cid", "name", "identity_num", "case_create_time", "status")
															
 
																-    mapTables.foreach(m => {
															
 
																-      println(m)
															
 
																-      spark.sparkContext.setJobDescription(s"查老赖（企业）数据预处理:${m._1}")
															
 
																-      deadbeat_info_pre(spark, project = project, table = m._1, rowkey = m._2._1, cid = m._2._2, name = m._2._3, card_num = m._2._4, publish_date = m._2._5, deleted = m._2._6).calc()
															
 
																-    })
															
 
																+    val ts = mapTables.map(m => {
															
 
																+      val name = s"查老赖（企业）数据预处理:${m._1}"
															
 
																+      val func = () => {
															
 
																+        spark.sparkContext.setJobDescription(name)
															
 
																+        deadbeat_info_pre(spark, project = project, table = m._1, rowkey = m._2._1, cid = m._2._2, name = m._2._3, card_num = m._2._4, publish_date = m._2._5, deleted = m._2._6).calc()
															
 
																+        return true
															
 
																+      }
															
 
																+      (name, func)
															
 
																+    }).toSeq
															
 
																+    AsyncExtract.startAndWait(spark, ts)
															
 
																   }
															
 
																   def company(): Unit = {