|
@@ -3,6 +3,7 @@ package com.winhc.bigdata.spark.jobs.chance
|
|
|
import com.winhc.bigdata.spark.config.EsConfig
|
|
|
import com.winhc.bigdata.spark.utils.BaseUtil.isWindows
|
|
|
import com.winhc.bigdata.spark.utils.{BaseUtil, LoggingUtils, SparkUtils}
|
|
|
+import org.apache.commons.lang3.StringUtils
|
|
|
import org.apache.spark.internal.Logging
|
|
|
import org.apache.spark.sql.functions.col
|
|
|
import org.apache.spark.sql.types.{MapType, StringType, StructField, StructType}
|
|
@@ -157,32 +158,57 @@ object ChangeExtract {
|
|
|
}
|
|
|
|
|
|
|
|
|
- // winhc_eci_dev company_tm rowkey 20200715 status_new
|
|
|
- // winhc_eci_dev company_patent_list rowkey 20200715 lprs
|
|
|
+ // winhc_eci_dev company_tm rowkey 20200717 status_new
|
|
|
+ // winhc_eci_dev company_patent_list rowkey 20200717 lprs
|
|
|
// winhc_eci_dev company_certificate rowkey 20200707 type
|
|
|
- // winhc_eci_dev company_copyright_works_list rowkey 20200715 type
|
|
|
- // winhc_eci_dev company_copyright_reg_list rowkey 20200715 version
|
|
|
+ // winhc_eci_dev company_copyright_works_list rowkey 20200717 type
|
|
|
+ // winhc_eci_dev company_copyright_reg_list rowkey 20200717 version
|
|
|
// winhc_eci_dev company_employment rowkey 20200630 source
|
|
|
|
|
|
- // winhc_eci_dev company_land_publicity rowkey 20200630 title,location,use_for
|
|
|
- // winhc_eci_dev company_land_announcement rowkey 20200715 e_number,project_name
|
|
|
+ // winhc_eci_dev company_land_publicity rowkey 20200717 title,location,use_for
|
|
|
+ // winhc_eci_dev company_land_announcement rowkey 20200717 e_number,project_name
|
|
|
|
|
|
+ // winhc_eci_dev company_bid_list rowkey 20200717 title
|
|
|
+ // winhc_eci_dev company_land_transfer rowkey 20200717 num,location
|
|
|
|
|
|
|
|
|
// winhc_eci_dev company cid 20200630 legal_entity_id,reg_location,business_scope,reg_status,reg_capital,emails,phones
|
|
|
def main(args: Array[String]): Unit = {
|
|
|
- val Array(project, tableName, rowkey, inc_ds, pf) = args
|
|
|
-
|
|
|
- val config = EsConfig.getEsConfigMap ++ mutable.Map(
|
|
|
- "spark.hadoop.odps.project.name" -> project,
|
|
|
- "spark.hadoop.odps.spark.local.partition.amt" -> "10"
|
|
|
- )
|
|
|
-
|
|
|
-
|
|
|
- val spark = SparkUtils.InitEnv("ChangeExtract", config)
|
|
|
-
|
|
|
- ChangeExtractHandle(spark, project, tableName, rowkey, inc_ds, pf.split(",")).calc
|
|
|
- spark.stop()
|
|
|
+ if (args.length == 5) {
|
|
|
+ val Array(project, tableName, rowkey, inc_ds, pf) = args
|
|
|
+ val config = EsConfig.getEsConfigMap ++ mutable.Map(
|
|
|
+ "spark.hadoop.odps.project.name" -> project,
|
|
|
+ "spark.hadoop.odps.spark.local.partition.amt" -> "10"
|
|
|
+ )
|
|
|
+ val spark = SparkUtils.InitEnv("ChangeExtract", config)
|
|
|
+
|
|
|
+
|
|
|
+ ChangeExtractHandle(spark, project, tableName, rowkey, inc_ds, pf.split(",")).calc
|
|
|
+ spark.stop()
|
|
|
+ } else {
|
|
|
+ val project = "winhc_eci_dev"
|
|
|
+ val config = EsConfig.getEsConfigMap ++ mutable.Map(
|
|
|
+ "spark.hadoop.odps.project.name" -> project,
|
|
|
+ "spark.hadoop.odps.spark.local.partition.amt" -> "10"
|
|
|
+ )
|
|
|
+ val spark = SparkUtils.InitEnv("ChangeExtract", config)
|
|
|
+ val rows =
|
|
|
+ """winhc_eci_dev company_tm rowkey 20200717 status_new
|
|
|
+ |winhc_eci_dev company_patent_list rowkey 20200717 lprs
|
|
|
+ |winhc_eci_dev company_copyright_works_list rowkey 20200717 type
|
|
|
+ |winhc_eci_dev company_copyright_reg_list rowkey 20200717 version
|
|
|
+ |winhc_eci_dev company_land_publicity rowkey 20200717 title,location,use_for
|
|
|
+ |winhc_eci_dev company_land_announcement rowkey 20200717 e_number,project_name
|
|
|
+ |winhc_eci_dev company_bid_list rowkey 20200717 title
|
|
|
+ |winhc_eci_dev company_land_transfer rowkey 20200717 num,location
|
|
|
+ |""".stripMargin
|
|
|
+ for (r <- rows.split("\r\n")) {
|
|
|
+ if(StringUtils.isNotEmpty(r)){
|
|
|
+ val Array(tmp,tableName,rowkey,inc_ds,pf) =r.split(" ")
|
|
|
+ ChangeExtractHandle(spark, project, tableName, rowkey, inc_ds, pf.split(",")).calc
|
|
|
+ }
|
|
|
+ }
|
|
|
+ spark.stop()
|
|
|
+ }
|
|
|
}
|
|
|
-
|
|
|
}
|