|
df.dropDuplicates("link").withColumn("cids",explode(split(col("cids"), ";")))
|
|
df.dropDuplicates("link").withColumn("cids",explode(split(col("cids"), ";")))
|
|
.select("id","cids","title","link","intro","abs","publish_time","purchaser","proxy","province","base","type","items","create_time","update_time","deleted")
|
|
.select("id","cids","title","link","intro","abs","publish_time","purchaser","proxy","province","base","type","items","create_time","update_time","deleted")
|