|
@@ -0,0 +1,27 @@
|
|
|
+package com.winhc.bigdata.udf;
|
|
|
+
|
|
|
+import com.aliyun.odps.udf.UDF;
|
|
|
+import com.aliyun.odps.utils.StringUtils;
|
|
|
+
|
|
|
+import java.util.regex.Pattern;
|
|
|
+
|
|
|
+/**
|
|
|
+ * @Author: π
|
|
|
+ * @Description: 统一分割符
|
|
|
+ */
|
|
|
+public class StringReplaceChar extends UDF {
|
|
|
+ private static final Pattern pattern = Pattern.compile("[\\u4e00-\\u9fa50-9a-zA-Z]");
|
|
|
+
|
|
|
+ public String evaluate(String val) {
|
|
|
+ return StringUtils.isNotBlank(val) ? val.replaceAll("、",",")
|
|
|
+ .replaceAll(";",",")
|
|
|
+ .replaceAll(",",",")
|
|
|
+ .replaceAll(" ",",")
|
|
|
+ : "";
|
|
|
+ }
|
|
|
+
|
|
|
+ public static void main(String[] args) {
|
|
|
+ String res = new StringReplaceChar().evaluate("中国,人123;za 早上5");
|
|
|
+ System.out.println(res);
|
|
|
+ }
|
|
|
+}
|