89 Commits 9d95ae3a0c ... 8c3744eef3

Author SHA1 Message Date
  许家凯 8c3744eef3 fix: 添加case_no_party_title_parse函数 1 year ago
  许家凯 972c5b8de0 Merge remote-tracking branch 'origin/master' 1 year ago
  许家凯 6e45fb67b4 fix: 添加case_no_party_title_parse函数 1 year ago
  许家凯 75ae988edb feat: 添加case_no_party_title_parse函数 1 year ago
  许家凯 5550426367 feat: 添加cleanup_sort函数 1 year ago
  许家凯 cf4cd06300 feat: 添加注册资本按汇率转换函数 1 year ago
  JimZhang 5b3d07bd49 feat: 公司类型、省市区代码、变更类型清洗 2 years ago
  xufei 119cbf1c29 add udf 2 years ago
  许家凯 e390fa82cc docs: 2 years ago
  许家凯 7c15c6a028 Merge remote-tracking branch 'origin/master' 2 years ago
  许家凯 2354463036 fix: 添加统一信用代码,工商注册号校验函数 2 years ago
  许家凯 ebc1ecdeeb feat: 添加统一信用代码,工商注册号校验函数 2 years ago
  xufei f4016e0cce add udf 2 years ago
  xufei 2d30ff5d0a add udf 2 years ago
  xufei 364fc6df6c add udf 2 years ago
  JimZhang a9de3e6a6a feat: 公司类型返回array 2 years ago
  JimZhang 52311ec3b6 Merge branch 'master' of http://139.224.213.4:3000/bigdata/UDF_Max 2 years ago
  JimZhang 3b8347bd94 feat: 公司类型 2 years ago
  JimZhang 00f940474a feat: 公司类型识别 2 years ago
  JimZhang 4c01e8d9bd Merge branch 'master' of http://139.224.213.4:3000/bigdata/UDF_Max 2 years ago
  JimZhang d87d02bc49 feat: add udf 2 years ago
  JimZhang 720123c4b6 feat: cleanup change info udf 2 years ago
  xufei 08f52b6a9d add udf 2 years ago
  xufei b4cd164df8 add udf 2 years ago
  许家凯 c81a31d40e feat: v7_tyc_company_compare 2 years ago
  许家凯 eeca233cb7 feat: amount_format 2 years ago
  xufei 76d51eab44 add udf 2 years ago
  xufei f2ca305b0b add udf 2 years ago
  xufei 272d573d49 add udf 3 years ago
  xufei 655b09a801 Merge remote-tracking branch 'origin/master' 3 years ago
  xufei 4276faf725 add udf 3 years ago
  xufei ba60a5b796 update 3 years ago
  许家凯 3eb88739dc feat: 添加查找繁体转简体异常问题 3 years ago
  xufei f903f5eb12 注册资本规整 3 years ago
  xufei f063ac3cb2 add udf 3 years ago
  许家凯 65a281eab1 feat: 添加注册资本格式化函数 3 years ago
  xufei 656cd385bb add udf 3 years ago
  xufei a54ecebc03 是否结案判断 3 years ago
  xufei 1fcd8ec891 udf add 3 years ago
  xufei d142c1d774 日期规整 3 years ago
  xufei 70bb4c7967 法人提取 3 years ago
  xufei 7c47868b84 注册资本修复 3 years ago
  xufei c614fad9d8 行业code转name 3 years ago
  许家凯 c0cf3f6dbf feat: add 3 years ago
  许家凯 6bc8605b24 feat: add 3 years ago
  xufei bc7128e507 兼容数值 3 years ago
  xufei 31a105193b url提取 3 years ago
  许家凯 cc0de7ac9b feat: add CompanyZxrRestrictPublishDate 3 years ago
  许家凯 8e92101c86 feat: add FieldsCompare 3 years ago
  xufei d681f21879 更新逻辑 3 years ago
  JimZhang dab2dd7c3e fix: 薪资转换优化特殊情况 3 years ago
  JimZhang d4475bdb2b feat: 薪资转换兼容更多情况 3 years ago
  JimZhang 4fc26d560d feat: 薪资转换 3 years ago
  xufei 081e319f2b 更新逻辑 3 years ago
  xufei d6df72c4c6 Merge remote-tracking branch 'origin/master' 3 years ago
  xufei 83d95e3210 更新逻辑 3 years ago
  xufei 7e542efc63 update 3 years ago
  xufei 5974bba2dc Merge remote-tracking branch 'origin/master' 3 years ago
  xufei d8e9b2799b 更新文书 3 years ago
  xufei f00fd9a773 add func 3 years ago
  xufei b749bbfc09 合并json 3 years ago
  许家凯 4f24d0b327 feat: add 3 years ago
  xufei ea9654db66 更新 3 years ago
  xufei 1f67fb532c 更新 3 years ago
  xufei db7b58a751 更新 3 years ago
  许家凯 f6138cb853 Merge remote-tracking branch 'origin/master' 3 years ago
  许家凯 94e3ab49c2 feat: add 3 years ago
  许家凯 6ba65c3092 feat: pom依赖排除其它包 3 years ago
  许家凯 123e64224a Merge remote-tracking branch 'origin/master' 3 years ago
  许家凯 b3fbe53244 feat: 添加依赖 3 years ago
  晏永年 2239c08589 concat_ws2 4 years ago
  xufei 8ea80cdd2b 添加函数 4 years ago
  许家凯 4b0345cb6e Merge remote-tracking branch 'origin/master' 4 years ago
  许家凯 bf41832bfd feat: 添加一系列函数 4 years ago
  许家凯 862942c7af Merge remote-tracking branch 'origin/master' 4 years ago
  许家凯 4a4fc0569c feat: 添加全角转半角函数 4 years ago
  xufei 1e3ffa72a7 udf更新 4 years ago
  xufei 36615f166c udf更新 4 years ago
  许家凯 d248596eec feat: 添加行业code函数 4 years ago
  许家凯 47a0709bab feat: 添加人名处理函数 4 years ago
  许家凯 8574333003 feat: 添加concat_cleanup函数 4 years ago
  许家凯 8bb16b840c feat: 添加身份证号提取、注册资本提取 4 years ago
  许家凯 83e6eb3f2e feat: 案号规整函数中文括号转英文 4 years ago
  许家凯 b64de49f0c Merge remote-tracking branch 'origin/master' 4 years ago
  许家凯 a87244ee81 feat: 添加案号规整函数 4 years ago
  许家凯 2b0136259b Merge branch 'master' of http://139.224.213.4:3000/bigdata/UDF_Max 4 years ago
  许家凯 329b2abbdc add company_split 4 years ago
  许家凯 b441632a77 添加币种提取udf 4 years ago
  许家凯 fab820d3ce init 4 years ago

+ 16 - 4
src/main/java/com/winhc/bigdata/udf/justice/CaseNoPartyTitleParseUtil.java

@@ -20,15 +20,21 @@ import java.util.*;
 /**
  * @Author: XuJiakai
  * 2023/10/25 9:49
- *
+ * <p>
  * 依据案号生成展示当事人字段
- *
+ * <p>
  * case_no_party_title_parse
  */
 public class CaseNoPartyTitleParseUtil extends UDF {
     private Map<String, Set<CaseNoTitleEntity>> caseNoMap = null;
     private List<String> caseNoSet = null;
 
+    private static Set<String> DEFAULT_CASE_NO_KEYWORD = new HashSet<String>() {{
+        add("民再");
+        add("刑再");
+        add("行再");
+    }};
+
     @Override
     public void setup(ExecutionContext ctx) throws UDFException, IOException {
         Entity<List<String>, Map<String, Set<CaseNoTitleEntity>>> caseNoKeyword = CaseNoPropertiesUtils.getCaseNoKeyword();
@@ -44,11 +50,17 @@ public class CaseNoPartyTitleParseUtil extends UDF {
             return null;
         }
         String caseNoKeyword = getCaseNoKeyword(case_no);
-        if (caseNoKeyword == null) {
+        if (caseNoKeyword == null || DEFAULT_CASE_NO_KEYWORD.contains(caseNoKeyword)) {
             return getPartyTitleDefault(plaintiff_info, defendant_info);
         }
+
+
         Set<CaseNoTitleEntity> caseNoTitleEntities = caseNoMap.get(caseNoKeyword);
 
+        if (caseNoTitleEntities == null) {
+            return getPartyTitleDefault(plaintiff_info, defendant_info);
+        }
+
         Iterator<CaseNoTitleEntity> it = caseNoTitleEntities.iterator();
         CaseNoTitleEntity caseNoTitleEntity = it.hasNext() ? it.next() : null;
 
@@ -129,7 +141,7 @@ public class CaseNoPartyTitleParseUtil extends UDF {
     public static void main(String[] args) throws UDFException, IOException {
         CaseNoPartyTitleParseUtil caseNoPartyTitleParseUtil = new CaseNoPartyTitleParseUtil();
         caseNoPartyTitleParseUtil.setup(null);
-        String evaluate = caseNoPartyTitleParseUtil.evaluate("(2022)鲁0214执保303号", "[{\"name\":\"杨云\",\"litigant_id\":\"\"}]", "[{\"name\":\"李久倩\",\"litigant_id\":\"pb95466c950ea6164f3ce90c234d365a5\"},{\"name\":\"陈全英\",\"litigant_id\":\"p05b849d9da746669f0414d1dd07ad9c4\"},{\"name\":\"江秀波\",\"litigant_id\":\"\"},{\"name\":\"青岛智力高通信息科技有限公司\",\"litigant_id\":\"66b0b993e2ce10f35b63b44c7d3f70f7\"}]");
+        String evaluate = caseNoPartyTitleParseUtil.evaluate("{2021)渝0103民初16256号", "[{\"name\": \"冯忠袁\", \"litigant_id\": \"\"}]", "[]");
         System.out.println(evaluate);
     }
 

+ 2 - 2
src/main/java/com/winhc/bigdata/utils/BaseUtils.java

@@ -1,6 +1,7 @@
 package com.winhc.bigdata.utils;
 
 import cn.hutool.core.io.file.FileReader;
+import cn.hutool.core.io.resource.ResourceUtil;
 import com.alibaba.fastjson.JSONObject;
 import com.alibaba.fastjson.serializer.SerializerFeature;
 
@@ -11,8 +12,7 @@ import com.alibaba.fastjson.serializer.SerializerFeature;
 public class BaseUtils {
 
     public static String readeResourceFile(String pathFromSourceRoot) {
-        FileReader fileReader = new FileReader(pathFromSourceRoot);
-        return fileReader.readString();
+        return ResourceUtil.readUtf8Str(pathFromSourceRoot);
     }
 
     public static String toString(Object o) {

+ 6 - 3
src/main/java/com/winhc/bigdata/utils/CaseNoPropertiesUtils.java

@@ -31,7 +31,7 @@ public class CaseNoPropertiesUtils {
             JSONObject item = ((JSONObject) o);
             recursion(item, null, caseNoMap, caseNoSet);
         }
-        List<String> collect = caseNoSet.stream().sorted(Comparator.comparingInt(String::length).reversed()).collect(Collectors.toList());
+        List<String> collect = caseNoSet.stream().filter(Objects::nonNull).sorted(Comparator.comparingInt(String::length).reversed()).collect(Collectors.toList());
         return Entity.of(collect, caseNoMap);
     }
 
@@ -41,7 +41,11 @@ public class CaseNoPropertiesUtils {
         if (item.containsKey("party_title")) {
             thisPartyTitle = item.getObject("party_title", CaseNoTitleEntity.class);
         }
-        if (item.containsKey("sub_case_type")) {
+        if (item.containsKey("case_no_keyword")) {
+            String caseNoKeyword = item.getString("case_no_keyword");
+            caseNoSet.add(caseNoKeyword);
+        }
+        if (item.containsKey("sub_case_type")&&!item.getJSONArray("sub_case_type").isEmpty()) {
             JSONArray sub_case_type = item.getJSONArray("sub_case_type");
             for (Object o : sub_case_type) {
                 recursion(((JSONObject) o), thisPartyTitle, caseNoMap, caseNoSet);
@@ -49,7 +53,6 @@ public class CaseNoPropertiesUtils {
         } else {
             if (item.containsKey("case_no_keyword")) {
                 String caseNoKeyword = item.getString("case_no_keyword");
-                caseNoSet.add(caseNoKeyword);
                 if (thisPartyTitle != null) {
                     if (caseNoMap.containsKey(caseNoKeyword)) {
                         Set<CaseNoTitleEntity> caseNoTitleEntities = caseNoMap.get(caseNoKeyword);