company_court_open_announcement.py 5.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159
  1. # -*- coding: utf-8 -*-
  2. # @Time : 2023/7/20 16:27
  3. # @Author : XuJiakai
  4. # @File : company_court_open_announcement
  5. # @Software: PyCharm
  6. import os
  7. from data_clean.api.hbase_api import bulk_get
  8. from data_clean.api.mongo_api import insert_one
  9. from data_clean.dim_handle_registry import get_dim_handle
  10. from data_clean.env.const import mongo_table_prefix
  11. from data_clean.exception.ruler_validation_exception import RulerValidationException
  12. from data_clean.utils.base_utils import *
  13. from data_clean.utils.case_utils import case_no_year_datetime
  14. from data_clean.utils.date_utils import str_2_date_time, get_update_time, establish_state_time
  15. from data_clean.utils.party_name_verify_utils import person_name_list_verify
  16. from data_clean.utils.str_utils import json_str_2_list
  17. from data_clean.utils.case_utils import get_case_party
  18. # 必须命名为dim_handle
  19. dim_handle = get_dim_handle(os.path.basename(__file__))
  20. # @dim_handle.registry_prefix_func
  21. async def prefix_func(dim_data: list):
  22. print("前置程序:", dim_data)
  23. raise ValueError("前置程序错误")
  24. pass
  25. @dim_handle.registry_postfix_func()
  26. async def post_func(dim_data: list):
  27. # print("后置程序:", dim_data)
  28. for r in dim_data:
  29. r['update_time'] = get_update_time()
  30. pass
  31. pass
  32. @dim_handle.registry_row_func
  33. async def party_intersect(row_data: dict) -> dict:
  34. # 判断当事人有交叉
  35. plaintiff_info = json_str_2_list(row_data['plaintiff_info'], "name")
  36. defendant_info = json_str_2_list(row_data['defendant_info'], "name")
  37. inter = list(set(plaintiff_info).intersection(set(defendant_info)))
  38. if len(inter) == 0:
  39. return row_data
  40. else:
  41. raise RulerValidationException("ccoa_001", "当事人有交叉:%s" % inter)
  42. pass
  43. async def _get_max_establish_date(company_ids: list):
  44. company_ids = [i for i in company_ids if i]
  45. res = await bulk_get('ng_rt_company', company_ids)
  46. res = [str_2_date_time(i['ESTIBLISH_TIME']) for i in res if 'ESTIBLISH_TIME' in i and i['ESTIBLISH_TIME']]
  47. if not res:
  48. return None
  49. return max(res)
  50. pass
  51. # 开庭时间相关过滤
  52. @dim_handle.registry_row_func
  53. async def open_ann_date(row_data: dict) -> dict:
  54. import datetime
  55. now = datetime.datetime.now()
  56. delta = datetime.timedelta(days=730) # 两年后
  57. max_date = now + delta
  58. start_date = get_or_none(row_data, 'start_date')
  59. case_no = get_or_none(row_data, 'case_no')
  60. if case_no is None and start_date is None:
  61. raise RulerValidationException("ccoa_007", "案号和开庭时间均为空")
  62. if start_date is None:
  63. return row_data
  64. try:
  65. this_date = str_2_date_time(row_data['start_date'])
  66. if this_date < establish_state_time:
  67. raise RulerValidationException("ccoa_002", "开庭时间早于建国时间:%s" % row_data['start_date'])
  68. if this_date > max_date:
  69. raise RulerValidationException("ccoa_006", "开庭时间在两年后:%s" % row_data['start_date'])
  70. part_keyno = json_str_2_list(row_data['plaintiff_info'], 'litigant_id') + json_str_2_list(
  71. row_data['defendant_info'], 'litigant_id')
  72. part_keyno = [i for i in part_keyno if i and len(i) == 32]
  73. max_establish_date = await _get_max_establish_date(part_keyno)
  74. if max_establish_date and this_date < max_establish_date:
  75. raise RulerValidationException("ccoa_004", "开庭时有公司未成立,最晚一个公司成立日期:%s,开庭时间:%s" % (
  76. max_establish_date, row_data['start_date']))
  77. case_no_year_dt = case_no_year_datetime(case_no)
  78. if case_no_year_dt and this_date < case_no_year_dt:
  79. raise RulerValidationException("ccoa_005", "案号大于开庭时间年份,案号:%s,开庭时间:%s" % (
  80. case_no, row_data['start_date']))
  81. except RulerValidationException as ex:
  82. if case_no is None:
  83. raise ex
  84. await insert_one(mongo_table_prefix + 'info_cooa_start_date_set_none', {
  85. "content": {
  86. "data": {
  87. "company_court_open_announcement": [row_data]
  88. },
  89. }
  90. })
  91. row_data['start_date'] = None
  92. pass
  93. return row_data
  94. pass
  95. @dim_handle.registry_row_func
  96. async def party_unknown(row_data: dict) -> dict:
  97. # 过滤当事人名字异常,Z某某、xxx
  98. plaintiff_info = json_str_2_list(row_data['plaintiff_info'], "name")
  99. defendant_info = json_str_2_list(row_data['defendant_info'], "name")
  100. li = plaintiff_info + defendant_info
  101. flag, error_name = person_name_list_verify(li)
  102. if not flag:
  103. result = await get_case_party(row_data['case_no'], source='open_court')
  104. if result:
  105. row_data['plaintiff_info'] = result['plaintiff_info']
  106. row_data['defendant_info'] = result['defendant_info']
  107. row_data['litigant_info'] = result['litigant_info']
  108. row_data['plaintiff'] = result['plaintiff']
  109. row_data['defendant'] = result['defendant']
  110. row_data['litigant'] = result['litigant']
  111. pass
  112. else:
  113. raise RulerValidationException("ccoa_003", "人名不符合规范:%s" % error_name)
  114. pass
  115. return row_data
  116. async def test():
  117. res = await _get_max_establish_date(
  118. ['bc702f0f5202342a9c1c75fbf9be9aff', 'b79d862faef595f33b166562bb3c18b6', '24cb269450f9262051dfcaa3dc389844'])
  119. print(res)
  120. pass
  121. if __name__ == '__main__':
  122. import asyncio
  123. asyncio.run(test())
  124. pass