Pārlūkot izejas kodu

修复前面有序号过滤错中标人

lsm 2 gadi atpakaļ
vecāks
revīzija
ca1da878cb
1 mainītis faili ar 2 papildinājumiem un 2 dzēšanām
  1. 2 2
      BiddingKG/dl/interface/predictor.py

+ 2 - 2
BiddingKG/dl/interface/predictor.py

@@ -683,7 +683,7 @@ class PREMPredict():
             text = text_list[i]
             if label in [0, 1, 2, 3, 4] and values[label] < 0.5: # 小于阈值的设为其他,让后面的规则召回重新判断
                 label = 5
-            elif label in [2,3,4] and re.search('序号:\d+,', text):
+            elif label in [2,3,4] and re.search('序号:\d+,\w{,2}候选', text):
                 label = 5
             elif label == 2:
                 if re.search('中标单位和.{,25}签订合同', text):
@@ -1350,7 +1350,7 @@ class RoleRulePredictor():
                                                     _weight = _group.split("_")[2] if len(_group.split("_"))==3 else ""
                                                     # _label = {"tenderee": 0, "agency": 1, "winTenderer": 2,
                                                     #           "secondTenderer": 3, "thirdTenderer": 4}.get(_role)
-                                                    if _i_span == 0 and _direct == "left" and re.search('各.{,5}供应商|尊敬的供应商|业绩|拟招|(交易|采购|招标)服务(单位|机构)|第[四五六七4567]|是否中标:否|序号:\d+',  #135463002 拟招一家供应商为宜宾市第三人民医院、李庄同济医院院区提供消防维保服务
+                                                    if _i_span == 0 and _direct == "left" and re.search('各.{,5}供应商|尊敬的供应商|业绩|拟招|(交易|采购|招标)服务(单位|机构)|第[四五六七4567]|是否中标:否|序号:\d+,\w{,2}候选',  #135463002 拟招一家供应商为宜宾市第三人民医院、李庄同济医院院区提供消防维保服务
                                                                                                         list_spans[0]) == None:  # 2021/12/22 修正错误中标召回 例子208668937
                                                         _flag = True
                                                         _label = {"tenderee": 0, "agency": 1, "winTenderer": 2,