|
@@ -6547,8 +6547,8 @@ class TablePremExtractor(object):
|
|
|
return flag,contain_header, header_dic, not_sure_winner
|
|
|
elif 'tenderer' in header_dic and (re.search('(中标|中选|中价|成交|竞得)(人|单位|供应商|公司|企业|厂家|商家?|客户|供?方|银行)',header_dic['tenderer'][1]) or all_winner): # 有中标人,且有明确中标关键词的进行提取
|
|
|
return flag, contain_header, header_dic, not_sure_winner
|
|
|
- elif 'tenderer' in header_dic and 'serviceTime' in header_dic:
|
|
|
- return flag, contain_header, header_dic
|
|
|
+ # elif 'tenderer' in header_dic and 'serviceTime' in header_dic:
|
|
|
+ # return flag, contain_header, header_dic, not_sure_winner
|
|
|
elif len(set(fix_td_list) & self.headerset) >= 2 or (len(set(fix_td_list)) == 2 and len(set(td_list) & self.headerset) >= 1): # 如果包含两个表头以上或 只有两列且包含一个表头
|
|
|
contain_header = True
|
|
|
return flag, contain_header, dict(), not_sure_winner
|