Browse Source

修复表格提取报错

lsm 2 years ago
parent
commit
3e260fbe4b
1 changed files with 1 additions and 1 deletions
  1. 1 1
      BiddingKG/dl/interface/predictor.py

+ 1 - 1
BiddingKG/dl/interface/predictor.py

@@ -5000,7 +5000,7 @@ class TablePremExtractor(object):
         multi_same_package = False # 非连续的重复包号
         package_fix2raw = dict()  # 处理后包号:处理前包号 字典
         link_set = set()
-        not_package = True if re.search('(货物|商品|产品|通用|主要标的)(名称?|内容)', headers['project_name'][1]) and \
+        not_package = True if 'project_name' in headers and re.search('(货物|商品|产品|通用|主要标的)(名称?|内容)', headers['project_name'][1]) and \
                           'package_code' not in headers and 'budget' not in headers and "bid_amount" not in headers else False
         for i in df.index:
             same_package = False  # 连续重复包号,一般是 rowspan 造成;一包 多个采购