|
@@ -5000,7 +5000,7 @@ class TablePremExtractor(object):
|
|
|
multi_same_package = False # 非连续的重复包号
|
|
|
package_fix2raw = dict() # 处理后包号:处理前包号 字典
|
|
|
link_set = set()
|
|
|
- not_package = True if re.search('(货物|商品|产品|通用|主要标的)(名称?|内容)', headers['project_name'][1]) and \
|
|
|
+ not_package = True if 'project_name' in headers and re.search('(货物|商品|产品|通用|主要标的)(名称?|内容)', headers['project_name'][1]) and \
|
|
|
'package_code' not in headers and 'budget' not in headers and "bid_amount" not in headers else False
|
|
|
for i in df.index:
|
|
|
same_package = False # 连续重复包号,一般是 rowspan 造成;一包 多个采购
|