|
@@ -1084,10 +1084,11 @@ class Dataflow_ActivteMQ_extract(Dataflow_extract):
|
|
attachment_len = len(_attachment.get_text()) if _attachment else 0 # 附件内容text长度
|
|
attachment_len = len(_attachment.get_text()) if _attachment else 0 # 附件内容text长度
|
|
main_text_len = all_len - attachment_len # 正文内容text长度
|
|
main_text_len = all_len - attachment_len # 正文内容text长度
|
|
|
|
|
|
- if attachment_len>150000: # 附件内容过长删除(处理超时)
|
|
|
|
- if _attachment is not None:
|
|
|
|
- _attachment.decompose()
|
|
|
|
- attachment_len = 0
|
|
|
|
|
|
+ # if attachment_len>150000: # 附件内容过长删除(处理超时)
|
|
|
|
+ # if _attachment is not None:
|
|
|
|
+ # _attachment.decompose()
|
|
|
|
+ # attachment_len = 0
|
|
|
|
+
|
|
# 正文或附件内容text长度大于limit_text_len才执行article_limit
|
|
# 正文或附件内容text长度大于limit_text_len才执行article_limit
|
|
if main_text_len>limit_text_len or attachment_len>limit_text_len:
|
|
if main_text_len>limit_text_len or attachment_len>limit_text_len:
|
|
_soup = article_limit(_soup,limit_text_len)
|
|
_soup = article_limit(_soup,limit_text_len)
|
|
@@ -1362,8 +1363,6 @@ class Dataflow_ActivteMQ_extract(Dataflow_extract):
|
|
if budget_unexpected or winprice_unexpected:
|
|
if budget_unexpected or winprice_unexpected:
|
|
return True,_reason
|
|
return True,_reason
|
|
|
|
|
|
-
|
|
|
|
-
|
|
|
|
return False,_reason
|
|
return False,_reason
|
|
|
|
|
|
|
|
|