Эх сурвалжийг харах

修复数据遗漏的问题

luojiehua 1 жил өмнө
parent
commit
6dfcf98d40

+ 2 - 1
BaseDataMaintenance/maintenance/dataflow_mq.py

@@ -765,7 +765,8 @@ class Dataflow_ActivteMQ_extract(Dataflow_extract):
                     _soup = BeautifulSoup(_dochtmlcon,"lxml")
                     if len(_dochtmlcon)>200000:
                         _find = _soup.find("div",attrs={"class":"richTextFetch"})
-                        _find.decompose()
+                        if _find is not None:
+                            _find.decompose()
                     else:
                         _soup = article_limit(_soup,50000)
                     _dochtmlcon = str(_soup)