|
@@ -754,8 +754,8 @@ class Dataflow_ActivteMQ_extract(Dataflow_extract):
|
|
|
|
|
|
html_len = len(_dochtmlcon)
|
|
|
if html_len>200000:
|
|
|
- if int(item.get("docid"))==325618927:
|
|
|
- save(item,"325618927.pk")
|
|
|
+ if int(item.get("docid"))==329546490:
|
|
|
+ save(item,"329546490.pk")
|
|
|
log("docid %s dochtmlcon too long len %d "%(str(item.get("docid")),html_len))
|
|
|
try:
|
|
|
_dochtmlcon = re.sub("<html>|</html>|<body>|</body>", "", _dochtmlcon)
|