Quellcode durchsuchen

kvtree识别优化

luojiehua vor 5 Monaten
Ursprung
Commit
cdc8a19e20
1 geänderte Dateien mit 8 neuen und 1 gelöschten Zeilen
  1. 8 1
      BiddingKG/dl/interface/html_2_kvtree.py

+ 8 - 1
BiddingKG/dl/interface/html_2_kvtree.py

@@ -297,6 +297,13 @@ def tree_reposition(tree,sentence_index=None):
             obj["wordOffset_end"] = wordOffset_end
             wordOffset_begin = wordOffset_end
 
+            list_kv = obj.get("kv",[])
+            for _d in list_kv:
+                _d["position"]["key_begin_sentence"] = sentence_index
+                _d["position"]["key_end_sentence"] = sentence_index
+                _d["position"]["value_begin_sentence"] = sentence_index
+                _d["position"]["value_end_sentence"] = sentence_index
+
         else:
             sentence_index += 1
             obj["sentence_index"] = sentence_index
@@ -1720,7 +1727,7 @@ if __name__ == '__main__':
     _pd = Html2KVTree(html_content)
     _pd.print_tree(_pd.tree,"-|")
 
-    list_kv = _pd.extract_kv("资格条件")
+    list_kv = _pd.extract_kv("资质要求")
     print(list_kv)
 
     #获取预处理后的所有句子,该句子与kv值对应