medical_product.py 931 B

1234567891011121314151617181920212223242526272829303132
  1. import re
  2. import sys,os
  3. import pandas as pd
  4. class MedicalProduct():
  5. def __init__(self):
  6. self.file_path = os.path.join(os.path.dirname(__file__),"医疗产品关键词.xlsx")
  7. df = pd.read_excel(self.file_path)
  8. self.list_medical_keyword = [str(a) for a in df["product_name"].tolist()]
  9. self.legal_keyword = []
  10. for _keyword in self.list_medical_keyword:
  11. try:
  12. if re.compile(_keyword):
  13. self.legal_keyword.append(_keyword)
  14. except:
  15. pass
  16. print("|".join(self.legal_keyword))
  17. self.medical_pattern = re.compile("|".join(self.legal_keyword))
  18. def is_medical_product(self,content):
  19. if self.medical_pattern.search(content):
  20. return True
  21. else:
  22. return False
  23. if __name__ == '__main__':
  24. MP = MedicalProduct()
  25. print(MP.is_medical_product("0.211ml离心管"))