cleanAgency.py 763 B

12345678910111213141516171819202122232425262728293031
  1. #coding:utf8
  2. import pandas as pd
  3. import re
  4. def clean():
  5. filename = "20230227都大于100.xlsx"
  6. df = pd.read_excel(filename)
  7. _count = 0
  8. df_data = {"name":[],
  9. "zbn":[],
  10. "dln":[],
  11. "sn":[]}
  12. for name,zbn,dln,sn in zip(df["nicknames"],df["zhao_biao_number"],df["dai_li_number"],df["same_number"]):
  13. if dln>10000 and re.search("招标|咨询",name) is not None:
  14. _count += 1
  15. print(_count,name,zbn,dln,sn)
  16. df_data["name"].append(name)
  17. df_data["zbn"].append(zbn)
  18. df_data["dln"].append(dln)
  19. df_data["sn"].append(sn)
  20. df = pd.DataFrame(df_data)
  21. df.to_excel("daili_check.xlsx")
  22. if __name__ == '__main__':
  23. clean()