convert_test.py 3.0 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374
  1. import base64
  2. import json
  3. import os
  4. import sys
  5. import time
  6. from multiprocessing.context import Process
  7. sys.path.append(os.path.dirname(os.path.abspath(__file__)) + "/../")
  8. from format_convert.utils import get_platform, request_post, get_md5_from_bytes
  9. def test_one(p, from_remote=False):
  10. start_time = time.time()
  11. with open(p, "rb") as f:
  12. file_bytes = f.read()
  13. file_base64 = base64.b64encode(file_bytes)
  14. _md5 = get_md5_from_bytes(file_bytes)
  15. data = {"file": file_base64, "type": p.split(".")[-1], "filemd5": 100}
  16. if from_remote:
  17. # _url = 'http://121.46.18.113:15010/convert'
  18. _url = 'http://192.168.2.102:15010/convert'
  19. # _url = 'http://172.16.160.65:15010/convert'
  20. result = json.loads(request_post(_url, data, time_out=10000))
  21. else:
  22. print("only support remote!")
  23. print(_md5)
  24. print("result_text", result.get("result_text")[0][:20])
  25. print("is_success", result.get("is_success"))
  26. print(time.time()-start_time)
  27. def test_duplicate(path_list, process_no=None):
  28. start_time = time.time()
  29. for i in range(500):
  30. if i % 10 == 0:
  31. if process_no is not None:
  32. print("Process", process_no, i*len(path_list), time.time()-start_time)
  33. else:
  34. print("Loop", i*len(path_list), time.time()-start_time)
  35. for p in path_list:
  36. test_one(p, from_remote=True)
  37. if __name__ == '__main__':
  38. if get_platform() == "Windows":
  39. # file_path = "C:/Users/Administrator/Desktop/error7.jpg"
  40. # file_path = "D:/BIDI_DOC/比地_文档/2022/Test_Interface/20210609202634853485.xlsx"
  41. # file_path = "D:/BIDI_DOC/比地_文档/2022/Test_ODPS/1624325845476.pdf"
  42. file_path = "C:/Users/Administrator/Downloads/1652672734044.jpg"
  43. else:
  44. file_path = "test1.doc"
  45. test_one(file_path, from_remote=True)
  46. # if get_platform() == "Windows":
  47. # # file_path_list = ["D:/BIDI_DOC/比地_文档/2022/Test_Interface/1623328459080.doc",
  48. # # "D:/BIDI_DOC/比地_文档/2022/Test_Interface/94961e1987d1090e.xls",
  49. # # "D:/BIDI_DOC/比地_文档/2022/Test_Interface/11111111.rar"]
  50. # # file_path_list = ["D:/BIDI_DOC/比地_文档/2022/Test_Interface/1623328459080.doc",
  51. # # "D:/BIDI_DOC/比地_文档/2022/Test_Interface/94961e1987d1090e.xls"]
  52. # # file_path_list = ["D:/BIDI_DOC/比地_文档/2022/Test_Interface/1623423836610.pdf"]
  53. # file_path_list = ["C:/Users/Administrator/Downloads/广东中检达元检测技术有限公司.pdf",
  54. # "C:/Users/Administrator/Desktop/error11.pdf",
  55. # "C:/Users/Administrator/Desktop/error9.pdf",
  56. # "C:/Users/Administrator/Desktop/error16.jpg",
  57. # "C:/Users/Administrator/Desktop/error9.jpg",]
  58. # else:
  59. # file_path_list = ["1623423836610.pdf"]
  60. # for j in range(10):
  61. # p = Process(target=test_duplicate, args=(file_path_list, j, ))
  62. # p.start()
  63. # p.join()