import requests import re import simhash url = "https://www.qimao.com/shuku/a-a-a-a-a-a-a-click-1/" def get_hexxor(s1, _0x4e08d8): _0x5a5d3b = '' for i in range(len(s1)): if i % 2 != 0: continue _0x401af1 = int(s1[i: i+2], 16) _0x105f59 = int(_0x4e08d8[i: i+2], 16) _0x189e2c_10 = (_0x401af1 ^ _0x105f59) print("i==",_0x401af1,_0x105f59,_0x189e2c_10) print("i==",hex(_0x401af1),hex(_0x105f59),hex(_0x189e2c_10)) _0x189e2c = hex(_0x189e2c_10)[2:] print("_0x189e2c",_0x189e2c) if len(_0x189e2c) == 1: _0x189e2c = '0' + _0x189e2c print("_0x189e2c",_0x189e2c) _0x5a5d3b += _0x189e2c return _0x5a5d3b def get_unsbox(arg1): _0x4b082b = [0xf, 0x23, 0x1d, 0x18, 0x21, 0x10, 0x1, 0x26, 0xa, 0x9, 0x13, 0x1f, 0x28, 0x1b, 0x16, 0x17, 0x19, 0xd, 0x6, 0xb, 0x27, 0x12, 0x14, 0x8, 0xe, 0x15, 0x20, 0x1a, 0x2, 0x1e, 0x7, 0x4, 0x11, 0x5, 0x3, 0x1c, 0x22, 0x25, 0xc, 0x24] print(_0x4b082b) _0x4da0dc = [] _0x12605e = '' for i in _0x4b082b: print('i--',i,i-1) _0x4da0dc.append(arg1[i-1]) _0x12605e = "".join(_0x4da0dc) return _0x12605e # 第一次请求获取js代码 headers = {"User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_4) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.105 Safari/537.36"} r = requests.get(url, headers=headers) # 重js中匹配出 arg1 arg1 = re.findall("arg1=\'(.*?)\'", r.text)[0] # 参数生成 s1 = get_unsbox(arg1) print("===",arg1,s1) _0x4e08d8 = "3000176000856006061501533003690027800375" _0x12605e = get_hexxor(s1, _0x4e08d8) print(s1, _0x12605e) # 二次请求携带cookie 获取html文件 headers = {"User-Agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_4) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.105 Safari/537.36", "cookie": "acw_sc__v2=%s" % _0x12605e} r = requests.get(url, headers=headers) # print(r.text)