网址:fanyi.baidu.com
接口:https://fanyi.baidu.com/ait/text/translateIncognitoAi
参数:Acs-Token
请求分析
打开devtool,随便输入单词,发包找请求堆栈:
进去,下断点,再次发包,发现参数已经生成:
跟栈分析
顺着堆栈找,注意这是异步堆栈,代码有很多重复执行的地方,真正的逻辑是for-case,例如:
下断点:
再次发包,然后单步跟栈:
进去:
这样可以直接跳到调用函数:
跟过来:
进到run内:
发现有点类似虚拟机的分发机制:
插桩
直接进去看看
然后开始插桩,不过不会插太多,只插特殊的:
只插这样的,将运行结果赋值给了e.V
进去:
不插,再回来:
进去
插上,日志断点,就这样,有个3,4个就行了,一些重要特殊断点:
日志分析
然后放开断点让他执行,看日志,发现已经生成:
然后搜索(去掉两个时间戳前缀)
经过在线验证是aes-cbc加密:
但是发现明文中好像还有加密内容,例如d0,d78
对于d0
依然全局搜索:
答案已经很清晰了
对于d78
经验证,是sha1加密:
___false_0__0 好像是环境检测,固定就行了
源码
from curl_cffi import requests
import time, re, base64
from hashlib import sha1
from Crypto.Cipher import AES
from Crypto.Util.Padding import paddef aes_cbc_encrypt_str(plaintext: str, key_n: str | bytes, iv_n: str | bytes) -> str:if isinstance(key_n, str):key_n = key_n.encode('utf-8')if isinstance(iv_n, str):iv_n = iv_n.encode('utf-8')cipher = AES.new(key_n, AES.MODE_CBC, iv_n) # noqapadded_plaintext = pad(plaintext.encode('utf-8'), AES.block_size)ciphertext = cipher.encrypt(padded_plaintext)return base64.b64encode(ciphertext).decode('utf-8')def update_response_cookies(response1, need_upgrade_cookies: bool | dict = None):if need_upgrade_cookies is None:need_upgrade_cookies = {}cookies_str = str(response1.cookies)raw_cookies = re.compile(r'<Cookies\[(.*?)]>').findall(cookies_str)if raw_cookies:for raw in raw_cookies[0].split(','):temp = raw.strip().split(' ')[1].split('=')need_upgrade_cookies.update({temp[0]: temp[1]})return need_upgrade_cookieselse:return need_upgrade_cookiesclass BaiDuTranslate:def __init__(self):self.key_str = 'kwoigaeecyumqcya'self.iv_str = '1234567887654321'self.headers = {'Accept-Language': 'zh-CN,zh;q=0.9,en;q=0.8,en-GB;q=0.7,en-US;q=0.6','Cache-Control': 'no-cache','Connection': 'keep-alive','Content-Type': 'application/json','Origin': 'https://fanyi.baidu.com','Pragma': 'no-cache','Referer': 'https://fanyi.baidu.com/','Sec-Fetch-Dest': 'empty','Sec-Fetch-Mode': 'cors','Sec-Fetch-Site': 'same-origin','User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/147.0.0.0 Safari/537.36 Edg/147.0.0.0','accept': 'text/event-stream','sec-ch-ua': '"Microsoft Edge";v="147", "Not.A/Brand";v="8", "Chromium";v="147"','sec-ch-ua-mobile': '?0','sec-ch-ua-platform': '"Windows"',}self.get_cookies()def get_cookies(self):response = requests.get('https://www.baidu.com/', cookies={}, headers=self.headers)self.cookies = update_response_cookies(response)print(self.cookies)def to_base(self, num, base=32):self.none = Noneif num == 0:return '0'digits = '0123456789abcdefghijklmnopqrstuvwxyz' # 0-9, a-zresult = ''while num > 0:result = digits[num % base] + resultnum //= basereturn resultdef get_acs_token(self, client_time: int):base_str = self.to_base(client_time)salt_str_head = f'if2glnrf99c{base_str}'salt_str = f'{salt_str_head}___false_0__0'd78 = int(sha1(salt_str.encode()).hexdigest()[:4], 16)param_str = f'{{"d0":"{salt_str_head}","ua":"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/147.0.0.0 Safari/537.36 Edg/147.0.0.0","baiduid":"{self.cookies['BAIDUID']}","platform":"Win32","d23":1,"hfe":"","d1":"","d2":0,"d420":0,"clientTs":{client_time},"version":"1.4.0.3","extra":"","odkp":0,"hf":"","d78":{d78},"h0":false,"h1":0}}'acs_token = f'1777312805494_{client_time}_{aes_cbc_encrypt_str(param_str, self.key_str, self.iv_str)}' # 这里的前缀时间戳还有待考究return acs_tokendef translate(self, word: str, from_: str = 'en', to_: str = 'zh'): # 自行添加语言方向处理逻辑start_time = int(time.time() * 1000)end_time = start_time + 1cal_end_time = start_time + 3001acs_token = self.get_acs_token(cal_end_time)self.headers['Acs-Token'] = acs_tokenjson_data = {'needNewlineCombine': False,'disableCache': False,'isAi': False,'sseStartTime': start_time,'query': word,'from': from_,'to': to_,'reference': '','corpusIds': [],'needPhonetic': True,'domain': 'common','detectLang': '','isIncognitoAI': False,'milliTimestamp': end_time,}response = requests.post('https://fanyi.baidu.com/ait/text/translate', cookies=self.cookies, headers=self.headers, json=json_data)print(response.text) # 自行添加结果处理逻辑⚡ 完整逆向流程展示 · 仅供技术研究
