使用requests库爬取百度翻译

使用requests库爬取百度翻译

  1. 首先查看pc端百度翻译接口发现有内部有签名机制(http://fanyi.baidu.com/v2transapi)
    这里写图片描述
  2. 尝试切换到移动端看看结果
    这里写图片描述

根据移动端接口爬取接口数据

"""
url http://fanyi.baidu.com/v2transapi
请求方式 POST

"from":"en",
"to":"zh",
"query":"set",
"transtype":"realtime",
"simple_means_flag":"3",
"sign":"710765.932700",
"token":"3d4a5f2c17cd9be756c8f1612dd9136d",

# 内部有签名机制
# 办法: 1.尝试切换到移动端看看结果
"""
import requests
import json
from pprint import pprint


url = "http://fanyi.baidu.com/basetrans"

query = input("请输入翻译内容:")

data = {
    "query": query,
    "from": "en",
    "to": "zh"
}

headers = {
    "User-Agent":"Mozilla/5.0 (iPhone; CPU iPhone OS 9_1 like Mac OS X) AppleWebKit/601.1.46 (KHTML, like Gecko) Version/9.0 Mobile/13B143 Safari/601.1",
    "Referer":"http://fanyi.baidu.com/?aldtype=16047",
    "X-Requested-With":"XMLHttpRequest",
    "Cookie":"BAIDUID=775A15033E10D619BB7FCF036B0788C4:FG=1; BIDUPSID=775A15033E10D619BB7FCF036B0788C4; PSTM=1530600959; FP_UID=c8da812881e10f57a2f4b43003b180ad; PSINO=1; H_PS_PSSID=1453_26259_21092_20927; BDORZ=B490B5EBF6F3CD402E515D22BCDA1598; locale=zh; REALTIME_TRANS_SWITCH=1; FANYI_WORD_SWITCH=1; HISTORY_SWITCH=1; SOUND_SPD_SWITCH=1; SOUND_PREFER_SWITCH=1; to_lang_often=%5B%7B%22value%22%3A%22en%22%2C%22text%22%3A%22%u82F1%u8BED%22%7D%2C%7B%22value%22%3A%22zh%22%2C%22text%22%3A%22%u4E2D%u6587%22%7D%5D; from_lang_often=%5B%7B%22value%22%3A%22zh%22%2C%22text%22%3A%22%u4E2D%u6587%22%7D%2C%7B%22value%22%3A%22en%22%2C%22text%22%3A%22%u82F1%u8BED%22%7D%5D; Hm_lvt_afd111fa62852d1f37001d1f980b6800=1530878230; Hm_lpvt_afd111fa62852d1f37001d1f980b6800=1530878230; Hm_lvt_64ecd82404c51e03dc91cb9e8c025574=1530877102,1530877124,1530878230; Hm_lpvt_64ecd82404c51e03dc91cb9e8c025574=1530878230"
}

# 区别 如果是get => params,post =>data
response = requests.post(url,data=data,headers=headers)

result = json.loads(response.text)
# print(result)
print("翻译结果:{}".format(result['trans'][0]['dst']))

猜你喜欢

转载自blog.csdn.net/qq_31603575/article/details/81006079