这是我的代码,它总是返回 503
帮我检查一下标题,这样就不会被亚马逊屏蔽了
# User agent list
user_agents = [
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
]
# header & random User-Agent
headers = {
"User-Agent": random.choice(user_agents),
"authority": "www.amazon.com",
"accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
"accept-language": "en-US,en;q=0.9,vi;q=0.8",
"cache-control": "max-age=0",
"sec-ch-device-memory": "8",
"downlink": "1.3",
"dpr": "2",
"ect": "3g",
"rtt": "250",
"sec-ch-dpr": "2",
"sec-ch-ua": "\"Chromium\";v=\"120\", \"Google Chrome\";v=\"120\", \"Not=A?Brand\";v=\"99\"",
"sec-ch-ua-mobile": "?0",
"sec-ch-ua-platform": "\"macOS\"",
"sec-ch-viewport-width": "1680",
"sec-fetch-dest": "document",
"sec-fetch-mode": "navigate",
"sec-fetch-site": "same-origin",
"sec-fetch-user": "?1",
"upgrade-insecure-requests": "1",
"viewport-width": "1680",
}
def send_request(url, headers):
retries = 25
cookies = load_cookies_from_file()
for _ in range(retries):
try:
response = requests.get(url, headers=headers, cookies=cookies)
response.raise_for_status()
return response
except requests.RequestException as e:
print(f"error {e}. sending new request..")
return None
Amazon.com 许可证 不允许使用机器人访问其服务:
本许可不包括任何亚马逊服务或其内容的转售或商业使用;任何产品列表、描述或价格的收集和使用;对任何亚马逊服务或其内容的任何衍生使用;为了任何第三方的利益而下载、复制或以其他方式使用帐户信息;或任何数据挖掘、机器人或类似数据收集和提取工具的使用。