我得到了以下代码的HTTPError: 400,我不明白为什么我不能打开url
from bs4 import BeautifulSoup
import requests
import lxml
import pandas as pd
import re
search_url = f'https://www.booking.com/reviewlist.en-gb.html?aid=304142&label=gen173nr-1DCAsoAkIbY2VudHJvLXlhcy1pc2xhbmQtYWJ1LWRoYWJpSDNYBGhsiAEBmAEJuAEGyAEM2AED6AEBiAIBqAIDuAKEwOrxBcACAQ&sid=61a721d17d76bc82ccf82c3c3d92de7c&cc1=ae&dist=1&pagename=centro-yas-island-abu-dhabi&srpvid=fee14d92dc160043&type=total&rows=10&offset=0'
page = requests.get(search_url)
print(page)
if page.status_code == requests.codes.ok:
soup = BeautifulSoup(page.text, 'lxml')
# get_property_attributes(soup)
else:
print('open error')ouput : <Response [400]>请给我一些解决这个问题的建议。
发布于 2020-02-05 14:29:58
尝试在请求中添加headers参数:
from bs4 import BeautifulSoup
import requests
import lxml
import pandas as pd
import re
search_url = 'https://www.booking.com/reviewlist.en-gb.html?aid=304142&label=gen173nr-1DCAsoAkIbY2VudHJvLXlhcy1pc2xhbmQtYWJ1LWRoYWJpSDNYBGhsiAEBmAEJuAEGyAEM2AED6AEBiAIBqAIDuAKEwOrxBcACAQ&sid=61a721d17d76bc82ccf82c3c3d92de7c&cc1=ae&dist=1&pagename=centro-yas-island-abu-dhabi&srpvid=fee14d92dc160043&type=total&rows=10&offset=0'
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.130 Safari/537.36'}
page = requests.get(search_url, headers=headers)
print(page)
if page.status_code == requests.codes.ok:
soup = BeautifulSoup(page.text, 'lxml')
# get_property_attributes(soup)
else:
print('open error')输出:
<Response [200]>https://stackoverflow.com/questions/60077904
复制相似问题