from bs4 import BeautifulSoupimport requestsimport time#url = 'http://www.tr
def get_attractions(url , data=None): wb_data = requests.get(url) time.sleep(4) #設定延時 soup = BeautifulSoup(wb_data.text, 'lxml') titles = soup.select('div.PRoperty_title > a[target="_blank"]') imgs = soup.select('img[width="160"]') cates = soup.select('div.p13n_reasoning_v2 > a') for title , img , cate in zip(titles , imgs , cates): data = { 'title': title.get_text(), 'img': img.get('src'), 'cate': list(cate.stripped_strings) } print(data)
for i in urls: get_attractions(i)
新手學習Python,了解網頁元素,難點:元素定位
新聞熱點
疑難解答