python爬蟲學習(一)requests+bs4爬取圖片
阿新 • • 發佈:2021-06-24
import requests from bs4 import BeautifulSoup import time url = "http://www.bizhi360.com/meinv/" resp = requests.get(url) resp.encoding = "utf-8" #print(resp.text) main_page = BeautifulSoup(resp.text,"html.parser") ul = main_page.find("ul") #print(ul) a = ul.find_all("a") #print(a) for i in a: #print(i.get('href'))#直接通過get就可以拿到屬性值#獲取陣列中的href的值href=""裡的值 url_detail = "http://www.bizhi360.com/"+str(i.get('href'))# 獲取每一張圖片的url #print(url_detail) resp_detail = requests.get(url_detail) resp_detail.encoding = 'utf-8' #print(resp_detail.text) main_detail = BeautifulSoup(resp_detail.text,"html.parser") div= main_detail.find("div",class_="content").find("a",class_="download") title = main_detail.find("h1",class_="title").text print(title) img_url = div.get('href') img_resp = requests.get(img_url) print(img_url) #下載圖片 img_name = str(title)+".jpg" with open(img_name, mode="wb") as f: #寫的是圖片用wb f.write(img_resp.content)#img_resp.content #這裡拿到的是位元組 #圖片內容寫入檔案 time.sleep(1)