1. 程式人生 > 其它 >python爬蟲學習(一)requests+bs4爬取圖片

python爬蟲學習(一)requests+bs4爬取圖片

import requests
from bs4 import BeautifulSoup
import time

url = "http://www.bizhi360.com/meinv/"
resp = requests.get(url)
resp.encoding = "utf-8"
#print(resp.text)
main_page = BeautifulSoup(resp.text,"html.parser")

ul = main_page.find("ul")
#print(ul)
a = ul.find_all("a")
#print(a)
for i in a:
    #print(i.get('href'))#直接通過get就可以拿到屬性值
#獲取陣列中的href的值href=""裡的值 url_detail = "http://www.bizhi360.com/"+str(i.get('href'))# 獲取每一張圖片的url #print(url_detail) resp_detail = requests.get(url_detail) resp_detail.encoding = 'utf-8' #print(resp_detail.text) main_detail = BeautifulSoup(resp_detail.text,"html.parser") div
= main_detail.find("div",class_="content").find("a",class_="download") title = main_detail.find("h1",class_="title").text print(title) img_url = div.get('href') img_resp = requests.get(img_url) print(img_url) #下載圖片 img_name = str(title)+".jpg" with open(img_name, mode
="wb") as f: #寫的是圖片用wb f.write(img_resp.content)#img_resp.content #這裡拿到的是位元組 #圖片內容寫入檔案 time.sleep(1)