我的代碼
from bs4 import BeautifulSoup
import requests
import time
import urllib
url = 'https://knewone.com/discover?page='
def get_page(url,data=None):
wb_data = requests.get(url)
soup = BeautifulSoup(wb_data.text,'lxml')
imgs = soup.select('a.cover-inner > img')
download_links = []
folder_path = '/Users/zhoujiangfeng/Pictures/jandan/'
for img in imgs:
img_link = img.get('src')
download_links.append(img_link)
for item in download_links:
#使用urllib下載圖片到本地
urllib.request.urlretrieve(item,folder_path + item[-21:-16])
print('done')
def get_more_pages(start,end):
for one in range(start,end):
get_page(url+str(one))
time.sleep(2)
get_more_pages(1,10)
總結
- 注意圖片鏈接的信息薪鹦,需以圖片格式后綴名保存(截取相應位數)
- 使用urllib庫的方法下載圖片到本地
最后編輯于 :
?著作權歸作者所有,轉載或內容合作請聯(lián)系作者