-
http://www.pythonscraping.com/pages/warandpeace.html
- 提取以上網(wǎng)頁中所有的對話(顯示為紅色字體)
-
http://www.pythonscraping.com/pages/page3.html
- 提取以上網(wǎng)頁中禮物標(biāo)題(title)和禮物花費(cost)
- 查詢禮物“Dead Parrot” 的花費(cost)
import requests
from bs4 import BeautifulSoup
url_1 = 'http://www.pythonscraping.com/pages/warandpeace.html'
url_2 = 'http://www.pythonscraping.com/pages/page3.html'
r1 = requests.get(url_1)
r2 = requests.get(url_2)
soup1 = BeautifulSoup(r1.content, 'html.parser')
soup2 = BeautifulSoup(r2.content, 'html.parser')
# 1)提取以上網(wǎng)頁中所有的對話(顯示為紅色字體)
redText = soup1.find_all("span", {"class":"red"})
for item in redText:
print(item.text)
# 2)提取以上網(wǎng)頁中禮物標(biāo)題(title)和禮物花費(cost)
# title
items = soup2.find_all('tr',{"class":"gift"})
for item in items:
print(item.td.text)
#cost
for item in items:
print(item.contents[2].text)