方法一:
import requests
# 引用requests庫
from bs4 import BeautifulSoup
# 引用BeautifulSoup庫
res_foods = requests.get('http://www.xiachufang.com/explore/')
# 獲取數據
bs_foods = BeautifulSoup(res_foods.text,'html.parser')
# 解析數據
list_foods = bs_foods.find_all('div',class_='info pure-u')
# 查找最小父級標簽
list_all = []
# 創建一個空列表,用於存儲信息
for food in list_foods:
tag_a = food.find('a')
# 提取第0個父級標簽中的<a>標簽
name = tag_a.text[17:-13]
# 菜名,使用[17:-13]切掉了多余的信息
URL = 'http://www.xiachufang.com'+tag_a['href']
# 獲取URL
tag_p = food.find('p',class_='ing ellipsis')
# 提取第0個父級標簽中的<p>標簽
ingredients = tag_p.text[1:-1]
# 食材,使用[1:-1]切掉了多余的信息
list_all.append([name,URL,ingredients])
# 將菜名、URL、食材,封裝為列表,添加進list_all
for i in list_all:
print (i)
# 打印
方法二:
import requests
for i in list_all:
print (i)
# 打印