Python-微信小程序信息的爬取

本文轉載自查看原文 2020-06-03 10:39 561 Python

import requests
import csv
from lxml import html
from bs4 import BeautifulSoup
Header = {
    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3928.4 Safari/537.36'
}
def getdata(url):
    resp=requests.get(url)
    ht=resp.text
    soup=BeautifulSoup(ht,"lxml")
    title=soup.find('h1',class_='ph')
    print(title.text)
    p = soup.find('div', class_='blockquote')
    print(p.text)
    time=soup.find('span',class_='time')
    print(time.text)
    #保存在csv文件當中
    with open("微信小程序.csv", "a", newline="") as cf:
        w = csv.writer(cf)
        w.writerow([title.text, p.text, time.text])
        cf.close()

def parse_page(url):
    resp=requests.get(url,headers=Header)
    resp.encoding = resp.apparent_encoding
    temp = resp.text
    ht = html.fromstring(temp)
    informations = ht.xpath('//*[@id="itemContainer"]/div/div/h3/a')
    #抓取在該網頁下的超鏈接
    for inf in informations:
        url2 = "http://www.wxapp-union.com/" + inf.get('href')
        getdata(url2)
    print('微信小程序全部爬取完成')
def began():
    #小程序頁面共計有107頁
    url = "http://www.wxapp-union.com/portal.php?mod=list&catid=1&page={}"
    for i in range(1,108):
        new_url=url.format(i)
        parse_page(new_url)
if __name__ == '__main__':
    began()

免責聲明！

本站轉載的文章為個人學習借鑒使用，本站對版權不負任何法律責任。如果侵犯了您的隱私權益，請聯系本站郵箱yoyou2525@163.com刪除。

猜您在找 scrapy爬取微信小程序社區教程（crawlspider） python實戰===爬取所有微信好友的信息 Python-爬取某條微博下的圖片評論 Python爬取微信好友微信小程序爬坑日記統計微信好友信息小程序微信小程序之藍牙廣播信息微信小程序信息展示微信小程序 --- 獲取設備信息微信小程序獲取個人信息