按關鍵字搜索並爬去微信公眾號文章


#!/usr/bin/python3
# -*- coding:utf-8 -*-

import re
import json
import time
import requests
from bs4 import BeautifulSoup
from urllib.request import quote


"""
from urllib.request import quote
url = 'http://www.example.com/api.php?text=中文在這里'

# 不帶附加參數
print('>>> %s' % quote(url))
>>> http%3A//www.example.com/api.php%3Ftext%3D%E4%B8%AD%E6%96%87%E5%9C%A8%E8%BF%99%E9%87%8C

# 附帶不轉換字符參數
print('>>> %s' % quote(url, safe='/:?='))
>>> http://www.example.com/api.php?text=%E4%B8%AD%E6%96%87%E5%9C%A8%E8%BF%99%E9%87%8C
"""

"""
https://httpbin.org/ip
"""


class WeixinSpider():
    def __init__(self,key):
        self.key = key
        self.sougou_search_url = "http://weixin.sogou.com/weixin?type=1&query={}&ie=utf8&s_from=input&page={}&_sug_=n&_sug_type_="
        # 設置header,模擬瀏覽器
        self.headers = {'User-Agent':'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3112.113 Safari/537.36'}
        # 代理池接口:從代理池獲取代理IP
        self.proxy_url = 'http://10.0.0.9:8000'
    def get_proxy(self):
        '''
        請求代理池,隨機返回IP地址
        :return: 
        '''
        # text = requests.get(self.proxy_url)
        text = requests.get(self.proxy_url).text
        proxy = {
            'http':'http://{}'.format(text),
            'https':'https://{}'.format(text)
        }
        print('當前代理IP是:http://{}'.format(text))
        return proxy
    def get_search_response(self,url,proxy=None,total=3):
        if 0 == total:
            return None
        try:
            content = requests.get(url,headers=self.headers,proxies=proxy,timeout=3).content
        except Exception as e:
            print('異常:{}'.format(str(e)))
            print('代理異常,重試...')
            total -= 1
            return self.get_search_response(url,proxy=self.get_proxy(),total=total)
        if '輸入驗證碼' in content.decode('utf-8'):
            total -= 1
            return self.get_search_response(url, proxy=self.get_proxy(), total=total)
        else:
            return content

    def get_wx_hkmovie(self,sougou_response):
        soup = BeautifulSoup(sougou_response.decode('utf-8'),'lxml')
        return [i.find('p',class_='tit').find('a')['href'] for i in soup.find_all('div',class_='txt-box')]

    def get_wx_article(self,response):
        req = re.compile(r'var msgList = (.*?}}]})',re.S)
        article_urls = re.findall(req,response.decode('utf-8'))
        return json.loads(article_urls[0])

    def time_format(self,timestamp):
        return time.strftime("%Y-%m-%d %H:%M:%S",time.localtime(timestamp))

    def parse_article(self,response):
        article_list = response.get('list')
        # articles = []
        prefix = "https://mp.weixin.qq.com"
        for article in article_list:
            article_author = article.get('app_msg_ext_info').get('author')
            article_url = article.get('app_msg_ext_info').get('content_url')
            article_title = article.get('app_msg_ext_info').get('title')
            article_addtime = article.get('comm_msg_info').get('datetime')
            print("作者:{},標題:{},時間:{},鏈接:{}".format(article_author,article_title,article_addtime,article_url))
            # item = {'author':article_author,'title':article_title,'datetime':self.time_format(article_addtime),'url':prefix+article_url}
            # articles.append(item)
        # return articles

    def main(self):
        content = self.get_search_response(self.sougou_search_url.format(self.key,10))
        for url in (self.get_wx_hkmovie(content)):
            print(url)
            html = self.get_search_response(url)
            article_dict = self.get_wx_article(html)
            # with open('Weixin_{}.txt'.format(self.key),mode='w',encoding='utf-8') as wf:
            #     wf.write(url+"\n")
            self.parse_article(article_dict)
                # wf.write(article_str+"\n")
                # wf.write("##############################################"+"\n")
            # break
if __name__ == '__main__':
    key = input('>>> ')
    spider = WeixinSpider(key)
    spider.main()
    # with open('SogouWeixin_python.txt',mode='r',encoding='gb2312') as rf:
    #     for line in rf:
    #         print(line)

  

 

 1 D:\soft\work\python35\python.exe D:/soft/work/work/20170925/sougou.py
 2 >>> python
 3 http://mp.weixin.qq.com/profile?src=3&timestamp=1508164694&ver=1&signature=IstVuOsMvC9JxSgNijn*x0hCsKSj9gxcQUZMYTSLsJ3DmCdT1iL*xhnLEy8kMUsDjAPhuZ1FOmLYm0tB-cUIPQ==
 4 作者:陳章,標題:2017年9月6日,時間:1504691232,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4c0t9dSZy-x7--ObsKVye0p4xpKHPQc5Rmu9Y6BKiGRPq4xK72Rrm-F1uQWc*nQN-iwUn4QC93JQyAYeDvvYka0=
 5 作者:陳章,標題:2017年9月5日,時間:1504602088,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4UzdgZNoGvCUZEA-mb9rhHB3SVBTF0wXcdeKnAqHDvS36jN0ZwHyiQNml-OHtr63Yyg6eJM*Zy9uCtBWUmG74nk=
 6 作者:陳章,標題:2017年9月4日,時間:1504518038,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4f9bHpSovDnfkNgXYqbRiEgyHgP7bqDJy3wK8At*i9FvaNUmiRiMYRQzSLUqefyak-j1dc6Ds3rOI5LSw73A5dE=
 7 作者:陳章,標題:2017年8月28日技術日記,時間:1503978338,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4bdAel5vdI1YrLxks1Gy4I2SH61DPdV11BucznpftjztJwNs3ayroyisMmPAg3zic5Z-MnRD9PyOtxuDgPFNSNg=
 8 作者:陳章,標題:2017年8月26日,時間:1503755794,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4eY0iFeJudhV5TXqM0IRKyKNuCfpNtrvxojLcqmwPAeHpc3fNrR9rLlXizeNsQc8N7rbP4ZDxur5SlIxpCkxsQs=
 9 作者:陳章,標題:2017年8月13日,時間:1502617504,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4fZrEzQRRP*oLpMdmGaumkAxOuwOJlddlONwv63YQ-HIG5q3CojJOKoCxyXoAkknPk65GZfyTygnKuc8YoYRlUE=
10 作者:CheungChan,標題:selenium調用chromedriver禁用flash時遇到的深坑,時間:1500627064,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4UjEBWliLF9GsgOv59rAWexEQjU2jJNXDFUJ6rWDF8nXxkinRHg0Sun8ujpdSvk*3qq*lbyu6JF3-v14fY3xxco=
11 作者:CheungChan,標題:python項目簡單實現自定義配置覆蓋默認配置,時間:1500448400,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4ezoLAjpY8xq9mXBTbuSJ-gMlCJUD5LqqzAEqJI6KerR8pcn3S9VVYVjH-wuNhqBDYOHFFKvnNOTD1hUJtvIvYo=
12 作者:ChuengChan,標題:配置vim為pythonIDE小結,時間:1492775424,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4YsXsdEBiCcX2wa5VhFHn9Q1Qrv33qzRuIrHr1qXW-UJ8JAz4s3SFveedBlI6I1KdHofhqkw5KxMZ922aErbVZ4=
13 作者:CheungChan,標題:django框架orm層api簡單總結,時間:1484032960,鏈接:/s?timestamp=1508164694&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PLMzzNSuVV3Q6b5Nw6Bo7IjXNSyDo1XVgJk8v8r09UQm6Uu667lTnMKEbeQAJa5k4TNDFYDGyFOOB*SZdRl4DDLseGEEqm1K4a8lDkoaBrARYyxccQurYHD8ks3Lt*7aPuONMMQbE*9Wjl2mwP0BOB8=
14 http://mp.weixin.qq.com/profile?src=3&timestamp=1508164694&ver=1&signature=DGakM4MrDnvd01JM6ApX3Yv*jmKeiIhex*DYA5PVyAcknJYfetZdWu4uD7bKW4Jg3NmhsTMxk3yu4hURxVP9UA==
15 作者:檸檬,標題:Python 運算符,時間:1479204290,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3CkKjbQpKLD9LrI7Zs3hl90UuQo77q5EPfuRKcPtcpT6vn9PfzIsman4DhSHvSPa6HSDNVxZ7ct1vYV-bgxiQJEI=
16 作者:檸檬,標題:Python 變量類型,時間:1479115697,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3Cmg9ce6bARZs-nWzuhz5EujlCnZxQ3hDMFcnsNtMgZUUOUWTDVA83CZRsqUkyIxOqkjiLb4sbwseLOoIkPy-2j8=
17 作者:檸檬,標題:Python 環境搭建,時間:1478769596,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3CkWwl3doZOH1*7N0fAlrlQjh1ACsDT1dxQU5f5T-FBbzpZG7Z6SMyMx5pdIWQNAQluTmxLspgWLK4K3Zcw6Pkw0=
18 作者:檸檬,標題:Python 簡介,時間:1478687814,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3CvKG5Dmbi8u0AaNe7tiK544KRYVnEbh4Jk6tTKfBpkVD*ikrK7eXBFH*PzhX7K3MPjYweYNOZtZfmnEn3arfOks=
19 作者:,標題:MySQL NULL 值處理,時間:1472011203,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3Cruu1pv-zT3jYImOcFJ30TyPuzQRcinWOZln6ow6UsPGRUyNQnNrS45LeelGmwy*8o8wvG4hweTnyqxD7iiXN6Q=
20 作者:,標題:Mysql 連接的使用,時間:1471930374,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3CkC9bfF7-9OYosjOt-*q-7Ddb7umB8cPzFqi1ZOQoi6iW9wEqNIeIM1Q6htJVQZSp*ibkwbDgm57NnUKIzvKeSg=
21 作者:,標題:MySQL LIKE 語句,時間:1471829721,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3CkvBo5gNgAP8glRJnkFyMoCgNjnDacndoVYwpNspE4XUgAIRIeA1XvgJRzIm5YTh8EpKlSs3JVhALDaua1vQGhg=
22 作者:,標題:MySQL DELETE 語句,時間:1471492609,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3Cn5RdI-eO450bpGe3AS61y5xIaiQ5DR3dSYLIX2nUNzb*vdyABRmvm9ljNjxUU1nOx4MNjfSpMKiz3eE5MowxhQ=
23 作者:,標題:MySQL UPDATE 語句,時間:1471416786,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3CnxL*5wvdLCQNdbop-csF-jUx6RGBbxqaLZPjrTt8aj0xn*THQBfo2bv75XO5Fnl6JLKAFS2p-fexRRhM8DC2Fs=
24 作者:,標題:MySQL where 子句,時間:1471321727,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMicQqaMwtoB3yG1IgRxJIq2S9*xCw9eG5kVERmL-3jc3CvugD5bCSl54FX2F4jr*bxAkHntPTJ6Qlpq9CYfR1LRlu954d2eCkcd8Qkv*iucuCkEfEA6tOGS6yAzbAm8LDHc=
25 http://mp.weixin.qq.com/profile?src=3&timestamp=1508164694&ver=1&signature=lAKlFlXYoTKA9eFAhmlPH4RWSEJYea9WxpFAzwgjUByqf1jijpjdCsILg8NWliN*w8NYPTX*kx-hBd5gFEZ2wg==
26 作者:小成老師,標題:搞事情,猜猜小成老師最近要發什么大招?,時間:1492007521,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyTy8SUxNynpwaC-SYeiYgG7-A69KDbNXliPTARb5BIZ3JqtNruMpdZoakPfNeBXRuMQ2XHiJ2abXGGSUrA7Kmen0=
27 作者:,標題:每一個中國人,都應該讀一下《論持久戰》(深度),時間:1491645931,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyT9xnPAwDLTiv9dYovIue3caKvzUGZHn6EZdZnLyDGfV4F9CkwNauojMIShwM5cDQYdCVAQGLDds3*aGSCeqItdY=
28 作者:,標題:最可怕的不是失業,而是你沒有考慮過失業!,時間:1487684264,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyT1OhJ90nh6iPbTK59arcaMepvVgc8tmElih1aiEVA1iSLJONWE-4m3qJMRBgu2tCSBV4i4KRYk-3s7QH4uupHJ0=
29 作者:sunedu,標題:別再上“一萬小時定律”的當了,科學家說它很不靠譜,時間:1487474925,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyT2ZTaamVZCyq4yS7lGKYD9gDXTwM*dPLWCewge7zXslPPfu7xivwNWa-nKOzj3NTobFn6IPJV01SiO36ZlaZnIM=
30 作者:,標題:“4E ”認證體系與繼續教育,時間:1486557161,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyT6XPYd7JBDfgyk07l5ojGTIUve0YJdDVm8ID-IqwnJ368i5H2ML*UGctef1KToN0EtJvC69RA-QBCX5hxg9WmBo=
31 作者:小成老師,標題:金融理財概述及CFP資格認證制度,時間:1486305736,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyT98NAfm5pqQ5GxssI2AZDN*4fUTZmCxudyPsbMNhf0GZhxp1Z*r*KRMRdZQ8TIs*FtwrJ51-yGcqOOg1-gcuBwg=
32 作者:小成老師,標題:小成老師AFP助學計划,時間:1486219932,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyTy7WSNv*rEBQlTAtBYs0yqgWQNwLNhaJeuwSRPgDYpIpJElK-NUpS8jXYJh-E6jvI9cOt77J0*RXVOubaDz*27Y=
33 作者:夢想規划師,標題:說一說理財中風險那些事兒,時間:1486127244,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyT4QZinRr5xTaN0tdINK2uzxZFlV0uuQix3aa6Q4Le*inqOsQ-2BcD0Y4QAHDTK575VucKqDLmqEhN-MPCKhoMzQ=
34 作者:曾成,標題:該不該買萬能保險?,時間:1479574339,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyT6DMjqyRnz2vHL-awMOzHzYEQhmWgaZLD*uOEcuop8GS3NV-KZpxgcKojYxmOCOJgiaeV4dhoTg1zVZeSWQvJI4=
35 作者:,標題:你投P2P,還是學點風險管理吧,時間:1479521555,鏈接:/s?timestamp=1508164695&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PHvZZO8-O9A090T4EnDOMid71vderF-o*M5WZeqTL9xKa9Uv-oZFjGTZNsMui0EyT0ZEQVVASfWg84ZSYQOpm7xdiAFU40Foo17VEDOn7T4XTck1dnL3XhS2pc*NWbrt4ID6B6iB9ARQSoI-yyLm0EA=
36 http://mp.weixin.qq.com/profile?src=3&timestamp=1508164694&ver=1&signature=1aWiNfiMZEaNavn5O-rtgID-YtbD9cnY4x0w1oZaH5GMxtN-TSUduOg6EUI3xmjouGa0g-dZ3ToEnExZsGYf-A==
37 作者:,標題:動態生成網頁下載—渲染類,時間:1497412525,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7AIM0G-Kmb47P*BFkGRgsBmxAjvE1LQnsao0NhkptIIBCLRk65XyOiWvJZ3NalWe6iQZ1iFLtSAaXXoHotmF5yo=
38 作者:,標題:多進程並發爬蟲,時間:1496979039,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7Ai3OVjtOijUYYDfiItUnxGlFbLzt3N2iDbdNSN2*mks8vmrl0kKv1ndf3tE1EKk9sUstGv4kJlGsrOnF19dBDE=
39 作者:,標題:鏈接爬蟲,時間:1496633905,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7C0dKXO*KdnHmx6ZctteXjRYYH1kRxSD9qssqnCus*H3trP*YkMa532VZ8V00DJVIYeIbW5Wv5zxvYmYOVWqf-k=
40 作者:,標題:堆排序,時間:1496320156,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7PAuhh51XxdAMcsZ4EuqDp7nTH*rgueVWIh3D9xntz9C*nYahdcAP4cz5MaPbynTjZ6hED0fhFTetBO3ZYKPKSs=
41 作者:,標題:糗事百科小爬蟲,時間:1496211976,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7Azs0C-5nzr1P-nRr9CV51o3am*cazrOno90q4Dh6jeadJjDeOVVIKOC*ukBAWL14haJBtTMXuv22jRVU*9tlYA=
42 作者:,標題:scrapy框架中的headers類,時間:1495845289,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7Gbq27ajqgH429Bif5nj-wzKaBjSB*QInnwIjCiDcW5707S9q5XvUYPzMGSENDWITwwq77ERgPXEmvYLnfM*eLg=
43 作者:,標題:生成密碼文件,時間:1495787373,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7Gp7ocbsrZCHuJbgjursT5*bELP--5G8vBY98RAAEJNWub9YARTILP0fxnOmljg*k58Yx6I6YJdBCcm-6NE3z1M=
44 作者:,標題:scrapy爬蟲,時間:1495612119,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7M0yMWUG*nsyDTx*WKfs80icVgDUTuh04Mtc0OnI6MfZcHJHFvQlQwnPLX2tdsuikwfEuwSGvDWo51Zod77w7hI=
45 作者:,標題:猜數字,時間:1495524656,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7ARgprB663iFp1OP7YBS0DOxdEr-YXbeJW3UiAr4fW7p1jy*0YSv3hpyq744Oq4Z58Md2JTKuYhXwbPCpG3BTUM=
46 作者:,標題:測試瀏覽器速度,時間:1495444483,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfyIB6Zj32AM8mGX*OGODZYfgR1E-ArNpwhQXjCA57P7KjEtUXbP7Yp9Mn-kZWpdEraeYZKbxRkoA3BBksRyxh4*yqWlhWewnWvX1xPfrQVPoqmz-cEl1bjPzDGANZmosM=
47 http://mp.weixin.qq.com/profile?src=3&timestamp=1508164694&ver=1&signature=AcFuowV3ZjTBxLCcXCX7-NBm-D0-YaKnreBiywa*sAnjb*qfdmtNhF-H9UNfcqTclwu5KHP56X3MNkL3f1y11w==
48 作者:貝克田庄,標題:Python爬取貼吧圖片,時間:1507790324,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDcc5*NqoM6yTCr4gLxSWKHvu*pmy1ml39cfe4LPTw-3yYuNrpJQnoC9Loy3Lvv2AZHjSoXSbLmS-FhlRd-85vglKg=
49 作者:,標題:編寫更好Python程序的5個技巧,時間:1507553279,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDcc3NBP-Hw1NoI8MHbNqfETFqdtzyzeSM3hhMq6JCaAF-tSTHXoG361zV1gIp2zFgFkVdYEhDtwjEqnuG5snFjRUM=
50 作者:冰是睡着的水,標題:500 行 Python 代碼構建一個輕量級爬蟲框架,時間:1507460022,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDccwLP6o*MQnF*rODy8JWF0lE2ha3dqyFZihjJcy28yYVyrpje-rWYObI4xLiyhAyW7-gc*gvSV1Cq5HO46xQYfXo=
51 作者:凡夢,標題:Android和Python之間的小秘密,時間:1505977153,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDcc7JpMl6NMhfDhyUCzP1oz-93FU363iqTMdyGSGEUBGfomppvTxRK6YBJQFx2N5o-F5vGgEoc5XO-ytYVi4uASHA=
52 作者:,標題:Python多線程學習,時間:1505905972,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDcc-lXkRCCxbqDfC-clFpxCWIfHwFMxLpPIIHADCe-Zf1mRau31gb7U9ihHmi7zZpzXTGzEDy9vQb7-7dWWikoTFE=
53 作者:,標題:十一去哪里?Python來幫你!,時間:1505139904,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDcc*2OpPausstVFAwxXXXvC8OV1ebFmMpJ8*Q7w-0CFWNnffkjCTVbQ8bWLYwyBwGu1-IR4HLCYdl*LQFj7-iMnK8=
54 作者:凡夢,標題:還不會Python正則表達式?看這篇文章試試,時間:1504964495,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDccz6DSCXiqZknbS5BSRtXRLZWqPaPQTZws0q0QI5-RUGm727trbP6sCken8lavDHyFGUIkSO*7E5c2noK9MR1E4s=
55 作者:,標題:Python開發簡單爬蟲,時間:1504794202,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDcc4Mp3qAW0gTtVCTnWP7aGukR3RTpeZ7DrypIY-efrMcKqfP4e2fsyTvT4hP32i*JMp-GjAB2bLIU296ZR3b8A3I=
56 作者:凡夢,標題:Python模擬登陸12306,時間:1504614650,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDcc0-vdhMcXi5lFDwCICBYako-zP27ZNK7OiBQmyyTP9LOIiqfAAbGwoZ6bCmOG5gLgwD-z*YR-UxAGwuXdz6hrOs=
57 作者:,標題:為什么說Python是偉大的入門語言,時間:1504510781,鏈接:/s?timestamp=1508164696&src=3&ver=1&signature=iIJXEqJtxS0IG1vEt7P4PPnNGBHjYYzvJr9xPZnOhRfYgAeU2MNQZidKCzP8jXBtl0jT2sVXsh1zP09j8bDcc9LWxZSOiUiU-n*7XW1wnFKzi*vvLrK2luaD*zacqViw2NkSe9IobfvEP-JORVZ087jIKdUhWFzwwdRgGTPixP0=
58 http://mp.weixin.qq.com/profile?src=3&timestamp=1508164694&ver=1&signature=03sGuUKmFI3W4EMT3e3kC-yoRJ6M*dEwlIkVwjz83qgF6kARbIVC*MRgelmDe7UQ5CmjKv*ZmJ**zjOAUTuIdA==
59 Traceback (most recent call last):
60 ...
執行結果

 

由於請求過於頻繁,就會出現如下所示驗證碼:

 

樓主學藝不精,沒有做驗證碼識別  ==''

 


免責聲明!

本站轉載的文章為個人學習借鑒使用,本站對版權不負任何法律責任。如果侵犯了您的隱私權益,請聯系本站郵箱yoyou2525@163.com刪除。



 
粵ICP備18138465號   © 2018-2025 CODEPRJ.COM