使用ghost.py 通过搜搜 的微信搜索来爬取微信公共账号的信息
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
|
# -*- coding: utf-8 -*- import sys reload (sys) import datetime import time sys.setdefaultencoding( "utf-8" ) from ghost import Ghost ghost = Ghost(wait_timeout = 20 ) page,resources = ghost. open (url) result, resources = ghost.wait_for_selector( "#wxmore a" ) from bs4 import BeautifulSoup c = 0 while True : if c> = 30 : break soup = BeautifulSoup(ghost.content) for wx in soup.find_all( "h4" ): print wx page, resources = ghost.evaluate( """ var div1 = document.getElementById("wxbox"); div1.innerHTML = ''; """ ) ghost.click( "#wxmore a" ) result, resources = ghost.wait_for_selector( ".wx-rb3" ) c = c + 1 pass |
以上所述就是本文的全部内容了,希望对大家学习Python能够有所帮助