# -*- coding: utf-8 -*- import sys reload(sys) import datetime import time sys.setdefaultencoding("utf-8") from ghost import Ghost ghost = Ghost(wait_timeout=20) url="http://www.51sjk.com/Upload/Articles/1/0/320/320926_20220812160250886.jpg" page,resources = ghost.open(url) result, resources = ghost.wait_for_selector("#wxmore a") from bs4 import BeautifulSoup c=0 while True: if c>=30: break soup = BeautifulSoup(ghost.content) for wx in soup.find_all("h4"): print wx page, resources = ghost.evaluate( """ var div1 = document.getElementById("wxbox"); div1.innerHTML = ''; """) ghost.click("#wxmore a") result, resources = ghost.wait_for_selector(".wx-rb3") c=c+1 pass
用户登录
还没有账号?立即注册
用户注册
投稿取消
文章分类: |
|
还能输入300字
上传中....