python webkit 异步抓取页面数据

最新推荐文章于 2024-05-10 09:39:05 发布

原创最新推荐文章于 2024-05-10 09:39:05 发布 · 7.7k 阅读

2 ·

CC 4.0 BY-SA版权

文章标签：

#Python #WebKit #JavaScript #URL

python 专栏收录该内容

11 篇文章

订阅专栏

#!/usr/bin/python
from ghost import Ghost


class FetcherCartoon:

	def getCartoonUrl(self, url):
		
		if url is None:
			return false
		#todo many decide about url
		
		ghost = Ghost()
		#open webkit
		ghost.open(url)
		#exceute javascript and get what you want 
		result, resources = ghost.evaluate("document.getElementById('cp_image').getAttribute('src');")
		del resources
		return result


if __name__ == "__main__":
	url = 'http://www.dm5.com/m136836-p3/'
	result = None
	fetcher = FetcherCartoon()


	result = fetcher.getCartoonUrl(url)
	print result