python webkit 异步抓取页面数据

最新推荐文章于 2022-04-25 17:50:07 发布

转载最新推荐文章于 2022-04-25 17:50:07 发布 · 1k 阅读

python 专栏收录该内容

37 篇文章

订阅专栏

http://blog.youkuaiyun.com/cabing2005/article/details/9764379

http://nightly.webkit.org/

[python]view plaincopy 
   
 #!/usr/bin/python  
 from ghost import Ghost  
   
 class FetcherCartoon:

[python]view plaincopy 
   
 def getCartoonUrl(self, url):  
       
     if url is None:  
         return false  
     #todo many decide about url  
       
     ghost = Ghost()  
     #open webkit  
     ghost.open(url)  
     #exceute javascript and get what you want   
     result, resources = ghost.evaluate("document.getElementById('cp_image').getAttribute('src');")  
     del resources  
     return result  

[python]view plaincopy 
   
 if __name__ == "__main__":  
     url = 'http://www.dm5.com/m136836-p3/'  
     result = None  
     fetcher = FetcherCartoon()  
   
   
     result = fetcher.getCartoonUrl(url)  
     print result