from lxml import etree
text = """
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
"http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>
<meta http-equiv="X-UA-Compatible" content="chrome=1,IE=edge">
<meta name="renderer" content="webkit"/>
<meta name="applicable-device" content="pc">
<meta name="domain_verify"
content="pmrgi33nmfuw4ir2ejyws5ltnbuweyljnnss4y3pnurcyithovuwiir2ejqwmyrtguzdgobsmezdgnbyheywcmzthbrdmmtemu4tamrqg5rtmirmej2gs3lfknqxmzjchiytkmrzgq4demjugaydcnd5">
<title>糗事百科 - 超搞笑的原创糗事笑话分享社区</title>
<meta name="keywords" content="笑话,搞笑,笑话大全 爆笑,笑话大全,糗事百科,幽默笑话,爆笑笑话"/>
<meta name="description" content="糗事百科是一个原创的糗事笑话分享社区,糗百网友分享的搞笑段子、搞笑图片大全,都是糗友最珍贵的开心经历,爆笑糗事笑话只在糗事百科!"/>
<meta http-equiv="mobile-agent" content="format=xhtml;url=//www.qiushibaike.com/">
<meta http-equiv="mobile-agent" content="format=html5;url=//www.qiushibaike.com/">
<link rel="canonical" href="//www.qiushibaike.com"/>
<meta name="robots" content="noarchive">
<link href="//static.qiushibaike.com/css/dist/web/v4/app.min.css?v=09995bc651774a8592961850d011e4f1"
media="screen, projection" rel="stylesheet" type="text/css"/>
<script type="text/javascript">
// Baidu Automatic push content
var _hmt = _hmt || [];
(function () {
var hm = document.createElement("script");
hm.src = "https://hm.baidu.com/hm.js?2670efbdd59c7e3ed3749b458cafaa37";
var s = document.getElementsByTagName("script")[0];
s.parentNode.insertBefore(hm, s);
})();
// 收集运营上缓存证据
window.config = {
'user_time': '2019-06-21 15:49:56',
'version': '2017-09-04 14:36'
}
</script>
</head>
<body>
<div id="content" class="main">
<div class="content-block clearfix">
<!-- 左边sidebar -->
<!-- 头部 -->
<div class="col0">
<div class="index-col0" id="sidebarLeft">
<div id="index_header" class="index-head">
<ul>
<li>
<a href="/" class="logo-area">
<div class="index-logo"></div>
<h1 class="hidden">糗事百科</h1>
</a>
</li>
<li><a id="menu-hover" href="/" target="_blank" rel="nofollow">热门</a></li>
<li><a href="/hot/" target="_blank">24小时</a></li>
<li><a href="/imgrank/" target="_blank">热图</a></li>
<li><a href="/text/" target="_blank">文字</a></li>
<li><a href="/history/" target="_blank">穿越</a></li>
<li><a href="/pic/" target="_blank">糗图</a></li>
<li><a href="/textnew/" target="_blank">新鲜</a></li>
</ul>
</div>
<!-- 左边栏广告1 -->
<div class="index-side-left-AD1">
<img src="//static.qiushibaike.com/images/web/v4/left_code.png?v=0a1153c06294049ad2da58efa408072e"
alt="糗百二维码">
</div>
</div>
</div>
<div class="col1 new-style-col1">
<!-- 相关推荐 -->
<div class="recommend-article" style="margin-top:-10px;">
<ul>
<!-- 相关推荐item -->
<li class="item typs_video" id='qiushi_tag_121160564'>
<a class="recmd-left video" href="/article/121160564" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-video','chick'])">
<img src="//qiubai-video-web.qiushibaike.com/U1EPUBQH6Q4MW8KF_hd.jpg?imageView2/1/w/150/h/112"
alt="乔老爷子,过审应该没">
<div class="recmd-tag">5:00</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121160564" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">乔老爷子,过审应该没问题吧</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>859</span><span>好笑</span>
<span>·</span>
<span>28</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/11533687" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/1153/11533687/thumb/20160215065133.jpg?imageView2/1/w/50/h/50"
alt="来自火星的芒"/>
<span class="recmd-name">来自火星...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_video" id='qiushi_tag_121143605'>
<a class="recmd-left video" href="/article/121143605" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-video','chick'])">
<img src="//qiubai-video-web.qiushibaike.com/SG4JCNRS318AQUA4_hd.jpg?imageView2/1/w/150/h/112"
alt="公交坐反!女大学生“">
<div class="recmd-tag">0:43</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121143605" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">公交坐反!女大学生“暴雨梨花式”哭着报警……</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>1767</span><span>好笑</span>
<span>·</span>
<span>64</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/33618126" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3361/33618126/thumb/20190412191806.jpg?imageView2/1/w/50/h/50"
alt="风吹裙边跑"/>
<span class="recmd-name">风吹裙边...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_multi" id='qiushi_tag_121196122'>
<a class="recmd-left multi" href="/article/121196122" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-multi','chick'])">
<img src="//pic.qiushibaike.com/article/image/XL84XIOSK8NL1G2W.jpg?imageView2/1/w/150/h/112"
alt="仿佛带了个黑头套">
<div class="recmd-tag">8图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121196122" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">仿佛带了个黑头套</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>282</span><span>好笑</span>
<span>·</span>
<span>1</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/33262784" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3326/33262784/thumb/20181229123534.jpg?imageView2/1/w/50/h/50"
alt="零點糗事"/>
<span class="recmd-name">零點糗事</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_word" id='qiushi_tag_121188685'>
<a class="recmd-left word" href="/article/121188685" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-word','chick'])">
<img src="//static.qiushibaike.com/images/web/v4/textDefault.png?v=12eaf94cfd4d3ae0423a3925bb5bbf9c"
alt="亲兄弟俩承包了镇子上"/>
<div class="recmd-tag">纯文</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121188685" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">亲兄弟俩承包了镇子上所有机关单位的旱厕保洁,把粪便集中处理,而后卖给温室蔬菜大棚,两头赚钱,生意红火。到了年底决算分成,就请我们几个关系好的吃一顿。我开玩笑问他</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>1542</span><span>好笑</span>
<span>·</span>
<span>21</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/32129742" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3212/32129742/thumb/2016091014150661.JPEG?imageView2/1/w/50/h/50"
alt="寒山宽洪"/>
<span class="recmd-name">寒山宽洪</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_multi" id='qiushi_tag_121176489'>
<a class="recmd-left multi" href="/article/121176489" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-multi','chick'])">
<img src="//qiubai-video-web.qiushibaike.com/article/gif/AIPCP6FB6502WD2H.jpg?imageView2/1/w/150/h/112"
alt="在土里挖出来20多万">
<div class="recmd-tag">9图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121176489" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">在土里挖出来20多万块,真是不敢想象</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>279</span><span>好笑</span>
<span>·</span>
<span>3</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/30683297" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3068/30683297/thumb/20190526180344.jpg?imageView2/1/w/50/h/50"
alt="傻妞也"/>
<span class="recmd-name">傻妞也</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_word" id='qiushi_tag_121196402'>
<a class="recmd-left word" href="/article/121196402" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-word','chick'])">
<img src="//static.qiushibaike.com/images/web/v4/textDefault.png?v=12eaf94cfd4d3ae0423a3925bb5bbf9c"
alt="前几天喝醉了,上了我"/>
<div class="recmd-tag">纯文</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121196402" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">前几天喝醉了,上了我哥们的女朋友。那天在哥们家吃晚饭,结果多喝了点他们让我上楼休息,我迷迷糊糊就摸到哥们卧室去,也没开灯看直接倒了下去。然后就听见“嗯~”的一声</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>3752</span><span>好笑</span>
<span>·</span>
<span>81</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/17589011" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/1758/17589011/thumb/20150930000606.jpg?imageView2/1/w/50/h/50"
alt="泥介夫"/>
<span class="recmd-name">泥介夫</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_video" id='qiushi_tag_121197238'>
<a class="recmd-left video" href="/article/121197238" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-video','chick'])">
<img src="//qiubai-video-web.qiushibaike.com/R0S1T15DM8BY94N8_hd.jpg?imageView2/1/w/150/h/112"
alt="夏天的味道……">
<div class="recmd-tag">0:13</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121197238" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">夏天的味道……</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>575</span><span>好笑</span>
<span>·</span>
<span>13</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/13843355" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/1384/13843355/thumb/20190125133956.jpg?imageView2/1/w/50/h/50"
alt="东临~天下"/>
<span class="recmd-name">东临~天...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_multi" id='qiushi_tag_121224238'>
<a class="recmd-left multi" href="/article/121224238" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-multi','chick'])">
<img src="//pic.qiushibaike.com/article/image/RYXLGVB3X0BXHM3R.jpg?imageView2/1/w/150/h/112"
alt="剪了个喜字,总觉得哪">
<div class="recmd-tag">7图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121224238" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">剪了个喜字,总觉得哪里不对劲</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>443</span><span>好笑</span>
<span>·</span>
<span>10</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/33262784" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3326/33262784/thumb/20181229123534.jpg?imageView2/1/w/50/h/50"
alt="零點糗事"/>
<span class="recmd-name">零點糗事</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_video" id='qiushi_tag_121175631'>
<a class="recmd-left video" href="/article/121175631" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-video','chick'])">
<img src="//qiubai-video-web.qiushibaike.com/KV1H5KJB9ES392NG_hd.jpg?imageView2/1/w/150/h/112"
alt="扭个头都是半自动的!">
<div class="recmd-tag">0:09</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121175631" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">扭个头都是半自动的!</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>507</span><span>好笑</span>
<span>·</span>
<span>2</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/18815995" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/1881/18815995/thumb/20181125161931.jpg?imageView2/1/w/50/h/50"
alt="带翅膀的老司机"/>
<span class="recmd-name">带翅膀的...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_image" id='qiushi_tag_121198312'>
<a class="recmd-left image" href="/article/121198312" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-image','chick'])">
<img src="//pic.qiushibaike.com/system/pictures/12119/121198312/small/CYS2UJZLB4OXIN6A.jpg?imageView2/1/w/150/h/112"
alt="咦?貌似哪里不对啊">
<div class="recmd-tag">1图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121198312" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">咦?貌似哪里不对啊<img
src="https://static.qiushibaike.com/static/images/emoji/qb_s_18.png"
align="absmiddle"></a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>313</span><span>好笑</span>
<span>·</span>
<span>2</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/10633497" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/1063/10633497/thumb/20180416103701.JPEG?imageView2/1/w/50/h/50"
alt="日邢一珊"/>
<span class="recmd-name">日邢一珊</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_word" id='qiushi_tag_121190457'>
<a class="recmd-left word" href="/article/121190457" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-word','chick'])">
<img src="//static.qiushibaike.com/images/web/v4/textDefault.png?v=12eaf94cfd4d3ae0423a3925bb5bbf9c"
alt="最近在听一部评书,单"/>
<div class="recmd-tag">纯文</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121190457" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">最近在听一部评书,单老师的《花木兰》。侄子突然问我,花木兰女扮男装进军营为什么没被发现呢?我说古代男女都是长头发,穿上盔甲看不出来吧!侄子突然问我“阿爷无大儿”</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>887</span><span>好笑</span>
<span>·</span>
<span>16</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/16168389" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/1616/16168389/thumb/20190603150145.jpg?imageView2/1/w/50/h/50"
alt="爱泡泡的|胡子哥"/>
<span class="recmd-name">爱泡泡的...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_image" id='qiushi_tag_121169819'>
<a class="recmd-left image" href="/article/121169819" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-image','chick'])">
<img src="//pic.qiushibaike.com/system/pictures/12116/121169819/small/OF2LVLEFHYVGRX7C.jpg?imageView2/1/w/150/h/112"
alt="当问女朋友是不是生气">
<div class="recmd-tag">1图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121169819" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">当问女朋友是不是生气了的时候……</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>267</span><span>好笑</span>
<span>·</span>
<span>1</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/39040667" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3904/39040667/thumb/20180802133508.jpg?imageView2/1/w/50/h/50"
alt="又一盏素酒"/>
<span class="recmd-name">又一盏素...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_video" id='qiushi_tag_121225948'>
<a class="recmd-left video" href="/article/121225948" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-video','chick'])">
<img src="//qiubai-video-web.qiushibaike.com/S46BJAVICSFPP7HT_hd.jpg?imageView2/1/w/150/h/112"
alt="女生最喜欢做什么运动">
<div class="recmd-tag">1:06</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121225948" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">女生最喜欢做什么运动?美女真厉害,听完后我笑了</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>313</span><span>好笑</span>
<span>·</span>
<span>3</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/33262784" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3326/33262784/thumb/20181229123534.jpg?imageView2/1/w/50/h/50"
alt="零點糗事"/>
<span class="recmd-name">零點糗事</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_multi" id='qiushi_tag_121187416'>
<a class="recmd-left multi" href="/article/121187416" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-multi','chick'])">
<img src="//pic.qiushibaike.com/article/image/Y953B0C3PXC5YRQF.jpg?imageView2/1/w/150/h/112"
alt="奢侈一次,一包干吃,">
<div class="recmd-tag">2图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121187416" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">奢侈一次,一包干吃,一包泡着吃</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>238</span><span>好笑</span>
<span>·</span>
<span>3</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/19580707" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/1958/19580707/thumb/20170121104313.JPEG?imageView2/1/w/50/h/50"
alt="海天交汇的地方"/>
<span class="recmd-name">海天交汇...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_video" id='qiushi_tag_121156127'>
<a class="recmd-left video" href="/article/121156127" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-video','chick'])">
<img src="//qiubai-video-web.qiushibaike.com/3H7151416U31S09A_hd.jpg?imageView2/1/w/150/h/112"
alt="狮子始终是兽王[笑">
<div class="recmd-tag">2:39</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121156127" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">狮子始终是兽王<img
src="https://static.qiushibaike.com/static/images/emoji/qb_s_44.png"
align="absmiddle">[捂脸]</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>2382</span><span>好笑</span>
<span>·</span>
<span>209</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/38730746" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3873/38730746/thumb/2018062112485553.JPEG?imageView2/1/w/50/h/50"
alt="撩汉大婶"/>
<span class="recmd-name">撩汉大婶</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_multi" id='qiushi_tag_121154394'>
<a class="recmd-left multi" href="/article/121154394" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-multi','chick'])">
<img src="//pic.qiushibaike.com/article/image/W2RWFRN8QJY18AKY.jpg?imageView2/1/w/150/h/112"
alt="剩九个男的那个你可能">
<div class="recmd-tag">9图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121154394" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">剩九个男的那个你可能不知道什么叫女生帅起来就没有男生什么事了??我们可以内部消化的</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>325</span><span>好笑</span>
<span>·</span>
<span>2</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/33712263" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3371/33712263/thumb/20190606231542.jpg?imageView2/1/w/50/h/50"
alt="一枕清霜゛"/>
<span class="recmd-name">一枕清霜...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_word" id='qiushi_tag_121153722'>
<a class="recmd-left word" href="/article/121153722" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-word','chick'])">
<img src="//static.qiushibaike.com/images/web/v4/textDefault.png?v=12eaf94cfd4d3ae0423a3925bb5bbf9c"
alt="因为平时有点儿强迫症"/>
<div class="recmd-tag">纯文</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121153722" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">因为平时有点儿强迫症,每次超市买完东西,找回零钱和小票,都是把钱放回钱包后,小票随手一撕。今天汽车站买车票。我递上去50。票45元,售票员把车票跟5元钱还给我之</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>1475</span><span>好笑</span>
<span>·</span>
<span>17</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/37507340" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3750/37507340/thumb/20190301191037.jpg?imageView2/1/w/50/h/50"
alt="奔跑的小土狼"/>
<span class="recmd-name">奔跑的小...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_multi" id='qiushi_tag_121156339'>
<a class="recmd-left multi" href="/article/121156339" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-multi','chick'])">
<img src="//pic.qiushibaike.com/article/image/J7Y6P0EDH23F2U15.jpg?imageView2/1/w/150/h/112"
alt="每一次看都笑疯:小时">
<div class="recmd-tag">4图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121156339" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">每一次看都笑疯:小时候,公鸡,泻药,澡堂……</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>266</span><span>好笑</span>
<span>·</span>
<span>1</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/38160879" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3816/38160879/thumb/20180909233849.jpg?imageView2/1/w/50/h/50"
alt="蜀南熟男"/>
<span class="recmd-name">蜀南熟男</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_image" id='qiushi_tag_121163209'>
<a class="recmd-left image" href="/article/121163209" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-image','chick'])">
<img src="//pic.qiushibaike.com/system/pictures/12116/121163209/small/IW3FRO7F2YLHAOWL.jpg?imageView2/1/w/150/h/112"
alt="跆拳道和军体拳">
<div class="recmd-tag">1图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121163209" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">跆拳道和军体拳</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>4522</span><span>好笑</span>
<span>·</span>
<span>187</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/27553574" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/2755/27553574/thumb/20180427153625.JPEG?imageView2/1/w/50/h/50"
alt="砸妳家玻璃"/>
<span class="recmd-name">砸妳家玻...</span>
</a>
</div>
</div>
</li>
<!-- 相关推荐item -->
<li class="item typs_multi" id='qiushi_tag_121215338'>
<a class="recmd-left multi" href="/article/121215338" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-multi','chick'])">
<img src="//pic.qiushibaike.com/article/image/NQ562MF4D5Z6B2H4.jpg?imageView2/1/w/150/h/112"
alt="萌妹成“悍将”屡获焊">
<div class="recmd-tag">3图</div>
</a>
<div class="recmd-right">
<a class="recmd-content" href="/article/121215338" target="_blank"
onclick="_hmt.push(['_trackEvent','web-list-user','chick'])">萌妹成“悍将”屡获焊大奖☞~1998年出生的郑莲身高1米62,体重不足百斤,讲起话来细声细语。但就是这样一个萌妹子,却是第45届世界技能大赛焊接项目选拔赛场上唯</a>
<div class="recmd-detail clearfix">
<div class="recmd-num">
<span>1415</span><span>好笑</span>
<span>·</span>
<span>56</span><span>评论</span>
</div>
<a class="recmd-user" href="/users/31064729" target="_blank">
<img src="//pic.qiushibaike.com/system/avtnew/3106/31064729/thumb/20190207212637.jpg?imageView2/1/w/50/h/50"
alt="绦子"/>
<span class="recmd-name">绦子</span>
</a>
</div>
</div>
</li>
</ul>
</div>
<!-- 全局翻页组件 -->
<ul class="pagination">
<li>
<a href="/8hr/" rel="nofollow">
<span class="prev">
<
</span>
</a>
</li>
<li>
<a href="/8hr/" rel="nofollow">
<span class="page-numbers">
1
</span>
</a>
</li>
<li>
<span class="current">
2
</span>
</li>
<li>
<a href="/8hr/page/3/" rel="nofollow">
<!--<a href="/8hr/page/3/" rel="nofollow">-->
<span class="page-numbers">
3
</span>
</a>
</li>
<li>
<a href="/8hr/page/4/" rel="nofollow">
<!--<a href="/8hr/page/4/" rel="nofollow">-->
<span class="page-numbers">
4
</span>
</a>
</li>
<li>
<a href="/8hr/page/5/" rel="nofollow">
<!--<a href="/8hr/page/5/" rel="nofollow">-->
<span class="page-numbers">
5
</span>
</a>
</li>
<li>
<span class="dots">
…
</span>
</li>
<li>
<a href="/8hr/page/13/" rel="nofollow">
<!--<a href="/8hr/page/13/" rel="nofollow">-->
<span class="page-numbers">
13
</span>
</a>
</li>
<li>
<a href="/8hr/page/3/" rel="nofollow">
<!--<a href="/8hr/page/3/" rel="nofollow">-->
<span class="next">
下一页
</span>
</a>
</li>
</ul>
</div>
<div class="col2">
<div id="sidebar" class="sidebar">
<div class="sidebar-hot clearfix">
<h3>今日10大糗图</h3>
<ul>
<li class="item clearfix image">
<a href="/article/121203925" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiutu','chick'])">
<div><span>
<img src="//pic.qiushibaike.com/system/pictures/12120/121203925/small/UHUC2M0J7QA2T9G1.jpg?imageView2/1/w/150/h/107"
alt="师兄,难道你忘记《青春修炼手册》了吗?"/>
</span></div>
<div><p>师兄,难道你忘记《青</p></div>
</a>
<a href="/article/121128146" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiutu','chick'])">
<div><span>
<img src="//qiubai-video-web.qiushibaike.com/article/gif/V7FFFG2GCP511VSU.jpg?imageView2/1/w/150/h/107"
alt="遇到这样的损友,小哥欲哭无泪"/>
</span></div>
<div><p>遇到这样的损友,小哥</p></div>
</a>
</li>
<li class="item clearfix multi">
<a href="/article/121167734" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiutu','chick'])">
<div><span>
<img src="//pic.qiushibaike.com/article/image/B758MBZ9TQI936HO.jpg?imageView2/1/w/150/h/107"
alt="据说,猫来穷狗来富,大晚上的来了两只小猫咪,怎么办,我都够穷了,不能再穷了,再穷没饭吃了"/>
</span></div>
<div><p>据说,猫来穷狗来富,</p></div>
</a>
<a href="/article/121178919" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiutu','chick'])">
<div><span>
<img src="//qiubai-video-web.qiushibaike.com/article/gif/DVOMJQBI0C8TB19H.jpg?imageView2/1/w/150/h/107"
alt="太会装B了,单身狗赶紧跑开..."/>
</span></div>
<div><p>太会装B了,单身狗赶</p></div>
</a>
</li>
<li class="item clearfix image">
<a href="/article/121162065" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiutu','chick'])">
<div><span>
<img src="//pic.qiushibaike.com/system/pictures/12116/121162065/small/2TSCKXZ4DY2NQAJ4.jpg?imageView2/1/w/150/h/107"
alt="知道自己为什么没钱吗?自己看"/>
</span></div>
<div><p>知道自己为什么没钱吗</p></div>
</a>
<a href="/article/121129363" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiutu','chick'])">
<div><span>
<img src="//pic.qiushibaike.com/article/image/161U4SKFS4DP3QH5.jpg?imageView2/1/w/150/h/107"
alt="红糖水是谎言经期除了让女朋友喝热水之外这些方法更管用"/>
</span></div>
<div><p>红糖水是谎言经期除了</p></div>
</a>
</li>
<li class="item clearfix multi">
<a href="/article/121134347" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiutu','chick'])">
<div><span>
<img src="//pic.qiushibaike.com/article/image/QNAZ1BPU6MQ1GSYL.jpg?imageView2/1/w/150/h/107" alt="论:如何作死"/>
</span></div>
<div><p>论:如何作死</p></div>
</a>
<a href="/article/121123012" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiutu','chick'])">
<div><span>
<img src="//pic.qiushibaike.com/system/pictures/12112/121123012/small/GDW7PM12K2TW0PFD.jpg?imageView2/1/w/150/h/107"
alt="说假期期间,男子张某开车从山西前往湖北。想着长途开车容易疲劳,于是张某花1000元请了代驾。第二天凌晨车快到目的地时,张某担心代驾会疲劳,于是主动换代驾休息自己"/>
</span></div>
<div><p>说假期期间,男子张某</p></div>
</a>
</li>
</ul>
</div>
<div class="sidebar-text clearfix">
<h3>今日10大糗事</h3>
<ul>
<li class="item clearfix word">
<a class="sidebar-left" href="/article/121187526" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiushi','chick'])">
<img src="//static.qiushibaike.com/images/web/v4/textDefault.png?v=12eaf94cfd4d3ae0423a3925bb5bbf9c"
alt="初中,扯了上铺两米多"/>
<div class="top">
<div class="top-icon top1-icon"></div>
</div>
</a>
<a class="sidebar-right" href="/article/121187526"
title="初中,扯了上铺两米多的卫生纸去厕所蹲坑,隔壁蹲坑没带纸,问我借纸,我就给了他差不多一米的纸,他在哪里愣了一会没说话,了事走人的时候回头跟我说:“哥们,以后有什么"
target="_blank" onclick="_hmt.push(['_trackEvent','web-sidebar-qiushi','chick'])">
<p>初中,扯了上铺两米多的卫生纸去厕所蹲坑,隔壁蹲坑没带纸,问我借纸,我就给了他差不多一米的纸,他在哪里愣了一会没说话,了事走人的时候回头跟我说:“哥们,以后有什么</p>
<div>
<span>5745</span><span>好笑</span>
</div>
</a>
</li>
<li class="item clearfix word">
<a class="sidebar-left" href="/article/121167144" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiushi','chick'])">
<img src="//static.qiushibaike.com/images/web/v4/textDefault.png?v=12eaf94cfd4d3ae0423a3925bb5bbf9c"
alt="北冥有狗,其名为哈。"/>
<div class="top">
<div class="top-icon top2-icon"></div>
</div>
</a>
<a class="sidebar-right" href="/article/121167144"
title="北冥有狗,其名为哈。外形冷峻,内心傻瓜,三更半夜,呜呜啦啦,主人不在,专门拆家,床单沙发,稀里哗啦,钢铁横梁,犹如泥巴!哈之大,一锅顿不下。化儿为犬,其名为奇。"
target="_blank" onclick="_hmt.push(['_trackEvent','web-sidebar-qiushi','chick'])">
<p>北冥有狗,其名为哈。外形冷峻,内心傻瓜,三更半夜,呜呜啦啦,主人不在,专门拆家,床单沙发,稀里哗啦,钢铁横梁,犹如泥巴!哈之大,一锅顿不下。化儿为犬,其名为奇。</p>
<div>
<span>581</span><span>好笑</span>
</div>
</a>
</li>
<li class="item clearfix word">
<a class="sidebar-left" href="/article/121184548" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiushi','chick'])">
<img src="//static.qiushibaike.com/images/web/v4/textDefault.png?v=12eaf94cfd4d3ae0423a3925bb5bbf9c"
alt="去男友家一般叫他爸妈"/>
<div class="top">
<div class="top-icon top3-icon"></div>
</div>
</a>
<a class="sidebar-right" href="/article/121184548"
title="去男友家一般叫他爸妈是叔叔阿姨,或者伯父伯母是吧?那他舅公舅母,舅舅舅妈我是跟着叫呢还是全都叫叔叔阿姨???[撞到玻璃][撞到玻璃]"
target="_blank" onclick="_hmt.push(['_trackEvent','web-sidebar-qiushi','chick'])">
<p>去男友家一般叫他爸妈是叔叔阿姨,或者伯父伯母是吧?那他舅公舅母,舅舅舅妈我是跟着叫呢还是全都叫叔叔阿姨???<img
src="https://static.qiushibaike.com/static/images/emoji/qb_s_19.png"
align="absmiddle"><img
src="https://static.qiushibaike.com/static/images/emoji/qb_s_19.png"
align="absmiddle"></p>
<div>
<span>447</span><span>好笑</span>
</div>
</a>
</li>
<li class="item clearfix word">
<a class="sidebar-left" href="/article/121171105" rel="nofollow" target="_blank"
onclick="_hmt.push(['_trackEvent','web-sidebar-qiushi','chick'])">
<img src="//static.qiushibaike.com/images/web/v4/textDefault.png?v=12eaf94cfd4d3ae0423a3925bb5bbf9c"
alt="儿子上幼儿园大班,老"/>
<div class="top">
<div class="top-icon top4-icon"></div>
</div>
</a>
<a class="sidebar-right" href="/article/121171105"
title="儿子上幼儿园大班,老师说要培养孩子爱护花草的兴趣,说是可以陶冶情操,有益身心健康!于是要求每个孩子在学校养一盆盆栽!让我觉得纳闷的是:为什么我在街上买的十块钱一"
target="_blank" onclick="_hmt.push(['_trackEvent','web-sidebar-qiushi','chick'])">
<p>儿子上幼儿园大班,老师说要培养孩子爱护花草的兴趣,说是可以陶冶情操,有益身心健康!于是要求每个孩子在学校养一盆盆栽!让我觉得纳闷的是:为什么我在街上买的十块钱一</p>
<div>
<span>2951</span><span>好笑</span>
</div>
</a>
</li>
</ul>
</div>
</div>
</div>
</div>
</div>
<div class="foot">
<div class="foot-nav clearfix">
<div class="foot-nav-col">
<h3>
关于
</h3>
<ul>
<li>
<a href="https://hr.qiushibaike.com/about.html" target="_blank" rel="nofollow">
关于糗百
</a>
</li>
<li>
<a href="https://hr.qiushibaike.com/social.html" target="_blank" rel="nofollow">
加入我们
</a>
</li>
<li>
<a href="https://hr.qiushibaike.com/about.html?tag=3" target="_blank" rel="nofollow">
联系方式
</a>
</li>
</ul>
</div>
<div class="foot-nav-col">
<h3>
帮助
</h3>
<ul>
<li>
<a href="//about.qiushibaike.com/feedback.html" target="_blank" rel="nofollow">
在线反馈
</a>
</li>
<li>
<a href="//about.qiushibaike.com/agreement.html" target="_blank" rel="nofollow">
用户协议
</a>
</li>
<li>
<a href="//about.qiushibaike.com/policy.html" target="_blank" rel="nofollow">
隐私政策
</a>
</li>
</ul>
</div>
<div class="foot-nav-col">
<h3>
下载
</h3>
<ul>
<li>
<a href="https://android.myapp.com/myapp/detail.htm?apkName=qsbk.app"
target="_blank" rel="external nofollow">
Android 客户端
</a>
</li>
<li>
<a href="https://itunes.apple.com/cn/app/id422853458" target="_blank" rel="external nofollow">
iPhone 客户端
</a>
</li>
</ul>
</div>
<div class="foot-nav-col">
<h3>
关注
</h3>
<ul>
<li>
<a href="#" class="foot-wechat">
微信
<div class="foot-wechat-tips">
<span class="foot-wechat-icon"></span>
手机扫描二维码关注
</div>
</a>
</li>
<li>
<a href="http://weibo.com/qiushibaike" target="_blank" rel="external nofollow">
新浪微博
</a>
</li>
<li>
<a href="http://user.qzone.qq.com/1492495058" target="_blank" rel="external nofollow">
QQ空间
</a>
</li>
</ul>
</div>
<div class="foot-nav-col">
<h3>
组织
</h3>
<ul>
<li>
<a href="http://user.qzone.qq.com/1492495058/blog/1408597608" target="_blank"
rel="external nofollow">
官方粉丝群
</a>
</li>
<li>
<a href="https://www.qiushibaike.com/users/37042475" target="_blank"
rel="external nofollow">
<img style="vertical-align: middle;height: 16px;margin-top: -2px;"
src="//static.qiushibaike.com/images/beian.png?v=d0289dc0a46fc5b15b3363ffa78cf6c7">
首都网警
</a>
</li>
</ul>
</div>
</div>
<div class="foot-copyrights">
<!-- <p>© Qiushibaike.com 糗事百科版权所有</p>
<p>
<span>京ICP备14028348号-1</span>
<span>京ICP证140448号</span>
<span>京网文[2017]2369-247号</span>
<span>
<a style='color:#333' target="_blank" href="http://www.beian.gov.cn/portal/registerSystemInfo?recordcode=11010502031601" rel="nofollow"><img style='vertical-align: top;' src="/static/images/beian.png?v=d0289dc0a46fc5b15b3363ffa78cf6c7" />京公网安备11010502031601号</a>
</span>
</p>
<p style="margin-top:8px">友际无限(北京)科技有限公司</p>
<p style="margin-top:8px">
<span>互联网违法和不良信息举报电话:010-84872896</span>
<span>邮箱:kefu@qiushibaike.com</span>
</p> -->
<p>互联网ICP备案:京ICP备14028348号-1</p>
<p>
<span>广播电视节目制作经营许可证:(京)字第08319号</span>
<span>网络文化经营许可证:
<a style='color:#333' target="_blank" href="http://sq.ccm.gov.cn:80/ccnt/sczr/service/business/emark/toDetail/"
rel="nofollow">
<img src="//static.qiushibaike.com/images/wenhuajingying.png?v=f5f3976cf4be787ad2be202a19d40823"
style='width: 20px; height: 20px; vertical-align: top;'>京网文[2017]2369-247号</a>
</span>
</p>
<p style="margin-top: 8px">电信与信息服务业务经营许可证:京ICP证140448号</p>
<p style="margin-top: 8px"><span>营业性演出许可证:京演(机构)(2018)1940号</span></p>
<p>
<span>计算机信息网络国际联网单位备案:<a style='color:#333' target="_blank"
href="http://www.beian.gov.cn/portal/registerSystemInfo?recordcode=11010502031601"
rel="nofollow"><img style='vertical-align: top;'
src="//static.qiushibaike.com/images/beian.png?v=d0289dc0a46fc5b15b3363ffa78cf6c7"/>京公网安备11010502031601号</a></span>
</p>
<br>
<p style="margin-top: 8px">友际无限(北京)科技有限公司</p>
<p>
<span>违法和不良信息举报电话:0755-86967540</span>
<span>邮箱:kefu@qiushibaike.com</span>
</p>
<br>
<p style="margin-top: 8px">© Qiushibaike.com 糗事百科版权所有</p>
</div>
</div>
<div class="float-nav">
<a class="float-nav-backtop" href="#" rel="nofollow">
<span class="float-nav-backtop-icon"></span>
</a>
</div>
<!--[if gte IE 6]>
<script type="text/javascript" src="//static.qiushibaike.com/js/src/web/json3.js?v=3a7f66a11a09842cd7555fad039657be"></script>
<![endif]-->
<script type="text/javascript"
src="//static.qiushibaike.com/js/dist/web/libs.min.js?v=bc8ddd36f0e7fed7c27f437c17f23ce0"></script>
<script type="text/javascript"
src="//static.qiushibaike.com/js/dist/web/v4/app.min.js?v=7e878079cd125ff96cc30319763052d9"></script>
<script type="text/javascript">
// Google Analytics
(function (i, s, o, g, r, a, m) {
i['GoogleAnalyticsObject'] = r;
i[r] = i[r] || function () {
(i[r].q = i[r].q || []).push(arguments)
}, i[r].l = 1 * new Date();
a = s.createElement(o),
m = s.getElementsByTagName(o)[0];
a.async = 1;
a.src = g;
m.parentNode.insertBefore(a, m)
})(window, document, 'script', 'https://www.google-analytics.com/analytics.js', 'ga');
ga('create', 'UA-8780108-1', 'auto');
ga('send', 'pageview');
</script>
<script type="text/javascript" async src="//pagead2.googlesyndication.com/pagead/js/adsbygoogle.js"></script>
<script type="text/javascript" src="https://cbjs.baidu.com/js/m.js"></script>
<script type="text/javascript">
window.broadJson = '[]'
</script>
<!-- <script type="text/javascript" src="//static.qiushibaike.com/js/dist/web/v3/adsAdmin.min.js?v=9c42f35ae43e17caf141e9d6ebe32cbb"></script> -->
</body>
</html>
"""
def parse_text():
html_element = etree.HTML(text)
print(etree.tostring(html_element).decode('utf-8')) # 字符串的解析
def parse_file():
html2 = etree.parse('file3.html')
print(etree.tostring(html2).decode('utf-8')) # 字符串的解析
"""
笔记:
1,标准的html字符串 etree.HTML(text) print(etree.tostring(html2).decode('utf-8'))
2,解析HTML文件,使用lxml.etree.parse进行解析,这个函数默认使用的是XML解析器,所以如果碰到一些不规范的'HTML'代码的时候就会解析错误,
这时候就要自己创建'HTML'解析器
"""
def parse_lago_file():
"""
:return: 处理不规则的html
"""
parser = etree.HTMLParser(encoding='utf-8')
htmlElement = etree.parse('lagou.html', parser=parser)
print(etree.tostring(htmlElement, encoding='utf-8').decode('utf-8'))
if __name__ == '__main__':
parse_text()