运行环境python3.6
import requests
from lxml import etree
def getAddr(idNum):
# 网上找的第三方接口
url="http://qq.ip138.com/idsearch/index.asp?action=idcard&userid="
# 拼接完整地址
url_idnum=url+str(idNum)
# 获取结果源码
res=requests.get(url_idnum)
# 处理中文编码问题
res.encoding='gb2312'
# 转化html
html=etree.HTML(res.text)
# xpath提取内容
addr=html.xpath("//td[@class=\"tdc2\"]/text()")
return addr
print(getAddr("235407195106112745"))
"""
备注:
新版etree导入方式
import lxml.html
etree = lxml.html.etree
"""
浏览器打开:
代码运行结果: