re import re pattern = re.compile(r'',re.S) r_list = pattern.findall(html) lxml+xpath from lxml import etree parse_html = etree.HTML(html) r_list = parse_html.xpath('')