from html.parser import HTMLParser
class HeadingParser(HTMLParser):
inHeading=False
def handle_starttag(self,tag,attrs):
if tag=="h1":
self.inHeading=True
print("Found a Heading 1")
def handle_data(self,data):
if self.inHeading:
print(data)
def handle_endtag(self,tag):
if tag=="h1":
self.inHeading=False
hParser=HeadingParser()
file=open("headings.html","r",encoding='utf-8')
html=file.read()
file.close()
hParser.feed(html)


被折叠的 条评论
为什么被折叠?



