import requests
from lxml import etree
url = 'http://www.boxofficecn.com/boxoffice2019'
headers = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/108.0.0.0 Safari/537.36 Edg/108.0.1462.46"}
resp = requests.get(url,headers=headers)
page = etree.HTML(resp.text)
trs = page.xpath("//table/tbody/tr")[1:-1]
for tr in trs:
num = tr.xpath('./td[1]/text()')
year = tr.xpath('./td[2]/text()')
name = tr.xpath('./td[3]/text()')
money = tr.xpath('./td[4]/text()')
if name:
"".join(name)
print(num, year, name, money)