# 定义爬取函数
def get_comment(dat):
res = requests.post(url, headers=header, data=dat)
result_1 = res.json()
mark = [i['mark'] for i in result_1['result']['list']]
content = [i['content'] for i in result_1['result']['list']]
commentorId = [i['commentorId'] for i in result_1['result']['list']]
userNickName = [i['userNickName'] for i in result_1['result']['list']]
termId = [i['termId'] for i in result_1['result']['list']]
gmtModified = [i['gmtModified'] for i in result_1['result']['list']]
comment = pd.DataFrame({'mark': mark, 'content': content, 'commentorId': commentorId,
'userNickName': userNickName, 'termId': termId, 'gmtModified': gmtModified})
return comment
# 进行测试
test = get_comment(dat)
comments = pd.DataFrame(columns=test.columns)
# 数据爬取
for i in range(49):
dat_new = {'courseId': '1002421002',
'pageIndex': i,
'pageSize': '20',
'orderBy': '3'}
comment = get_comment(dat_new)
comments = comments.append(comment)