library(XML)
library(xml2)
library(rvest)
library(stringr)
url[i] <- paste0("https://rate.tmall.com/list_detail_rate.htm?itemId=544568867374&spuId=719363051&sellerId=661559176&order=3¤tPage=",i,"&append=0&content=1")
}
#利用jsonlite包抓取
download <- function(url){
web <- read_html(url,encoding = "GBK")
# 抓取内容
List <- web %>% html_nodes("p") %>% html_text %>%
str_replace('\"rateDetail\":',"") %>% fromJSON()
# 获取评论页数
List$pag
library(xml2)
library(rvest)
library(stringr)
library(jsonlite)
#找出需要爬的网址(F12进入,network+F5刷新寻找评论)
url[i] <- paste0("https://rate.tmall.com/list_detail_rate.htm?itemId=544568867374&spuId=719363051&sellerId=661559176&order=3¤tPage=",i,"&append=0&content=1")
}
#利用jsonlite包抓取
download <- function(url){
web <- read_html(url,encoding = "GBK")
# 抓取内容
List <- web %>% html_nodes("p") %>% html_text %>%
str_replace('\"rateDetail\":',"") %>% fromJSON()
# 获取评论页数
List$pag