URL-, paste0, . . URL, :
url <- paste0(url1,year,url2,page,url3)
. do.call(rbind,..):
library(XML)
url1 <- "http://www.nfl.com/stats/categorystats?tabSeq=1&season="
year <- 2013
url2 <- "&seasonType=REG&experience=&Submit=Go&archive=false&conference=null&d-447263-p="
page <- 1
url3 <- "&statisticPositionCategory=DEFENSIVE_BACK&qualified=true"
getTable <-
function(page=1,year=2013){
url <- paste0(url1,year,url2,page,url3)
tab = readHTMLTable(url,header=FALSE)
tab$result
}
do.call(rbind,lapply(seq_len(8),getTable,year=2013))
, URL , xpath , . , .
getNext <-
function(url=url_base){
doc <- htmlParse(url)
XPATH_NEXT = "//*[@class='linkNavigation floatRight']/*[contains(., 'next')]"
next_page <- unique(xpathSApply(doc,XPATH_NEXT,xmlGetAttr,'href'))
if(length(next_page)>0)
paste0("http://www.nfl.com",next_page)
else ''
}
res <- list()
while(TRUE){
tab = readHTMLTable(url_base,header=FALSE)
res <- rbind(res,tab$result)
url_base <- getNext(url_base)
if (nchar(url_base)==0)
break
}