bat_ave.R
x <- read.csv("Batting.csv", as.is = TRUE) # downloaded from
# http://www.seanlahman.com/baseball-archive/statistics/
bat_ave <- matrix(NA,length(unique(x$playerID)),4)
for (i in 1:length(unique(x$playerID))) {
pid <- sort(unique(x$playerID))[i]
ABid <- sum(x[x$playerID==pid,]$AB, na.rm = TRUE)
Hid <- sum(x[x$playerID==pid,]$H, na.rm = TRUE)
bat_ave[i,1] <- pid
bat_ave[i,2] <- ABid
bat_ave[i,3] <- Hid
bat_ave[i,4] <- ifelse(ABid > 0,Hid/ABid,NA)
print(i)
}
colnames(bat_ave) <- c("playerID","AB","H","AVE")
bat_ave2 <- as.data.frame(bat_ave)
bat_ave2$AB <- as.numeric(as.character(bat_ave2$AB))
bat_ave2$H <- as.numeric(as.character(bat_ave2$H))
bat_ave2$AVE <- as.numeric(as.character(bat_ave2$AVE))
bat_ave3 <- bat_ave2[is.na(bat_ave2$AVE)==0,]
write.csv(bat_ave3,"bat_ave.csv")