bat_ave.R

x <- read.csv("Batting.csv", as.is = TRUE) # downloaded from

# http://www.seanlahman.com/baseball-archive/statistics/

bat_ave <- matrix(NA,length(unique(x$playerID)),4)

for (i in 1:length(unique(x$playerID))) {

pid <- sort(unique(x$playerID))[i]

ABid <- sum(x[x$playerID==pid,]$AB, na.rm = TRUE)

Hid <- sum(x[x$playerID==pid,]$H, na.rm = TRUE)

bat_ave[i,1] <- pid

bat_ave[i,2] <- ABid

bat_ave[i,3] <- Hid

bat_ave[i,4] <- ifelse(ABid > 0,Hid/ABid,NA)

print(i)

}

colnames(bat_ave) <- c("playerID","AB","H","AVE")

bat_ave2 <- as.data.frame(bat_ave)

bat_ave2$AB <- as.numeric(as.character(bat_ave2$AB))

bat_ave2$H <- as.numeric(as.character(bat_ave2$H))

bat_ave2$AVE <- as.numeric(as.character(bat_ave2$AVE))

bat_ave3 <- bat_ave2[is.na(bat_ave2$AVE)==0,]

write.csv(bat_ave3,"bat_ave.csv")