project <- read.csv("project.csv", stringsAsFactors = F)

project

View(project)

qplot(project$area)

ggplot(data = project, aes(x = area, y = page, fill = project$comple))+geom_col()

table(project$stand)

qplot(project$stand)

project$floormaterial

class(project$floormaterial)

table(project$floormaterial)

project$floormaterial <- ifelse(project$floormaterial == 2, NA, project$floormaterial)

table(is.na(project$floormaterial))

project$floormaterial <- ifelse(project$floormaterial == 1, "turf","sand")

ggplot(data = project, aes(x = area, y = stand ))+geom_col()

summary(project$stand)

table(is.na(project$stand))

project$stand <- ifelse(project$stand == 9999, NA, project$stand)
table(is.na(project$stand))

summary(project$completion)

table(is.na(project$completion))



project <- project %>% 
  mutate(comple = ifelse(completion > 2015, "A",
                         ifelse(completion > 2010, "B","C")))

table(project$comple)


qplot(project$comple)


top10 <- project$area %>% 
  arrange(desc(project$area)) %>% 
  head(10)
