require(tidyverse) #you may need to run install.packages('tidyverse') first, only once on a machine
require(dplyr)
require(lubridate) #same goes for any new package
require(rvest)
require(stringr)
require(knitr)
require(ggplot2)
load("../data/honors.RData")
load(file = "../data/athletic_summary.RData")
require(gridExtra)
load("../data/students.RData")
load("../data/roster.RData")
load("../data/classified.RData")
load(file = "../data/ethnic_summary.RData")

knitr::opts_chunk$set(tidy=TRUE, message=FALSE)

Motivation and Approaches


Disclaimers and Limitations


Data


Data Tidying and Manuvering


Two proportion z-test

-

hispanic <- classified %>%
  filter(hispanic == 1) %>%
  group_by(latin) %>%
  summarize(value = length(name))
non_hispanic = classified %>%
  filter(hispanic == 0) %>%
  group_by(latin) %>%
  summarize(value = length(name))
prop.test(c(filter(hispanic, latin == 1)$value, 
            filter(non_hispanic, latin == 1)$value), 
          c(sum(hispanic$value), sum(non_hispanic$value)))

T tests

athlete <- athletic_summary %>%
  filter(athlete == 1) 
non_athlete <- athletic_summary %>%
  filter(athlete == 0) 
t.test(athlete$ratio, non_athlete$ratio)

Thoughts and Potential Future Work



hs97/kane2017 documentation built on May 17, 2019, 5:55 p.m.