25 lines
1.2 KiB
R
25 lines
1.2 KiB
R
|
library(tidyverse)
|
||
|
|
||
|
enrollment_data <- read_csv(file = "/home/ben/Documents/Data analysis/map/data/Enrollement_2022-2023/enrollment_by_gradelevel_certified_2022-23.csv")
|
||
|
enrollment_data_wide <-
|
||
|
enrollment_data %>%
|
||
|
mutate(district_school = paste0(DISTRICT_CODE, SCHOOL_CODE),
|
||
|
variable_name = paste0(GROUP_BY, "__", GROUP_BY_VALUE)) %>%
|
||
|
mutate(variable_name = str_replace_all(variable_name, "[ ]", "_")) %>%
|
||
|
pivot_wider(id_cols = c(district_school, GRADE_LEVEL, SCHOOL_NAME, DISTRICT_NAME), names_from = variable_name, values_from = PERCENT_OF_GROUP)
|
||
|
|
||
|
write_csv(enrollment_data_wide, file = "/home/ben/Documents/Data analysis/map/data/Enrollement_2022-2023/enrollment_by_gradelevel_certified_2022-23_wide.csv")
|
||
|
|
||
|
|
||
|
# school comparison
|
||
|
schools <- data.frame(Name = c("East High", "West High", "Memorial High", "LaFollette High"),
|
||
|
district_school = c(32690150,32690840,32690360,32690420))
|
||
|
|
||
|
enrollment_data_wide %>%
|
||
|
filter(district_school %in% schools$district_school) %>%
|
||
|
group_by(district_school)
|
||
|
summarise(mean_econ_disadv = mean(as.double('Economic_Status__Econ_Disadv'), na.rm = TRUE))
|
||
|
ggplot() +
|
||
|
geom_col(aes(x = SCHOOL_NAME,
|
||
|
y = mean_econ_disadv))
|