eohi/.history/eohi1/regression e1 - edu x ehi_20251020101841.r
2025-12-23 15:47:09 -05:00

35 lines
795 B
R

options(scipen = 999)
library(dplyr)
setwd("C:/Users/irina/Documents/DND/EOHI/eohi1")
df <- read.csv("ehi1.csv")
data <- df %>%
select(eohiDGEN_mean, ehi_global_mean, demo_edu) %>%
mutate(demo_edu = as.factor(demo_edu))
# examine data object
str(data)
colSums(is.na(data))
sapply(data, class)
levels(data$demo_edu)
# Create dummy variables
dummy_vars <- model.matrix(~ demo_edu - 1, data = data)
dummy_df <- as.data.frame(dummy_vars)
# Rename columns with meaningful names (excluding reference level)
colnames(dummy_df) <- c(
"edu_highschool", # reference level (will be dropped)
"edu_trade",
"edu_college",
"edu_uni_undergrad",
"edu_uni_masters",
"edu_uni_phd",
"edu_prof"
)
# Add to your data
data <- cbind(data, dummy_df)