40 lines
1.0 KiB
R
40 lines
1.0 KiB
R
options(scipen = 999)
|
|
|
|
library(dplyr)
|
|
|
|
setwd("C:/Users/irina/Documents/DND/EOHI/eohi1")
|
|
|
|
df <- read.csv("ehi1.csv")
|
|
|
|
data <- df %>%
|
|
select(eohiDGEN_mean, ehi_global_mean, demo_sex, demo_age_1, edu3, AOT_total, CRT_correct, CRT_int, bs_28, bs_easy, bs_hard, cal_selfActual, cal_global) %>%
|
|
filter(demo_sex != "Prefer not to say")
|
|
|
|
str(data)
|
|
colSums(is.na(data))
|
|
sapply(data, class)
|
|
|
|
# Create dummy variable for sex (0 = Male, 1 = Female)
|
|
data$sex_dummy <- ifelse(data$demo_sex == "Female", 1, 0)
|
|
|
|
# Verify the dummy coding
|
|
print(table(data$demo_sex, data$sex_dummy))
|
|
|
|
#descriptives
|
|
|
|
# Descriptives for age
|
|
print(summary(data$demo_age_1))
|
|
print(sd(data$demo_age_1, na.rm = TRUE))
|
|
|
|
# Center demo_age_1 (subtract the mean)
|
|
data$age_centered <- data$demo_age_1 - mean(data$demo_age_1, na.rm = TRUE)
|
|
|
|
# Verify the centering
|
|
print(summary(data$age_centered))
|
|
|
|
# Descriptives for sex (frequency table)
|
|
print(table(data$demo_sex))
|
|
print(prop.table(table(data$demo_sex)))
|
|
|
|
# Descriptives for sex dummy variable
|
|
print(table(data$sex_dummy)) |