- Import the original data and check perform a LS regression
- This regression is the oracle model
wages_f <- read.csv("../data/fakedata/wages_df.csv", header = TRUE)
lm0 <- lm(log(WAGE) ~ SEX + EXPERIENCE + I(EXPERIENCE^2) +
EDUCATION + as.factor(OCCUPATION) + UNION,
data = wages_f)