credit_data <- read_csv("credit_risk_dataset.csv")
clean_credit <- credit_data |>
select(
person_age,
person_income,
person_emp_length,
loan_intent,
loan_int_rate,
loan_amnt
) |>
na.omit()
glimpse(clean_credit)Rows: 28,638
Columns: 6
$ person_age <dbl> 22, 21, 25, 23, 24, 21, 26, 24, 24, 21, 22, 21, 23, …
$ person_income <dbl> 59000, 9600, 9600, 65500, 54400, 9900, 77100, 78956,…
$ person_emp_length <dbl> 123, 5, 1, 4, 8, 2, 8, 5, 8, 6, 6, 2, 2, 4, 2, 7, 0,…
$ loan_intent <chr> "PERSONAL", "EDUCATION", "MEDICAL", "MEDICAL", "MEDI…
$ loan_int_rate <dbl> 16.02, 11.14, 12.87, 15.23, 14.27, 7.14, 12.42, 11.1…
$ loan_amnt <dbl> 35000, 1000, 5500, 35000, 35000, 2500, 35000, 35000,…
nrow(clean_credit)[1] 28638