library(tidyverse)
## ── Attaching core tidyverse packages ──────────────────────── tidyverse 2.0.0 ──
## ✔ dplyr 1.2.0 ✔ readr 2.1.6
## ✔ forcats 1.0.1 ✔ stringr 1.6.0
## ✔ ggplot2 4.0.2 ✔ tibble 3.3.1
## ✔ lubridate 1.9.4 ✔ tidyr 1.3.2
## ✔ purrr 1.2.1
## ── Conflicts ────────────────────────────────────────── tidyverse_conflicts() ──
## ✖ dplyr::filter() masks stats::filter()
## ✖ dplyr::lag() masks stats::lag()
## ℹ Use the conflicted package (<http://conflicted.r-lib.org/>) to force all conflicts to become errors
library(readxl)
TEA_Data<-read_excel("district.xls")
pastecs::stat.desc(TEA_Data$DZRVLOCP)
## nbr.val nbr.null nbr.na min max
## 1202.0000000 8.0000000 5.0000000 -6.2000000 97.6000000
## range sum median mean SE.mean
## 103.8000000 45584.3000000 35.3000000 37.9237105 0.6928507
## CI.mean.0.95 var std.dev coef.var
## 1.3593323 577.0105864 24.0210447 0.6334044
pastecs::stat.desc(TEA_Data$DPETALLC)
## nbr.val nbr.null nbr.na min max range
## 1.207000e+03 0.000000e+00 0.000000e+00 4.000000e+00 1.937270e+05 1.937230e+05
## sum median mean SE.mean CI.mean.0.95 var
## 5.402928e+06 8.840000e+02 4.476328e+03 3.594000e+02 7.051187e+02 1.559062e+08
## std.dev coef.var
## 1.248624e+04 2.789393e+00
hist(TEA_Data$DZRVLOCP)

TEA_Data<-TEA_Data %>% drop_na(DZRVLOCP)
TEA_Data%>% filter(DZRVLOCP<0)
## # A tibble: 2 × 137
## DISTNAME DISTRICT DZCNTYNM REGION DZRATING DZCAMPUS DPETALLC DPETBLAP DPETHISP
## <chr> <chr> <chr> <chr> <chr> <dbl> <dbl> <dbl> <dbl>
## 1 TRIUMPH… 071803 071 EL … 19 A 2 198 2.5 95.5
## 2 FORT EL… 242906 242 WHE… 16 A 1 159 0 7.5
## # ℹ 128 more variables: DPETWHIP <dbl>, DPETINDP <dbl>, DPETASIP <dbl>,
## # DPETPCIP <dbl>, DPETTWOP <dbl>, DPETECOP <dbl>, DPETLEPP <dbl>,
## # DPETSPEP <dbl>, DPETBILP <dbl>, DPETVOCP <dbl>, DPETGIFP <dbl>,
## # DA0AT21R <dbl>, DA0912DR21R <dbl>, DAGC4X21R <dbl>, DAGC5X20R <dbl>,
## # DAGC6X19R <dbl>, DA0GR21N <dbl>, DA0GS21N <dbl>, DDA00A001S22R <dbl>,
## # DDA00A001222R <dbl>, DDA00A001322R <dbl>, DDA00AR01S22R <dbl>,
## # DDA00AR01222R <dbl>, DDA00AR01322R <dbl>, DDA00AM01S22R <dbl>, …
TEA_Data<-TEA_Data %>% mutate(DZRVLOCP_transformed=sqrt(DZRVLOCP))
## Warning: There was 1 warning in `mutate()`.
## ℹ In argument: `DZRVLOCP_transformed = sqrt(DZRVLOCP)`.
## Caused by warning in `sqrt()`:
## ! NaNs produced