bw=read.csv("D://PHAN TICH R//DU LIEU TS THACH//birthwt.csv")
dim(bw)
## [1] 189 11
tail(bw, 10)
## id low age lwt race smoke ptl ht ui ftv bwt
## 180 71 1 17 120 2 0 0 0 0 2 2438
## 181 75 1 26 154 3 0 1 1 0 1 2442
## 182 76 1 20 105 3 0 0 0 0 3 2450
## 183 77 1 26 190 1 1 0 0 0 0 2466
## 184 78 1 14 101 3 1 1 0 0 0 2466
## 185 79 1 28 95 1 1 0 0 0 2 2466
## 186 81 1 14 100 3 0 0 0 0 2 2495
## 187 82 1 23 94 3 1 0 0 0 0 2495
## 188 83 1 17 142 2 0 0 1 0 0 2495
## 189 84 1 21 130 1 1 0 1 0 3 2495
tail(bw,10)
## id low age lwt race smoke ptl ht ui ftv bwt
## 180 71 1 17 120 2 0 0 0 0 2 2438
## 181 75 1 26 154 3 0 1 1 0 1 2442
## 182 76 1 20 105 3 0 0 0 0 3 2450
## 183 77 1 26 190 1 1 0 0 0 0 2466
## 184 78 1 14 101 3 1 1 0 0 0 2466
## 185 79 1 28 95 1 1 0 0 0 2 2466
## 186 81 1 14 100 3 0 0 0 0 2 2495
## 187 82 1 23 94 3 1 0 0 0 0 2495
## 188 83 1 17 142 2 0 0 1 0 0 2495
## 189 84 1 21 130 1 1 0 1 0 3 2495
#việc 5 BIÊN TẬP DỮ LIỆU ## tạo biến số mới mwt(kg)
bw$mwt= bw$lwt*0.45
bw$mwt= bw$lwt*0.45
bw$ethnicity[bw$race==1]="white"
bw$ethnicity[bw$race==2]="black"
bw$ethnicity[bw$race==3]="other"
table(bw$ethnicity, bw$race)
##
## 1 2 3
## black 0 26 0
## other 0 0 67
## white 96 0 0
bw1=bw[,c("id", "low", "bwt")]
bw3=subset(bw,low==1)
table(bw$low)
##
## 0 1
## 130 59
bw4=subset(bw,low==1& smoke==1)
table(bw4$low, bw4$smoke)
##
## 1
## 1 30
bw5 <- subset(bw, low == 1 & smoke == 1)
dim(bw5)
## [1] 30 13