library(foreign)
data=read.dta("enaho01a-2018-300.dta")
data1=data[,c(1:10,254,286:289,312,316:318,475:476)]
data1$Codigo=paste0(data1[,1],data1[,2],data1[,3],data1[,4],data1[,5],data1[,6])
data1$Codigopersona=paste0(data1[,1],data1[,2],data1[,3],data1[,4],data1[,5],data1[,6],data1[,7])
MAYORES DE 6 AÑOS
data1=data1[!is.na(data1$p314a),] #BORRAMOS LOS NA'S QUE PERTENECEN A NIÑOS MENORES A 6
data1$INTERNET=ifelse(data1$p314a=="si", "0","1")
data1$COMPRAR_PRODUCTOS=ifelse(data1$p316_3=="si", "0","1")
data1$BANCA_ELECTRONICA=ifelse(data1$p316_4=="si", "0","1")
data1$EDUCACION_FORMAL=ifelse(data1$p316_5=="si", "0","1")
data1$TRANSACCION_OE=ifelse(data1$p316_6=="si", "0","1")
data1$persona="1"
data1[,c(24:29)]=lapply(data1[,c(24:29)], as.numeric)
data1[,c(25:28)][is.na(data1[,c(25:28)])] <- 1
data1$POB_DIG=ifelse(data1$COMPRAR_PRODUCTOS==1 | data1$BANCA_ELECTRONICA==1 |data1$EDUCACION_FORMAL==1 | data1$TRANSACCION_OE==1 , "1", "0" )
data1$POB_DIG2=ifelse(data1$POB_DIG==1 & data1$INTERNET== 1, "1","0")
table(data1$POB_DIG)
##
## 0 1
## 637 119404
table(data1$POB_DIG2)
##
## 0 1
## 50558 69483
library(openxlsx)
Ubigeo=read.xlsx("UBIGEOS.xlsx")
Ubigeo=Ubigeo[,-c(1,5)]
data1$ubigeo[data1$ubigeo== "120699"] = "120609"
data1=merge(data1,Ubigeo, by.x="ubigeo", by.y="UBIGEO_INEI", all.x=T)
nacional_pob_dig <-as.data.frame(xtabs(factora07~POB_DIG2, data = data1))
distrito_pob_dig <-as.data.frame(xtabs(factora07~POB_DIG2+ubigeo, data = data1))
distri1=distrito_pob_dig[distrito_pob_dig$POB_DIG2 == "1",]
distri2=distrito_pob_dig[distrito_pob_dig$POB_DIG2 == "0",]
Distri=merge(distri1[,-c(1)],distri2[,-c(1)],by="ubigeo")
names(Distri)=c("Ubigeo","pobre_digital","acceso_digital")
Distri$poblacion=rowSums(Distri[,c(2:3)])
Distri$brecha_digital=Distri$pobre_digital/Distri$poblacion
Distri=merge(Distri,Ubigeo,by.x="Ubigeo", by.y="UBIGEO_INEI", all.x=T)
pob_dig <-as.data.frame(xtabs(factora07~POB_DIG2+Departamento, data = data1))
depa1=pob_dig[pob_dig$POB_DIG2 == "1",]
depa2=pob_dig[pob_dig$POB_DIG2 == "0",]
Depa=merge(depa1[,-c(1)],depa2[,-c(1)],by="Departamento")
names(Depa)=c("Departamento","pobre_digital","acceso_digital")
Depa$poblacion=rowSums(Depa[,c(2:3)])
Depa$brecha_digital=Depa$pobre_digital/Depa$poblacion