setwd("/cloud/project/datos")
datos <- read.csv("Petroleo_Ontaro.csv", header=T, dec=".", sep=";")
#tipo de pozo
c_tipo <- datos$WELL_TYPE
TDFc_tipo <- table(c_tipo)
TDFc_tipo
## c_tipo
## Brine Well
## 31 34
## Brine Well Natural Gas Well Brine Well Oil Well
## 4 5
## Cavern Storage Well Compressed Air Energy Storage Well
## 124 2
## Disposal Well Dry Hole
## 129 4544
## Gas Show Gas Well Oil Show
## 2728 56
## Historical Injection Well Historical Oil Well
## 49 1210
## Injection Well Licensed
## 235 2
## Location Natural Gas Storage Well
## 935 333
## Natural Gas Well Observation Well
## 9330 176
## Oil and Gas Show Oil and Gas Well
## 795 253
## Oil Show Oil Well
## 976 2101
## Oil Well Gas Show Other
## 53 19
## Private Gas Well Solution Mining Well
## 1057 204
## Source Well Stratigraphic Test
## 10 1271
Tabla <- as.data.frame(TDFc_tipo)
hi <- Tabla$Freq/sum(Tabla$Freq)
hi
## [1] 1.162529e-03 1.275032e-03 1.500038e-04 1.875047e-04 4.650116e-03
## [6] 7.500188e-05 4.837621e-03 1.704043e-01 1.023026e-01 2.100053e-03
## [11] 1.837546e-03 4.537613e-02 8.812720e-03 7.500188e-05 3.506338e-02
## [16] 1.248781e-02 3.498837e-01 6.600165e-03 2.981325e-02 9.487737e-03
## [21] 3.660092e-02 7.878947e-02 1.987550e-03 7.125178e-04 3.963849e-02
## [26] 7.650191e-03 3.750094e-04 4.766369e-02
sum(hi)
## [1] 1
hi_porc <- hi*100
sum(hi_porc)
## [1] 100
Tabla_tipo <- data.frame(Tabla, hi_porc)
total <- data.frame(c_tipo="Total",
Freq=sum(Tabla_tipo$Freq),
hi_porc="100%")
Tabla_tipofinal <- rbind(Tabla_tipo, total)
colnames(Tabla_tipofinal)[colnames(Tabla_tipofinal)=="c_tipo"] <- "Tipo de Pozo"
names(Tabla_tipofinal)
## [1] "Tipo de Pozo" "Freq" "hi_porc"
colnames(Tabla_tipofinal)[colnames(Tabla_tipofinal)=="Freq"] <- "ni"
names(Tabla_tipofinal)
## [1] "Tipo de Pozo" "ni" "hi_porc"
colnames(Tabla_tipofinal)[colnames(Tabla_tipofinal)=="hi_porc"] <- "hi"
names(Tabla_tipofinal)
## [1] "Tipo de Pozo" "ni" "hi"
Tabla_tipo <- Tabla_tipo[order(-Tabla_tipo$Freq), ]
Tabla_top10tipo <- head(Tabla_tipo, 10)
barplot(Tabla_top10tipo$Freq,
main = "Gráfica No2.01: Distribucion de Tipo de Pozo",
xlab = "Tipo",
ylab = "Cantidad",
col = "#CDC8B1",
cex.names = 0.5,
cex.axis = 0.9,
names.arg = Tabla_top10tipo$c_tipo,
las = 2
)

barplot(Tabla_top10tipo$Freq,
main = "Gráfica No2.02: Distribucion de Tipo de Pozo (Global)",
xlab = "Tipo",
ylab = "Cantidad",
col = "#CDC8B1",
cex.names = 0.5,
cex.axis = 0.9,
names.arg = Tabla_top10tipo$c_tipo,
las = 2,
ylim = c(0, 26666)
)

barplot(Tabla_top10tipo$hi_porc,
main = "Gráfica No2.03: Distribucion de Tipo de Pozo",
xlab = "Tipo",
ylab = "Porcentaje",
col = "#CDC8B1",
cex.names = 0.5,
cex.axis = 0.9,
names.arg = Tabla_top10tipo$c_tipo,
las = 2
)

barplot(Tabla_top10tipo$hi_porc,
main = "Gráfica No2.04: Distribucion de Tipo de Pozo (Global)",
xlab = "Tipo",
ylab = "Porcentaje",
col = "#CDC8B1",
cex.names = 0.5,
cex.axis = 0.9,
names.arg = Tabla_top10tipo$c_tipo,
las = 2,
ylim = c(0, 100)
)

Colores <- colorRampPalette(rainbow(11))
etiquetas <- paste(round(Tabla_top10tipo$hi_porc),"%", sep = "")
pie(Tabla_top10tipo$hi_porc,
radius = 0.5,
col = Colores(10),
main = "Gráfica No2.05: Distribucion de Tipo de Pozo",
labels = etiquetas)
legend("bottomleft", title = "Leyenda", legend = Tabla_top10tipo$c_tipo,
cex = 0.5, fill = Colores(10), title.cex = 0.8)
