Configuración y Carga
de Datos
##### UNIVERSIDAD CENTRAL DEL ECUADOR #####
#### AUTOR: MARTIN SARMIENTO ####
### CARRERA: INGENIERÍA EN PETRÓLEOS #####
#### VARIABLE PAISES (CONTINENTES) ####
## DATASET ##
setwd("~/R/COUNTRY")
# Cargar dataset
Datos <- read.csv("Dataset_Mundial_Final.csv", sep = ";", fileEncoding = "latin1")
## Estructura de los datos
str(Datos)
## 'data.frame': 58978 obs. of 29 variables:
## $ ï..OBJECTID : int 2 3 4 5 6 7 8 9 10 11 ...
## $ code : chr "00001-AFG-P" "00002-AFG-P" "00003-AFG-P" "00004-AFG-P" ...
## $ plant_name : chr "Badghis Solar Power Plant" "Balkh solar farm" "Behsood solar farm" "Dab Pal 4 solar farm" ...
## $ country : chr "Afghanistan" "Afghanistan" "Afghanistan" "Afghanistan" ...
## $ operational_status : chr "cancelled - inferred 4 y" "cancelled - inferred 4 y" "cancelled - inferred 4 y" "shelved - inferred 2 y" ...
## $ longitude : chr "62,874" "67,121" "70,413" "66,239" ...
## $ latitude : chr "35,078" "36,714" "34,407" "33,768" ...
## $ elevation : int 918 359 629 2288 1060 1060 1392 398 410 1012 ...
## $ area : chr "6,735" "10,718" "487,729" "111,801" ...
## $ size : chr "Small" "Small" "Small" "Small" ...
## $ slope : chr "7,375" "0,49" "1,099" "6,162" ...
## $ slope_type : chr "Moderado" "Plano o casi plano" "Plano o casi plano" "Moderado" ...
## $ curvature : chr "-0,024" "0" "0" "0,045" ...
## $ curvature_type : chr "Superficies cóncavas / Valles" "Superficies planas o intermedias" "Superficies planas o intermedias" "Superficies convexas / Crestas" ...
## $ aspect : chr "96,77" "358,452" "36,18" "305,766" ...
## $ aspect_type : chr "East" "North" "Northeast" "Northwest" ...
## $ dist_to_road : chr "7037,104" "92,748" "112,117" "1705,255" ...
## $ ambient_temperature : chr "14,402" "17,875" "21,315" "8,857" ...
## $ ghi : chr "5,824" "5,579" "5,805" "6,749" ...
## $ humidity : chr "47,743" "42,305" "36,396" "37,344" ...
## $ wind_speed : chr "0,039" "0,954" "0,234" "0,943" ...
## $ wind_direction : chr "187,481" "207,422" "255,601" "160,331" ...
## $ dt_wind : chr "South" "Southwest" "West" "South" ...
## $ solar_aptitude : chr "0,72" "0,635" "0,685" "0,659" ...
## $ solar_aptitude_rounded: int 7 6 7 7 8 8 8 6 6 4 ...
## $ solar_aptittude_class : chr "Alta" "Alta" "Alta" "Alta" ...
## $ capacity : chr "32" "40" "60" "3000" ...
## $ optimal_tilt : chr "30" "31" "31,063" "33" ...
## $ pv_potential : chr "4,613" "4,408" "4,572" "5,424" ...
# Cargamos las librerias
library(dplyr)
##
## Adjuntando el paquete: 'dplyr'
## The following objects are masked from 'package:stats':
##
## filter, lag
## The following objects are masked from 'package:base':
##
## intersect, setdiff, setequal, union
library(ggplot2)
library(gt)
Categorización y
Ordenamiento Lógico
### Agrupación ###
# Limpieza de caracteres especiales
tabla_PAIS$Pais <- gsub("Türkiye", "Türkiye", tabla_PAIS$Pais)
tabla_PAIS$Pais <- gsub("Réunion", "Réunion", tabla_PAIS$Pais)
tabla_PAIS$Pais <- gsub("Côte d'Ivoire", "Côte d'Ivoire", tabla_PAIS$Pais)
tabla_PAIS <- tabla_PAIS %>%
ungroup() %>%
mutate(grupo = case_when(
grepl("Argentina|Bolivia|Brazil|Chile|Colombia|Ecuador|Guyana|Paraguay|Peru|Suriname|Uruguay|Venezuela",
Pais, ignore.case = TRUE) ~ "América del Sur",
grepl("United States|USA|Canada|Mexico|México",
Pais, ignore.case = TRUE) ~ "América del Norte",
grepl("Guatemala|Belize|Honduras|El Salvador|Nicaragua|Costa Rica|Panama|Panamá|Cuba|Dominican Republic|Haiti|Jamaica|Puerto Rico|Antigua and Barbuda|Cayman Islands|Bonaire|Virgin Islands|Saint Kitts and Nevis|Guadeloupe",
Pais, ignore.case = TRUE) ~ "América Central y Caribe",
grepl("Spain|España|France|Germany|Alemania|Italy|Italia|United Kingdom|UK|Portugal|Netherlands|Belgium|Poland|Sweden|Norway|Denmark|Finland|Greece|Russia|Ukraine|Albania|Andorra|Austria|Belarus|Bosnia and Herzegovina|Bulgaria|Croatia|Cyprus|Czech Republic|Estonia|Holy See|Hungary|Ireland|Isle of Man|Kosovo|Latvia|Lithuania|Luxembourg|Malta|Moldova|Montenegro|North Macedonia|Romania|Serbia|Slovakia|Slovenia|Switzerland",
Pais, ignore.case = TRUE) ~ "Europa",
# Türkiye ahora será capturado aquí
grepl("China|India|Japan|Japón|Korea|Vietnam|Thailand|Indonesia|Malaysia|Philippines|Saudi Arabia|UAE|United Arab Emirates|Israel|Turkey|Turquía|Iran|Iraq|Afghanistan|Armenia|Azerbaijan|Bahrain|Bangladesh|Bhutan|Brunei|Cambodia|Georgia|Hong Kong|Jordan|Kazakhstan|Kuwait|Kyrgyzstan|Laos|Lebanon|Mongolia|Myanmar|Nepal|Oman|Pakistan|Palestine|Qatar|Singapore|Sri Lanka|Syria|Taiwan|Tajikistan|Timor-Leste|Türkiye|Uzbekistan|Yemen",
Pais, ignore.case = TRUE) ~ "Asia",
# Réunion y Côte d'Ivoire ahora serán capturados aquí
grepl("South Africa|Egypt|Egipto|Nigeria|Morocco|Marruecos|Algeria|Kenya|Ethiopia|Ghana|Senegal|Angola|Benin|Botswana|Burkina Faso|Burundi|Cabo Verde|Cameroon|Central African Republic|Chad|Comoros|Côte d'Ivoire|DR Congo|Republic of the Congo|Djibouti|Eritrea|Eswatini|Gabon|Guinea|Guinea-Bissau|Lesotho|Liberia|Libya|Madagascar|Malawi|Mali|Mauritania|Mauritius|Mayotte|Mozambique|Namibia|Niger|Réunion|Rwanda|Sao Tome and Principe|Seychelles|Sierra Leone|Somalia|South Sudan|Sudan|Tanzania|The Gambia|Togo|Tunisia|Uganda|Western Sahara|Zambia|Zimbabwe",
Pais, ignore.case = TRUE) ~ "África",
grepl("Australia|New Zealand|Fiji|Papua|British Indian Ocean Territory|Vanuatu|New Caledonia",
Pais, ignore.case = TRUE) ~ "Oceanía",
TRUE ~ "Otros / No Especificado"
))
tabla_resumen <- tabla_PAIS %>%
group_by(grupo) %>%
summarise(
Frecuencia = sum(Freq),
Porcentaje = sum(hi_porc)) %>%
arrange(desc(Frecuencia))
# Renombramos columnas
colnames(tabla_resumen) <- c("Continente","ni","hi (%)")
# Tabla Intermedia GT
tabla_resumen_gt <- tabla_resumen %>%
gt() %>%
tab_header(
title = md("**Tabla N°1 de Agrupación por Continentes de las Plantas Solares**")) %>%
tab_source_note(source_note = "Autor: Martin Sarmiento") %>%
cols_label(
Continente = "Continentes",
ni = "Frecuencia (ni)",
`hi (%)` = "Porcentaje (hi%)") %>%
fmt_number(columns = c(`hi (%)`), decimals = 2) %>%
tab_options(
heading.title.font.size = px(16),
column_labels.background.color = "#F0F0F0")
# Mostramos la tabla
tabla_resumen_gt
| Tabla N°1 de Agrupación por Continentes de las Plantas Solares |
| Continentes |
Frecuencia (ni) |
Porcentaje (hi%) |
| Asia |
28403 |
48.16 |
| Europa |
18787 |
31.85 |
| América del Norte |
7783 |
13.20 |
| América del Sur |
2346 |
3.98 |
| África |
1072 |
1.82 |
| América Central y Caribe |
379 |
0.64 |
| Oceanía |
208 |
0.35 |
| Autor: Martin Sarmiento |