## Propuesta
library(tidyverse)
library(readxl)
grafica_error <- read_excel("graficamala1.xlsx") %>%
ggplot( aes(x = Año , y = Amapolas_erradicadas)) +
geom_point()+
geom_line()
grafica_error
-Global
library(readxl)
library(janitor)
library(tidyverse)
library(Hmisc)
Global_pib <- read_excel("pib_global.xlsx") %>%
ggplot( aes(x = Año , y = PIB, color = PIB)) +
geom_line()+
geom_point()
Global_pib
library(readxl)
Alemania_pib <- read_excel("pib_alemania.xlsx") %>%
ggplot( aes(x = Año , y = PIB, color = PIB)) +
geom_line()+
geom_point()
Alemania_pib
library(janitor)
library(tidyverse)
library(Hmisc)
data_hurtos <- read_csv(
file = "HURTO_A_CABEZAS_DE_GANADO_PER_ODO_DEL_01_DE_ENERO__AL_31_DE_DICIEMBRE_A_O_2019.csv"
) %>%
clean_names() %>%
filter(cantidad == 1) %>%
mutate_if(is.character, tolower) %>%
mutate_if(is.character, capitalize) %>%
mutate_if(is.character, as.factor) %>%
mutate(dia = factor(dia,
levels = c("Lunes", "Martes", "Miércoles", "Jueves",
"Viernes", "Sábado", "Domingo"))) %>%
select(-codigo_dane)
head(data_hurtos)
library(ggplot2)
library(dplyr)
data_hurtos %>%
group_by(dia,zona) %>%
summarise(cantidad = n()) %>%
ggplot( aes(x = dia , y = cantidad, color = zona, group = zona)) +
geom_point() +
geom_line()
data_hurtos %>%
group_by(clase_de_empleado, zona) %>%
summarise(total = sum(cantidad)) %>%
ggplot(mapping = aes( x = reorder(clase_de_empleado, total) , y = total)) +
facet_wrap(facets = ~zona, scales = "free" , ncol = 2) +
geom_point()+
coord_flip()
data_hurtos %>%
group_by(dia,zona, departamento) %>%
summarise(cantidad = n()) %>%
ggplot(mapping = aes(x = dia, y = cantidad, color = zona, group = zona )) +
geom_line ()+
geom_point()+
facet_wrap(facets = ~departamento, scales = "free", ncol = 4)+
theme(legend.position = "top", axis.text.x = element_text(angle = 45, hjust = 1))
data_hurtos %>%
group_by( dia, departamento) %>%
summarise(total = sum(cantidad)) %>%
ggplot(mapping = aes( x = total)) +
facet_wrap(facets = ~departamento, scales = "free" , ncol = 4) +
geom_density()
# Accidentalidad Motos Medellín 2015-2020
library(janitor)
library(tidyverse)
library(Hmisc)
data_motos <- read_csv("Accidentalidad_con_motos_municipio_de_Medell_n_actualizado_a_julio_2020.csv") %>%
clean_names() %>%
mutate(fecha_accidente = as.Date(fecha_accidente, format = "%m/%d/%Y")) %>%
mutate_if(is.character, tolower) %>%
mutate_if(is.character, capitalize) %>%
mutate_if(is.character, as.factor)
head(data_motos)
data_motos %>%
filter(zona %in% c("Comuna 1", "Comuna 2", "Comuna 3", "Comuna 4", "Comuna 5",
"Comuna 6", "Comuna 7", "Comuna 8", "Comuna 9",
"Comuna 10", "Comuna 11", "Comuna 12", "Comuna 13",
"Comuna 14", "Comuna 15", "Comuna 16")) %>%
group_by(zona) %>%
count(name = "total") %>%
ggplot(mapping = aes(x = reorder(zona,total), y = total)) +
geom_col(fill = "red3") +
coord_flip() +
labs(x = "comuna",
y = "total",
title = "accidentes en moto por comuna")
data_motos %>%
group_by( hora_accidente) %>%
count(name = "total") %>%
ggplot(mapping = aes(x = hora_accidente, y = total)) +
geom_smooth(se = FALSE) +
labs(x = "total",
y = "hora",
title = "accidentes en moto hora")
-¿El patrón de comportamiento observado en el gráfico anterior es el mismo para todas las comunas?
data_motos %>%
filter(zona %in% c("Comuna 1", "Comuna 2", "Comuna 3", "Comuna 4",
"Comuna 5", "Comuna 6", "Comuna 7", "Comuna 8",
"Comuna 9", "Comuna 10", "Comuna 11", "Comuna 12"
, "Comuna 13", "Comuna 14", "Comuna 15", "Comuna 16")) %>%
group_by( hora_accidente,zona) %>%
count(name = "total") %>%
ggplot(mapping = aes(x = hora_accidente, y = total)) +
geom_smooth(se = FALSE) +
facet_wrap(facets = ~zona, scales = "free" , ncol = 4)
labs(x = "total",
y = "hora",
title = "accidentes en moto hora")
## $x
## [1] "total"
##
## $y
## [1] "hora"
##
## $title
## [1] "accidentes en moto hora"
##
## attr(,"class")
## [1] "labels"
library(tidyverse)
data_nutri <- read_csv("datos_kaggle_nutrition.csv")
data_nutri
library(readxl)
data_grupos <- read_excel("datos_kaggel_grupos_definitivo.xlsx")
data_grupos %>%
clean_names()
library(tidyverse)
data_grupos1 <- data_grupos %>%
mutate(grupo = as.factor(grupo),
name = as.factor(name)) %>%
clean_names() %>%
mutate(calories_kcal = as.numeric(calories_kcal),
manganese_mg = as.numeric(manganese_mg),
phosphorus_g = as.numeric(phosphorus_g),
potassium_g = as.numeric(potassium_g),
sodium_g = as.numeric(sodium_g),
vitamin_a_iu = as.numeric(vitamin_a_iu),
magnesium_mg = as.numeric( magnesium_mg),
protein_g = as.numeric(protein_g),
total_fat_g = as.numeric(total_fat_g),
total_fiber_g = as.numeric(total_fiber_g),
cholesterol_mg = as.numeric(cholesterol_mg),
vitamin_c_mg = as.numeric(vitamin_c_mg),
vitamin_d_iu = as.numeric(vitamin_d_iu),
vitamin_k_ug = as.numeric(vitamin_k_ug),
folate_ug = as.numeric(folate_ug),
calcium_g= as.numeric(calcium_g),
choline_mg = as.numeric(choline_mg),
iron_mg = as.numeric(iron_mg),
selenium_ug = as.numeric(selenium_ug),
carbohydrates_g = as.numeric(carbohydrates_g))
data_grupos1
data_grupos1 %>%
select(grupo,calories_kcal:zinc_mg) %>%
pivot_longer(cols = -grupo, names_to= "variable", values_to= "valores") %>%
ggplot(mapping = aes(x=valores, color = grupo, fill = grupo ))+
facet_wrap(facets = ~variable, scales = "free", ncol = 4)+
geom_density(alpha = 0.5)+
scale_x_log10()