df <- read.table("http://gauss.inf.um.es/datos/paMunMur0015DF.csv", sep = ";", header = T)
head(df)
## codMun Mun year pobTotal pobHom pobMuj
## 1 1 Abanilla 2000 6106 3050 3056
## 2 1 Abanilla 2001 6033 3030 3003
## 3 1 Abanilla 2002 6040 3045 2995
## 4 1 Abanilla 2003 6239 3151 3088
## 5 1 Abanilla 2004 6145 3084 3061
## 6 1 Abanilla 2005 6265 3171 3094
str(df)
## 'data.frame': 720 obs. of 6 variables:
## $ codMun : int 1 1 1 1 1 1 1 1 1 1 ...
## $ Mun : Factor w/ 45 levels "Ãguilas","Abanilla",..: 2 2 2 2 2 2 2 2 2 2 ...
## $ year : int 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 ...
## $ pobTotal: int 6106 6033 6040 6239 6145 6265 6333 6568 6642 6589 ...
## $ pobHom : int 3050 3030 3045 3151 3084 3171 3212 3350 3390 3315 ...
## $ pobMuj : int 3056 3003 2995 3088 3061 3094 3121 3218 3252 3274 ...
Tenemos 720 observaciones de 6 variables: 5 son números enteros y 1 es un factor.
a2000 <- df[df$year == 2000,]
head(a2000)
## codMun Mun year pobTotal pobHom pobMuj
## 1 1 Abanilla 2000 6106 3050 3056
## 17 2 Abarán 2000 12241 6111 6130
## 33 3 Ãguilas 2000 27559 13719 13840
## 49 4 Albudeite 2000 1369 690 679
## 65 5 Alcantarilla 2000 33453 16464 16989
## 81 6 Aledo 2000 997 505 492
Mujeres_by_year <- aggregate(. ~ year, data = df[, c(3,6)], sum)
Mujeres_by_year
## year pobMuj
## 1 2000 579203
## 2 2001 594621
## 3 2002 610757
## 4 2003 629435
## 5 2004 642637
## 6 2005 658743
## 7 2006 673279
## 8 2007 685791
## 9 2008 703110
## 10 2009 714911
## 11 2010 723352
## 12 2011 728488
## 13 2012 731722
## 14 2013 732207
## 15 2014 730929
## 16 2015 731854
muni <- df[df$Mun == "Alguazas",]
muni <- muni[, -c(1,2)]
apply(muni[, -1], 2, mean)
## pobTotal pobHom pobMuj
## 8464.125 4353.625 4110.500
library(tables)
## Warning: package 'tables' was built under R version 3.3.3
## Loading required package: Hmisc
## Warning: package 'Hmisc' was built under R version 3.3.2
## Loading required package: lattice
## Loading required package: survival
## Warning: package 'survival' was built under R version 3.3.2
## Loading required package: Formula
## Warning: package 'Formula' was built under R version 3.3.2
## Loading required package: ggplot2
## Warning: package 'ggplot2' was built under R version 3.3.2
##
## Attaching package: 'Hmisc'
## The following objects are masked from 'package:base':
##
## format.pval, round.POSIXt, trunc.POSIXt, units
tabular(~ (Hombres_2015 = pobHom) * ((Media = mean) + (SD = sd) + (Mediana = median) + (Min. = min) + (Max. = max)), data=df[df$year == 2015,])
##
## Hombres_2015
## Media SD Mediana Min. Max.
## 16343 34857 7954 270 215177
tt <- tabular(~ (Hombres_2015 = pobHom) * ((Media = mean) + (SD = sd) + (Mediana = median) + (Min. = min) + (Max. = max)), data=df[df$year == 2015,])
html(tt)
Hombres_2015 | |||||
---|---|---|---|---|---|
Media | SD | Mediana | Min. | Max. | |
16343 | 34857 | 7954 | 270 | 215177 |
plot(muni$pobTotal ~ muni$year, ylim = c(0, max(muni$pobTotal)), xlab = "Año", ylab = "Número de habitantes", main = "Población de Alguazas", type = "l", col = "black", lwd = 5)
lines(muni$pobHom ~ muni$year, col = "blue")
lines(muni$pobMuj ~ muni$year, col = "blue", lty = 3)
legend("bottomright", c("total", "hombres", "mujeres"), title = "Poblaciones", fill = c("black", "blue", "blue"), col = c("black", "blue", "blue"), lty = c(1, 1, 3), lwd = c(5, 1, 1))