###installar paquetes: install.packages("gapminder"), install.packages("dplyr"), install.packages("ggplot2")

### cargar paquetes
library(gapminder)
library(dplyr)
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(ggplot2)


###DATAFRAME
gapminder
## # A tibble: 1,704 × 6
##    country     continent  year lifeExp      pop gdpPercap
##    <fct>       <fct>     <int>   <dbl>    <int>     <dbl>
##  1 Afghanistan Asia       1952    28.8  8425333      779.
##  2 Afghanistan Asia       1957    30.3  9240934      821.
##  3 Afghanistan Asia       1962    32.0 10267083      853.
##  4 Afghanistan Asia       1967    34.0 11537966      836.
##  5 Afghanistan Asia       1972    36.1 13079460      740.
##  6 Afghanistan Asia       1977    38.4 14880372      786.
##  7 Afghanistan Asia       1982    39.9 12881816      978.
##  8 Afghanistan Asia       1987    40.8 13867957      852.
##  9 Afghanistan Asia       1992    41.7 16317921      649.
## 10 Afghanistan Asia       1997    41.8 22227415      635.
## # … with 1,694 more rows
##Mutar variable lifeExp de años a meses
gapminder<-gapminder%>%
  mutate(lifeExp=lifeExp*12)%>%
  print()
## # A tibble: 1,704 × 6
##    country     continent  year lifeExp      pop gdpPercap
##    <fct>       <fct>     <int>   <dbl>    <int>     <dbl>
##  1 Afghanistan Asia       1952    346.  8425333      779.
##  2 Afghanistan Asia       1957    364.  9240934      821.
##  3 Afghanistan Asia       1962    384. 10267083      853.
##  4 Afghanistan Asia       1967    408. 11537966      836.
##  5 Afghanistan Asia       1972    433. 13079460      740.
##  6 Afghanistan Asia       1977    461. 14880372      786.
##  7 Afghanistan Asia       1982    478. 12881816      978.
##  8 Afghanistan Asia       1987    490. 13867957      852.
##  9 Afghanistan Asia       1992    500. 16317921      649.
## 10 Afghanistan Asia       1997    501. 22227415      635.
## # … with 1,694 more rows
##crea nueva variable llamada ID2 
gapminder<-gapminder%>%
  mutate(ID2= c(1:1704))%>%
  print()
## # A tibble: 1,704 × 7
##    country     continent  year lifeExp      pop gdpPercap   ID2
##    <fct>       <fct>     <int>   <dbl>    <int>     <dbl> <int>
##  1 Afghanistan Asia       1952    346.  8425333      779.     1
##  2 Afghanistan Asia       1957    364.  9240934      821.     2
##  3 Afghanistan Asia       1962    384. 10267083      853.     3
##  4 Afghanistan Asia       1967    408. 11537966      836.     4
##  5 Afghanistan Asia       1972    433. 13079460      740.     5
##  6 Afghanistan Asia       1977    461. 14880372      786.     6
##  7 Afghanistan Asia       1982    478. 12881816      978.     7
##  8 Afghanistan Asia       1987    490. 13867957      852.     8
##  9 Afghanistan Asia       1992    500. 16317921      649.     9
## 10 Afghanistan Asia       1997    501. 22227415      635.    10
## # … with 1,694 more rows
##crear una nueva variable derivada de variables disponibles
gapminder<-gapminder%>%
  mutate(gdp=gdpPercap*pop)%>%
  print()
## # A tibble: 1,704 × 8
##    country     continent  year lifeExp      pop gdpPercap   ID2          gdp
##    <fct>       <fct>     <int>   <dbl>    <int>     <dbl> <int>        <dbl>
##  1 Afghanistan Asia       1952    346.  8425333      779.     1  6567086330.
##  2 Afghanistan Asia       1957    364.  9240934      821.     2  7585448670.
##  3 Afghanistan Asia       1962    384. 10267083      853.     3  8758855797.
##  4 Afghanistan Asia       1967    408. 11537966      836.     4  9648014150.
##  5 Afghanistan Asia       1972    433. 13079460      740.     5  9678553274.
##  6 Afghanistan Asia       1977    461. 14880372      786.     6 11697659231.
##  7 Afghanistan Asia       1982    478. 12881816      978.     7 12598563401.
##  8 Afghanistan Asia       1987    490. 13867957      852.     8 11820990309.
##  9 Afghanistan Asia       1992    500. 16317921      649.     9 10595901589.
## 10 Afghanistan Asia       1997    501. 22227415      635.    10 14121995875.
## # … with 1,694 more rows
##quien tiene el GDP mas alto?
gapminder%>%
  filter(year==2007)%>%
  arrange(desc(gdp))%>%
  print()
## # A tibble: 142 × 8
##    country        continent  year lifeExp        pop gdpPercap   ID2     gdp
##    <fct>          <fct>     <int>   <dbl>      <int>     <dbl> <int>   <dbl>
##  1 United States  Americas   2007    939.  301139947    42952.  1620 1.29e13
##  2 China          Asia       2007    876. 1318683096     4959.   300 6.54e12
##  3 Japan          Asia       2007    991.  127467972    31656.   804 4.04e12
##  4 India          Asia       2007    776. 1110396331     2452.   708 2.72e12
##  5 Germany        Europe     2007    953.   82400996    32170.   576 2.65e12
##  6 United Kingdom Europe     2007    953.   60776238    33203.  1608 2.02e12
##  7 France         Europe     2007    968.   61083916    30470.   540 1.86e12
##  8 Brazil         Americas   2007    869.  190010647     9066.   180 1.72e12
##  9 Italy          Europe     2007    967.   58147733    28570.   780 1.66e12
## 10 Mexico         Americas   2007    914.  108700891    11978.   996 1.30e12
## # … with 132 more rows
## Plot
gapminder%>%
  filter(year==2007)%>%
  ggplot( aes(x= pop, y=gdp))+
  geom_point()+
  scale_x_log10()+
  scale_y_log10()+
  geom_smooth()
## `geom_smooth()` using method = 'loess' and formula 'y ~ x'