Las librerías
library (dplyr)
library (readr)
library (fdth)
Los datos
datos <- read.csv("https://raw.githubusercontent.com/rpizarrog/Curso-Titulacion-Data-Science-/master/2020/datos/starwars.csv")
datos
## X name height mass hair_color skin_color
## 1 1 Luke Skywalker 172 77.0 blond fair
## 2 2 C-3PO 167 75.0 <NA> gold
## 3 3 R2-D2 96 32.0 <NA> white, blue
## 4 4 Darth Vader 202 136.0 none white
## 5 5 Leia Organa 150 49.0 brown light
## 6 6 Owen Lars 178 120.0 brown, grey light
## 7 7 Beru Whitesun lars 165 75.0 brown light
## 8 8 R5-D4 97 32.0 <NA> white, red
## 9 9 Biggs Darklighter 183 84.0 black light
## 10 10 Obi-Wan Kenobi 182 77.0 auburn, white fair
## 11 11 Anakin Skywalker 188 84.0 blond fair
## 12 12 Wilhuff Tarkin 180 NA auburn, grey fair
## 13 13 Chewbacca 228 112.0 brown unknown
## 14 14 Han Solo 180 80.0 brown fair
## 15 15 Greedo 173 74.0 <NA> green
## 16 16 Jabba Desilijic Tiure 175 1358.0 <NA> green-tan, brown
## 17 17 Wedge Antilles 170 77.0 brown fair
## 18 18 Jek Tono Porkins 180 110.0 brown fair
## 19 19 Yoda 66 17.0 white green
## 20 20 Palpatine 170 75.0 grey pale
## 21 21 Boba Fett 183 78.2 black fair
## 22 22 IG-88 200 140.0 none metal
## 23 23 Bossk 190 113.0 none green
## 24 24 Lando Calrissian 177 79.0 black dark
## 25 25 Lobot 175 79.0 none light
## 26 26 Ackbar 180 83.0 none brown mottle
## 27 27 Mon Mothma 150 NA auburn fair
## 28 28 Arvel Crynyd NA NA brown fair
## 29 29 Wicket Systri Warrick 88 20.0 brown brown
## 30 30 Nien Nunb 160 68.0 none grey
## 31 31 Qui-Gon Jinn 193 89.0 brown fair
## 32 32 Nute Gunray 191 90.0 none mottled green
## 33 33 Finis Valorum 170 NA blond fair
## 34 34 Jar Jar Binks 196 66.0 none orange
## 35 35 Roos Tarpals 224 82.0 none grey
## 36 36 Rugor Nass 206 NA none green
## 37 37 Ric Olié 183 NA brown fair
## 38 38 Watto 137 NA black blue, grey
## 39 39 Sebulba 112 40.0 none grey, red
## 40 40 Quarsh Panaka 183 NA black dark
## 41 41 Shmi Skywalker 163 NA black fair
## 42 42 Darth Maul 175 80.0 none red
## 43 43 Bib Fortuna 180 NA none pale
## 44 44 Ayla Secura 178 55.0 none blue
## 45 45 Dud Bolt 94 45.0 none blue, grey
## 46 46 Gasgano 122 NA none white, blue
## 47 47 Ben Quadinaros 163 65.0 none grey, green, yellow
## 48 48 Mace Windu 188 84.0 none dark
## 49 49 Ki-Adi-Mundi 198 82.0 white pale
## 50 50 Kit Fisto 196 87.0 none green
## 51 51 Eeth Koth 171 NA black brown
## 52 52 Adi Gallia 184 50.0 none dark
## 53 53 Saesee Tiin 188 NA none pale
## 54 54 Yarael Poof 264 NA none white
## 55 55 Plo Koon 188 80.0 none orange
## 56 56 Mas Amedda 196 NA none blue
## 57 57 Gregar Typho 185 85.0 black dark
## 58 58 Cordé 157 NA brown light
## 59 59 Cliegg Lars 183 NA brown fair
## 60 60 Poggle the Lesser 183 80.0 none green
## 61 61 Luminara Unduli 170 56.2 black yellow
## 62 62 Barriss Offee 166 50.0 black yellow
## 63 63 Dormé 165 NA brown light
## 64 64 Dooku 193 80.0 white fair
## 65 65 Bail Prestor Organa 191 NA black tan
## 66 66 Jango Fett 183 79.0 black tan
## 67 67 Zam Wesell 168 55.0 blonde fair, green, yellow
## 68 68 Dexter Jettster 198 102.0 none brown
## 69 69 Lama Su 229 88.0 none grey
## 70 70 Taun We 213 NA none grey
## 71 71 Jocasta Nu 167 NA white fair
## 72 72 Ratts Tyerell 79 15.0 none grey, blue
## 73 73 R4-P17 96 NA none silver, red
## 74 74 Wat Tambor 193 48.0 none green, grey
## 75 75 San Hill 191 NA none grey
## 76 76 Shaak Ti 178 57.0 none red, blue, white
## 77 77 Grievous 216 159.0 none brown, white
## 78 78 Tarfful 234 136.0 brown brown
## 79 79 Raymus Antilles 188 79.0 brown light
## 80 80 Sly Moore 178 48.0 none pale
## 81 81 Tion Medon 206 80.0 none grey
## 82 82 Finn NA NA black dark
## 83 83 Rey NA NA brown light
## 84 84 Poe Dameron NA NA brown light
## 85 85 BB8 NA NA none none
## 86 86 Captain Phasma NA NA unknown unknown
## 87 87 Padmé Amidala 165 45.0 brown light
## eye_color birth_year gender homeworld species
## 1 blue 19.0 male Tatooine Human
## 2 yellow 112.0 <NA> Tatooine Droid
## 3 red 33.0 <NA> Naboo Droid
## 4 yellow 41.9 male Tatooine Human
## 5 brown 19.0 female Alderaan Human
## 6 blue 52.0 male Tatooine Human
## 7 blue 47.0 female Tatooine Human
## 8 red NA <NA> Tatooine Droid
## 9 brown 24.0 male Tatooine Human
## 10 blue-gray 57.0 male Stewjon Human
## 11 blue 41.9 male Tatooine Human
## 12 blue 64.0 male Eriadu Human
## 13 blue 200.0 male Kashyyyk Wookiee
## 14 brown 29.0 male Corellia Human
## 15 black 44.0 male Rodia Rodian
## 16 orange 600.0 hermaphrodite Nal Hutta Hutt
## 17 hazel 21.0 male Corellia Human
## 18 blue NA male Bestine IV Human
## 19 brown 896.0 male <NA> Yoda's species
## 20 yellow 82.0 male Naboo Human
## 21 brown 31.5 male Kamino Human
## 22 red 15.0 none <NA> Droid
## 23 red 53.0 male Trandosha Trandoshan
## 24 brown 31.0 male Socorro Human
## 25 blue 37.0 male Bespin Human
## 26 orange 41.0 male Mon Cala Mon Calamari
## 27 blue 48.0 female Chandrila Human
## 28 brown NA male <NA> Human
## 29 brown 8.0 male Endor Ewok
## 30 black NA male Sullust Sullustan
## 31 blue 92.0 male <NA> Human
## 32 red NA male Cato Neimoidia Neimodian
## 33 blue 91.0 male Coruscant Human
## 34 orange 52.0 male Naboo Gungan
## 35 orange NA male Naboo Gungan
## 36 orange NA male Naboo Gungan
## 37 blue NA male Naboo <NA>
## 38 yellow NA male Toydaria Toydarian
## 39 orange NA male Malastare Dug
## 40 brown 62.0 male Naboo <NA>
## 41 brown 72.0 female Tatooine Human
## 42 yellow 54.0 male Dathomir Zabrak
## 43 pink NA male Ryloth Twi'lek
## 44 hazel 48.0 female Ryloth Twi'lek
## 45 yellow NA male Vulpter Vulptereen
## 46 black NA male Troiken Xexto
## 47 orange NA male Tund Toong
## 48 brown 72.0 male Haruun Kal Human
## 49 yellow 92.0 male Cerea Cerean
## 50 black NA male Glee Anselm Nautolan
## 51 brown NA male Iridonia Zabrak
## 52 blue NA female Coruscant Tholothian
## 53 orange NA male Iktotch Iktotchi
## 54 yellow NA male Quermia Quermian
## 55 black 22.0 male Dorin Kel Dor
## 56 blue NA male Champala Chagrian
## 57 brown NA male Naboo Human
## 58 brown NA female Naboo Human
## 59 blue 82.0 male Tatooine Human
## 60 yellow NA male Geonosis Geonosian
## 61 blue 58.0 female Mirial Mirialan
## 62 blue 40.0 female Mirial Mirialan
## 63 brown NA female Naboo Human
## 64 brown 102.0 male Serenno Human
## 65 brown 67.0 male Alderaan Human
## 66 brown 66.0 male Concord Dawn Human
## 67 yellow NA female Zolan Clawdite
## 68 yellow NA male Ojom Besalisk
## 69 black NA male Kamino Kaminoan
## 70 black NA female Kamino Kaminoan
## 71 blue NA female Coruscant Human
## 72 unknown NA male Aleen Minor Aleena
## 73 red, blue NA female <NA> <NA>
## 74 unknown NA male Skako Skakoan
## 75 gold NA male Muunilinst Muun
## 76 black NA female Shili Togruta
## 77 green, yellow NA male Kalee Kaleesh
## 78 blue NA male Kashyyyk Wookiee
## 79 brown NA male Alderaan Human
## 80 white NA female Umbara <NA>
## 81 black NA male Utapau Pau'an
## 82 dark NA male <NA> Human
## 83 hazel NA female <NA> Human
## 84 brown NA male <NA> Human
## 85 black NA none <NA> Droid
## 86 unknown NA female <NA> <NA>
## 87 brown 46.0 female Naboo Human
str(datos)
## 'data.frame': 87 obs. of 11 variables:
## $ X : int 1 2 3 4 5 6 7 8 9 10 ...
## $ name : Factor w/ 87 levels "Ackbar","Adi Gallia",..: 46 15 62 21 44 54 10 64 12 53 ...
## $ height : int 172 167 96 202 150 178 165 97 183 182 ...
## $ mass : num 77 75 32 136 49 120 75 32 84 77 ...
## $ hair_color: Factor w/ 12 levels "auburn","auburn, grey",..: 5 NA NA 10 7 8 7 NA 4 3 ...
## $ skin_color: Factor w/ 31 levels "blue","blue, grey",..: 7 9 29 28 17 17 17 30 17 7 ...
## $ eye_color : Factor w/ 15 levels "black","blue",..: 2 15 11 15 4 2 2 11 4 3 ...
## $ birth_year: num 19 112 33 41.9 19 52 47 NA 24 57 ...
## $ gender : Factor w/ 4 levels "female","hermaphrodite",..: 3 NA NA 3 1 3 1 NA 3 3 ...
## $ homeworld : Factor w/ 48 levels "Alderaan","Aleen Minor",..: 40 40 28 40 1 40 40 40 40 38 ...
## $ species : Factor w/ 37 levels "Aleena","Besalisk",..: 11 6 6 11 11 11 11 6 11 11 ...
summary(datos)
## X name height mass
## Min. : 1.0 Ackbar : 1 Min. : 66.0 Min. : 15.00
## 1st Qu.:22.5 Adi Gallia : 1 1st Qu.:167.0 1st Qu.: 55.60
## Median :44.0 Anakin Skywalker : 1 Median :180.0 Median : 79.00
## Mean :44.0 Arvel Crynyd : 1 Mean :174.4 Mean : 97.31
## 3rd Qu.:65.5 Ayla Secura : 1 3rd Qu.:191.0 3rd Qu.: 84.50
## Max. :87.0 Bail Prestor Organa: 1 Max. :264.0 Max. :1358.00
## (Other) :81 NA's :6 NA's :28
## hair_color skin_color eye_color birth_year gender
## none :37 fair :17 brown :21 Min. : 8.00 female :19
## brown :18 light :11 blue :19 1st Qu.: 35.00 hermaphrodite: 1
## black :13 dark : 6 yellow :11 Median : 52.00 male :62
## white : 4 green : 6 black :10 Mean : 87.57 none : 2
## blond : 3 grey : 6 orange : 8 3rd Qu.: 72.00 NA's : 3
## (Other): 7 pale : 5 red : 5 Max. :896.00
## NA's : 5 (Other):36 (Other):13 NA's :44
## homeworld species
## Naboo :11 Human :35
## Tatooine :10 Droid : 5
## Alderaan : 3 Gungan : 3
## Coruscant: 3 Kaminoan: 2
## Kamino : 3 Mirialan: 2
## (Other) :47 (Other) :35
## NA's :10 NA's : 5
Tabla de distribución por genero
tabla.frecuencias <- fdt_cat(datos$gender, breaks = "Sturges")
tabla.frecuencias
## Category f rf rf(%) cf cf(%)
## male 62 0.74 73.81 62 73.81
## female 19 0.23 22.62 81 96.43
## none 2 0.02 2.38 83 98.81
## hermaphrodite 1 0.01 1.19 84 100.00
Tabla de distribución por planeta
tabla.frecuencias <- fdt_cat(datos$homeworld, breaks = "Sturges")
tabla.frecuencias
## Category f rf rf(%) cf cf(%)
## Naboo 11 0.14 14.29 11 14.29
## Tatooine 10 0.13 12.99 21 27.27
## Alderaan 3 0.04 3.90 24 31.17
## Coruscant 3 0.04 3.90 27 35.06
## Kamino 3 0.04 3.90 30 38.96
## Corellia 2 0.03 2.60 32 41.56
## Kashyyyk 2 0.03 2.60 34 44.16
## Mirial 2 0.03 2.60 36 46.75
## Ryloth 2 0.03 2.60 38 49.35
## Aleen Minor 1 0.01 1.30 39 50.65
## Bespin 1 0.01 1.30 40 51.95
## Bestine IV 1 0.01 1.30 41 53.25
## Cato Neimoidia 1 0.01 1.30 42 54.55
## Cerea 1 0.01 1.30 43 55.84
## Champala 1 0.01 1.30 44 57.14
## Chandrila 1 0.01 1.30 45 58.44
## Concord Dawn 1 0.01 1.30 46 59.74
## Dathomir 1 0.01 1.30 47 61.04
## Dorin 1 0.01 1.30 48 62.34
## Endor 1 0.01 1.30 49 63.64
## Eriadu 1 0.01 1.30 50 64.94
## Geonosis 1 0.01 1.30 51 66.23
## Glee Anselm 1 0.01 1.30 52 67.53
## Haruun Kal 1 0.01 1.30 53 68.83
## Iktotch 1 0.01 1.30 54 70.13
## Iridonia 1 0.01 1.30 55 71.43
## Kalee 1 0.01 1.30 56 72.73
## Malastare 1 0.01 1.30 57 74.03
## Mon Cala 1 0.01 1.30 58 75.32
## Muunilinst 1 0.01 1.30 59 76.62
## Nal Hutta 1 0.01 1.30 60 77.92
## Ojom 1 0.01 1.30 61 79.22
## Quermia 1 0.01 1.30 62 80.52
## Rodia 1 0.01 1.30 63 81.82
## Serenno 1 0.01 1.30 64 83.12
## Shili 1 0.01 1.30 65 84.42
## Skako 1 0.01 1.30 66 85.71
## Socorro 1 0.01 1.30 67 87.01
## Stewjon 1 0.01 1.30 68 88.31
## Sullust 1 0.01 1.30 69 89.61
## Toydaria 1 0.01 1.30 70 90.91
## Trandosha 1 0.01 1.30 71 92.21
## Troiken 1 0.01 1.30 72 93.51
## Tund 1 0.01 1.30 73 94.81
## Umbara 1 0.01 1.30 74 96.10
## Utapau 1 0.01 1.30 75 97.40
## Vulpter 1 0.01 1.30 76 98.70
## Zolan 1 0.01 1.30 77 100.00
Tabla de distribución por especie
tabla.frecuencias <- fdt_cat(datos$species, breaks = "Sturges")
tabla.frecuencias
## Category f rf rf(%) cf cf(%)
## Human 35 0.43 42.68 35 42.68
## Droid 5 0.06 6.10 40 48.78
## Gungan 3 0.04 3.66 43 52.44
## Kaminoan 2 0.02 2.44 45 54.88
## Mirialan 2 0.02 2.44 47 57.32
## Twi'lek 2 0.02 2.44 49 59.76
## Wookiee 2 0.02 2.44 51 62.20
## Zabrak 2 0.02 2.44 53 64.63
## Aleena 1 0.01 1.22 54 65.85
## Besalisk 1 0.01 1.22 55 67.07
## Cerean 1 0.01 1.22 56 68.29
## Chagrian 1 0.01 1.22 57 69.51
## Clawdite 1 0.01 1.22 58 70.73
## Dug 1 0.01 1.22 59 71.95
## Ewok 1 0.01 1.22 60 73.17
## Geonosian 1 0.01 1.22 61 74.39
## Hutt 1 0.01 1.22 62 75.61
## Iktotchi 1 0.01 1.22 63 76.83
## Kaleesh 1 0.01 1.22 64 78.05
## Kel Dor 1 0.01 1.22 65 79.27
## Mon Calamari 1 0.01 1.22 66 80.49
## Muun 1 0.01 1.22 67 81.71
## Nautolan 1 0.01 1.22 68 82.93
## Neimodian 1 0.01 1.22 69 84.15
## Pau'an 1 0.01 1.22 70 85.37
## Quermian 1 0.01 1.22 71 86.59
## Rodian 1 0.01 1.22 72 87.80
## Skakoan 1 0.01 1.22 73 89.02
## Sullustan 1 0.01 1.22 74 90.24
## Tholothian 1 0.01 1.22 75 91.46
## Togruta 1 0.01 1.22 76 92.68
## Toong 1 0.01 1.22 77 93.90
## Toydarian 1 0.01 1.22 78 95.12
## Trandoshan 1 0.01 1.22 79 96.34
## Vulptereen 1 0.01 1.22 80 97.56
## Xexto 1 0.01 1.22 81 98.78
## Yoda's species 1 0.01 1.22 82 100.00
Tabla de distribución de la columna mass
tabla.frecuencias <- fdt(datos$mass, breaks = "Sturges")
tabla.frecuencias
## Class limits f rf rf(%) cf cf(%)
## [14.85,208.6686) 58 0.98 98.31 58 98.31
## [208.6686,402.4871) 0 0.00 0.00 58 98.31
## [402.4871,596.3057) 0 0.00 0.00 58 98.31
## [596.3057,790.1243) 0 0.00 0.00 58 98.31
## [790.1243,983.9429) 0 0.00 0.00 58 98.31
## [983.9429,1177.761) 0 0.00 0.00 58 98.31
## [1177.761,1371.58) 1 0.02 1.69 59 100.00
barplot(height = tabla.frecuencias$table$f, names.arg = tabla.frecuencias$table$`Class limits`)
Tabla de distribución de la columna heigh
tabla.frecuencias <- fdt(datos$heigh, breaks = "Sturges")
tabla.frecuencias
## Class limits f rf rf(%) cf cf(%)
## [65.34,90.5025) 3 0.04 3.70 3 3.70
## [90.5025,115.665) 5 0.06 6.17 8 9.88
## [115.665,140.827) 2 0.02 2.47 10 12.35
## [140.827,165.99) 9 0.11 11.11 19 23.46
## [165.99,191.152) 43 0.53 53.09 62 76.54
## [191.152,216.315) 14 0.17 17.28 76 93.83
## [216.315,241.477) 4 0.05 4.94 80 98.77
## [241.477,266.64) 1 0.01 1.23 81 100.00
barplot(height = tabla.frecuencias$table$f, names.arg = tabla.frecuencias$table$`Class limits`)