ANALISIS DEMOGRAFI_TUGAS 2
#baca data
demografi <- read.csv("D:/KULIAH UIN/SMT 2/MACHINE LEARNING/tugas 2/P2-Demographic-Data.csv")
head(demografi)
## Country.Name Country.Code Birth.rate Internet.users
## 1 Aruba ABW 10.244 78.9
## 2 Afghanistan AFG 35.253 5.9
## 3 Angola AGO 45.985 19.1
## 4 Albania ALB 12.877 57.2
## 5 United Arab Emirates ARE 11.044 88.0
## 6 Argentina ARG 17.716 59.9
## Income.Group
## 1 High income
## 2 Low income
## 3 Upper middle income
## 4 Upper middle income
## 5 High income
## 6 High income
summary(demografi)
## Country.Name Country.Code Birth.rate Internet.users
## Length:195 Length:195 Min. : 7.90 Min. : 0.90
## Class :character Class :character 1st Qu.:12.12 1st Qu.:14.52
## Mode :character Mode :character Median :19.68 Median :41.00
## Mean :21.47 Mean :42.08
## 3rd Qu.:29.76 3rd Qu.:66.22
## Max. :49.66 Max. :96.55
## Income.Group
## Length:195
## Class :character
## Mode :character
##
##
##
#Data dengan Angka Kelahiran di atas 2
filter_br <- demografi$Birth.rate > 2
head(demografi[filter_br,])
## Country.Name Country.Code Birth.rate Internet.users
## 1 Aruba ABW 10.244 78.9
## 2 Afghanistan AFG 35.253 5.9
## 3 Angola AGO 45.985 19.1
## 4 Albania ALB 12.877 57.2
## 5 United Arab Emirates ARE 11.044 88.0
## 6 Argentina ARG 17.716 59.9
## Income.Group
## 1 High income
## 2 Low income
## 3 Upper middle income
## 4 Upper middle income
## 5 High income
## 6 High income
head(demografi[demografi$Birth.rate > 40,])
## Country.Name Country.Code Birth.rate Internet.users Income.Group
## 3 Angola AGO 45.985 19.1 Upper middle income
## 12 Burundi BDI 44.151 1.3 Low income
## 15 Burkina Faso BFA 40.551 9.1 Low income
## 66 Gambia, The GMB 42.525 14.0 Low income
## 116 Mali MLI 44.138 3.5 Low income
## 128 Niger NER 49.661 1.7 Low income
head(demografi[demografi$Income.Group == "High income",])
## Country.Name Country.Code Birth.rate Internet.users Income.Group
## 1 Aruba ABW 10.244 78.9000 High income
## 5 United Arab Emirates ARE 11.044 88.0000 High income
## 6 Argentina ARG 17.716 59.9000 High income
## 8 Antigua and Barbuda ATG 16.447 63.4000 High income
## 9 Australia AUS 13.200 83.0000 High income
## 10 Austria AUT 9.400 80.6188 High income
MENCARI BERDASARKAN NEGARA
head(demografi[demografi$Country.Code == "AFG ",])
## [1] Country.Name Country.Code Birth.rate Internet.users Income.Group
## <0 rows> (or 0-length row.names)
library(ggplot2)
## Warning: package 'ggplot2' was built under R version 4.0.5
qplot(data = demografi, x=Internet.users, y = Birth.rate, size=I(4), colour=I("blue"))
#
qplot(data = demografi, x=Internet.users, y = Birth.rate, size=I(3), colour=Income.Group)
Berdasarkan Negara
#Scatter Plot antara Pengguna.Internet & Angka.Kelahiran dan dikategorikan berdasarkan Wilayah Negara
qplot(data = demografi, x= Internet.users, y= Birth.rate, size=I(3), colour=Country.Name)
A. Membuat Scatter Plot dengan Kategori Berdasarkan Wilayah Negara
Country.Code <- c("ABW","AFG","AGO","ALB","ARE","ARG","ARM","ATG","AUS","AUT","AZE","BDI","BEL","BEN","BFA","BGD","BGR","BHR","BHS","BIH","BLR","BLZ","BMU","BOL","BRA","BRB","BRN","BTN","BWA","CAF","CAN","CHE","CHL","CHN","CIV","CMR","COG","COL","COM","CPV","CRI","CUB","CYM","CYP","CZE","DEU","DJI","DNK","DOM","DZA","ECU","EGY","ERI","ESP","EST","ETH","FIN","FJI","FRA","FSM","GAB","GBR","GEO","GHA","GIN","GMB","GNB","GNQ","GRC","GRD","GRL","GTM","GUM","GUY","HKG","HND","HRV","HTI","HUN","IDN","IND","IRL","IRN","IRQ","ISL","ISR","ITA","JAM","JOR","JPN","KAZ","KEN","KGZ","KHM","KIR","KOR","KWT","LAO","LBN","LBR","LBY","LCA","LIE","LKA","LSO","LTU","LUX","LVA","MAC","MAR","MDA","MDG","MDV","MEX","MKD","MLI","MLT","MMR","MNE","MNG","MOZ","MRT","MUS","MWI","MYS","NAM","NCL","NER","NGA","NIC","NLD","NOR","NPL","NZL","OMN","PAK","PAN","PER","PHL","PNG","POL","PRI","PRT","PRY","PYF","QAT","ROU","RUS","RWA","SAU","SDN","SEN","SGP","SLB","SLE","SLV","SOM","SRB","SSD","STP","SUR","SVK","SVN","SWE","SWZ","SYC","SYR","TCD","TGO","THA","TJK","TKM","TLS","TON","TTO","TUN","TUR","TZA","UGA","UKR","URY","USA","UZB","VCT","VEN","VIR","VNM","VUT","PSE","WSM","YEM","ZAF","COD","ZMB","ZWE")
Country.Name <- c("Amerika","Asia","Afrika","Eropa","Middle East","Amerika","Asia","Amerika","Oceania","Eropa","Asia","Afrika","Eropa","Afrika","Afrika","Asia","Eropa","Middle East","Amerika","Eropa","Eropa","Amerika","Amerika","Amerika","Amerika","Amerika","Asia","Asia","Afrika","Afrika","Amerika","Eropa","Amerika","Asia","Afrika","Afrika","Afrika","Amerika","Afrika","Afrika","Amerika","Amerika","Amerika","Eropa","Eropa","Eropa","Afrika","Eropa","Amerika","Afrika","Amerika","Afrika","Afrika","Eropa","Eropa","Afrika","Eropa","Oceania","Eropa","Oceania","Afrika","Eropa","Asia","Afrika","Afrika","Afrika","Afrika","Afrika","Eropa","Amerika","Amerika","Amerika","Oceania","Amerika","Asia","Amerika","Eropa","Amerika","Eropa","Asia","Asia","Eropa","Middle East","Middle East","Eropa","Middle East","Eropa","Amerika","Middle East","Asia","Asia","Afrika","Asia","Asia","Oceania","Asia","Middle East","Asia","Middle East","Afrika","Afrika","Amerika","Eropa","Asia","Afrika","Eropa","Eropa","Eropa","Asia","Afrika","Eropa","Afrika","Asia","Amerika","Eropa","Afrika","Eropa","Asia","Eropa","Asia","Afrika","Afrika","Afrika","Afrika","Asia","Afrika","Oceania","Afrika","Afrika","Amerika","Eropa","Eropa","Asia","Oceania","Middle East","Asia","Amerika","Amerika","Asia","Oceania","Eropa","Amerika","Eropa","Amerika","Oceania","Middle East","Eropa","Eropa","Afrika","Middle East","Afrika","Afrika","Asia","Oceania","Afrika","Amerika","Afrika","Eropa","Afrika","Afrika","Amerika","Eropa","Eropa","Eropa","Afrika","Afrika","Middle East","Afrika","Afrika","Asia","Asia","Asia","Asia","Oceania","Amerika","Afrika","Eropa","Afrika","Afrika","Eropa","Amerika","Amerika","Asia","Amerika","Amerika","Amerika","Asia","Oceania","Middle East","Oceania","Middle East","Afrika","Afrika","Afrika","Afrika")
# Membuat Data Frame
dataset_demographic <- data.frame(Country.Code, Country.Name)
head(dataset_demographic)
## Country.Code Country.Name
## 1 ABW Amerika
## 2 AFG Asia
## 3 AGO Afrika
## 4 ALB Eropa
## 5 ARE Middle East
## 6 ARG Amerika
MENYATUKAN 2 DATA : DI ATAS
merge_dataset <- merge(demografi, dataset_demographic, by.x="Country.Code", by.y ="Country.Code")
head(merge_dataset)
## Country.Code Country.Name.x Birth.rate Internet.users
## 1 ABW Aruba 10.244 78.9
## 2 AFG Afghanistan 35.253 5.9
## 3 AGO Angola 45.985 19.1
## 4 ALB Albania 12.877 57.2
## 5 ARE United Arab Emirates 11.044 88.0
## 6 ARG Argentina 17.716 59.9
## Income.Group Country.Name.y
## 1 High income Amerika
## 2 Low income Asia
## 3 Upper middle income Afrika
## 4 Upper middle income Eropa
## 5 High income Middle East
## 6 High income Amerika
B. Scatter Plot Angka Kelahiran dan Pengguna Internet Berdasarkan Wilayah Negara.
scatterplot2 <- ggplot(merge_dataset, aes(x = Birth.rate, y = Internet.users, shape = Country.Name, color=Country.Name))+
geom_point()
scatterplot2