Latihan VDE W9

visualisasi data penumpang titanic

library(dplyr)
## Warning: package 'dplyr' was built under R version 4.4.3
## 
## Attaching package: 'dplyr'
## The following objects are masked from 'package:stats':
## 
##     filter, lag
## The following objects are masked from 'package:base':
## 
##     intersect, setdiff, setequal, union
library(ggplot2)
## Warning: package 'ggplot2' was built under R version 4.4.3
titanic = read.csv("C:/Users/user/Downloads/titanic2.csv.csv")

contoh visualisasi

Perbandingan Jenis Kelamin Penumpang Titanic

#1. perbandingan jenis kelamin di titanic
ggplot(titanic, aes(x=Sex)) +
  geom_bar(fill='purple') +
  labs(title="Perbandingan Jenis Kelamin Penumpang")

Perbandingan Data Selamat atau Tidak

#2. perbandingan data selamat atau tidak berdasarkan kelas
ggplot(titanic, aes(x=factor(Pclass), fill=factor(Survived))) +
  geom_bar(position="fill") +
  labs(title="Proporsi Survival berdasarkan Kelas")

Distribusi Umur Penumpang

#3. distribusi umur penumpang
ggplot(titanic, aes(x=Age)) +
  geom_histogram(bins=30, fill='pink') +
  labs(title="Distribusi Umur Penumpang")
## Warning: Removed 177 rows containing non-finite outside the scale range
## (`stat_bin()`).

Boxplot Umur Penumpang yang Selamat

ggplot(titanic, aes(x=factor(Survived), y=Age, fill=factor(Survived))) +
  geom_boxplot(outlier.color='red') +
  labs(title= "Boxplot")
## Warning: Removed 177 rows containing non-finite outside the scale range
## (`stat_boxplot()`).

outlier=umur penumpang yang ga selamat

Scatterplot Umur dan Harga Tiket

ggplot(titanic, aes(x=Age, y=Fare)) +
  geom_point() +
  geom_smooth(method="lm", col='blue') +
  labs(title="Pengaruh Umur terhadap Harga Tiket")
## `geom_smooth()` using formula = 'y ~ x'
## Warning: Removed 177 rows containing non-finite outside the scale range
## (`stat_smooth()`).
## Warning: Removed 177 rows containing missing values or values outside the scale range
## (`geom_point()`).