df<-read.delim("c:\\R\\Data\\data1.txt")
dim(df)
## [1] 1925 26
head(df);tail(df)
## Q1 Q2 Q3 Q4 Q5 Q6 Q7 Q8 Q9 Q10 Q11 Q12 Q13 Q14 Q15 Q16 Q17 Q18 Q19 Q20 Gender
## 1 4 4 2 3 4 2 2 4 4 4 4 4 4 4 4 4 4 4 4 4 0
## 2 4 4 4 4 4 3 2 4 4 4 4 4 4 4 4 4 3 4 2 1 0
## 3 4 4 4 4 2 4 4 4 4 2 4 4 4 4 3 4 4 4 4 3 0
## 4 5 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 0
## 5 4 4 4 4 4 4 4 4 2 4 4 4 4 4 4 4 4 4 4 4 0
## 6 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 4 0
## EDU BF BM Happiness Peace
## 1 1 3.4 3.2 4.0 4.0
## 2 1 4.0 3.4 4.0 2.8
## 3 2 3.6 3.6 3.8 3.8
## 4 1 4.2 4.0 4.0 4.0
## 5 2 4.0 3.6 4.0 4.0
## 6 1 4.0 4.0 4.0 4.0
## Q1 Q2 Q3 Q4 Q5 Q6 Q7 Q8 Q9 Q10 Q11 Q12 Q13 Q14 Q15 Q16 Q17 Q18 Q19 Q20
## 1920 4 4 3 4 4 2 2 3 4 2 2 4 3 4 4 3 4 4 3 4
## 1921 2 2 2 1 2 2 2 2 2 2 1 3 2 1 3 2 2 2 2 2
## 1922 3 2 2 2 3 1 1 1 1 1 3 3 3 4 4 4 4 5 2 2
## 1923 5 4 4 4 4 2 2 2 2 3 3 4 3 4 3 3 3 4 4 4
## 1924 4 4 4 2 2 4 2 4 4 3 3 2 3 4 3 4 4 4 3 4
## 1925 3 3 1 1 2 1 1 1 1 1 4 4 3 2 2 3 4 4 3 2
## Gender EDU BF BM Happiness Peace
## 1920 1 3 3.8 2.6 3.4 3.6
## 1921 1 2 1.8 2.0 2.0 2.0
## 1922 0 2 2.4 1.0 3.4 3.4
## 1923 0 2 4.2 2.2 3.4 3.6
## 1924 1 2 3.2 3.4 3.0 3.8
## 1925 0 3 2.0 1.0 3.0 3.2
str(df)
## 'data.frame': 1925 obs. of 26 variables:
## $ Q1 : int 4 4 4 5 4 4 4 4 4 4 ...
## $ Q2 : int 4 4 4 4 4 4 2 2 4 4 ...
## $ Q3 : int 2 4 4 4 4 4 4 4 4 2 ...
## $ Q4 : int 3 4 4 4 4 4 4 4 4 2 ...
## $ Q5 : int 4 4 2 4 4 4 4 4 2 4 ...
## $ Q6 : int 2 3 4 4 4 4 4 4 1 2 ...
## $ Q7 : int 2 2 4 4 4 4 4 4 3 4 ...
## $ Q8 : int 4 4 4 4 4 4 5 5 2 2 ...
## $ Q9 : int 4 4 4 4 2 4 5 5 3 4 ...
## $ Q10 : int 4 4 2 4 4 4 5 5 2 4 ...
## $ Q11 : int 4 4 4 4 4 4 5 5 4 4 ...
## $ Q12 : int 4 4 4 4 4 4 5 5 3 4 ...
## $ Q13 : int 4 4 4 4 4 4 5 5 4 4 ...
## $ Q14 : int 4 4 4 4 4 4 5 5 5 4 ...
## $ Q15 : int 4 4 3 4 4 4 4 2 3 4 ...
## $ Q16 : int 4 4 4 4 4 4 5 2 4 4 ...
## $ Q17 : int 4 3 4 4 4 4 2 2 4 4 ...
## $ Q18 : int 4 4 4 4 4 4 4 4 4 4 ...
## $ Q19 : int 4 2 4 4 4 4 4 2 4 2 ...
## $ Q20 : int 4 1 3 4 4 4 4 2 4 2 ...
## $ Gender : int 0 0 0 0 0 0 0 0 1 0 ...
## $ EDU : int 1 1 2 1 2 1 1 1 4 3 ...
## $ BF : num 3.4 4 3.6 4.2 4 4 3.6 3.6 3.6 3.2 ...
## $ BM : num 3.2 3.4 3.6 4 3.6 4 4.6 4.6 2.2 3.2 ...
## $ Happiness: num 4 4 3.8 4 4 4 4.8 4.4 3.8 4 ...
## $ Peace : num 4 2.8 3.8 4 4 4 3.8 2.4 4 3.2 ...
summary(df)
## Q1 Q2 Q3 Q4
## Min. :1.000 Min. :1.000 Min. :1.000 Min. :1.000
## 1st Qu.:3.000 1st Qu.:3.000 1st Qu.:2.000 1st Qu.:2.000
## Median :4.000 Median :3.000 Median :3.000 Median :3.000
## Mean :3.536 Mean :3.291 Mean :2.928 Mean :3.061
## 3rd Qu.:4.000 3rd Qu.:4.000 3rd Qu.:4.000 3rd Qu.:4.000
## Max. :5.000 Max. :5.000 Max. :5.000 Max. :5.000
## Q5 Q6 Q7 Q8
## Min. :1.000 Min. :1.000 Min. :1.000 Min. :1.000
## 1st Qu.:2.000 1st Qu.:2.000 1st Qu.:2.000 1st Qu.:2.000
## Median :3.000 Median :3.000 Median :3.000 Median :3.000
## Mean :3.041 Mean :2.796 Mean :3.086 Mean :3.049
## 3rd Qu.:4.000 3rd Qu.:4.000 3rd Qu.:4.000 3rd Qu.:4.000
## Max. :5.000 Max. :5.000 Max. :5.000 Max. :5.000
## Q9 Q10 Q11 Q12 Q13
## Min. :1.000 Min. :1.000 Min. :1.00 Min. :1.000 Min. :1.000
## 1st Qu.:2.000 1st Qu.:2.000 1st Qu.:3.00 1st Qu.:3.000 1st Qu.:3.000
## Median :3.000 Median :3.000 Median :4.00 Median :4.000 Median :4.000
## Mean :3.066 Mean :2.883 Mean :3.47 Mean :3.421 Mean :3.588
## 3rd Qu.:4.000 3rd Qu.:4.000 3rd Qu.:4.00 3rd Qu.:4.000 3rd Qu.:4.000
## Max. :5.000 Max. :5.000 Max. :5.00 Max. :5.000 Max. :5.000
## Q14 Q15 Q16 Q17
## Min. :1.000 Min. :1.000 Min. :1.000 Min. :1.000
## 1st Qu.:3.000 1st Qu.:3.000 1st Qu.:3.000 1st Qu.:3.000
## Median :4.000 Median :4.000 Median :4.000 Median :4.000
## Mean :3.716 Mean :3.542 Mean :3.791 Mean :3.516
## 3rd Qu.:4.000 3rd Qu.:4.000 3rd Qu.:4.000 3rd Qu.:4.000
## Max. :5.000 Max. :5.000 Max. :5.000 Max. :5.000
## Q18 Q19 Q20 Gender
## Min. :1.000 Min. :1.000 Min. :1.000 Min. :0.0000
## 1st Qu.:4.000 1st Qu.:3.000 1st Qu.:3.000 1st Qu.:0.0000
## Median :4.000 Median :3.000 Median :3.000 Median :0.0000
## Mean :3.804 Mean :3.364 Mean :3.349 Mean :0.4099
## 3rd Qu.:4.000 3rd Qu.:4.000 3rd Qu.:4.000 3rd Qu.:1.0000
## Max. :5.000 Max. :5.000 Max. :5.000 Max. :1.0000
## EDU BF BM Happiness
## Min. :1.000 Min. :1.000 Min. :1.000 Min. :1.400
## 1st Qu.:2.000 1st Qu.:2.600 1st Qu.:2.400 1st Qu.:3.000
## Median :3.000 Median :3.200 Median :3.000 Median :3.600
## Mean :2.616 Mean :3.172 Mean :2.976 Mean :3.547
## 3rd Qu.:3.000 3rd Qu.:3.800 3rd Qu.:3.600 3rd Qu.:4.000
## Max. :4.000 Max. :5.000 Max. :5.000 Max. :5.000
## Peace
## Min. :1.200
## 1st Qu.:3.200
## Median :3.600
## Mean :3.564
## 3rd Qu.:4.000
## Max. :5.000
df1<-df[,c(21:26)]
summary(df1)
## Gender EDU BF BM
## Min. :0.0000 Min. :1.000 Min. :1.000 Min. :1.000
## 1st Qu.:0.0000 1st Qu.:2.000 1st Qu.:2.600 1st Qu.:2.400
## Median :0.0000 Median :3.000 Median :3.200 Median :3.000
## Mean :0.4099 Mean :2.616 Mean :3.172 Mean :2.976
## 3rd Qu.:1.0000 3rd Qu.:3.000 3rd Qu.:3.800 3rd Qu.:3.600
## Max. :1.0000 Max. :4.000 Max. :5.000 Max. :5.000
## Happiness Peace
## Min. :1.400 Min. :1.200
## 1st Qu.:3.000 1st Qu.:3.200
## Median :3.600 Median :3.600
## Mean :3.547 Mean :3.564
## 3rd Qu.:4.000 3rd Qu.:4.000
## Max. :5.000 Max. :5.000
attach(df1)
mean(Happiness)
## [1] 3.547065
t.test(Happiness, Peace, paired = TRUE)
##
## Paired t-test
##
## data: Happiness and Peace
## t = -1.1468, df = 1924, p-value = 0.2516
## alternative hypothesis: true difference in means is not equal to 0
## 95 percent confidence interval:
## -0.04660127 0.01221166
## sample estimates:
## mean of the differences
## -0.01719481
wilcox.test(Happiness, mu=3.5)
##
## Wilcoxon signed rank test with continuity correction
##
## data: Happiness
## V = 1029154, p-value = 2.782e-06
## alternative hypothesis: true location is not equal to 3.5
options(scipen=999)
wilcox.test(Happiness-Peace)
##
## Wilcoxon signed rank test with continuity correction
##
## data: Happiness - Peace
## V = 596154, p-value = 0.3322
## alternative hypothesis: true location is not equal to 0
library(ggplot2)
library(gapminder)
library(tidyverse)
## -- Attaching packages --------------------------------------- tidyverse 1.3.1 --
## v tibble 3.1.6 v dplyr 1.0.8
## v tidyr 1.2.0 v stringr 1.4.0
## v readr 2.1.2 v forcats 0.5.1
## v purrr 0.3.4
## -- Conflicts ------------------------------------------ tidyverse_conflicts() --
## x dplyr::filter() masks stats::filter()
## x dplyr::lag() masks stats::lag()
library(ggplot2)
ggplot(gapminder, aes(x=gdpPercap, y=lifeExp, col=continent))+geom_point() + scale_x_log10()

ggplot(gapminder, aes(x=gdpPercap, y=lifeExp, col=continent, size=pop))+geom_point() + scale_x_log10()

ggplot(gapminder, aes(x=gdpPercap, y=lifeExp, col=continent, size=pop))+geom_point(alpha=0.5) + scale_x_log10()

ggplot(gapminder, aes(x=gdpPercap, y=lifeExp, col=continent, size=pop))+geom_point(alpha=0.5) + scale_x_log10() + facet_wrap(~year)
