require(pacman)
## Loading required package: pacman
p_load(mosaic,dplyr)
df <- read.table("http://ansatte.uit.no/oystein.myrland/BED2011/data/saldo.txt",
header=TRUE, sep="", na.strings="NA", dec=".")
summary(df)
## saldo id alder minibank
## Min. :-20373 Min. : 1 Min. :15.00 Min. :-20.00
## 1st Qu.: 8009 1st Qu.: 8922 1st Qu.:33.00 1st Qu.: 13.00
## Median : 13503 Median :17844 Median :39.00 Median : 20.00
## Mean : 13549 Mean :17844 Mean :39.58 Mean : 19.42
## 3rd Qu.: 19037 3rd Qu.:26766 3rd Qu.:46.00 3rd Qu.: 26.00
## Max. : 52174 Max. :35687 Max. :80.00 Max. : 63.00
## kjonn
## Min. :0.0000
## 1st Qu.:0.0000
## Median :1.0000
## Mean :0.5045
## 3rd Qu.:1.0000
## Max. :1.0000
head(df)
## saldo id alder minibank kjonn
## 1 8364.37 1 36 16 1
## 2 -76.09 2 27 13 1
## 3 29307.41 3 33 6 1
## 4 6004.50 4 38 44 1
## 5 -5418.38 5 25 11 1
## 6 7264.75 6 57 23 1
tail(df)
## saldo id alder minibank kjonn
## 35682 15557.06 35682 46 21 1
## 35683 6389.66 35683 42 1 0
## 35684 14604.77 35684 29 26 0
## 35685 1130.60 35685 25 7 0
## 35686 11941.11 35686 44 31 0
## 35687 21958.79 35687 42 28 1
# Gjsnitt saldo @ opg 1
mean(df$saldo)
## [1] 13548.77
mean(df$saldo, data=df)
## [1] 13548.77
sd(df$saldo, data = df)
## [1] 8134.177
# median saldo @ opg 2
median(df$saldo)
## [1] 13502.57
# gjsnittlig saldo og standardavvik mann
mean(~saldo, data=filter(df, kjonn=="0"))
## [1] 13602.82
sd(~saldo, data=filter(df, kjonn=="0"))
## [1] 8170.188
# gjsnittlig saldo og standardavvik kvinne
mean(~saldo, data=filter(df, kjonn=="1"))
## [1] 13495.69
sd(~saldo, data=filter(df, kjonn=="1"))
## [1] 8098.527
# største saldo
max(df$saldo, data=filter(df, kjonn=="0"))
## [1] 52174.47
# minste saldo
min(df$saldo, data=filter(df, kjonn=="0"))
## [1] -20372.64
min(df$saldo, data=filter(df, kjonn=="1"))
## [1] -20372.64
# histogram saldo begge kjønn (opg7)
histogram(~saldo, data=df, main="Saldo")

# histogram menn
histogram(~saldo, data=filter(df, kjonn=="0"), main="Saldo Menn")

# histogram kvinner
histogram(~saldo, data=filter(df, kjonn=="1"), main="Saldo Kvinner")

# kvartiler
length(df$saldo)
## [1] 35687
median(df$saldo)
## [1] 13502.57
quantile(df$saldo)
## 0% 25% 50% 75% 100%
## -20372.64 8008.88 13502.57 19037.35 52174.47
# andel kvinner/menn
tally(df$kjonn)
## X
## 0 1
## 17683 18004