require(pacman)
## Loading required package: pacman
p_load(mosaic,dplyr)
df <- read.table("http://ansatte.uit.no/oystein.myrland/BED2011/data/saldo.txt",
                 header=TRUE, sep="", na.strings="NA", dec=".")

summary(df)
##      saldo              id            alder          minibank     
##  Min.   :-20373   Min.   :    1   Min.   :15.00   Min.   :-20.00  
##  1st Qu.:  8009   1st Qu.: 8922   1st Qu.:33.00   1st Qu.: 13.00  
##  Median : 13503   Median :17844   Median :39.00   Median : 20.00  
##  Mean   : 13549   Mean   :17844   Mean   :39.58   Mean   : 19.42  
##  3rd Qu.: 19037   3rd Qu.:26766   3rd Qu.:46.00   3rd Qu.: 26.00  
##  Max.   : 52174   Max.   :35687   Max.   :80.00   Max.   : 63.00  
##      kjonn       
##  Min.   :0.0000  
##  1st Qu.:0.0000  
##  Median :1.0000  
##  Mean   :0.5045  
##  3rd Qu.:1.0000  
##  Max.   :1.0000
head(df)
##      saldo id alder minibank kjonn
## 1  8364.37  1    36       16     1
## 2   -76.09  2    27       13     1
## 3 29307.41  3    33        6     1
## 4  6004.50  4    38       44     1
## 5 -5418.38  5    25       11     1
## 6  7264.75  6    57       23     1
tail(df)
##          saldo    id alder minibank kjonn
## 35682 15557.06 35682    46       21     1
## 35683  6389.66 35683    42        1     0
## 35684 14604.77 35684    29       26     0
## 35685  1130.60 35685    25        7     0
## 35686 11941.11 35686    44       31     0
## 35687 21958.79 35687    42       28     1
# Gjsnitt saldo @ opg 1
mean(df$saldo)
## [1] 13548.77
mean(df$saldo, data=df)
## [1] 13548.77
sd(df$saldo, data = df)
## [1] 8134.177
# median saldo @ opg 2
median(df$saldo)
## [1] 13502.57
# gjsnittlig saldo og standardavvik mann
mean(~saldo, data=filter(df, kjonn=="0"))
## [1] 13602.82
sd(~saldo, data=filter(df, kjonn=="0"))
## [1] 8170.188
# gjsnittlig saldo og standardavvik kvinne
mean(~saldo, data=filter(df, kjonn=="1"))
## [1] 13495.69
sd(~saldo, data=filter(df, kjonn=="1"))
## [1] 8098.527
# største saldo
max(df$saldo, data=filter(df, kjonn=="0"))
## [1] 52174.47
# minste saldo 
min(df$saldo, data=filter(df, kjonn=="0"))
## [1] -20372.64
min(df$saldo, data=filter(df, kjonn=="1"))
## [1] -20372.64
# histogram saldo begge kjønn (opg7)
histogram(~saldo, data=df, main="Saldo")

# histogram menn
histogram(~saldo, data=filter(df, kjonn=="0"), main="Saldo Menn")

# histogram kvinner
histogram(~saldo, data=filter(df, kjonn=="1"), main="Saldo Kvinner")

# kvartiler
length(df$saldo)
## [1] 35687
median(df$saldo)
## [1] 13502.57
quantile(df$saldo)
##        0%       25%       50%       75%      100% 
## -20372.64   8008.88  13502.57  19037.35  52174.47
# andel kvinner/menn
tally(df$kjonn)
## X
##     0     1 
## 17683 18004