Haven
Haven contains functions that lets R import SPSS, SAS, Stata, and
other foreign files.
Documentation can be viewed here
# Check if haven is already installed and if it is, load it.
if (!require(haven)){
# If it's not intalled, then tell R to install it.
install.packages("haven", dependencies = TRUE)
# Once it's installed, tell R to load it.
library(haven)
}
Tidyverse
Tidyverse contains many functions useful to cleaning, tidying, and
manipulating data
Documentation can be viewed here
if (!require(tidyverse)){
install.packages("tidyverse", dependencies = TRUE)
library(tidyverse)
}
psych
Summarytools provide useful functions for summarizing and visualizing
data
Documentation can be viewed here
if (!require(psych)){
install.packages("psych", dependencies = TRUE)
require(psych)
}
corrr
quick and easy correlations
Documentation can be viewed here
if (!require(corrr)){
install.packages("corrr", dependencies = TRUE)
require(corrr)
}
GGally
quick and easy correlations
Documentation can be viewed here
if (!require(GGally)){
install.packages("GGally", dependencies = TRUE)
require(GGally)
}
Import an SPSS file
Use the read_sav() function from the Haven package to import an SPSS
file into R.
Documentation can be viewed here
dataset <- read_sav("https://osf.io/98mt6/download")
Clean dataset
View dataset
Use the View() function to look at your dataset like you would in
SPSS or Excel
Documentation can be viewed here
#View(dataset)
View questions or ‘labels’
This is useful if you used haven to import an SPSS file created by
Qualtrics
Documentation can be viewed here
dataset %>%
map(~ attr(., "label"))
Remove columns
Use the Select() function to de-select a column.
Put ‘-’ before the column name to remove a column (you can list more
than one column).
Just type the column name to keep only that column (you can list more
than one column).
Documentation can be viewed here
dataset %>%
select(-IPAddress) -> dataset
Remove practice runs
Use the slice() funciton to remove rows.
Put the range of rows you’d like to remove with minus signs in
front.
Documentation can be viewed here
dataset %>%
slice(-1:-3) -> dataset
Recode variables
Use the tidyverse, mutate, and case_when to recode variables
Documentation can be viewed here
Recode to a factor
dataset %>%
mutate(CoinFlipFactor = case_when(CoinFlip==1 ~ "Heads",
CoinFlip==2 ~ "Tails")) -> dataset
Recode to a dummy variable
dataset %>%
mutate(FlipHeadsDummy = case_when(CoinFlip==1 ~ 1,
CoinFlip==2 ~ 0)) -> dataset
Summarize variables
Use the describe() function of the psych package to summarize
data
Documentation can be viewed here
#First select the variables you'd like to summarize
dataset %>%
select (CoinFlip, FFM_5, Potter3) %>%
describe()
Create Composite Variable
Psych
Documentation can be viewed here
Agreeableness
#create dataframe with only relevant variables to work with
Agreeableness <- data.frame (dataset$FFM_2, dataset$FFM_7, dataset$FFM_12, dataset$FFM_17, dataset$FFM_22, dataset$FFM_27, dataset$FFM_32, dataset$FFM_37, dataset$FFM_42)
Agreeableness.keys <- make.keys(Agreeableness, list(Agreeableness=c(-1,2,-3,4,5,-6,7,-8,9)))
Agreeableness.scales <- scoreItems (Agreeableness.keys, Agreeableness)
Agreeableness.scores <- Agreeableness.scales$scores
dataset$Agreeableness <- Agreeableness.scores[,]
Agreeableness.scales$alpha
Conscientiousness
#create dataframe with only relevant variables to work with
Conscientiousness <- data.frame (dataset$FFM_3, dataset$FFM_8, dataset$FFM_13, dataset$FFM_18, dataset$FFM_23, dataset$FFM_28, dataset$FFM_33, dataset$FFM_38, dataset$FFM_43)
my.keys <- make.keys(Conscientiousness, list(Conscientiousness=c(1,-2,3,-4,-5,6,7,8,-9)))
my.scales <- scoreItems (my.keys, Conscientiousness)
my.scores <- my.scales$scores
dataset$Conscientiousness <- my.scores[,]
my.scales$alpha
Neuroticism
#create dataframe with only relevant variables to work with
Neuroticism <- data.frame (dataset$FFM_4, dataset$FFM_9, dataset$FFM_14, dataset$FFM_19, dataset$FFM_24, dataset$FFM_29, dataset$FFM_34, dataset$FFM_39)
my.keys <- make.keys(Neuroticism, list(Neuroticism=c(1,-2,3,4,-5,6,-7,8)))
my.scales <- scoreItems (my.keys, Neuroticism)
my.scores <- my.scales$scores
dataset$Neuroticism <- my.scores[,]
my.scales$alpha
Openness
#create dataframe with only relevant variables to work with
Openness <- data.frame (dataset$FFM_5, dataset$FFM_10, dataset$FFM_15, dataset$FFM_20, dataset$FFM_25, dataset$FFM_30, dataset$FFM_35, dataset$FFM_40, dataset$FFM_41, dataset$FFM_44)
my.keys <- make.keys(Openness, list(Openness=c(1,2,3,4,5,6,-7,8,-9,10)))
my.scales <- scoreItems (my.keys, Openness)
my.scores <- my.scales$scores
dataset$Openness <- my.scores[,]
my.scales$alpha
Tidyverse
Documentation can be viewed here
and here
dataset %>%
rowwise() %>%
mutate(extraversionTidy = mean(c(FFM_1, 6-FFM_6, FFM_11, FFM_16, 6-FFM_21, FFM_26, 6-FFM_31, FFM_36))) -> dataset
Correlations
Calculate correlations
Explore correlations
Documentation can be viewed here
dataset %>%
select(Openness, Conscientiousness, Extraversion, Agreeableness, Neuroticism) %>%
correlate() %>%
shave() %>%
fashion()
Calculate p-values
Documentation can be viewed here
dataset %>%
select(Openness, Conscientiousness, Extraversion, Agreeableness, Neuroticism) -> Big5df
corr.test(x = Big5df,
y = NULL,
use = "pairwise",
method = "pearson",
adjust = "holm",
alpha = .05,
ci = TRUE)
Deciding between Pearson and Spearman correlations
Documentation can be viewed here
dataset %>%
select(Openness, Conscientiousness, Extraversion, Agreeableness, Neuroticism) %>%
ggpairs()
t-tests
Documentation can be viewed here
independent samples t-tests
dataset %>%
with(t.test(Agreeableness ~ CoinFlipFactor))
paired samples t-tests
dataset %>%
with(t.test(Agreeableness, Neuroticism, paired = TRUE))
