Diane, Jane, and Kimberly.
Everything before 15 - analysis is a syntax to match all children.
I know errors happen all the time. Therefore, these codes were made available here if someone wants to review or check the consistency.
In the e-mail that you found this link, I attached an excel file in which you’ll be able to check this file.

Please notice that this report refers to birth to three only
If you don’t want to check any code, please click here

1 load package

pacman::p_load(tidyverse, janitor)

2 Data handling

3 get all ASQ4 data

read_excel_allsheets <- function(filename) {
    sheets <- readxl::excel_sheets(filename) #get all sheet names
    x <- lapply(sheets, function(X) readxl::read_excel(filename, sheet = X))
    names(x) <- sheets #get names only
    x #return
}
#get the excel file
excel_list <- read_excel_allsheets("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/Final ALL ASQ4 for AEPS 2019_2020.xlsx")
#transform into vectors
list2env(setNames(excel_list, #list
                  paste0("ds_",janitor::make_clean_names(names(excel_list)))),  #fixing different names and other patterns
         envir=.GlobalEnv) #where?

4 Create a backup

backup_asq4_demo <- ds_asq4_demo 
backup_asq4_items <- ds_asq4_items

#remove all attributes

#ds_asq4_demo[] <- lapply(ds_asq4_demo, function(x) { attributes(x) <- NULL; x })
#backup_asq4_items[] <- lapply(backup_asq4_items, function(x) { attributes(x) <- NULL; x })

5 clean names

ds_asq4_demo <- clean_names(ds_asq4_demo)
ds_asq4_items <- clean_names(ds_asq4_items)

6 merge datasets

ds_asq <- left_join(ds_asq4_demo, ds_asq4_items, by = c("asq4_id"))

7 Compute totals

7.1 Change variable computational level

ds_asq <- ds_asq %>% 
  mutate_at(vars(c1:c6, gm1:gm6, fm1:fm6, ps1:ps6, p1:p6), ~as.numeric(.))

7.2 Compute totals for each ASQ-4 domain

ds_asq<-ds_asq %>% 
  mutate(com_sum = rowSums(select(.,c1:c6))) %>% 
  mutate(gm_sum = rowSums(select(.,gm1:gm6))) %>% 
  mutate(fm_sum = rowSums(select(.,fm1:fm6))) %>% 
  mutate(ps_sum = rowSums(select(.,ps1:ps6))) %>% 
  mutate(per_sum = rowSums(select(.,p1:p6)))

8 AEPS Demographics

aeps_1_demo <- readxl::read_excel("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/copy KM Cleaned AEPS 3.5.21/1.Cleaned AEPSBirthToThreeFormNoN 2 Grace 9.13.2019.xlsx", sheet = 2)
#fix names
aeps_1_demo <- clean_names(aeps_1_demo)
#remove empty columns and rows
aeps_1_demo <- remove_empty(aeps_1_demo, which = c("rows", "cols"), quiet = TRUE)
#remove useless rows
aeps_1_demo <- aeps_1_demo %>% filter(!is.na(childs_id))

#add new features to merge
aeps_1_demo <- aeps_1_demo %>% 
  mutate(aeps_file_number = 1) %>% #same as ds_asq
  mutate(spread_sheet = spread_sheet_id_1) %>% #same as full dataset!
  mutate(aeps_sprdsheet_id_number = spread_sheet_id_1) #same as ds_asq

9 1.AEPSBirthToThreeFormNoN 2 Grace 9.13.2019

10 First file 1 - Fine motor (1)

10.1 get data

aeps_1_fine <- readxl::read_excel("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/copy KM Cleaned AEPS 3.5.21/1.Cleaned AEPSBirthToThreeFormNoN 2 Grace 9.13.2019.xlsx", sheet = 3)
#clear excel attributes
aeps_1_fine[] <- lapply(aeps_1_fine, function(x) { attributes(x) <- NULL; x })
#fix names
aeps_1_fine <- clean_names(aeps_1_fine)
#remove empty columns and rows
aeps_1_fine <- remove_empty(aeps_1_fine, which = c("rows", "cols"), quiet = TRUE)
#create a skill
aeps_1_fine <- aeps_1_fine %>% 
  mutate(skill = .[[1]]) %>% #this is the first column )in this case -- fine motor (sub)domain
  select(1,skill, everything())
#With this new variable (skill), just keep if is a letter
aeps_1_fine <- aeps_1_fine %>% 
  mutate(skill = if_else(str_detect(skill, "[a-z]"), .[[1]],  NA_character_)) %>% #if skill is a letter, otherwise missing
  fill(skill)
#remove first line (it's almost all na)
aeps_1_fine <- aeps_1_fine %>% 
  filter(!str_detect(.[[1]], "[a-z]"))
#transform to numeric
aeps_1_fine <- aeps_1_fine %>% mutate(!! names(.)[1] := as.numeric(!! rlang::sym(names(.)[1]))) 
#aeps_1_fine[[1]] <- as.numeric(aeps_1_fine[[1]])

10.2 Tranform it to long format

spec <- tibble(`.name` = names(aeps_1_fine)) %>%
  slice(-c(1:2)) %>%
  mutate(`.value` = case_when(
           `.name` %>% str_detect("spread") ~ "spread_sheet",
           `.name` %>% str_detect("score")  ~ "score",
           `.name` %>% str_detect("confirm") ~ "confirm")
  )
# apply the spec
aeps_1_fine_long <- aeps_1_fine %>%
  pivot_longer_spec(spec)

10.3 Add domain

This chunk will get all domains and number skills. It will be useful to merge all ds in the future.

aeps_1_fine_long <- aeps_1_fine_long %>% 
  mutate(domain = names(.)[[1]]) %>% 
  rename(number_skill = names(.)[[1]]) %>% 
  select(domain, number_skill, everything())

11 First file 1 - Gross motor (2)

11.1 get data

aeps_1_gross <- readxl::read_excel("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/copy KM Cleaned AEPS 3.5.21/1.Cleaned AEPSBirthToThreeFormNoN 2 Grace 9.13.2019.xlsx", sheet = 4)
#clear excel attributes
aeps_1_gross[] <- lapply(aeps_1_gross, function(x) { attributes(x) <- NULL; x })
#fix names
aeps_1_gross <- clean_names(aeps_1_gross)
#remove empty columns and rows
aeps_1_gross <- remove_empty(aeps_1_gross, which = c("rows", "cols"), quiet = TRUE)
#create a skill
aeps_1_gross <- aeps_1_gross %>% 
  mutate(skill = .[[1]]) %>% #this is the first column )in this case -- fine motor (sub)domain
  select(1,skill, everything())
#With this new variable (skill), just keep if is a letter
aeps_1_gross <- aeps_1_gross %>% 
  mutate(skill = if_else(str_detect(skill, "[a-z]"), .[[1]],  NA_character_)) %>% #if skill is a letter, otherwise missing
  fill(skill)
#remove first line (it's almost all na)
aeps_1_gross <- aeps_1_gross %>% 
  filter(!str_detect(.[[1]], "[a-z]"))
#transform to numeric
aeps_1_gross <- aeps_1_gross %>% mutate(!! names(.)[1] := as.numeric(!! rlang::sym(names(.)[1]))) 
#aeps_1_gross[[1]] <- as.numeric(aeps_1_gross[[1]])

11.2 Tranform it to long format

spec <- tibble(`.name` = names(aeps_1_gross)) %>%
  slice(-c(1:2)) %>%
  mutate(`.value` = case_when(
    `.name` %>% str_detect("spread") ~ "spread_sheet",
    `.name` %>% str_detect("score")  ~ "score",
    `.name` %>% str_detect("confirm") ~ "confirm")
  )
# apply the spec
aeps_1_gross_long <- aeps_1_gross %>%
  pivot_longer_spec(spec)

11.3 Add domain

This chunk will get all domains and number skills. It will be useful to merge all ds in the future.

aeps_1_gross_long <- aeps_1_gross_long %>% 
  mutate(domain = names(.)[[1]]) %>% 
  rename(number_skill = names(.)[[1]]) %>% 
  select(domain, number_skill, everything())

12 First file 1 - Adaptive (3)

12.1 get data

aeps_1_adaptive <- readxl::read_excel("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/copy KM Cleaned AEPS 3.5.21/1.Cleaned AEPSBirthToThreeFormNoN 2 Grace 9.13.2019.xlsx", sheet = 5)
#clear excel attributes
aeps_1_adaptive[] <- lapply(aeps_1_adaptive, function(x) { attributes(x) <- NULL; x })
#fix names
aeps_1_adaptive <- clean_names(aeps_1_adaptive)
#remove empty columns and rows
aeps_1_adaptive <- remove_empty(aeps_1_adaptive, which = c("rows", "cols"), quiet = TRUE)
#create a skill
aeps_1_adaptive <- aeps_1_adaptive %>% 
  mutate(skill = .[[1]]) %>% #this is the first column )in this case -- fine motor (sub)domain
  select(1,skill, everything())
#With this new variable (skill), just keep if is a letter
aeps_1_adaptive <- aeps_1_adaptive %>% 
  mutate(skill = if_else(str_detect(skill, "[a-z]"), .[[1]],  NA_character_)) %>% #if skill is a letter, otherwise missing
  fill(skill)
#remove first line (it's almost all na)
aeps_1_adaptive <- aeps_1_adaptive %>% 
  filter(!str_detect(.[[1]], "[a-z]"))
#transform to numeric
aeps_1_adaptive <- aeps_1_adaptive %>% mutate(!! names(.)[1] := as.numeric(!! rlang::sym(names(.)[1]))) 
#aeps_1_adaptive[[1]] <- as.numeric(aeps_1_adaptive[[1]])

12.2 Tranform it to long format

spec <- tibble(`.name` = names(aeps_1_adaptive)) %>%
  slice(-c(1:2)) %>%
  mutate(`.value` = case_when(
    `.name` %>% str_detect("spread") ~ "spread_sheet",
    `.name` %>% str_detect("score")  ~ "score",
    `.name` %>% str_detect("confirm") ~ "confirm")
  )
# apply the spec
aeps_1_adaptive_long <- aeps_1_adaptive %>%
  pivot_longer_spec(spec)

12.3 Add domain

This chunk will get all domains and number skills. It will be useful to merge all ds in the future.

aeps_1_adaptive_long <- aeps_1_adaptive_long %>% 
  mutate(domain = names(.)[[1]]) %>% 
  rename(number_skill = names(.)[[1]]) %>% 
  select(domain, number_skill, everything())

13 Merge AEPS spreadsheets datasets

Just checking if we have 22 children in each dataset

aeps_1_fine_long %>% count(spread_sheet)
aeps_1_gross_long %>% count(spread_sheet)
aeps_1_adaptive_long %>% count(spread_sheet)

I’ll use bind_rows to put each dataset on top of the another. First, fine long with gross long

ds_aeps_birth_three <- bind_rows(
  aeps_1_fine_long,
  aeps_1_gross_long)

Now, this resultant ds with adaptive

ds_aeps_birth_three <- bind_rows(
  ds_aeps_birth_three,
  aeps_1_adaptive_long)

14 Merge AEPS with AEPS demographics

I’ll get aeps_1_demo to add to this partially full dataset the child’ ID

ds_aeps_birth_three <- left_join(ds_aeps_birth_three, aeps_1_demo)

First, i’ll add two key variables present in the ASQ-4 dataset to guarantee the merging will be correct

ds_aeps_birth_three <- ds_aeps_birth_three %>% 
  mutate(aeps_file_number = 1) %>% 
  mutate(aeps_sprdsheet_id_number = spread_sheet) %>% 
  rename(asq4_id = childs_id) %>% 
  mutate(asq4_id = as.numeric(asq4_id)) #in ASQ4 dataset, this variable is numeric

Create a full dataset with ASQ-4 and AEPS

ds_birth_three_aeps_asq <- left_join(
  ds_aeps_birth_three,
  ds_asq,
  by = "asq4_id"
)

14.1 Manual check

ds_birth_three_aeps_asq %>% 
  filter(spread_sheet == "15") %>% View()

14.2 Save as excel

It seems everything worked! (Saturday, 13 March, 2021)
Ask Kimberly

15 Analyses - birth to three

Diane, Jane, and Kimberly. From this line on, I will:
(1) Present a plot and a table with the ASQ-4 summative results
(2) Present a plot and a table with the AEPS summative results (I read elsewhere and it seems that AEPS items need to be summed as well)
(3) Run all correlation analyses between the ASQ-4 summative scores and the AEPS summative scores

You’ll notice that the correlation results are too low. I’m wondering if something was under the radar in my code or if I’m missing some point.
I have sent an e-mail in which I present an excel file to make some points clearer.

15.1 ASQ-4 analysis

15.1.1 Plot

The graph below describes the distribution of all ASQ4 results.

15.1.2 Summary table

The table below reports the ASQ-4 results. I did not group the results by age interval.

com_sum (N=22) fm_sum (N=22) gm_sum (N=22) per_sum (N=22) ps_sum (N=22) Total (N=110) p value
value 0.328
   Mean (SD) 51.250 (10.683) 46.818 (12.492) 52.045 (9.084) 46.818 (9.580) 48.636 (10.821) 49.114 (10.631)
   Range 15.000 - 60.000 15.000 - 60.000 35.000 - 60.000 20.000 - 60.000 20.000 - 60.000 15.000 - 60.000
ds_birth_three_aeps_asq %>%
  select(asq4_id, everything()) %>% #just for checking
  distinct(asq4_id, .keep_all = T) %>% #use only one information (we have 22 children here)
  select(ends_with("_sum")) %>% 
  janitor::remove_empty(c("cols")) %>% #remove empty columns
  pivot_longer(everything(.)) %>% 
  arsenal::tableby(name ~ value, .) %>% 
  summary()

15.2 AEPS domains and skills

The following results will present the AEPS findings.

15.2.1 Descriptive table

The following table will present the descriptives of each participant and activitiy

How to interpret these results?
ASQ4id = 500 (it’s a child in the dataset) He or She has 18 results in domain adaptative and skill = Feeding.
If you access the excel file, it will be these same values.

15.2.2 Plot total scores

If I understood everything right (I’ve consulted https://pt.slideshare.net/BrookesPubCo/aeps-intro-webinar-slideshare),
each participant needs to have a score reflecting his/her ability.
Therefore, I summed up the scores obtained in each skill of each domain (e.g.: Reach, Grab, and Release from Fine motor).

ds_birth_three_aeps_asq %>% 
  group_by(asq4_id,domain, skill) %>%  #grop for having each score for each participant
  summarise(raw_score = sum(score)) %>% #create the summative score
  select(asq4_id,domain, skill, raw_score) %>% #select before pivoting
      pivot_longer(-c(asq4_id, raw_score, skill),
                   values_to = "domain") %>% 
  select(-name) %>% 
  ggplot(., aes(x = domain, y = raw_score, fill = skill)) +
  #geom_col(position = position_dodge2(preserve = "single")) +
  geom_bar(stat = "summary", position = "dodge", width = 0.8) +
  theme_bw()
`summarise()` has grouped output by 'asq4_id', 'domain'. You can override using the `.groups` argument.

15.2.3 Summary total scores

The following table presents the same information presented above. However, I imagine you’ll be able to check if everything is correct.

ds_birth_three_aeps_asq %>% 
  group_by(asq4_id,domain, skill) %>%  #grop for having each score for each participant
  summarise(raw_score = sum(score)) %>% #create the summative score
  select(asq4_id,domain, skill, raw_score) %>% #select before pivoting
      pivot_longer(-c(asq4_id, raw_score, skill),
                   values_to = "domain") %>% 
  select(-name) %>% 
  group_by(domain, skill) %>% 
  summarise(mean(raw_score), sd(raw_score), n()) %>% 
  mutate_if(is.numeric,round,2)

summarise() has grouped output by ‘asq4_id’, ‘domain’. You can override using the .groups argument. summarise() has grouped output by ‘domain’. You can override using the .groups argument. mutate_if() ignored the following grouping variables: Column domain

How to interpret these results?
Example:
when considering all children in domain (fine motor), and skill (A. Reach, Grab, Release), the mean result is 34.82
I double checked the excel file and this result is correct

15.3 Correlations AEPS ASQ-4

The following tables will present the correlation between each ASQ-4 domain and its AEPS parallel.
I’m using the summative score of the ASQ-4 and also the summative score of AEPS. Diane, please let me know if that’s the way to achieve the AEPS results.

Please don’t consider the three following chunks. They are programming syntaxes.

15.3.1 Create a summative score (Ask Diane)

cor_ds_1 <- ds_birth_three_aeps_asq %>% 
  group_by(asq4_id,domain, skill) %>%  #grop for having each score for each participant
  summarise(raw_score = sum(score))
`summarise()` has grouped output by 'asq4_id', 'domain'. You can override using the `.groups` argument.

15.3.2 Create a dataframe to gather all data

15.3.3 Merge these data and remove useless vectors

cor_ds <- left_join(cor_ds_1,cor_ds_2)
Joining, by = "asq4_id"

15.4 ASQ Fine motor vs AEPS Fine motor

library(corrr) #correlation 

Correlation between ASQ Fine motor and AEPS Fine motor I’m using the same child!

How to interpret these results?
The correlation between the ASQ-4 fine motor and AEPS fine motor (skill: Reach and Grab) is -0.22 (makes no sense to me)
The correlation between the ASQ-4 fine motor and AEPS fine motor (skill: Functional use) is -0.05 (makes no sense to me)

I have attached an excel file in which I mannually ran these correlations and the results match

15.5 ASQ gross motor AEPS gross motor

Correlation between ASQ Gross motor and AEPS Gross motor I’m using the data from same children.

How to interpret these results?
The correlation between the ASQ-4 gross motor and AEPS gross motor (skill: A. Movement and Locomotion) is -0.17 (makes no sense to me)
The correlation between the ASQ-4 gross motor and AEPS gross motor (skill: B. Balance in Sitting) is -0.06 (makes no sense to me)
The correlation between the ASQ-4 gross motor and AEPS gross motor (skill: C. Balance & Mobility) is 0.03 (makes no sense to me)
The correlation between the ASQ-4 gross motor and AEPS gross motor (skill: D. Play Skills) is 0.04 (makes no sense to me)

15.6 ASQ Personal-Social AEPS adaptive

**Jane: Just to refresh my memory. In the dataset, PS means problem-solving and P means Personal and Social, right?
Correlation between ASQ Personal-Social and AEPS Adaptive I’m using the data from same children.

How to interpret these results?
The correlation between the ASQ-4 Personal and Social and AEPS Adaptive (skill: A. Feeding) is 0.34 (makes sense!!)
The correlation between the ASQ-4 Personal and Social and AEPS Adaptive (skill: B. Personal Hygiene) is 0.27 (makes sense!!)
The correlation between the ASQ-4 Personal and Social and AEPS Adaptive (skill: C. Undressing) is 0.30 (makes sense!!)

end of report

---
title: "Diane - AEPS & ASQ-4"
output:
  html_notebook:
    toc: yes
    toc_float: yes
    number_sections: yes
    theme: united
    highlight: textmate
editor_options: 
  chunk_output_type: inline
---

```{r global options, include = FALSE}
knitr::opts_chunk$set(echo = FALSE, 
                      warning = FALSE, 
                      messages = FALSE, 
                      include = TRUE,
                      results = "hide")
```

<div class="alert alert-success">
**Diane, Jane, and Kimberly. **   
Everything before `15 - analysis` is a syntax to match all children.   
I know errors happen all the time. Therefore, these codes were made available here if someone wants to review or check the consistency.   
In the e-mail that you found this link, I attached an excel file in which you'll be able to check this file.   

**Please notice that this report refers to birth to three only**     
**If you don't want to check any code, please click [here](#analyses)**
</div>


# load package
```{r}
pacman::p_load(tidyverse, janitor)
```

# Data handling

# get all ASQ4 data

```{r}
read_excel_allsheets <- function(filename) {
    sheets <- readxl::excel_sheets(filename) #get all sheet names
    x <- lapply(sheets, function(X) readxl::read_excel(filename, sheet = X))
    names(x) <- sheets #get names only
    x #return
}
#get the excel file
excel_list <- read_excel_allsheets("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/Final ALL ASQ4 for AEPS 2019_2020.xlsx")
#transform into vectors
list2env(setNames(excel_list, #list
                  paste0("ds_",janitor::make_clean_names(names(excel_list)))),  #fixing different names and other patterns
         envir=.GlobalEnv) #where?
```

# Create a backup

```{r}
backup_asq4_demo <- ds_asq4_demo 
backup_asq4_items <- ds_asq4_items
```


#remove all attributes 

```{r}
#ds_asq4_demo[] <- lapply(ds_asq4_demo, function(x) { attributes(x) <- NULL; x })
#backup_asq4_items[] <- lapply(backup_asq4_items, function(x) { attributes(x) <- NULL; x })
```

# clean names 

```{r}
ds_asq4_demo <- clean_names(ds_asq4_demo)
ds_asq4_items <- clean_names(ds_asq4_items)
```

# merge datasets 

```{r}
ds_asq <- left_join(ds_asq4_demo, ds_asq4_items, by = c("asq4_id"))
```

# Compute totals

## Change variable computational level 

```{r}
ds_asq <- ds_asq %>% 
  mutate_at(vars(c1:c6, gm1:gm6, fm1:fm6, ps1:ps6, p1:p6), ~as.numeric(.))
```

## Compute totals for each ASQ-4 domain
```{r}
ds_asq<-ds_asq %>% 
  mutate(com_sum = rowSums(select(.,c1:c6))) %>% 
  mutate(gm_sum = rowSums(select(.,gm1:gm6))) %>% 
  mutate(fm_sum = rowSums(select(.,fm1:fm6))) %>% 
  mutate(ps_sum = rowSums(select(.,ps1:ps6))) %>% 
  mutate(per_sum = rowSums(select(.,p1:p6)))
```


# AEPS Demographics

```{r}
aeps_1_demo <- readxl::read_excel("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/copy KM Cleaned AEPS 3.5.21/1.Cleaned AEPSBirthToThreeFormNoN 2 Grace 9.13.2019.xlsx", sheet = 2)
```

```{r}
#fix names
aeps_1_demo <- clean_names(aeps_1_demo)
#remove empty columns and rows
aeps_1_demo <- remove_empty(aeps_1_demo, which = c("rows", "cols"), quiet = TRUE)
#remove useless rows
aeps_1_demo <- aeps_1_demo %>% filter(!is.na(childs_id))

#add new features to merge
aeps_1_demo <- aeps_1_demo %>% 
  mutate(aeps_file_number = 1) %>% #same as ds_asq
  mutate(spread_sheet = spread_sheet_id_1) %>% #same as full dataset!
  mutate(aeps_sprdsheet_id_number = spread_sheet_id_1) #same as ds_asq
```



# 1.AEPSBirthToThreeFormNoN 2 Grace 9.13.2019

# First file 1 - Fine motor (1)

## get data

```{r}
aeps_1_fine <- readxl::read_excel("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/copy KM Cleaned AEPS 3.5.21/1.Cleaned AEPSBirthToThreeFormNoN 2 Grace 9.13.2019.xlsx", sheet = 3)
```
```{r}
#clear excel attributes
aeps_1_fine[] <- lapply(aeps_1_fine, function(x) { attributes(x) <- NULL; x })
#fix names
aeps_1_fine <- clean_names(aeps_1_fine)
#remove empty columns and rows
aeps_1_fine <- remove_empty(aeps_1_fine, which = c("rows", "cols"), quiet = TRUE)
#create a skill
aeps_1_fine <- aeps_1_fine %>% 
  mutate(skill = .[[1]]) %>% #this is the first column )in this case -- fine motor (sub)domain
  select(1,skill, everything())
#With this new variable (skill), just keep if is a letter
aeps_1_fine <- aeps_1_fine %>% 
  mutate(skill = if_else(str_detect(skill, "[a-z]"), .[[1]],  NA_character_)) %>% #if skill is a letter, otherwise missing
  fill(skill)
#remove first line (it's almost all na)
aeps_1_fine <- aeps_1_fine %>% 
  filter(!str_detect(.[[1]], "[a-z]"))
#transform to numeric
aeps_1_fine <- aeps_1_fine %>% mutate(!! names(.)[1] := as.numeric(!! rlang::sym(names(.)[1]))) 
#aeps_1_fine[[1]] <- as.numeric(aeps_1_fine[[1]])
```


## Tranform it to long format

```{r}
spec <- tibble(`.name` = names(aeps_1_fine)) %>%
  slice(-c(1:2)) %>%
  mutate(`.value` = case_when(
           `.name` %>% str_detect("spread") ~ "spread_sheet",
           `.name` %>% str_detect("score")  ~ "score",
           `.name` %>% str_detect("confirm") ~ "confirm")
  )
# apply the spec
aeps_1_fine_long <- aeps_1_fine %>%
  pivot_longer_spec(spec)
```

## Add domain

This chunk will get all domains and number skills. It will be useful to merge all ds in the future.  

```{r}
aeps_1_fine_long <- aeps_1_fine_long %>% 
  mutate(domain = names(.)[[1]]) %>% 
  rename(number_skill = names(.)[[1]]) %>% 
  select(domain, number_skill, everything())
```


# First file 1 - Gross motor (2)

## get data

```{r}
aeps_1_gross <- readxl::read_excel("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/copy KM Cleaned AEPS 3.5.21/1.Cleaned AEPSBirthToThreeFormNoN 2 Grace 9.13.2019.xlsx", sheet = 4)
```
```{r}
#clear excel attributes
aeps_1_gross[] <- lapply(aeps_1_gross, function(x) { attributes(x) <- NULL; x })
#fix names
aeps_1_gross <- clean_names(aeps_1_gross)
#remove empty columns and rows
aeps_1_gross <- remove_empty(aeps_1_gross, which = c("rows", "cols"), quiet = TRUE)
#create a skill
aeps_1_gross <- aeps_1_gross %>% 
  mutate(skill = .[[1]]) %>% #this is the first column )in this case -- fine motor (sub)domain
  select(1,skill, everything())
#With this new variable (skill), just keep if is a letter
aeps_1_gross <- aeps_1_gross %>% 
  mutate(skill = if_else(str_detect(skill, "[a-z]"), .[[1]],  NA_character_)) %>% #if skill is a letter, otherwise missing
  fill(skill)
#remove first line (it's almost all na)
aeps_1_gross <- aeps_1_gross %>% 
  filter(!str_detect(.[[1]], "[a-z]"))
#transform to numeric
aeps_1_gross <- aeps_1_gross %>% mutate(!! names(.)[1] := as.numeric(!! rlang::sym(names(.)[1]))) 
#aeps_1_gross[[1]] <- as.numeric(aeps_1_gross[[1]])
```


## Tranform it to long format

```{r}
spec <- tibble(`.name` = names(aeps_1_gross)) %>%
  slice(-c(1:2)) %>%
  mutate(`.value` = case_when(
    `.name` %>% str_detect("spread") ~ "spread_sheet",
    `.name` %>% str_detect("score")  ~ "score",
    `.name` %>% str_detect("confirm") ~ "confirm")
  )
# apply the spec
aeps_1_gross_long <- aeps_1_gross %>%
  pivot_longer_spec(spec)
```

## Add domain

This chunk will get all domains and number skills. It will be useful to merge all ds in the future.  

```{r}
aeps_1_gross_long <- aeps_1_gross_long %>% 
  mutate(domain = names(.)[[1]]) %>% 
  rename(number_skill = names(.)[[1]]) %>% 
  select(domain, number_skill, everything())
```



# First file 1 - Adaptive (3)

## get data

```{r}
aeps_1_adaptive <- readxl::read_excel("C:/Users/luisf/Dropbox/ASQ4_AEPS Data for Luis 2.2021/Luis Feb 2021/copy KM Cleaned AEPS 3.5.21/1.Cleaned AEPSBirthToThreeFormNoN 2 Grace 9.13.2019.xlsx", sheet = 5)
```

```{r}
#clear excel attributes
aeps_1_adaptive[] <- lapply(aeps_1_adaptive, function(x) { attributes(x) <- NULL; x })
#fix names
aeps_1_adaptive <- clean_names(aeps_1_adaptive)
#remove empty columns and rows
aeps_1_adaptive <- remove_empty(aeps_1_adaptive, which = c("rows", "cols"), quiet = TRUE)
#create a skill
aeps_1_adaptive <- aeps_1_adaptive %>% 
  mutate(skill = .[[1]]) %>% #this is the first column )in this case -- fine motor (sub)domain
  select(1,skill, everything())
#With this new variable (skill), just keep if is a letter
aeps_1_adaptive <- aeps_1_adaptive %>% 
  mutate(skill = if_else(str_detect(skill, "[a-z]"), .[[1]],  NA_character_)) %>% #if skill is a letter, otherwise missing
  fill(skill)
#remove first line (it's almost all na)
aeps_1_adaptive <- aeps_1_adaptive %>% 
  filter(!str_detect(.[[1]], "[a-z]"))
#transform to numeric
aeps_1_adaptive <- aeps_1_adaptive %>% mutate(!! names(.)[1] := as.numeric(!! rlang::sym(names(.)[1]))) 
#aeps_1_adaptive[[1]] <- as.numeric(aeps_1_adaptive[[1]])
```


## Tranform it to long format

```{r}
spec <- tibble(`.name` = names(aeps_1_adaptive)) %>%
  slice(-c(1:2)) %>%
  mutate(`.value` = case_when(
    `.name` %>% str_detect("spread") ~ "spread_sheet",
    `.name` %>% str_detect("score")  ~ "score",
    `.name` %>% str_detect("confirm") ~ "confirm")
  )
# apply the spec
aeps_1_adaptive_long <- aeps_1_adaptive %>%
  pivot_longer_spec(spec)
```

## Add domain

This chunk will get all domains and number skills. It will be useful to merge all ds in the future.  

```{r}
aeps_1_adaptive_long <- aeps_1_adaptive_long %>% 
  mutate(domain = names(.)[[1]]) %>% 
  rename(number_skill = names(.)[[1]]) %>% 
  select(domain, number_skill, everything())
```


# Merge AEPS spreadsheets datasets

Just checking if we have 22 children in each dataset  
```{r}
aeps_1_fine_long %>% count(spread_sheet)
aeps_1_gross_long %>% count(spread_sheet)
aeps_1_adaptive_long %>% count(spread_sheet)
```

I'll use `bind_rows` to put each dataset on top of the another. 
First, fine long with gross long


```{r}
ds_aeps_birth_three <- bind_rows(
  aeps_1_fine_long,
  aeps_1_gross_long)
```

Now, this resultant ds with adaptive

```{r}
ds_aeps_birth_three <- bind_rows(
  ds_aeps_birth_three,
  aeps_1_adaptive_long)
```


# Merge AEPS with AEPS demographics

I'll get `aeps_1_demo` to add to this partially full dataset the child' ID

```{r}
ds_aeps_birth_three <- left_join(ds_aeps_birth_three, aeps_1_demo)
```

First, i'll add two key variables present in the ASQ-4 dataset to guarantee the merging will be correct

```{r}
ds_aeps_birth_three <- ds_aeps_birth_three %>% 
  mutate(aeps_file_number = 1) %>% 
  mutate(aeps_sprdsheet_id_number = spread_sheet) %>% 
  rename(asq4_id = childs_id) %>% 
  mutate(asq4_id = as.numeric(asq4_id)) #in ASQ4 dataset, this variable is numeric
```


Create a full dataset with ASQ-4 and AEPS

```{r}
ds_birth_three_aeps_asq <- left_join(
  ds_aeps_birth_three,
  ds_asq,
  by = "asq4_id"
)
```


## Manual check

```{r}
ds_birth_three_aeps_asq %>% 
  filter(spread_sheet == "15") %>% View()
```


## Save as excel

```{r}
write.csv(ds_birth_three_aeps_asq, file = "ds_birth_three_aeps_asq.csv", row.names = F)
```


> It seems everything worked! (Saturday, 13 March, 2021)  
Ask Kimberly

# Analyses - birth to three {#analyses}


<div class="alert alert-success">
Diane, Jane, and Kimberly. 
From this line on, I will:    
**(1)** Present a plot and a table with the ASQ-4 summative results   
**(2)** Present a plot and a table with the  AEPS summative results (I read elsewhere and it seems that AEPS items need to be summed as well)   
**(3)** Run all correlation analyses between the ASQ-4 summative scores and the AEPS summative scores   

You'll notice that the correlation results are too low. I'm wondering if something was under the radar in my code or if I'm missing some point.  
I have sent an e-mail in which I present an excel file to make some points clearer.
</div>


## ASQ-4 analysis

### Plot 

<div class="alert alert-info">
The graph below describes the distribution of all ASQ4 results.
</div>

```{r}
ds_birth_three_aeps_asq %>%
  select(asq4_id, everything()) %>% #just for checking
  distinct(asq4_id, .keep_all = T) %>% #use only one information (we have 22 children here)
  select(ends_with("_sum")) %>% 
  janitor::remove_empty("cols") %>% #remove empty columns
  pivot_longer(everything(.)) %>% 
  ggplot(., aes(name, value)) +
  geom_boxplot() +
  theme_bw()
```
### Summary table  

<div class="alert alert-info">
The table below reports the ASQ-4 results. I did not group the results by age interval.      
</div>

```{r, results = "asis"}
ds_birth_three_aeps_asq %>%
  select(asq4_id, everything()) %>% #just for checking
  distinct(asq4_id, .keep_all = T) %>% #use only one information (we have 22 children here)
  select(ends_with("_sum")) %>% 
  janitor::remove_empty(c("cols")) %>% #remove empty columns
  pivot_longer(everything(.)) %>% 
  arsenal::tableby(name ~ value, .) %>% 
  summary()
```



## AEPS domains and skills

<div class="alert alert-info">
The following results will present the AEPS findings.   
</div>

### Descriptive table  


<div class="alert alert-info">
The following table will present the descriptives of each participant and activitiy 
</div>


```{r}
ds_birth_three_aeps_asq %>% 
  select(asq4_id, everything()) %>% 
  group_by(asq4_id) %>% 
  arrange(asq4_id) %>% 
  count(domain, skill)
```
<div class="alert alert-danger">
How to interpret these results?      
ASQ4id = 500 (it's a child in the dataset)
He or She has 18 results in domain `adaptative` and skill = `Feeding`.   
If you access the excel file, it will be these same values.  
</div>



### Plot total scores  

<div class="alert alert-info">
If I understood everything right (I've consulted https://pt.slideshare.net/BrookesPubCo/aeps-intro-webinar-slideshare),    
each participant needs to have a score reflecting his/her ability.    
Therefore, I summed up the scores obtained in each skill of each domain (e.g.: Reach, Grab, and Release from Fine motor). 
</div>


```{r}
ds_birth_three_aeps_asq %>% 
  group_by(asq4_id,domain, skill) %>%  #grop for having each score for each participant
  summarise(raw_score = sum(score)) %>% #create the summative score
  select(asq4_id,domain, skill, raw_score) %>% #select before pivoting
      pivot_longer(-c(asq4_id, raw_score, skill),
                   values_to = "domain") %>% 
  select(-name) %>% 
  ggplot(., aes(x = domain, y = raw_score, fill = skill)) +
  #geom_col(position = position_dodge2(preserve = "single")) +
  geom_bar(stat = "summary", position = "dodge", width = 0.8) +
  theme_bw()
  
```

### Summary total scores 

<div class="alert alert-info">
The following table presents the same information presented above. However, I imagine you'll be able to check if everything is correct.   
</div>

```{r, results = "asis"}
ds_birth_three_aeps_asq %>% 
  group_by(asq4_id,domain, skill) %>%  #grop for having each score for each participant
  summarise(raw_score = sum(score)) %>% #create the summative score
  select(asq4_id,domain, skill, raw_score) %>% #select before pivoting
      pivot_longer(-c(asq4_id, raw_score, skill),
                   values_to = "domain") %>% 
  select(-name) %>% 
  group_by(domain, skill) %>% 
  summarise(mean(raw_score), sd(raw_score), n()) %>% 
  mutate_if(is.numeric,round,2)
```

<div class="alert alert-danger">
How to interpret these results?      
Example:   
when considering **all children** in domain (fine motor), and skill (A. Reach, Grab, Release), the mean result is 34.82   
I double checked the excel file and this result is correct   
</div>



## Correlations AEPS ASQ-4 

<div class="alert alert-info">
The following tables will present the correlation between each ASQ-4 domain and its AEPS parallel.   
I'm using the summative score of the ASQ-4 and also the summative score of AEPS.  Diane, please let me know if that's the way to achieve the AEPS results.   
</div>

> Please don't consider the three following chunks. They are programming syntaxes.  

### Create a summative score (Ask Diane)

```{r}
cor_ds_1 <- ds_birth_three_aeps_asq %>% 
  group_by(asq4_id,domain, skill) %>%  #grop for having each score for each participant
  summarise(raw_score = sum(score))
```

### Create a dataframe to gather all data 

```{r}
cor_ds_2 <- ds_birth_three_aeps_asq %>%
  select(asq4_id, everything()) %>% #just for checking
  distinct(asq4_id, .keep_all = T) %>% #use only one information (we have 22 children here)
  select(asq4_id,ends_with("_sum")) %>% 
  janitor::remove_empty("cols") %>% #remove empty columns
  pivot_longer(-asq4_id, names_to = "asq4") 
```


### Merge these data and remove useless vectors  
```{r}
cor_ds <- left_join(cor_ds_1,cor_ds_2)
rm(cor_ds_1, cor_ds_2)
```


## ASQ Fine motor vs AEPS Fine motor

```{r}
library(corrr) #correlation 
```

<div class="alert alert-info">
Correlation between *ASQ Fine motor* and *AEPS Fine motor*
I'm using the same child! 
</div>


```{r, warning=FALSE, message = FALSE  }
cor_ds %>% 
  filter(asq4 == "fm_sum", domain == "fine_motor")%>%
  group_by(skill) %>% 
  select(raw_score, value) %>% 
  nest() %>% 
  mutate(data = map(data, purrr::compose(stretch, correlate))) %>% 
  unnest(cols = -skill) %>% 
  na.omit  %>% 
  distinct(skill, .keep_all = T)
```

<div class="alert alert-danger">
How to interpret these results?      
The correlation between the ASQ-4 fine motor and AEPS fine motor (skill: Reach and Grab) is -0.22 (makes no sense to me)   
The correlation between the ASQ-4 fine motor and AEPS fine motor (skill: Functional use) is -0.05 (makes no sense to me)   

**I have attached an excel file in which I mannually ran these correlations and the results match**
</div>

## ASQ gross motor AEPS gross motor


<div class="alert alert-info">
Correlation between *ASQ Gross motor* and *AEPS Gross motor*
I'm using the data from same children.    
</div>


```{r, warning=FALSE, message = FALSE  }
cor_ds %>% 
  filter(asq4 == "gm_sum", domain == "gross_motor") %>%
  group_by(skill) %>% 
  select(raw_score, value) %>% 
  nest() %>% 
  mutate(data = map(data, purrr::compose(stretch, correlate))) %>% 
  unnest(cols = -skill) %>% 
  na.omit  %>% 
  distinct(skill, .keep_all = T)
```

<div class="alert alert-danger">
How to interpret these results?      
The correlation between the ASQ-4 gross motor and AEPS gross motor (skill: A. Movement and Locomotion) is -0.17 (makes no sense to me)     
The correlation between the ASQ-4 gross motor and AEPS gross motor (skill: B. Balance in Sitting) is -0.06 (makes no sense to me)     
The correlation between the ASQ-4 gross motor and AEPS gross motor (skill: C. Balance & Mobility) is 0.03 (makes no sense to me)      
The correlation between the ASQ-4 gross motor and AEPS gross motor (skill: D. Play Skills) is 0.04 (makes no sense to me) 
</div>

## ASQ Personal-Social AEPS adaptive

<div class="alert alert-info">
**Jane: Just to refresh my memory. In the dataset, PS means problem-solving and P means Personal and Social, right?   
Correlation between *ASQ Personal-Social* and *AEPS Adaptive*
I'm using the data from same children.    
</div>

```{r, warning=FALSE, message = FALSE  }
cor_ds %>% 
  filter(asq4 == "per_sum", domain == "adaptive_area") %>%
  group_by(skill) %>% 
  select(raw_score, value) %>% 
  nest() %>% 
  mutate(data = map(data, purrr::compose(stretch, correlate))) %>% 
  unnest(cols = -skill) %>% 
  na.omit  %>% 
  distinct(skill, .keep_all = T)
```

<div class="alert alert-danger">
How to interpret these results?      
The correlation between the ASQ-4 Personal and Social and AEPS Adaptive (skill: A. Feeding) is 0.34 (makes sense!!)     
The correlation between the ASQ-4 Personal and Social and AEPS Adaptive (skill: B. Personal Hygiene) is 0.27 (makes sense!!)     
The correlation between the ASQ-4 Personal and Social and AEPS Adaptive (skill: C. Undressing) is 0.30 (makes sense!!)     
</div>   

end of report