Here, we will begin to analyse the guild-level temporal activity of Southeast Asian wildlife. Species are grouped by their respective guilds which consist of their typical feeding habits (i.e., carnivore, herbivore and omnivore) and their body size (i.e., small (<4kg), medium (4-20kg), large (>20kg)).

Load the relevant packages and dataframe

#Load the packages
library(tidyverse);library(activity);library(overlap);library(lubridate);library(plyr)

## ── Attaching packages ─────────────────────────────────────── tidyverse 1.3.1 ──

## ✔ ggplot2 3.3.6     ✔ purrr   0.3.4
## ✔ tibble  3.1.7     ✔ dplyr   1.0.9
## ✔ tidyr   1.2.0     ✔ stringr 1.4.0
## ✔ readr   2.1.2     ✔ forcats 0.5.1

## ── Conflicts ────────────────────────────────────────── tidyverse_conflicts() ──
## ✖ dplyr::filter() masks stats::filter()
## ✖ dplyr::lag()    masks stats::lag()

## This is overlap devel version 0.3.4.
## For overview type ?overlap; for changes do news(p='overlap').

## 
## Attaching package: 'lubridate'

## The following objects are masked from 'package:base':
## 
##     date, intersect, setdiff, union

## ------------------------------------------------------------------------------

## You have loaded plyr after dplyr - this is likely to cause problems.
## If you need functions from both plyr and dplyr, please load plyr first, then dplyr:
## library(plyr); library(dplyr)

## ------------------------------------------------------------------------------

## 
## Attaching package: 'plyr'

## The following objects are masked from 'package:dplyr':
## 
##     arrange, count, desc, failwith, id, mutate, rename, summarise,
##     summarize

## The following object is masked from 'package:purrr':
## 
##     compact

#Load the dataframe
caps <- as.data.frame(read.csv('SEA_Activity_dataset_for_community_guild-level_analyses_20230306.csv'))

#Inspect the dataframe
head(caps)

##   camera_id     survey_id           Species time.rad FLII_status
## 1 02_sorted KhaoChong2018        Sus_scrofa 4.673671    Degraded
## 2 02_sorted KhaoChong2018        Sus_scrofa 3.762784    Degraded
## 3 02_sorted KhaoChong2018 Macaca_nemestrina 1.750001    Degraded
## 4 02_sorted KhaoChong2018 Macaca_nemestrina 2.206759    Degraded
## 5 02_sorted KhaoChong2018 Macaca_nemestrina 1.979037    Degraded
## 6 02_sorted KhaoChong2018 Macaca_nemestrina 2.682890    Degraded
##     trophic_guild
## 1  large_omnivore
## 2  large_omnivore
## 3 medium_omnivore
## 4 medium_omnivore
## 5 medium_omnivore
## 6 medium_omnivore

str(caps)

## 'data.frame':    31138 obs. of  6 variables:
##  $ camera_id    : chr  "02_sorted" "02_sorted" "02_sorted" "02_sorted" ...
##  $ survey_id    : chr  "KhaoChong2018" "KhaoChong2018" "KhaoChong2018" "KhaoChong2018" ...
##  $ Species      : chr  "Sus_scrofa" "Sus_scrofa" "Macaca_nemestrina" "Macaca_nemestrina" ...
##  $ time.rad     : num  4.67 3.76 1.75 2.21 1.98 ...
##  $ FLII_status  : chr  "Degraded" "Degraded" "Degraded" "Degraded" ...
##  $ trophic_guild: chr  "large_omnivore" "large_omnivore" "medium_omnivore" "medium_omnivore" ...

names(caps)

## [1] "camera_id"     "survey_id"     "Species"       "time.rad"     
## [5] "FLII_status"   "trophic_guild"

dim(caps)

## [1] 31138     6

anyNA(caps)

## [1] FALSE

Here, we will be extensively using for() loops to carry out our analyses. In general, ‘Loops’ are great at repeating the same functions over and over again for a given dataset.

#Loop to split dataframe per guild

#Create a guild and status vector
sort(unique(caps$trophic_guild))

## [1] "large_carnivore"  "large_herbivore"  "large_omnivore"   "medium_carnivore"
## [5] "medium_herbivore" "medium_omnivore"  "small_carnivore"  "small_herbivore" 
## [9] "small_omnivore"

guilds <- c('large_carnivore', 'large_herbivore', 'large_omnivore', 'medium_carnivore', 'medium_herbivore',
            'medium_omnivore', 'small_carnivore', 'small_herbivore', 'small_omnivore')
status <- c('Degraded', 'Intact')

#Store the dataframes for each guild in this list
guild_caps = list() 

#Test out the loop with specific variables
i=1

for(i in 1:length(guilds)){ #repeat for each guild
  
  #Specify guild and subset caps for it
  a = guilds[i]
  b = caps[caps$trophic_guild == a,]
  
  #Save it!
  guild_caps[[i]] = b
  names(guild_caps)[i]= a
  
}

## keep enviro clean
rm(a,b,i)

Loop to split guild data frames into specific status data frames stored in a nested list

We will further split each of the guild dataframes by the FLII status (i.e., degraded or intact)

## store the split dataframes into this list 
split_guild = list()

## variables to practice with 
i=1;l=1

for(i in 1:length(guild_caps)){ # repeat for each guild 
  
  # Subset data for a single guild
  a = guild_caps[[i]] 
  
  # store results for each value per status
  temp = list()

  for(l in 1:length(status)){ # repeat for each status
    
    #Select a status
    b = status[l]
    
    # Subset the dataframe for each status
    c = a[a$FLII_status == b,]
    
      
      if(nrow(c)>0){ # add a conditional statement to avoid saving data w/ zero detections
        
        # save this! 
        temp[[l]] = c
        names(temp)[l] = b
        
      }else{
        
        # Make it NA if were missing data! 
        temp[[l]] = NA
        names(temp)[l] = b
        
      } # end conditional statement

    
  } # end loop per status
  
  # Save the guild name 
  split_guild[[i]] = temp
  names(split_guild)[i] = unique(a$trophic_guild)
  
  
} # end loop per guild

#keep environment clean
rm(temp,i,l,a,b,c)

Loop to generate Actmod objects for each status per guild

Here, we will be using the fitact() function to create Activity Model Class (Actmod) objects or simple terms, circular kernel density estimates to observe the activity pattern of each guild. We will be using 10,000 bootstrap samples to meet current literature criteria, however, for testing purposes, it will be wise to use a lower number (e.g., 10 reps) as it can take awhile to finish.

## store actmod objects in this list 
actmod.list = list()

## variables to practice the loop with 
i=1;l=1

for(i in 1:length(split_guild)){ #repeat for each guild 
  
  #subset for a specific guild and save the guild name
  a = split_guild[[i]]
  s = names(split_guild)[i] 
  
  #save results from next loop in this temporary list
  temp = list()
  
  for(l in 1:length(a)){ #repeat for each status
    
    #subset for a specific status
    b = a[[l]]
    v = names(a)[l] #save that status name 
    
    
      if(nrow(b) <= 100){
        
        act = fitact(b$time.rad, sample = "model", adj = 1, reps = 10000) 
        
      }else{
        
        act = fitact(b$time.rad, sample = "data", adj = 1, reps = 10000) 
        
      } #end conditional 
      
      
      #Save it
      temp[[l]] = act
      names(temp)[l] = v
      
    
  } # end loop per status 
  
  ## THE FINAL SAVE
  actmod.list[[i]] = temp
  names(actmod.list)[i] = s
  
} # end loop per guild

#keep environment clean
rm(i,l,a,b,s,v,temp,act)

#Save actmods in teh form of a RDS file
saveRDS(actmod.list, 'SEA_Activity_guild-level_actmods_20230309.RDS')

Determining Temporal Shifts

Now that we are done in generating our circular kernel density distributions (“activity curves”), we can now begin to determine whether there is a shift in activity pattern between intact and degraded forests. We will be using three indicators, namely p-values, overlap estimates and peak activity times to determine whether a shift is occurring. I will discuss each indicator at length below, but for now let’s define a temporal shift. A temporal shift has occurred when:

P < 0.05
Peak activity changes between intact and degraded forests

We also used a overlap estimates to determine the magnitude of difference in activity patterns between both types of forest:

Magnitude of Difference (1-overlap) > 0.25 = “strong” (Roughly interpreted as more than 25% change in activity)
Magnitude of Difference (1-overlap) <= 0.25 = “weak”

Using CompareCkern() fucntion to calculate p-value

In the ‘activity’ package in r, there are various statistical significance test that we can use to calculate p-values. However, for the purposes of our research question, the more approprite test to use is the compareCkern() test as it calculates the significant difference between two circular kernel density curves. Other statistcal significance test included in the package are compareAct() (‘Wald test’) and the compareTime () tests. You can read more about it here

#Create an empty list to save results
p_value.list <- list()

i = 1

for (i in 1:length(actmod.list)) { #repeat for each guild
  
  a = actmod.list[[i]] #Select a single guild
  b = names(actmod.list)[i] #Save the name of the guild
  
  #Compare activity patterns 
  c = as.data.frame(compareCkern(a[[1]], a[[2]]))
  
  #Add guild and outputs column
  c$guild = b
  c$outputs = rownames(c)
  
  #Save it 
  p_value.list[[i]] = c
  names(p_value.list)[i] = b
  
  
}

#Keep environment clean!
rm(a,b,c,i)

#Extract outputs and covert it into a dataframe
df = do.call(rbind, p_value.list)
rownames(df)= NULL
#rm(res)

#Filter out the p-values and rename the column
df <- df %>% 
  filter(outputs == "pNull") %>% 
  select(-outputs)

colnames(df) <- c('pNull', 'guild')

#Keep environment clean!
rm(p_value.list, split_guild, guild_caps)

Using the overlapEST() function to calculate overlap estimate

Here, we will be calculating the overlap estimate using the overlapEST() fucntion from the ‘overlap’ package. Overlap is basically the overlapping area under the two activity curves where the overlap estimate ranges from 0 to 1. We will also be using bootstrapping to calculate the 95% CI of each overlap estimate and thus can take some time to finish.

#Create an empty list to store results
overlap.list = list()

i=1;l=1

for (i in 1:length(actmod.list)) { #repeat for each guild
  
  a = actmod.list[[i]]
  b = names(actmod.list)[i]
  
  c = min(length(a[[1]]@data), length(a[[2]]@data))
  
  if(c <= 75){
    
    overlap.coef = overlapEst(a[[1]]@data, a[[2]]@data, adjust = 0.8, type = "Dhat1")
    
  }else{
    
    overlap.coef = overlapEst(a[[1]]@data, a[[2]]@data, adjust = 1, type = "Dhat4")
    
  }
  
  
  if(c <= 75){ #calculate overlap estimate
    
    overlap.boot = bootstrap(a[[1]]@data, a[[2]]@data, nb = 10000, adjust = 0.8, type = "Dhat1")
    
    
  }else{
    
    overlap.boot = bootstrap(a[[1]]@data, a[[2]]@data, nb = 10000, adjust = 1, type = "Dhat4")
    
    
  }
  
  overlap.CI = bootCI(overlap.coef, overlap.boot, conf = 0.95) #calculate 95% CI of overlap estimate
  
  d = as.data.frame(overlap.CI)
  
  d = d["norm0",]
  
  e = as.data.frame(overlap.coef)
  
  f = cbind(e,d)
  
  f$guild = b
  
  overlap.list[[i]] = f
  names(overlap.list)[i] = b
  
}


#Keep environment clean!
rm(a,b,c,d,e,f,i,l,overlap.boot,overlap.CI,overlap.coef)

#Merge it with df
a = do.call(rbind, overlap.list)
df <- merge(df, a, by = 'guild')
rm(a, overlap.list)

Extract peak activity within intact and degraded forests

The peak activity refers to the time associated to maximum temporal activity density or in more simple terms, the time when a species/guild/community is most active. We first define a peak activity to be ‘nocturnal’, ‘diurnal’ and ‘crepuscular’ when the peak activity occurred within the night (1931 – 0429 hours; 9 hours total), day (0731 – 1629 hrs; 9 hours total) and dawn and/or dusk (0430 – 0730 hrs and/or 1630 – 1930 hrs; 6 hours total) respectively. A change of peak activity has occurred when there is a shift between ‘diurnal’, ‘nocturnal’ and ‘crepuscular’ hours. For instance, when a species has a peak activity at 0500 hours in intact forests while having a peak activity at 0800 hours in degraded forests, this shows that the species has shifted from crepuscular to diurnal hours, which is referred to a diurnal change in peak activities.

Firstly, we will need to ‘unlist’ actmod.list and create to a dataframe before extracting.

#Unlist actmod.list
act <- unlist(actmod.list)

#Create a vector for our column names
colnamestoextract = c("guild", "peak_activity_radians")

#Create a dataframe to fill
empty = as.data.frame(matrix(NA,nrow = length(act),ncol = 2))

#Apply the column names
colnames(empty) = colnamestoextract

Here, we will use a loop to extract the peak activities in radians from each of the actmods. This is usually called a S4 model extraction.

i=1

for(i in 1:length(act)){
  
  a = act[[i]] #Subset a term from the list called act
  
  b = names(act)[i] #Save the names of the term
  
  empty$guild[i] = b #Save the names of the term
  
  c = a@pdf #Extract the probability density function values
  
  d = as.data.frame(c) #Convert it into a dataframe
  
  e = filter(d, y == max(y)) # Remove other rows and now only contains maximum density values 
  
  empty$peak_activity_radians[i] = e$x # X will be the peak activity where most of our species detections (density) are found
  
}

#Keep environment clean
rm(a,b,c,d,e,i,colnamestoextract)

Now, we will convert radian times into our normal time format in hours: minutes: seconds and separate them by FLII status.

# Convert peak_activity in radians to seconds
empty <- empty %>% mutate(peak_activity_seconds = (peak_activity_radians*86400)/(2*pi))

#Convert seconds into time format
str(empty)

## 'data.frame':    18 obs. of  3 variables:
##  $ guild                : chr  "large_carnivore.Degraded" "large_carnivore.Intact" "large_herbivore.Degraded" "large_herbivore.Intact" ...
##  $ peak_activity_radians: num  4.57 1.73 5.04 4.88 1.82 ...
##  $ peak_activity_seconds: num  62775 23794 69356 67163 24975 ...

empty$peak_activity_seconds <- as.integer(empty$peak_activity_seconds)
empty <- empty %>% mutate(peak_activity = seconds_to_period(peak_activity_seconds))

#Select columns that we need
empty <- select(empty, guild, peak_activity)

#Create a dataframe with only degraded peak activities
degraded_peak <- empty[!grepl(".Intact", empty$guild),]
colnames(degraded_peak) <- c("guild", "peak_activity_degraded")

#Create a dataframe with only pristine peak actvities
intact_peak <- empty[!grepl(".Degraded", empty$guild),]
colnames(intact_peak) <- c("guild", "peak_activity_intact")

#Combine both of them!
intact_peak <- intact_peak %>% select(-guild)
peak_activity <- cbind(degraded_peak, intact_peak)

#Remove ".Degraded" to combine with p-values and overlaps later
peak_activity = peak_activity %>% 
  mutate(guild = str_remove_all(guild, ".Degraded"))

#keep environment clean
rm(act, degraded_peak, empty, intact_peak)

#Merge it with df
df <- merge(df, peak_activity, by = 'guild')

#Save the overall results!
write.csv(df, 'SEA_Activity_guild-level_results_20230310.csv', row.names = F)

#Keep environment clean
rm(peak_activity, df, caps)

Visualisation of Activity Patterns

Here, we will begin the process of visualizing activity curves using ggplot2(). But first, we nned to prepare the data before hand

Data preparation for visualisation

We need to extract the probability distribution function (pdf) from each actmod to plot the data. As usual, we will be using loops to do this.

#Create a empty list to store prepared data
pdf_cov = list()

i=1;k=1 #Change here to select different variables

for (i in 1:length(actmod.list)) {#repeat for each guild
  
  #Select a single guild and save the name
  a = actmod.list[[i]]
  b = names(actmod.list)[i]
  
  #Create an empty dataframe store multiple activity distributions here by matching the format of the pdf 
  c = data.frame(a[[1]]@pdf)
  c = c[0,]
  
  for (k in 1:length(a)) { #repeat for each status
    
    #Select a single status and save the name
    d = a[[k]]
    e = names(a)[k]
    
    #Extract the probability density function 
    f = data.frame(d@pdf)
    f$guild = b
    f$status = e
    
    #save this!
    c = rbind(c, f)
    
  }
  
  #save it!
  pdf_cov[[i]] = c
  names(pdf_cov)[i] = b
}

#Keep environment clean!
rm(a,b,c,d,e,f,i,k)

Visualisation

Feel free to adjust the themes, colours and fonts in ggplot2() to suit your taste.

#Save the plots here
cov_plot = list()

i=1 #Change here to select a different variable

for (i in 1:length(pdf_cov)) { #repeat for each guild
  
  #Select a single guild
  a = pdf_cov[[i]]
  b = names(pdf_cov)[i]
  
  #Visualise activity using ggplot
  plot =
    ggplot(a, aes(x=x, y=y, fill = status))+
    geom_ribbon(aes(ymin = lcl, ymax = ucl), alpha = 0.6)+
    scale_x_continuous(breaks = c(0, 3.14, 6.3), 
                       labels = c("Midnight", "Noon", "Midnight"))+
    coord_cartesian(ylim = c(0, 0.8))+ 
    annotate("rect", xmin = 0, xmax = 1.17, ymin = 0, ymax= c(0,0.8), color = "#333333", alpha = .4)+
    annotate("rect", xmin = 1.18, xmax = 1.96, ymin = 0, ymax= c(0,0.8), color = "grey", alpha = .1)+
    annotate("rect", xmin = 4.32, xmax = 5.1, ymin = 0, ymax= c(0,0.8), color = "grey", alpha = .1)+
    annotate("rect", xmin = 5.11, xmax = 6.3, ymin = 0, ymax= c(0,0.8), color = "#333333", alpha = .4)+
    theme_test()+
    scale_fill_manual(name = a$status, values = c("#FC6600", "#4169e1"))+
    theme(axis.title = element_blank(), axis.text = element_text(size = 24),
          legend.position  = 'none', panel.grid.major = element_blank(), 
          panel.grid.minor = element_blank(), panel.background = element_blank(), 
          axis.line = element_line(colour = "black"))
  
  #Save the plots
  cov_plot[[i]] = plot
  names(cov_plot)[i] = b
  
}

#Keep environment clean
#rm(a,b,i,plot)

Save the activity plots

#Save all the plots!

i=1

for(i in 1:length(cov_plot)){ #repeat for each guild
  
  # select a single plot from a guild
  a = cov_plot[[i]]
  b = names(cov_plot)[i] #save guild name
  
  path = paste0(b, "_20230310.PDF", sep = "")
  
  ggsave(path, a, height = 8, width = 14, units = "in")
  
  
} 

#Keep environment clean
rm(a,b,path,i)

Guild-level Temporal Shift Analysis

Samuel Xin Tham Lee

2023-03-08