Install Packages
packages = c('igraph', 'tidygraph', 'ggraph', 'ggrepel', 'visNetwork', 'lubridate', 'tidyverse')
for(p in packages){library
if(!require(p, character.only = T)){
install.packages(p)
}
library(p, character.only = T)
}
Data Import
GAStech_nodes <- read_csv("data/GAStech_email_node.csv")
Parsed with column specification:
cols(
id = [32mcol_double()[39m,
label = [31mcol_character()[39m,
Department = [31mcol_character()[39m,
Title = [31mcol_character()[39m
)
GAStech_edges <- read_csv("data/GAStech_email_edge-v2.csv")
Parsed with column specification:
cols(
source = [32mcol_double()[39m,
target = [32mcol_double()[39m,
SentDate = [31mcol_character()[39m,
SentTime = [34mcol_time(format = "")[39m,
Subject = [31mcol_character()[39m,
MainSubject = [31mcol_character()[39m,
sourceLabel = [31mcol_character()[39m,
targetLabel = [31mcol_character()[39m
)
Data Wrangling
GAStech_edges$SentDate = dmy(GAStech_edges$SentDate)
GAStech_edges$Weekday = wday(GAStech_edges$SentDate, label = TRUE, abbr = FALSE)
GAStech_edges_aggregated <- GAStech_edges %>%
filter(MainSubject == "Work related") %>%
group_by(source, target, Weekday) %>%
summarise(Weight = n()) %>%
filter(source!=target) %>%
filter(Weight > 1) %>%
ungroup()
GAStech_edges_aggregated
GAStech_graph <- tbl_graph(nodes = GAStech_nodes, edges = GAStech_edges_aggregated, directed = TRUE)
GAStech_graph
[38;5;246m# A tbl_graph: 54 nodes and 1456 edges
[39m[38;5;246m#
[39m[38;5;246m# A directed multigraph with 1 component
[39m[38;5;246m#
[39m[38;5;246m# Node Data: 54 x 4 (active)[39m
id label Department Title
[3m[38;5;246m<dbl>[39m[23m [3m[38;5;246m<chr>[39m[23m [3m[38;5;246m<chr>[39m[23m [3m[38;5;246m<chr>[39m[23m
[38;5;250m1[39m 1 Mat.Bramar Administrati~ Assistant to CEO
[38;5;250m2[39m 2 Anda.Ribera Administrati~ Assistant to CFO
[38;5;250m3[39m 3 Rachel.Pantanal Administrati~ Assistant to CIO
[38;5;250m4[39m 4 Linda.Lagos Administrati~ Assistant to COO
[38;5;250m5[39m 5 Ruscella.Mies.H~ Administrati~ Assistant to Engineering Gro~
[38;5;250m6[39m 6 Carla.Forluniau Administrati~ Assistant to IT Group Manager
[38;5;246m# ... with 48 more rows[39m
[38;5;246m#
[39m[38;5;246m# Edge Data: 1,456 x 4[39m
from to Weekday Weight
[3m[38;5;246m<int>[39m[23m [3m[38;5;246m<int>[39m[23m [3m[38;5;246m<ord>[39m[23m [3m[38;5;246m<int>[39m[23m
[38;5;250m1[39m 1 2 Monday 4
[38;5;250m2[39m 1 2 Tuesday 3
[38;5;250m3[39m 1 2 Wednesday 5
[38;5;246m# ... with 1,453 more rows[39m
GAStech_graph %>%
activate(edges) %>%
arrange(desc(Weight))
[38;5;246m# A tbl_graph: 54 nodes and 1456 edges
[39m[38;5;246m#
[39m[38;5;246m# A directed multigraph with 1 component
[39m[38;5;246m#
[39m[38;5;246m# Edge Data: 1,456 x 4 (active)[39m
from to Weekday Weight
[3m[38;5;246m<int>[39m[23m [3m[38;5;246m<int>[39m[23m [3m[38;5;246m<ord>[39m[23m [3m[38;5;246m<int>[39m[23m
[38;5;250m1[39m 40 41 Tuesday 23
[38;5;250m2[39m 40 43 Tuesday 19
[38;5;250m3[39m 41 43 Tuesday 15
[38;5;250m4[39m 41 40 Tuesday 14
[38;5;250m5[39m 42 41 Tuesday 13
[38;5;250m6[39m 42 40 Tuesday 12
[38;5;246m# ... with 1,450 more rows[39m
[38;5;246m#
[39m[38;5;246m# Node Data: 54 x 4[39m
id label Department Title
[3m[38;5;246m<dbl>[39m[23m [3m[38;5;246m<chr>[39m[23m [3m[38;5;246m<chr>[39m[23m [3m[38;5;246m<chr>[39m[23m
[38;5;250m1[39m 1 Mat.Bramar Administration Assistant to CEO
[38;5;250m2[39m 2 Anda.Ribera Administration Assistant to CFO
[38;5;250m3[39m 3 Rachel.Pantanal Administration Assistant to CIO
[38;5;246m# ... with 51 more rows[39m
Task 1: Static Organisation Graph
1.1 Original Network Grarph
The original network graph from section 6.1 of Hands-on-Exercise 10 is as follow:
# computing centrality indices
g <- GAStech_graph %>%
mutate(betweenness_centrality = centrality_betweenness()) %>%
mutate(closeness_centrality = centrality_closeness()) %>%
ggraph(layout = "nicely") +
geom_edge_link(aes()) +
geom_node_point(aes(colour = closeness_centrality, size=betweenness_centrality))
g + theme_graph()

The graph above shows the network of a particular employee based on the closeness centrality and betweenness centrality. However, the aesthetic and clarity of the graph is still not satisfactory. It is still leveraging on ggraph 1.0.
Negative remarks on clarity:
- I am not sure which employees are of higher clonessness centrality or betweenness centrality.
- With all the edges similar to each other, I am not sure which area has a higher weightage than the other. This means who are the employees that are more connected with each other.
- Just from looking the graph at a glance, I cannot derive much information. For example, when are the time they interacts? From which departments are they from?
Negative remarks on aesthetics:
- The nodes are overlapping of each other. Hence, making certain nodes not obvious
- Not all nodes can be seen due to the colour complement with the black edges.
1.2 Sketch for Task 1
I have drawn out the desired design to improve the aesthetics and clarity of the graph. In this sketch design, there are 2 graphs. The first graph will focus to improve on the aesthetics of the current design while the second graph will focus to improve the clarity.

1.3 Final Design for Task 1
Graph 1
In the the first graph, here is the improvement made:
1. The opacity of the node is reduced
2. Add in label for employees whose closeness centrality is very high
3. Add in the colour gradient. The higher the closeness centrality, the node will be indicated by red while lower closeness centrality will be indicated by yellow
4. Assign width = Weight in the aesthetic of the edge to show how much interactions done among the employees.
g <- GAStech_graph %>%
mutate(betweenness_centrality = centrality_betweenness()) %>%
mutate(closeness_centrality = centrality_closeness()) %>%
ggraph(layout = "nicely") +
geom_edge_link(aes(width = Weight),colour= "black", alpha=0.1, show.legend = FALSE) +
geom_node_point(aes(colour = closeness_centrality, size=betweenness_centrality),alpha=0.7) +
scale_color_gradient(low = "yellow", high = "red")+
geom_node_label(aes(filter=closeness_centrality > 0.015, label= label),
family = "serif",repel = TRUE, label.size = 0.25)
g + theme_graph()

Graph 2
Although the first graph has improved the overall aesthetics, it still does not tell much about the graph. Hence, I make the second graph to gain more information about the graph. In the second graph, we faceted by department and weekdays. Hence, we are able to see when is the most interaction occurs. Which departments has the most interaction with each other. Here is my findings from the second graph:
1. Based on the graph below, I can see that Hideki Cocinaro from security department as the highest interactions on tuesday.
2. People from Executive department do not interact with each other.
3. The interactions happeining at Administration and Information Technology department does not vary much throughout the week.
g1 <- GAStech_graph %>%
mutate(betweenness_centrality = centrality_betweenness()) %>%
mutate(closeness_centrality = centrality_closeness()) %>%
ggraph(layout = "fr") +
geom_edge_link(aes(width = Weight),colour= "black", alpha=0.6, show.legend = FALSE) +
#scale_edge_width(range = c(0.1, 5))+
geom_node_point(aes(colour = closeness_centrality, size=betweenness_centrality),alpha=0.5) +
scale_color_gradient(low = "yellow", high = "red") +
geom_label_repel(aes(x=ifelse(closeness_centrality > 0.015, x, 0),
y=ifelse(closeness_centrality > 0.015, y, 0),
label=ifelse(closeness_centrality > 0.015, label,"")),
fontface = 'bold', color = 'black',
size = 3,
box.padding = 0.80, point.padding = 0.5,
segment.colour = "white",
na.rm=TRUE)
#scale_edge_width(range = c(0.1, 5))
g1 + facet_graph(Weekday~Department,labeller = label_wrap_gen(width=10))

Task 2: Interactive Organisation Graph
2.1 Further data preparation
# data prep
GAStech_edges_aggregated <- GAStech_edges %>%
left_join(GAStech_nodes, by = c("sourceLabel" = "label")) %>%
rename(from = id) %>%
left_join(GAStech_nodes, by = c("targetLabel" = "label")) %>%
rename(to = id) %>%
filter(MainSubject == "Work related") %>%
group_by(from, to) %>%
summarise(weight = n()) %>%
filter(from!=to) %>%
filter(weight > 1) %>%
ungroup()
GAStech_nodes <- GAStech_nodes %>%
rename(group = Department)
2.2 Original Network Grarph
The original network graph from section 7.4 of Hands-on-Exercise 10 is as follow:
#interactivity
visNetwork(GAStech_nodes, GAStech_edges_aggregated) %>%
visIgraphLayout(layout = "layout_with_fr") %>%
visOptions(highlightNearest = TRUE, nodesIdSelection = TRUE)
The graph above adding an interactivity element. User can choose the name of the employee. Then, the connections related to that employees are highlighted. Other than choosing the drop down list, user can also see the highlight by clicking on the node immediately. However, there are few problems with this graph:
1. Only nodes are highlighted without knowing who are the employees exactly.In order to see the label (name),the user has to zoom in.
2. Even with zooming in, the labels are also not clearly seen. It is mixed with all the lines
3. The colour of the node does not tell what the difference is. What is red, green, blue, yellow, purple referring to?
2.3 Sketch for Task 2
For the following sketch, i have improved the aesthetics and the clarity from the previous graph. 
2.4 Final Design for Task 2
In the improved graph, here are the changes made:
1. Adding of legend to clearly show in which department does a particular employee belong to. The departments are also differentiated by colour.
2. Instead of a circle, I change the shape of the node to box. This way, we can see the labels clearly and without overlapping with the edge link.
3. I have also added tooltip to add more interactivity when user hover on the node. The tooltip shows the name of the employees clearly in case the nodes are overlapping with each other.
4. I added the arrow in the edge showing the direction of the link.
5. I have added title to show clearly what this graph is about and also change the description of the dropdown list.
GAStech_nodes$title <- paste0(GAStech_nodes$label)
visNetwork(GAStech_nodes, GAStech_edges_aggregated,main = "Task 2: Interactive Network Graph") %>%
visIgraphLayout(layout = "layout_with_fr") %>%
visEdges(arrows = "to", smooth = FALSE) %>%
visPhysics(stabilization = FALSE) %>%
visInteraction(dragNodes = TRUE, dragView = TRUE, zoomView = FALSE) %>%
visNodes(shape="box", labelHighlightBold = TRUE, font = list(size=30)) %>%
visOptions(highlightNearest = list(enabled = T,degree = list(from = 1, to = 1), hover = F,algorithm = "hierarchical"), nodesIdSelection = list(enabled = TRUE,main = "Employees' name" ))%>%
visLegend(zoom = FALSE)%>%
addFontAwesome()
