This template is based in this paper
https://revistas.ucm.es/index.php/REVE/article/view/75566/4564456557467
For a detail explanation of how to use it, please watch this video
wos_scopus_tos <-
tosr::tosr_load("Scopus_2000.bib",
"WoS_1.txt",
"WoS_2.txt",
"WoS_3.txt")
[1] 4
Converting your scopus collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
Converting your wos collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
Converting your wos collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
Converting your wos collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
735 duplicated documents have been removed
tree_of_science <-
tosr::tosR("Scopus_2000.bib",
"WoS_1.txt",
"WoS_2.txt",
"WoS_3.txt")
[1] 4
Converting your scopus collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
Converting your wos collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
Converting your wos collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
Converting your wos collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
735 duplicated documents have been removed
Computing TOS SAP
Computing TOS subfields
wos <-
bibliometrix::convert2df(c("WoS_1.txt",
"WoS_2.txt",
"WoS_3.txt")) # create dataframe from wos file
Converting your wos collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
scopus <-
bibliometrix::convert2df("Scopus_2000.bib", # Create dataframe from scopus file
dbsource = "scopus",
format = "bibtex")
Converting your scopus collection into a bibliographic dataframe
Done!
Generating affiliation field tag AU_UN from C1: Done!
table_1 <-
tibble(wos = length(wos$SR), # Create a dataframe with the values.
scopus = length(scopus$SR),
total = length(wos_scopus_tos$df$SR))
table_1
main_languages <-
wos_scopus_tos$df |>
select(LA) |>
separate_rows(LA, sep = "; ") |>
count(LA, sort = TRUE) |>
slice(1:5)
other_languages <-
wos_scopus_tos$df |>
separate_rows(LA, sep = "; ") |>
select(LA) |>
count(LA, sort = TRUE) |>
slice(6:n) |>
summarise(n = sum(n)) |>
mutate(LA = "OTHERS") |>
select(LA, n)
Warning in 6:n :
numerical expression has 25 elements: only the first used
languages <-
main_languages |>
bind_rows(other_languages) |>
mutate(percentage = n / sum(n),
percentage = round(percentage,
digits = 2) ) |>
rename(language = LA) |>
select(language, percentage, count = n)
languages
df <- languages |>
rename(value = percentage, group = language) |>
mutate(value = value * 100) |>
select(value, group)
df2 <- df %>%
mutate(csum = rev(cumsum(rev(value))),
pos = value/2 + lead(csum, 1),
pos = if_else(is.na(pos), value/2, pos))
ggplot(df, aes(x = 2 , y = value, fill = fct_inorder(group))) +
geom_col(width = 1, color = 1) +
coord_polar(theta = "y") +
geom_label_repel(data = df2,
aes(y = pos, label = paste0(value, "%")),
size = 4.5, nudge_x = 1, show.legend = FALSE) +
theme(panel.background = element_blank(),
axis.line = element_blank(),
axis.text = element_blank(),
axis.ticks = element_blank(),
axis.title = element_blank(),
plot.title = element_text(hjust = 0.5, size = 18)) +
labs(title = "Languages") +
guides(fill = guide_legend(title = "")) +
theme_void() +
xlim(0.5, 2.5)
wos_anual_production <-
wos |>
select(PY) |>
count(PY, sort = TRUE) |>
na.omit() |>
filter(PY >= 2000,
PY < year(today())) |>
mutate(ref_type = "wos")
scopus_anual_production <-
scopus |>
select(PY) |>
count(PY, sort = TRUE) |>
na.omit() |>
filter(PY >= 2000,
PY < year(today())) |>
mutate(ref_type = "scopus")
total_anual_production <-
wos_scopus_tos$df |>
select(PY) |>
count(PY, sort = TRUE) |>
na.omit() |>
filter(PY >= 2000,
PY < year(today())) |>
mutate(ref_type = "total")
wos_scopus_total_annual_production <-
wos_anual_production |>
bind_rows(scopus_anual_production,
total_anual_production)
figure_2_data <-
wos_scopus_total_annual_production |>
mutate(PY = replace_na(PY, replace = 0)) |>
pivot_wider(names_from = ref_type,
values_from = n) |>
arrange(desc(PY))
figure_2_data
```r
wos_scopus_total_annual_production |>
ggplot(aes(x = PY, y = n, color = ref_type)) +
geom_line() +
labs(title = \Annual Scientific Production\,
x = \years\,
y = \papers\) +
theme(plot.title = element_text(hjust = 0.5))
<!-- rnb-source-end -->
<!-- rnb-plot-begin -->
<img src="" />
<!-- rnb-plot-end -->
<!-- rnb-chunk-end -->
<!-- rnb-text-begin -->
## Table 2. Country production
<!-- rnb-text-end -->
<!-- rnb-chunk-begin -->
<!-- rnb-source-begin eyJkYXRhIjoiYGBgclxuZGF0YV9iaWJsaW9fd29zIDwtIGJpYmxpb0FuYWx5c2lzKHdvcylcblxud29zX2NvdW50cnkgPC0gXG4gIGRhdGFfYmlibGlvX3dvcyRDb3VudHJpZXMgfD4gXG4gIGRhdGEuZnJhbWUoKSB8PiBcbiAgbXV0YXRlKGRhdGFiYXNlID0gXCJ3b3NcIikgfD4gXG4gIHNlbGVjdChjb3VudHJ5ID0gVGFiLCBwYXBlcnMgPSBGcmVxLCBkYXRhYmFzZSApIHw+IFxuICBhcnJhbmdlKGRlc2MocGFwZXJzKSkgXG5cbmRhdGFfYmlibGlvX3Njb3B1cyA8LSBiaWJsaW9BbmFseXNpcyhzY29wdXMpXG5cbnNjb3B1c19jb3VudHJ5IDwtIFxuICBkYXRhX2JpYmxpb19zY29wdXMkQ291bnRyaWVzIHw+IFxuICBkYXRhLmZyYW1lKCkgfD4gXG4gIG11dGF0ZShkYXRhYmFzZSA9IFwic2NvcHVzXCIpIHw+IFxuICBzZWxlY3QoY291bnRyeSA9IFRhYiwgcGFwZXJzID0gRnJlcSwgZGF0YWJhc2UgKSB8PiBcbiAgYXJyYW5nZShkZXNjKHBhcGVycykpIFxuXG5kYXRhX2JpYmxpb190b3RhbCA8LSBiaWJsaW9BbmFseXNpcyh3b3Nfc2NvcHVzX3RvcyRkZilcblxudG90YWxfY291bnRyeSA8LSBcbiAgZGF0YV9iaWJsaW9fdG90YWwkQ291bnRyaWVzIHw+IFxuICBkYXRhLmZyYW1lKCkgfD4gXG4gIG11dGF0ZShkYXRhYmFzZSA9IFwidG90YWxcIikgfD4gXG4gIHNlbGVjdChjb3VudHJ5ID0gVGFiLCBwYXBlcnMgPSBGcmVxLCBkYXRhYmFzZSApIHw+IFxuICBhcnJhbmdlKGRlc2MocGFwZXJzKSkgXG5cbndvc19zY29wdXNfdG90YWxfY291bnRyeSA8LSBcbiAgd29zX2NvdW50cnkgfD4gXG4gIGJpbmRfcm93cyhzY29wdXNfY291bnRyeSwgXG4gICAgICAgICAgICB0b3RhbF9jb3VudHJ5KSB8PiBcbiAgbXV0YXRlKGNvdW50cnkgPSBhcy5jaGFyYWN0ZXIoY291bnRyeSkpIHw+IFxuICBwaXZvdF93aWRlcihuYW1lc19mcm9tID0gZGF0YWJhc2UsIFxuICAgICAgICAgICAgICB2YWx1ZXNfZnJvbSA9IHBhcGVycykgfD4gXG4gIGFycmFuZ2UoZGVzYyh0b3RhbCkpIHw+IFxuICBzbGljZSgxOjEwKSB8PiBcbiAgbXV0YXRlKHBlcmNlbnRhZ2UgPSB0b3RhbCAvICh0YWJsZV8xIHw+IHB1bGwodG90YWwpKSxcbiAgICAgICAgIHBlcmNlbnRhZ2UgPSByb3VuZChwZXJjZW50YWdlLCBkaWdpdHMgPSAyKSlcblxud29zX3Njb3B1c190b3RhbF9jb3VudHJ5XG5gYGAifQ== -->
```r
data_biblio_wos <- biblioAnalysis(wos)
wos_country <-
data_biblio_wos$Countries |>
data.frame() |>
mutate(database = "wos") |>
select(country = Tab, papers = Freq, database ) |>
arrange(desc(papers))
data_biblio_scopus <- biblioAnalysis(scopus)
scopus_country <-
data_biblio_scopus$Countries |>
data.frame() |>
mutate(database = "scopus") |>
select(country = Tab, papers = Freq, database ) |>
arrange(desc(papers))
data_biblio_total <- biblioAnalysis(wos_scopus_tos$df)
total_country <-
data_biblio_total$Countries |>
data.frame() |>
mutate(database = "total") |>
select(country = Tab, papers = Freq, database ) |>
arrange(desc(papers))
wos_scopus_total_country <-
wos_country |>
bind_rows(scopus_country,
total_country) |>
mutate(country = as.character(country)) |>
pivot_wider(names_from = database,
values_from = papers) |>
arrange(desc(total)) |>
slice(1:10) |>
mutate(percentage = total / (table_1 |> pull(total)),
percentage = round(percentage, digits = 2))
wos_scopus_total_country
wos_journal <-
wos |>
select(journal = SO) |>
na.omit() |>
count(journal, sort = TRUE) |>
slice(1:20) |>
rename(publications = n) |>
mutate(database = "wos")
scopus_journal <-
scopus |>
select(journal = SO) |>
na.omit() |>
count(journal, sort = TRUE) |>
slice(1:20) |>
rename(publications = n) |>
mutate(database = "scopus")
total_journal <-
wos_scopus_tos$df |>
select(journal = SO) |>
na.omit() |>
count(journal, sort = TRUE) |>
slice(1:20) |>
rename(publications = n) |>
mutate(database = "total")
wos_scopus_total_journal <-
wos_journal |>
bind_rows(scopus_journal,
total_journal) |>
pivot_wider(names_from = database,
values_from = publications) |>
arrange(desc(total)) |>
slice(1:10) |>
mutate(percentage = total / table_1 |> pull(total),
percentage = round(percentage, digits = 2))
wos_scopus_total_journal
wos_scopus_country_collab_matrix <-
biblioNetwork(M = wos_scopus_tos$df,
analysis = "collaboration",
network = "countries")
plot_country_collab <-
networkPlot(wos_scopus_country_collab_matrix,
weighted=T, n = 30,
Title = "Country Collaboration Network",
type = "fruchterman",
size=T,
edgesize = 5,
labelsize=0.7)
country_collab_tbl_graph <-
graph_from_adjacency_matrix(wos_scopus_country_collab_matrix ,
mode = "undirected",
weighted = TRUE,
diag = FALSE) |>
as_tbl_graph(aca_igraph, directed = FALSE ) |>
activate(nodes) |>
mutate(degree = centrality_degree()) |>
arrange(desc(degree)) |>
slice(1:30)
country_collab_tbl_graph_filtered <-
country_collab_tbl_graph |>
activate(nodes) |>
mutate(components = group_components(type = "weak")) |>
filter(components == 1) |>
mutate(degree = centrality_degree(),
community = as.factor(group_louvain()) )
country_collab_tbl_graph_filtered |>
ggraph(layout = "kk") +
geom_edge_link(alpha = .25,
aes(width = weight)) +
geom_node_point(aes(colour = community,
size = degree)) +
geom_node_text(aes(label = name), repel = TRUE) +
theme_graph()
wos_scopus_keyword_co_occurrence_matrix <-
biblioNetwork(M = wos_scopus_tos$df,
analysis = "co-occurrences",
network = "keywords",
sep = ";")
plot_net_co_occurrence <-
networkPlot(wos_scopus_keyword_co_occurrence_matrix,
weighted=T, n = 30,
Title = "Keyword Co-occurrence Network",
type = "fruchterman",
size=T,
edgesize = 5,
labelsize=0.7)
keyword_co_occurrence_tbl_graph <-
graph_from_adjacency_matrix(wos_scopus_keyword_co_occurrence_matrix ,
mode = "undirected",
weighted = TRUE,
diag = FALSE) |>
as_tbl_graph(aca_igraph, directed = FALSE ) |>
activate(nodes) |>
mutate(degree = centrality_degree()) |>
arrange(desc(degree)) |>
slice(1:30)
keyword_co_occurrence_weight_tbl <-
keyword_co_occurrence_tbl_graph |>
activate(edges) |>
select(weight) |>
as.data.frame()
threshold <-
quantile(keyword_co_occurrence_weight_tbl |>
select(weight) |>
pull(),
probs = 0.80)
keyword_co_occurrence_tbl_graph_filtered <-
keyword_co_occurrence_tbl_graph |>
activate(edges) |>
filter(weight >= threshold) |>
activate(nodes) |>
mutate(components = group_components(type = "weak")) |>
filter(components == 1) |>
mutate(degree = centrality_degree(),
community = as.factor(group_louvain()) )
keyword_co_occurrence_tbl_graph_filtered |>
ggraph(layout = "kk") +
geom_edge_link(alpha = .25,
aes(width = weight)) +
geom_node_point(aes(colour = community,
size = degree)) +
geom_node_text(aes(label = name), repel = TRUE) +
theme_graph()
tree_of_science
Finding the clusters
nodes <- # Create a dataframe with the fullname of articles
tibble(name = V(wos_scopus_tos$graph)$name) |>
left_join(wos_scopus_tos$nodes,
by = c("name" = "ID_TOS"))
wos_scopus_citation_network_1 <- # Add the article names to the citation network
wos_scopus_tos$graph |>
igraph::set.vertex.attribute(name = "full_name",
index = V(wos_scopus_tos$graph)$name,
value = nodes$CITE)
nodes_1 <- # Create a dataframe with subfields (clusters)
tibble(name = V(wos_scopus_citation_network_1)$name,
cluster = V(wos_scopus_citation_network_1)$subfield,
full_name = V(wos_scopus_citation_network_1)$full_name)
nodes_2 <- # Count the number of articles per cluster
nodes_1 |>
count(cluster, sort = TRUE) |>
mutate(cluster_1 = row_number()) |>
select(cluster, cluster_1)
nodes_3 <-
nodes_1 |>
left_join(nodes_2) |>
rename(subfield = cluster_1) |>
select(name, full_name, subfield)
Joining, by = "cluster"
edge_list <-
get.edgelist(wos_scopus_citation_network_1) |>
data.frame() |>
rename(Source = X1, Target = X2)
wos_scopus_citation_network <-
graph.data.frame(d = edge_list,
directed = TRUE,
vertices = nodes_3)
wos_scopus_citation_network |>
summary()
IGRAPH 51794e1 DN-- 7356 16320 --
+ attr: name (v/c), full_name (v/c), subfield (v/n)
Choosing clusters
We proposed the tipping point option to choose the number of clusters. See this paper:
https://www.nature.com/articles/s41598-021-85041-8
clusters <-
tibble(cluster = V(wos_scopus_citation_network)$subfield) |>
count(cluster, sort = TRUE)
clusters |>
ggplot(aes(x = reorder(cluster, n), y = n)) +
geom_point(size = 3) +
labs(x = "Clusters", y = "Number of papers") +
theme(axis.title.x = element_text(size = 16 ,
family = "Arial"),
axis.title.y = element_text(size = 16, family = "Arial"),
axis.text.x = element_text(size = 12, family = "Arial"),
axis.text.y = element_text(size = 12, family = "Arial"))
Removing not chosen clusters
wos_scopus_citation_network_clusters <-
wos_scopus_citation_network |>
delete.vertices(which(V(wos_scopus_citation_network)$subfield != 1 & # filter clusters
V(wos_scopus_citation_network)$subfield != 2 &
V(wos_scopus_citation_network)$subfield != 3 &
V(wos_scopus_citation_network)$subfield != 4))
wos_scopus_citation_network_clusters |>
summary()
IGRAPH 6e3a93b DN-- 3521 7905 --
+ attr: name (v/c), full_name (v/c), subfield (v/n)
pal <- brewer.pal(8,"Dark2")
nodes_full_data <-
tibble(name = V(wos_scopus_citation_network)$name,
cluster = V(wos_scopus_citation_network)$subfield,
full_name = V(wos_scopus_citation_network)$full_name)
cluster_1 <-
wos_scopus_citation_network |>
delete.vertices(which(V(wos_scopus_citation_network)$subfield != 1))
cluster_1_page_rank <-
cluster_1 |>
set.vertex.attribute(name = "page_rank",
value = page_rank(cluster_1)$vector)
cluster_1_df <-
tibble(name = V(cluster_1_page_rank)$name,
full_name = V(cluster_1_page_rank)$full_name,
page_rank = V(cluster_1_page_rank)$page_rank,
cluster = V(cluster_1_page_rank)$subfield,)
nodes_full_data |>
filter(cluster == 1) |>
select(full_name) |>
mutate(full_name = str_extract(full_name, SPC %R% # Regular expressions
one_or_more(WRD) %R%
SPC %R%
one_or_more(or(WRD, ANY_CHAR))),
full_name = str_remove(full_name, OPEN_PAREN %R%
repeated(DGT, 4) %R%
CLOSE_PAREN %R%
one_or_more(or(WRD,ANY_CHAR))),
full_name = str_trim(full_name)) |>
unnest_tokens(output = word, input = full_name) |> # Tokenization
anti_join(stop_words) |> # Removing stop words
filter(word != "doi",
!str_detect(word, "[0-9]")) |> # WoS data
filter(word == str_remove(word, pattern = "citation"),
word == str_remove(word, pattern = "research"), # Words removed
word == str_remove(word, pattern = "analysis"),
word == str_remove(word, pattern = "science"),
word == str_remove(word, pattern = "scientometric"),
word == str_remove(word, pattern = "management"),
word == str_remove(word, pattern = "bibliometric"),
word == str_remove(word, pattern = "review"),
word == str_remove(word, pattern = "journal")) |>
count(word, sort = TRUE) |>
with(wordcloud(word,
n,
random.order = FALSE,
max.words = 50,
colors=pal))
Joining, by = "word"
Warning in wordcloud(word, n, random.order = FALSE, max.words = 50, colors = pal) :
performance could not be fit on page. It will not be plotted.
cluster_2 <-
wos_scopus_citation_network |>
delete.vertices(which(V(wos_scopus_citation_network)$subfield != 2))
cluster_2_page_rank <-
cluster_2 |>
set.vertex.attribute(name = "page_rank",
value = page_rank(cluster_2)$vector)
cluster_2_df <-
tibble(name = V(cluster_2_page_rank)$name,
full_name = V(cluster_2_page_rank)$full_name,
page_rank = V(cluster_2_page_rank)$page_rank,
cluster = V(cluster_2_page_rank)$subfield,)
nodes_full_data |>
filter(cluster == 2) |>
select(full_name) |>
mutate(full_name = str_extract(full_name, SPC %R% # Regular expressions
one_or_more(WRD) %R%
SPC %R%
one_or_more(or(WRD, ANY_CHAR))),
full_name = str_remove(full_name, OPEN_PAREN %R%
repeated(DGT, 4) %R%
CLOSE_PAREN %R%
one_or_more(or(WRD,ANY_CHAR))),
full_name = str_trim(full_name)) |>
unnest_tokens(output = word, input = full_name) |>
anti_join(stop_words) |>
filter(word != "doi",
!str_detect(word, "[0-9]")) |> # WoS data
filter(word == str_remove(word, pattern = "citation"),
word == str_remove(word, pattern = "research"),
word == str_remove(word, pattern = "analysis"),
word == str_remove(word, pattern = "science"),
word == str_remove(word, pattern = "scientometric"),
word == str_remove(word, pattern = "vulnerability")) |>
count(word, sort = TRUE) |>
with(wordcloud(word,
n,
random.order = FALSE,
max.words = 50,
colors=pal))
Joining, by = "word"
cluster_3 <-
wos_scopus_citation_network |>
delete.vertices(which(V(wos_scopus_citation_network)$subfield != 3))
cluster_3_page_rank <-
cluster_3 |>
set.vertex.attribute(name = "page_rank",
value = page_rank(cluster_3)$vector)
cluster_3_df <-
tibble(name = V(cluster_3_page_rank)$name,
full_name = V(cluster_3_page_rank)$full_name,
page_rank = V(cluster_3_page_rank)$page_rank,
cluster = V(cluster_3_page_rank)$subfield,)
nodes_full_data |>
filter(cluster == 3) |>
select(full_name) |>
mutate(full_name = str_extract(full_name, SPC %R% # Regular expressions
one_or_more(WRD) %R%
SPC %R%
one_or_more(or(WRD, ANY_CHAR))),
full_name = str_remove(full_name, OPEN_PAREN %R%
repeated(DGT, 4) %R%
CLOSE_PAREN %R%
one_or_more(or(WRD,ANY_CHAR))),
full_name = str_trim(full_name)) |>
unnest_tokens(output = word, input = full_name) |>
anti_join(stop_words) |>
filter(word != "doi",
!str_detect(word, "[0-9]")) |> # WoS data
filter(word == str_remove(word, pattern = "citation"),
word == str_remove(word, pattern = "research"),
word == str_remove(word, pattern = "analysis"),
word == str_remove(word, pattern = "science"),
word == str_remove(word, pattern = "scientometric"),
word == str_remove(word, pattern = "vulnerability"),
word == str_remove(word, pattern = "journal"),
word == str_remove(word, pattern = "information")) |>
count(word, sort = TRUE) |>
with(wordcloud(word,
n,
random.order = FALSE,
max.words = 50,
colors=pal))
Joining, by = "word"
cluster_4 <-
wos_scopus_citation_network |>
delete.vertices(which(V(wos_scopus_citation_network)$subfield != 4))
cluster_4_page_rank <-
cluster_4 |>
set.vertex.attribute(name = "page_rank",
value = page_rank(cluster_4)$vector)
cluster_4_df <-
tibble(name = V(cluster_4_page_rank)$name,
full_name = V(cluster_4_page_rank)$full_name,
page_rank = V(cluster_4_page_rank)$page_rank,
cluster = V(cluster_4_page_rank)$subfield,)
nodes_full_data |>
filter(cluster == 4) |>
select(full_name) |>
mutate(full_name = str_extract(full_name, SPC %R% # Regular expressions
one_or_more(WRD) %R%
SPC %R%
one_or_more(or(WRD, ANY_CHAR))),
full_name = str_remove(full_name, OPEN_PAREN %R%
repeated(DGT, 4) %R%
CLOSE_PAREN %R%
one_or_more(or(WRD,ANY_CHAR))),
full_name = str_trim(full_name)) |>
unnest_tokens(output = word, input = full_name) |>
anti_join(stop_words) |>
filter(word != "doi",
!str_detect(word, "[0-9]")) |> # WoS data
filter(word == str_remove(word, pattern = "citation"),
word == str_remove(word, pattern = "research"),
word == str_remove(word, pattern = "analysis"),
word == str_remove(word, pattern = "science"),
word == str_remove(word, pattern = "scientometric"),
word == str_remove(word, pattern = "vulnerability")) |>
count(word, sort = TRUE) |>
with(wordcloud(word,
n,
random.order = FALSE,
max.words = 50,
colors=pal))
Joining, by = "word"
Warning in wordcloud(word, n, random.order = FALSE, max.words = 50, colors = pal) :
university could not be fit on page. It will not be plotted.
Warning in wordcloud(word, n, random.order = FALSE, max.words = 50, colors = pal) :
academic could not be fit on page. It will not be plotted.
Warning in wordcloud(word, n, random.order = FALSE, max.words = 50, colors = pal) :
universities could not be fit on page. It will not be plotted.
Warning in wordcloud(word, n, random.order = FALSE, max.words = 50, colors = pal) :
education could not be fit on page. It will not be plotted.
Warning in wordcloud(word, n, random.order = FALSE, max.words = 50, colors = pal) :
performance could not be fit on page. It will not be plotted.
write_csv(wos_scopus_tos$df, "wos_scopus_tos.csv") # Exporting all data merged
write_csv(table_1, "table_1.csv") # Exporting table 1
write_csv(wos_scopus_total_country, "table_2_.csv") # Exporting table 2
write_csv(wos_scopus_authors, "table_3.csv") # Exporting table 3
write_csv(wos_scopus_total_journal, "table_4.csv") # Exporting table 4
write_csv(languages, "figure_1.csv") # Exporting data figure 1
write_csv(figure_2_data, "figure_2.csv") # Exporting data figure 2
write.graph(wos_scopus_citation_network, "citation_network_full.graphml", "graphml") # Exporting graph
write.graph(wos_scopus_citation_network_clusters,
"wos_scopus_citation_network_clusters.graphml",
"graphml")
aca_graphml_nodes <-
aca_tbl_graph_filtered |>
activate(nodes) |>
as_tibble() |>
rename(author = name) |>
rownames_to_column("name")
aca_graphml_edges <-
aca_tbl_graph_filtered |>
activate(edges) |>
as_tibble()
aca_graphml <-
graph_from_data_frame(d = aca_graphml_edges,
directed = FALSE,
vertices = aca_graphml_nodes)
write_graph(aca_graphml, "aca_graph.graphml", "graphml") # Export author co-citation graph
author_collab_graphml_nodes <-
author_collab_tbl_graph_filtered |>
activate(nodes) |>
as_tibble() |>
rename(author = name) |>
rownames_to_column("name")
author_collab_graphml_edges <-
author_collab_tbl_graph_filtered |>
activate(edges) |>
as_tibble()
author_collab_graphml <-
graph_from_data_frame(d = author_collab_graphml_edges,
directed = FALSE,
vertices = author_collab_graphml_nodes)
write_graph(author_collab_graphml, "author_collab_graphml.graphml", "graphml") # Export author co-citation graph
country_collab_graphml_nodes <-
country_collab_tbl_graph_filtered |>
activate(nodes) |>
as_tibble() |>
rename(author = name) |>
rownames_to_column("name")
country_collab_graphml_edges <-
country_collab_tbl_graph_filtered |>
activate(edges) |>
as_tibble()
country_collab_graphml <-
graph_from_data_frame(d = country_collab_graphml_edges,
directed = FALSE,
vertices = country_collab_graphml_nodes)
write_graph(country_collab_graphml, "country_collab_graphml.graphml", "graphml") # Export author co-citation graph
keyword_co_occurrence_graphml_nodes <-
keyword_co_occurrence_tbl_graph_filtered |>
activate(nodes) |>
as_tibble() |>
rename(author = name) |>
rownames_to_column("name")
keyword_co_occurrence_graphml_edges <-
keyword_co_occurrence_tbl_graph_filtered |>
activate(edges) |>
as_tibble()
keyword_co_occurrence_graphml <-
graph_from_data_frame(d = keyword_co_occurrence_graphml_edges,
directed = FALSE,
vertices = keyword_co_occurrence_graphml_nodes)
write_graph(keyword_co_occurrence_graphml, "keyword_co_occurrence_graphml.graphml", "graphml") # Export author co-citation graph
write.csv(tree_of_science, "tree_of_science.csv") # Exporting Tree of Science
write.csv(cluster_1_df, "cluster_1.csv") # Exporting cluster 1
write.csv(cluster_2_df, "cluster_2.csv") # Exporting cluster 2
write.csv(cluster_3_df, "cluster_3.csv") # Exporting cluster 3
write.csv(cluster_4_df, "cluster_4.csv") # Exporting cluster 4
write.csv(nodes_full_data, "nodes_full_data.csv") # Exporting all nodes