Spaces:
Running
Running
authorPubNodes <- function(keywords,pub_start_date,pub_end_date){ | |
keywords <- keywords | |
pub_start_date <- pub_start_date | |
pub_end_date <- pub_end_date | |
# create search engine function | |
search_engine <- function(keywords,pub_start_date,pub_end_date){ | |
suppressPackageStartupMessages(library(openalexR)) | |
suppressPackageStartupMessages(library(tidyverse)) | |
options(openalexR.mailto = "[email protected]") | |
# search engine | |
works_search <- oa_fetch( | |
entity = "works", | |
title.search = keywords, | |
cited_by_count = ">50", | |
from_publication_date = pub_start_date, | |
to_publication_date = pub_end_date, | |
options = list(sort = "cited_by_count:desc"), | |
verbose = FALSE | |
) | |
return(works_search) | |
} | |
search_data <- search_engine(keywords,pub_start_date,pub_end_date) | |
# grab authors and group them according to collaboration | |
authors_collaboration_groups <- list() | |
for (i in 1:nrow(search_data)){ | |
authors_collaboration_groups[[i]] <- search_data$author[[i]][2] | |
} | |
# grab all authors | |
all_authors <- c() | |
for (i in 1:length(authors_collaboration_groups)) { | |
all_authors <- c(all_authors,authors_collaboration_groups[[i]][[1]]) | |
} | |
# get length of each authors collaboration | |
authors_length <- c() | |
for(authors in 1:length(authors_collaboration_groups)){ | |
authors_length <- c(authors_length,authors_collaboration_groups[[authors]] |> nrow()) | |
} | |
# grab all publications | |
publications <- list() | |
for (i in 1:nrow(search_data)){ | |
publications[[i]] <- rep(search_data$display_name[i], each = authors_length[i]) | |
} | |
# place all publications in a vector | |
all_publications <- c() | |
for(i in 1:length(publications)){ | |
all_publications <- c(all_publications,publications[[i]]) | |
} | |
# create author_to_publication data frame | |
authors_to_publications <- data.frame( | |
Authors = all_authors, | |
Publications = all_publications | |
) | |
# stack the df so that authors and publications | |
# are together as one column | |
stacked_df <- stack(authors_to_publications) | |
stacked_df <- unique.data.frame(stacked_df) # remove duplicate rows | |
stacked_df <- stacked_df[-2] # delete second column in df | |
# create author_publications_nodes df | |
author_publication_nodes <- data.frame( | |
Id = 1:nrow(stacked_df), | |
Nodes = stacked_df$values, | |
Label = stacked_df$values | |
) | |
return(author_publication_nodes) | |
} |