OpenAlex4Gephi

Running

App Files Files Community

OpenAlex4Gephi / OpenAlexNodes.R

Ifeanyi

Upload 3 files

5fd4781 almost 2 years ago

raw

history blame

2.46 kB

	authorPubNodes <- function(keywords,pub_start_date,pub_end_date){

	keywords <- keywords
	pub_start_date <- pub_start_date
	pub_end_date <- pub_end_date

	# create search engine function
	search_engine <- function(keywords,pub_start_date,pub_end_date){
	suppressPackageStartupMessages(library(openalexR))
	suppressPackageStartupMessages(library(tidyverse))

	options(openalexR.mailto = "[email protected]")

	# search engine
	works_search <- oa_fetch(
	entity = "works",
	title.search = keywords,
	cited_by_count = ">50",
	from_publication_date = pub_start_date,
	to_publication_date = pub_end_date,
	options = list(sort = "cited_by_count:desc"),
	verbose = FALSE
	)

	return(works_search)

	}

	search_data <- search_engine(keywords,pub_start_date,pub_end_date)


	# grab authors and group them according to collaboration
	authors_collaboration_groups <- list()
	for (i in 1:nrow(search_data)){
	authors_collaboration_groups[[i]] <- search_data$author[[i]][2]
	}

	# grab all authors
	all_authors <- c()
	for (i in 1:length(authors_collaboration_groups)) {
	all_authors <- c(all_authors,authors_collaboration_groups[[i]][[1]])
	}

	# get length of each authors collaboration
	authors_length <- c()
	for(authors in 1:length(authors_collaboration_groups)){
	authors_length <- c(authors_length,authors_collaboration_groups[[authors]] \|> nrow())
	}

	# grab all publications
	publications <- list()
	for (i in 1:nrow(search_data)){
	publications[[i]] <- rep(search_data$display_name[i], each = authors_length[i])
	}

	# place all publications in a vector
	all_publications <- c()
	for(i in 1:length(publications)){
	all_publications <- c(all_publications,publications[[i]])
	}

	# create author_to_publication data frame
	authors_to_publications <- data.frame(
	Authors = all_authors,
	Publications = all_publications
	)

	# stack the df so that authors and publications
	# are together as one column
	stacked_df <- stack(authors_to_publications)
	stacked_df <- unique.data.frame(stacked_df) # remove duplicate rows
	stacked_df <- stacked_df[-2] # delete second column in df

	# create author_publications_nodes df
	author_publication_nodes <- data.frame(
	Id = 1:nrow(stacked_df),
	Nodes = stacked_df$values,
	Label = stacked_df$values
	)


	return(author_publication_nodes)


	}