updating for classification tasks
This commit is contained in:
parent
747ddf8ee9
commit
57151a3618
13362
auto-dedup-cites.csv
Normal file
13362
auto-dedup-cites.csv
Normal file
File diff suppressed because one or more lines are too long
140208
auto_dedup_results.bib
Normal file
140208
auto_dedup_results.bib
Normal file
File diff suppressed because one or more lines are too long
25
lit-dedup.R
25
lit-dedup.R
@ -1,2 +1,25 @@
|
||||
install.packages("devtools")
|
||||
devtools::install_github("camaradesuk/ASySD")
|
||||
devtools::install_github("camaradesuk/ASySD")
|
||||
library(ASySD)
|
||||
library(tidyverse)
|
||||
|
||||
#sv_files <- list.files("/Users/mgone/Desktop/SLR_references_total/both_waves_references", pattern = "*.bib", full.names = TRUE)
|
||||
|
||||
t1all <- ASySD::load_search("/Users/mgone/Desktop/SLR_references_total/SLR_references_1/t1all.bib", method="bib")
|
||||
|
||||
t2all <- ASySD::load_search("/Users/mgone/Desktop/SLR_references_total/SLR_references_2/t2all.bib", method="bib")
|
||||
|
||||
common_columns <- intersect(names(t1all), names(t2all))
|
||||
t1_common <- t1all[, common_columns, drop = FALSE]
|
||||
t2_common <- t2all[, common_columns, drop = FALSE]
|
||||
|
||||
all_citations <- rbind(t1_common, t2_common)
|
||||
|
||||
dedup_results <- batch_dedup(all_citations, batch_n=1000, sort_by = c('year', 'title', 'abstract', 'author'))
|
||||
unique_dedup_results <- dedup_results$unique
|
||||
write_citations(unique_dedup_results, type="bib", filename="auto_dedup_results.bib")
|
||||
#dedup
|
||||
#results <- batch_dedup(citations, batch_n=2000, sort_by = c("year", "title","author"))
|
||||
#unique_r2 <- results_r2$unique
|
||||
|
||||
#write_citations(citations, type = c("ris", "txt", "csv", "bib"), filename)
|
||||
|
Loading…
Reference in New Issue
Block a user