汇总与主要出版物相关的共同出版物
Aggregate copublications associated with a primary publication
每个 primary_citation 可能有多个共同出版物。我想汇总与每个主要引用相关的 citation_id。以下代码有效,但创建了必须随后删除的重复行。我正在寻找一种避免创建重复行的方法。
dat %>%
group_by(primary_citation) %>%
mutate(copublications = paste0(citation_id, collapse = ", ")) %>%
ungroup() %>%
select(-citation_id)
dat <- structure(list(primary_citation = c("29967037", "32439388", "32439388",
"28475431", "29967037", "29703800", "29967037", "23899372", "28125624",
"35304745", "12057549", "12057549", "12057549", "12057549", "12057549"
), citation_id = c("34176288", "34470135", "149786406", "32119129",
"32517785", "31121137", "L621236193", "28125624", "23899372",
"31641005", "19366459", "17166220", "17166221", "16411990", "15113445"
)), row.names = c(NA, -15L), class = c("tbl_df", "tbl", "data.frame"
))
Lmk 如果这就是您所需要的:
dat %>%
group_by(primary_citation) %>%
mutate(N = paste0("copublication_",row_number())) %>%
ungroup() %>%
pivot_wider(
id_cols = primary_citation,
names_from = N,
values_from = !c(primary_citation, N),
values_fill = NA)
每个 primary_citation 可能有多个共同出版物。我想汇总与每个主要引用相关的 citation_id。以下代码有效,但创建了必须随后删除的重复行。我正在寻找一种避免创建重复行的方法。
dat %>%
group_by(primary_citation) %>%
mutate(copublications = paste0(citation_id, collapse = ", ")) %>%
ungroup() %>%
select(-citation_id)
dat <- structure(list(primary_citation = c("29967037", "32439388", "32439388",
"28475431", "29967037", "29703800", "29967037", "23899372", "28125624",
"35304745", "12057549", "12057549", "12057549", "12057549", "12057549"
), citation_id = c("34176288", "34470135", "149786406", "32119129",
"32517785", "31121137", "L621236193", "28125624", "23899372",
"31641005", "19366459", "17166220", "17166221", "16411990", "15113445"
)), row.names = c(NA, -15L), class = c("tbl_df", "tbl", "data.frame"
))
Lmk 如果这就是您所需要的:
dat %>%
group_by(primary_citation) %>%
mutate(N = paste0("copublication_",row_number())) %>%
ungroup() %>%
pivot_wider(
id_cols = primary_citation,
names_from = N,
values_from = !c(primary_citation, N),
values_fill = NA)