如何在 R 中重塑这个宽 table 以允许成对比较?
How do I reshape this wide table in R to allow pairwise comparisons?
我有以下数据:
structure(list(id = c(174L, 187L, 188L, 190L, 213L, 234L), p7 = c(1L,
1L, NA, 1L, 0L, 1L), p4 = c(1L, NA, NA, 1L, 1L, 1L), p3 = c(1L,
1L, 1L, 1L, NA, 1L), p6 = c(1L, NA, NA, 1L, 1L, 1L), p1 = c(1L,
1L, 1L, 1L, NA, 1L), p2 = c(1L, 1L, 1L, 1L, 1L, 1L), p5 = c(1L,
0L, NA, 1L, NA, 1L), p8 = c(1L, NA, NA, 1L, 1L, 1L), q1 = c(1L,
1L, NA, NA, NA, NA), q2 = c(NA, NA, 0L, NA, NA, NA), q3 = c(1L,
1L, 1L, NA, 0L, 0L), q4 = c(NA, NA, NA, 0L, 0L, 0L), q5 = c(NA,
1L, 0L, 1L, 0L, 1L), q6 = c(1L, NA, 1L, 1L, 0L, NA), q7 = c(0L,
NA, 0L, 0L, NA, 1L), q8 = c(1L, NA, 0L, 0L, 0L, 0L)), .Names = c("id",
"p7", "p4", "p3", "p6", "p1", "p2", "p5", "p8", "q1", "q2", "q3",
"q4", "q5", "q6", "q7", "q8"), row.names = c(NA, 6L), class = "data.frame")
我需要一个数据框,其中第一列包含 id
重复 8 次,第二列包含所有标有 p
的值(按此顺序),第三列包含标有 q
的所有值(按此顺序)。我需要这个,所以我可以在相应的 p
s 和 q
s 数据点之间进行成对比较。
有什么提示吗?
library(reshape2)
df = structure(list(id=c(174L,187L,188L,190L,213L,234L),p7=c(1L,
1L,NA,1L,0L,1L),p4=c(1L,NA,NA,1L,1L,1L),p3=c(1L,
1L,1L,1L,NA,1L),p6=c(1L,NA,NA,1L,1L,1L),p1=c(1L,
1L,1L,1L,NA,1L),p2=c(1L,1L,1L,1L,1L,1L),p5=c(1L,
0L,NA,1L,NA,1L),p8=c(1L,NA,NA,1L,1L,1L),q1=c(1L,
1L,NA,NA,NA,NA),q2=c(NA,NA,0L,NA,NA,NA),q3=c(1L,
1L,1L,NA,0L,0L),q4=c(NA,NA,NA,0L,0L,0L),q5=c(NA,
1L,0L,1L,0L,1L),q6=c(1L,NA,1L,1L,0L,NA),q7=c(0L,
NA,0L,0L,NA,1L),q8=c(1L,NA,0L,0L,0L,0L)),.Names=c("id",
"p7","p4","p3","p6","p1","p2","p5","p8","q1","q2","q3",
"q4","q5","q6","q7","q8"),row.names=c(NA,6L),class="data.frame")
p = melt(df, id.vars=c("id"),measure.vars=c("p7", "p4", "p3", "p6","p1", "p2", "p5", "p8"), variable.name="p")
q = melt(df, id.vars=c("id"),measure.vars=c("q1", "q2", "q3", "q4","q5", "q6", "q7", "q8"), variable.name="q")
both = cbind(p, q)
我们可以使用 data.table
中的 melt
轻松做到这一点,它可以占用多个 measure
patterns
library(data.table)
melt(setDT(df), measure = patterns("^p\d+", "^q\d+"),
value.name = c("p", "q"), variable.name = "grp")
我有以下数据:
structure(list(id = c(174L, 187L, 188L, 190L, 213L, 234L), p7 = c(1L,
1L, NA, 1L, 0L, 1L), p4 = c(1L, NA, NA, 1L, 1L, 1L), p3 = c(1L,
1L, 1L, 1L, NA, 1L), p6 = c(1L, NA, NA, 1L, 1L, 1L), p1 = c(1L,
1L, 1L, 1L, NA, 1L), p2 = c(1L, 1L, 1L, 1L, 1L, 1L), p5 = c(1L,
0L, NA, 1L, NA, 1L), p8 = c(1L, NA, NA, 1L, 1L, 1L), q1 = c(1L,
1L, NA, NA, NA, NA), q2 = c(NA, NA, 0L, NA, NA, NA), q3 = c(1L,
1L, 1L, NA, 0L, 0L), q4 = c(NA, NA, NA, 0L, 0L, 0L), q5 = c(NA,
1L, 0L, 1L, 0L, 1L), q6 = c(1L, NA, 1L, 1L, 0L, NA), q7 = c(0L,
NA, 0L, 0L, NA, 1L), q8 = c(1L, NA, 0L, 0L, 0L, 0L)), .Names = c("id",
"p7", "p4", "p3", "p6", "p1", "p2", "p5", "p8", "q1", "q2", "q3",
"q4", "q5", "q6", "q7", "q8"), row.names = c(NA, 6L), class = "data.frame")
我需要一个数据框,其中第一列包含 id
重复 8 次,第二列包含所有标有 p
的值(按此顺序),第三列包含标有 q
的所有值(按此顺序)。我需要这个,所以我可以在相应的 p
s 和 q
s 数据点之间进行成对比较。
有什么提示吗?
library(reshape2)
df = structure(list(id=c(174L,187L,188L,190L,213L,234L),p7=c(1L,
1L,NA,1L,0L,1L),p4=c(1L,NA,NA,1L,1L,1L),p3=c(1L,
1L,1L,1L,NA,1L),p6=c(1L,NA,NA,1L,1L,1L),p1=c(1L,
1L,1L,1L,NA,1L),p2=c(1L,1L,1L,1L,1L,1L),p5=c(1L,
0L,NA,1L,NA,1L),p8=c(1L,NA,NA,1L,1L,1L),q1=c(1L,
1L,NA,NA,NA,NA),q2=c(NA,NA,0L,NA,NA,NA),q3=c(1L,
1L,1L,NA,0L,0L),q4=c(NA,NA,NA,0L,0L,0L),q5=c(NA,
1L,0L,1L,0L,1L),q6=c(1L,NA,1L,1L,0L,NA),q7=c(0L,
NA,0L,0L,NA,1L),q8=c(1L,NA,0L,0L,0L,0L)),.Names=c("id",
"p7","p4","p3","p6","p1","p2","p5","p8","q1","q2","q3",
"q4","q5","q6","q7","q8"),row.names=c(NA,6L),class="data.frame")
p = melt(df, id.vars=c("id"),measure.vars=c("p7", "p4", "p3", "p6","p1", "p2", "p5", "p8"), variable.name="p")
q = melt(df, id.vars=c("id"),measure.vars=c("q1", "q2", "q3", "q4","q5", "q6", "q7", "q8"), variable.name="q")
both = cbind(p, q)
我们可以使用 data.table
中的 melt
轻松做到这一点,它可以占用多个 measure
patterns
library(data.table)
melt(setDT(df), measure = patterns("^p\d+", "^q\d+"),
value.name = c("p", "q"), variable.name = "grp")