这里我们使用一些不可读的base R。如果使用dplyr管道让代码可读,不妨使用group/summarise
data.frame(id = unique(exdf$id),
dv = cbind(lapply(split(exdf, exdf$id),
function(x) unlist(x$dv))))
id dv
1 1 3, 5, 6, 4, 7, 4, 2, 1, 6, 5, 5, 8, 5
2 2 2, 8, 8, 6, 6, 1, 1, 7, 7, 4, 4, 7, 5, 5, 2, 3, 6, 4
3 3 2, 6, 5, 6, 3, 3, 8, 6, 6, 1
4 4 7, 4, 6, 8, 3, 4, 2, 4, 5, 5, 3, 4, 5, 2
5 5 4, 7, 8, 2, 6, 2, 6, 3, 5, 8, 6, 3, 4, 2, 1, 3, 2, 3
6 6 4, 1, 7, 1, 8, 6, 4, 7, 8, 4, 1, 3
7 7 7, 3, 4, 7, 3, 3, 4, 3, 6, 7, 7, 4
8 8 4, 2, 7, 6, 8, 7, 4, 8, 4, 4, 2, 8, 6, 6
9 9 1, 6, 4, 7, 6, 8, 4, 6, 4, 3, 4, 5, 2, 2, 5, 8, 3, 2, 8
10 10 5, 5, 7, 1, 4, 2, 6, 1, 2, 2, 1, 1, 6, 8, 8, 2, 7, 6
如果我们死心塌地使用“聚合”,您可以通过将数字列表更改为字符来执行以下操作。然后使用正则表达式提取这些数字。
exdf$dv <- as.character(exdf$dv)
aggregate(
formula=dv~id,
data=exdf,
FUN = function(x) regmatches(paste0(x, collapse = ""),
gregexpr('[0-9]', paste0(x, collapse = ""))))
id dv
1 1 3, 5, 6, 4, 7, 4, 2, 1, 6, 5, 5, 8, 5
2 2 2, 8, 8, 6, 6, 1, 1, 7, 7, 4, 4, 7, 5, 5, 2, 3, 6, 4
3 3 2, 6, 5, 6, 3, 3, 8, 6, 6, 1
4 4 7, 4, 6, 8, 3, 4, 2, 4, 5, 5, 3, 4, 5, 2
5 5 4, 7, 8, 2, 6, 2, 6, 3, 5, 8, 6, 3, 4, 2, 1, 3, 2, 3
6 6 4, 1, 7, 1, 8, 6, 4, 7, 8, 4, 1, 3
7 7 7, 3, 4, 7, 3, 3, 4, 3, 6, 7, 7, 4
8 8 4, 2, 7, 6, 8, 7, 4, 8, 4, 4, 2, 8, 6, 6
9 9 1, 6, 4, 7, 6, 8, 4, 6, 4, 3, 4, 5, 2, 2, 5, 8, 3, 2, 8
10 10 5, 5, 7, 1, 4, 2, 6, 1, 2, 2, 1, 1, 6, 8, 8, 2, 7, 6