从数据框中提取带有条件的列名

多维尼·贾亚辛格(Dovini jayasinghe)
dput(new)
structure(list(ID = c(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 
13, 14, 15, 16, 17, 18, 19, 20, 21, 22), A1 = c(1, 1, 1, 1, 0, 
0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0), A2 = c(1, 
1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
), A3 = c(0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
0, 0, 0, 0, 0), A4 = c(0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
0, 0, 0, 0, 0, 0, 0, 0, 0), A5 = c(0, 0, 0, 0, 0, 0, 0, 0, 0, 
0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0), A6 = c(0, 0, 0, 0, 0, 
0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0), A7 = c(0, 
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0
), A8 = c(0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1, 
1, 1, 1, 0, 0), A9 = c(0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 
0, 0, 0, 0, 0, 0, 0, 0, 0)), row.names = c(NA, -22L), class = c("tbl_df", 
"tbl", "data.frame"))

我有以下数据框。我需要提取并打印出现1的ID和逗号分隔的列名。例如:

1 A1,A2
2 A1,A2
3 A1
4 A1
6 A2,A8
7 A6,A8

等等...

如何进行?

这是我的尝试:

vec_ID <- c()
vec_JOB <- c()
job <- 0
for(i in 1 : length(ID)){
  for(j in 2:10){
    if(new[i,j]==1){
      vec_ID[i] <- ID[i] 
    }
  }
}
print(vec_ID)
vec_ID <- vec_ID[!is.na(vec_ID)]
#vec_ID <- as.data.frame(vec_ID)
print(vec_ID)

new_df <- new[ID[vec_ID],]
View(new_df)

for (i in 1:nrow(vec_ID)) {

}
索托斯

下面是使用经由基础R一个衬垫stackaggregate

aggregate(ind ~ ID, 
          subset(cbind(ID = new$ID, stack(replace(new, new == 0, '')[-1])), values == 1), 
          toString)

这使,

   ID    ind
1   1 A1, A2
2   2 A1, A2
3   3     A1
4   4     A1
5   6 A2, A8
6   7 A6, A8
7   8 A1, A8
8   9 A6, A8
9  10     A8
10 11 A1, A8
11 12     A6
12 13 A5, A8
13 15     A8
14 16     A8
15 17     A8
16 18     A8
17 19     A8
18 20     A8
19 21     A7

本文收集自互联网,转载请注明来源。

如有侵权,请联系 [email protected] 删除。

编辑于
0

我来说两句

0 条评论
登录 后参与评论

相关文章