dput(new)
structure(list(ID = c(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12,
13, 14, 15, 16, 17, 18, 19, 20, 21, 22), A1 = c(1, 1, 1, 1, 0,
0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0), A2 = c(1,
1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
), A3 = c(0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0), A4 = c(0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0), A5 = c(0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0), A6 = c(0, 0, 0, 0, 0,
0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0), A7 = c(0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0
), A8 = c(0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 1, 1, 1,
1, 1, 1, 0, 0), A9 = c(0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0)), row.names = c(NA, -22L), class = c("tbl_df",
"tbl", "data.frame"))
Run Code Online (Sandbox Code Playgroud)
我有以下数据框。我需要提取并打印出现 1 的 id 和逗号分隔的列名。例如:
1 A1,A2
2 A1,A2
3 A1
4 A1
6 A2,A8
7 A6,A8
Run Code Online (Sandbox Code Playgroud)
等等...
如何进行?
这是我的尝试:
vec_ID <- c()
vec_JOB <- c()
job <- 0
for(i in 1 : length(ID)){
for(j in 2:10){
if(new[i,j]==1){
vec_ID[i] <- ID[i]
}
}
}
print(vec_ID)
vec_ID <- vec_ID[!is.na(vec_ID)]
#vec_ID <- as.data.frame(vec_ID)
print(vec_ID)
new_df <- new[ID[vec_ID],]
View(new_df)
for (i in 1:nrow(vec_ID)) {
}
Run Code Online (Sandbox Code Playgroud)
你可以做:
apply(df[-1], 1, function(x) toString(names(df[-1])[as.logical(x)]))
[1] "A1, A2" "A1, A2" "A1" "A1" "" "A2, A8" "A6, A8" "A1, A8" "A6, A8" "A8" "A1, A8" "A6"
[13] "A5, A8" "" "A8" "A8" "A8" "A8" "A8" "A8" "A7" ""
Run Code Online (Sandbox Code Playgroud)
这是一个通过底座 R 的单行,使用stack和aggregate,
aggregate(ind ~ ID,
subset(cbind(ID = new$ID, stack(replace(new, new == 0, '')[-1])), values == 1),
toString)
Run Code Online (Sandbox Code Playgroud)
这使,
Run Code Online (Sandbox Code Playgroud)ID ind 1 1 A1, A2 2 2 A1, A2 3 3 A1 4 4 A1 5 6 A2, A8 6 7 A6, A8 7 8 A1, A8 8 9 A6, A8 9 10 A8 10 11 A1, A8 11 12 A6 12 13 A5, A8 13 15 A8 14 16 A8 15 17 A8 16 18 A8 17 19 A8 18 20 A8 19 21 A7