首页 > 解决方案 > 通过考虑 r (2) 中的分组 Q 矩阵来操作字符向量

问题描述

我正在尝试基于一个Group变量编写代码,该变量item.map具有项目信息,其中包括一个 q 矩阵,显示哪个项目与哪个组相关联。

    Group <- c(1,2,3,4)
item.map <- data.frame(
  item.id = c(21,41,61,72),
  group.1 = c(1,1,1,0),
  group.2 = c(0,1,0,1),
  group.3 = c(1,1,1,0),
  group.4 = c(0,0,0,1))

> item.map
  item.id group.1 group.2 group.3 group.4
1      21       1       0       1       0
2      41       1       1       1       0
3      61       1       0       1       0
4      72       0       1       0       1

在这个item.mapgroup.1 中有 3 个项目,而 group.2 有两个项目,group.3有三个项目和group.41 个项目。使用这个 item.map 我想在下面的代码块中分配这些项目,但我无法插入item.map信息.

   OUTPUT <- as.data.frame(c())
for(i in 1:length(item.map$item.id)) {
 
  for(k in 0:(length(Group))) { # here with the length(State) I gained the sequqnece of 0,1,2,3
    output <- paste0("Equal = ",paste0(paste("(", "G1, ",item.map$item.id[i], ","," Slope[",k,"])",collapse=", ", sep=""),", ",
                                        paste( "(", "G2, ",item.map$item.id[i], ","," Slope[",k,"])",collapse=", ", sep=""),
                                        ";"))
    OUTPUT <- c(OUTPUT, output)
    
  }
}


[1] "Equal = (G1, 21, Slope[0]), (G2, 21, Slope[0]), (G3, 21, Slope[0]), (G4, 21, Slope[0]);"
[1] "Equal = (G1, 21, Slope[1]), (G2, 21, Slope[1]), (G3, 21, Slope[1]), (G4, 21, Slope[1]);"
[1] "Equal = (G1, 21, Slope[2]), (G2, 21, Slope[2]), (G3, 21, Slope[2]), (G4, 21, Slope[2]);"
[1] "Equal = (G1, 21, Slope[3]), (G2, 21, Slope[3]), (G3, 21, Slope[3]), (G4, 21, Slope[3]);"
[1] "Equal = (G1, 21, Slope[4]), (G2, 21, Slope[4]), (G3, 21, Slope[4]), (G4, 21, Slope[4]);"
[1] "Equal = (G1, 41, Slope[0]), (G2, 41, Slope[0]), (G3, 41, Slope[0]), (G4, 41, Slope[0]);"
[1] "Equal = (G1, 41, Slope[1]), (G2, 41, Slope[1]), (G3, 41, Slope[1]), (G4, 41, Slope[1]);"
[1] "Equal = (G1, 41, Slope[2]), (G2, 41, Slope[2]), (G3, 41, Slope[2]), (G4, 41, Slope[2]);"
[1] "Equal = (G1, 41, Slope[3]), (G2, 41, Slope[3]), (G3, 41, Slope[3]), (G4, 41, Slope[3]);"
[1] "Equal = (G1, 41, Slope[4]), (G2, 41, Slope[4]), (G3, 41, Slope[4]), (G4, 41, Slope[4]);"
[1] "Equal = (G1, 61, Slope[0]), (G2, 61, Slope[0]), (G3, 61, Slope[0]), (G4, 61, Slope[0]);"
[1] "Equal = (G1, 61, Slope[1]), (G2, 61, Slope[1]), (G3, 61, Slope[1]), (G4, 61, Slope[1]);"
[1] "Equal = (G1, 61, Slope[2]), (G2, 61, Slope[2]), (G3, 61, Slope[2]), (G4, 61, Slope[2]);"
[1] "Equal = (G1, 61, Slope[3]), (G2, 61, Slope[3]), (G3, 61, Slope[3]), (G4, 61, Slope[3]);"
[1] "Equal = (G1, 61, Slope[4]), (G2, 61, Slope[4]), (G3, 61, Slope[4]), (G4, 61, Slope[4]);"
[1] "Equal = (G1, 72, Slope[0]), (G2, 72, Slope[0]), (G3, 72, Slope[0]), (G4, 72, Slope[0]);"
[1] "Equal = (G1, 72, Slope[1]), (G2, 72, Slope[1]), (G3, 72, Slope[1]), (G4, 72, Slope[1]);"
[1] "Equal = (G1, 72, Slope[2]), (G2, 72, Slope[2]), (G3, 72, Slope[2]), (G4, 72, Slope[2]);"
[1] "Equal = (G1, 72, Slope[3]), (G2, 72, Slope[3]), (G3, 72, Slope[3]), (G4, 72, Slope[3]);"
[1] "Equal = (G1, 72, Slope[4]), (G2, 72, Slope[4]), (G3, 72, Slope[4]), (G4, 72, Slope[4]);"

因此,在所需的输出中,分组块中不G1应该有项目72和 G2 不应该有项目2161信息。此外,我无法在我的代码中对“G1”和“G2”进行排序。G1考虑到,和G2,有没有办法将这两条线组合成一条线?G3G4

output <- paste0("Equal = ",paste0(paste("(", "G1, ",item.map$item.id[i], ","," Slope[",k,"])",collapse=", ", sep=""),", ",
                                       paste("(", "G2, ",item.map$item.id[i], ","," Slope[",k,"])",collapse=", ", sep=""),", ",
                                       paste("(", "G3, ",item.map$item.id[i], ","," Slope[",k,"])",collapse=", ", sep=""),", ",
                                       paste( "(", "G4, ",item.map$item.id[i], ","," Slope[",k,"])",collapse=", ", sep=""),
                                       
                                       ";"))

所需的输出是:

[1] "Equal = (G1, 21, Slope[0]), (G3, 21, Slope[0]);"
[1] "Equal = (G1, 21, Slope[1]), (G3, 21, Slope[1]);"
[1] "Equal = (G1, 21, Slope[2]), (G3, 21, Slope[2]);"
[1] "Equal = (G1, 21, Slope[3]), (G3, 21, Slope[3]);"
[1] "Equal = (G1, 21, Slope[4]), (G3, 21, Slope[4]);"
[1] "Equal = (G1, 41, Slope[0]), (G2, 41, Slope[0]), (G3, 41, Slope[0]);"
[1] "Equal = (G1, 41, Slope[1]), (G2, 41, Slope[1]), (G3, 41, Slope[1]);"
[1] "Equal = (G1, 41, Slope[2]), (G2, 41, Slope[2]), (G3, 41, Slope[2]);"
[1] "Equal = (G1, 41, Slope[3]), (G2, 41, Slope[3]), (G3, 41, Slope[3]);"
[1] "Equal = (G1, 41, Slope[4]), (G2, 41, Slope[4]), (G3, 41, Slope[4]);"
[1] "Equal = (G1, 61, Slope[0]), (G3, 61, Slope[0]);"
[1] "Equal = (G1, 61, Slope[1]), (G3, 61, Slope[1]);"
[1] "Equal = (G1, 61, Slope[2]), (G3, 61, Slope[2]);"
[1] "Equal = (G1, 61, Slope[3]), (G3, 61, Slope[3]);"
[1] "Equal = (G1, 61, Slope[4]), (G3, 61, Slope[4]);"
[1] "Equal = (G2, 72, Slope[0]), (G4, 72, Slope[0]);"
[1] "Equal = (G2, 72, Slope[1]), (G4, 72, Slope[1]);"
[1] "Equal = (G2, 72, Slope[2]), (G4, 72, Slope[2]);"
[1] "Equal = (G2, 72, Slope[3]), (G4, 72, Slope[3]);"
[1] "Equal = (G2, 72, Slope[4]), (G4, 72, Slope[4]);"

有没有人有任何想法?谢谢

标签: rcharacter

解决方案


这是一个选项tidyverse,我们循环遍历“组”列名,select从“item.map”listrename“G1”、“G2”,然后根据逻辑组列crossing扩展数据集,创建带有(from ) 和to a的filter表达式glue_datagrlueflattenlistvector

library(dplyr)
library(purrr)
library(stringr)
out <- map(c('group.1', 'group.2'), 
      ~ item.map %>% 
          select(item.id, .x) %>% 
          rename_at(.x, ~ str_c('G', str_remove(., "\\D+"))) %>% 
          crossing(k = 0:2) %>%
          filter(across(starts_with('G'), as.logical)) %>% 
          glue::glue_data("Equal = ({names(.)[2]}, {item.id}, Slope[{k}]);")%>%
          as.character) %>%
    flatten_chr

-输出

out
#[1] "Equal = (G1, 21, Slope[0]);" "Equal = (G1, 21, Slope[1]);" "Equal = (G1, 21, Slope[2]);" "Equal = (G1, 41, Slope[0]);"
#[5] "Equal = (G1, 41, Slope[1]);" "Equal = (G1, 41, Slope[2]);" "Equal = (G1, 61, Slope[0]);" "Equal = (G1, 61, Slope[1]);"
#[9] "Equal = (G1, 61, Slope[2]);" "Equal = (G2, 41, Slope[0]);" "Equal = (G2, 41, Slope[1]);" "Equal = (G2, 41, Slope[2]);"
#[13] "Equal = (G2, 72, Slope[0]);" "Equal = (G2, 72, Slope[1]);" "Equal = (G2, 72, Slope[2]);"

如果我们想将两个组中都为 1 的那些分组,

i1 <- ave(seq_along(out), sub("G\\d+", "", out), FUN = length)

 out[i1 > 1] <- ave(out[i1 > 1], sub("Equal = \\(G\\d+", "", out[i1 > 1]), 
      FUN = function(x) {
          x[1] <- sub(";", "", x[1])
          paste(x[1], sub("Equal = ", "", x[2]), sep =", ")
  })
out1 <- unique(out)
out1

#[1] "Equal = (G1, 21, Slope[0]);"                     "Equal = (G1, 21, Slope[1]);"                    
#[3] "Equal = (G1, 21, Slope[2]);"                     "Equal = (G1, 41, Slope[0]), (G2, 41, Slope[0]);"
#[5] "Equal = (G1, 41, Slope[1]), (G2, 41, Slope[1]);" "Equal = (G1, 41, Slope[2]), (G2, 41, Slope[2]);"
#[7] "Equal = (G1, 61, Slope[0]);"                     "Equal = (G1, 61, Slope[1]);"                    
#[9] "Equal = (G1, 61, Slope[2]);"                     "Equal = (G2, 72, Slope[0]);"                    
#[11] "Equal = (G2, 72, Slope[1]);"                     "Equal = (G2, 72, Slope[2]);"  

更新

使用更新的数据集

out <- map(c('group.1', 'group.2', 'group.3', 'group.4'), 
       ~ item.map %>% 
            select(item.id, .x) %>% 
            rename_at(.x, ~ str_c('G', str_remove(., "\\D+"))) %>% 
            crossing(k = 0:4) %>%
            filter(across(starts_with('G'), as.logical)) %>% 
            glue::glue_data("Equal = ({names(.)[2]}, {item.id}, Slope[{k}]);")%>%
            as.character) %>%
      flatten_chr
 
out[i1 > 1] <- ave(out[i1 > 1], sub("Equal = \\(G\\d+", "", out[i1 > 1]),
     FUN = function(x) {
      x[-length(x)] <- sub(";", "", x[-length(x)])
      paste(x[1], paste(sub("Equal = ", "", x[-1]), collapse = ", "), sep=", ") 
   })
   
unique(out)
 [1] "Equal = (G1, 21, Slope[0]), (G3, 21, Slope[0]);"                    
 [2] "Equal = (G1, 21, Slope[1]), (G3, 21, Slope[1]);"                    
 [3] "Equal = (G1, 21, Slope[2]), (G3, 21, Slope[2]);"                    
 [4] "Equal = (G1, 21, Slope[3]), (G3, 21, Slope[3]);"                    
 [5] "Equal = (G1, 21, Slope[4]), (G3, 21, Slope[4]);"                    
 [6] "Equal = (G1, 41, Slope[0]), (G2, 41, Slope[0]), (G3, 41, Slope[0]);"
 [7] "Equal = (G1, 41, Slope[1]), (G2, 41, Slope[1]), (G3, 41, Slope[1]);"
 [8] "Equal = (G1, 41, Slope[2]), (G2, 41, Slope[2]), (G3, 41, Slope[2]);"
 [9] "Equal = (G1, 41, Slope[3]), (G2, 41, Slope[3]), (G3, 41, Slope[3]);"
[10] "Equal = (G1, 41, Slope[4]), (G2, 41, Slope[4]), (G3, 41, Slope[4]);"
[11] "Equal = (G1, 61, Slope[0]), (G3, 61, Slope[0]);"                    
[12] "Equal = (G1, 61, Slope[1]), (G3, 61, Slope[1]);"                    
[13] "Equal = (G1, 61, Slope[2]), (G3, 61, Slope[2]);"                    
[14] "Equal = (G1, 61, Slope[3]), (G3, 61, Slope[3]);"                    
[15] "Equal = (G1, 61, Slope[4]), (G3, 61, Slope[4]);"                    
[16] "Equal = (G2, 72, Slope[0]), (G4, 72, Slope[0]);"                    
[17] "Equal = (G2, 72, Slope[1]), (G4, 72, Slope[1]);"                    
[18] "Equal = (G2, 72, Slope[2]), (G4, 72, Slope[2]);"                    
[19] "Equal = (G2, 72, Slope[3]), (G4, 72, Slope[3]);"                    
[20] "Equal = (G2, 72, Slope[4]), (G4, 72, Slope[4]);"       

或者使用嵌套for循环

OUTPUT <- c()
# // loop over the sequence of rows
for(i in seq_len(nrow(item.map))) {
    # // nested loop to expand on a sequence
    for(k in  0:2) {  
        # // do a second nest based on the 'Group'  
         for(j in seq_along(Group)) {
              # // create a logical expression based on the 'group' column
              i1 <- as.logical(item.map[[paste0("group.", j)]][i])
              # // if it is TRUE, then only do the below
              if(i1) {
                  # // create the expression with paste
                  output <- paste0("Equal = ", paste("(", "G", j, 
                     ", ", item.map$item.id[i], ", Slope[", k, "])", 
                         collapse=", ", sep=""))
                 
              # // concatenate the NULL vector with the temporary output
              OUTPUT <- c(OUTPUT, output)
              }
         
         }
    
    }

}

推荐阅读