如何在循环中使用mutate和ifelse?

问题描述

要做的是创建虚拟变量,以指示连续变量是超过某个阈值(1)还是低于该阈值(0)。我通过几个重复的mutations实现了这一点,我想用一个循环代替。

# load tidyverse
library(tidyverse)

# create data
data <- data.frame(x = runif(1:100,min=0,max=100))

# What I do
data <- data %>%
  mutate(x20 = ifelse(x >= 20,1,0)) %>%
  mutate(x40 = ifelse(x >= 40,0)) %>%
  mutate(x60 = ifelse(x >= 60,0)) %>%
  mutate(x80 = ifelse(x >= 80,0)) 
  
# What I would like to do
for (i in seq(from=0,to=100,by=20)){
  data %>% mutate(paste(x,i) = ifelse(x >= i,0))
}

谢谢。

解决方法

您可以在此处使用map_dfc

library(dplyr)
library(purrr)
breaks <- seq(from=0,to=100,by=20)
bind_cols(data,map_dfc(breaks,~
          data %>% transmute(!!paste0('x',.x) := as.integer(x > .x))))

#             x x0 x20 x40 x60 x80 x100
#1    6.2772517  1   0   0   0   0    0
#2   16.3520358  1   0   0   0   0    0
#3   25.8958212  1   1   0   0   0    0
#4   78.9354970  1   1   1   1   0    0
#5   35.7731737  1   1   0   0   0    0
#6    5.7395139  1   0   0   0   0    0
#7   49.7069551  1   1   1   0   0    0
#8   53.5134559  1   1   1   0   0    0
#...
#....     

尽管如此,我认为在R的基础上要简单得多:

data[paste0('x',breaks)] <- lapply(breaks,function(x) as.integer(data$x > x))
,

Ronak的基数R可能是最好的,但是为了完整起见,这是与您最初使用dplyr时类似的另一种方式:

  <!-- REQUIRED SCRIPTS -->

  <!-- jQuery -->
  <script src="./AdminLTE-3.0.5/plugins/jquery/jquery.min.js"></script>
  <!-- Bootstrap 4 -->
  <script src="./AdminLTE-3.0.5/plugins/bootstrap/js/bootstrap.bundle.min.js"></script>
  <!-- AdminLTE App -->
  <script src="./AdminLTE-3.0.5/dist/js/adminlte.min.js"></script>
,

您可以在reduce()中使用purrr

library(dplyr)
library(purrr)

reduce(seq(0,100,by = 20),.init = data,~ mutate(.x,!!paste0('x',.y) := as.integer(x >= .y)))

#             x x0 x20 x40 x60 x80 x100
# 1   61.080545  1   1   1   1   0    0
# 2   63.036673  1   1   1   1   0    0
# 3   71.064322  1   1   1   1   0    0
# 4    1.821416  1   0   0   0   0    0
# 5   24.721454  1   1   0   0   0    0

base对应的Reduce()方式:

Reduce(function(df,y){ df[paste0('x',y)] <- as.integer(df$x >= y); df },seq(0,data)