# NOT RUN {
# Given
library(data.table)
col_vals <- runif(1000)
col_mean <- mean(col_vals)
col_sd <- sd(col_vals)
extrem_val <- col_mean + 6 * col_sd
dataSet <- data.table(num_col = c(col_vals, extrem_val))
# When
dataSet <- remove_sd_outlier(dataSet, cols = "auto", n_sigmas = 3, verbose = TRUE)
# Then extrem value is no longer in set
extrem_val %in% dataSet[["num_col"]] # Is false
# }
Run the code above in your browser using DataLab