dat <- data.frame(x1 = c(1, 1, 2, 1, 4),
x2 = c(1, 1, 2, 1, 6),
x3 = c(2, 2, 3, 2, 6),
x4 = c(1, 1, 2, 2, 4),
x5 = c(1, 1, 4, 4, 3))
#--------------------------------------
# df.duplicated() function
# Extract duplicated rows based on all variables
df.duplicated(dat)
# Extract duplicated rows based on x4
df.duplicated(dat, x4)
# Extract duplicated rows based on x2 and x3
df.duplicated(dat, x2, x3)
# Extract duplicated rows based on all variables
# exclude first of identical rows
df.duplicated(dat, first = FALSE)
# Extract duplicated rows based on x2 and x3
# do not return all variables
df.duplicated(dat, x2, x3, keep.all = FALSE)
# Extract duplicated rows based on x4
# consider duplication from the reversed side
df.duplicated(dat, x4, first = FALSE, from.last = TRUE)
# Extract duplicated rows based on x2 and x3
# set row names to NULL
df.duplicated(dat, x2, x3, keep.row.names = FALSE)
#--------------------------------------
# df.unique() function
# Extract unique rows based on all variables
unique(dat)
# Extract unique rows based on x4
df.unique(dat, x4)
# Extract unique rows based on x1, x2, and x3
df.unique(dat, x1, x2, x3)
# Extract unique rows based on x2 and x3
# do not return all variables
df.unique(dat, x2, x3, keep.all = FALSE)
# Extract unique rows based on x4
# consider duplication from the reversed side
df.unique(dat, x4, from.last = TRUE)
# Extract unique rows based on x2 and x3
# set row names to NULL
df.unique(dat, x2, x3, keep.row.names = FALSE)
Run the code above in your browser using DataLab