if (FALSE) {
data(iris)
# Split dataset into train (75
set.seed(5)
Iris <- split(p = 0.75, Dataset = iris, class = 5)
Iris
# Generate simulated dataset.
N <- 1000
class <- c(rep("A", 0.4 * N), rep("B", 0.2 * N),
rep("C", 0.1 * N), rep("D", 0.05 * N), rep("E", 0.25 * N))
type <- c(rep("train", 0.75 * N), rep("test", 0.25 * N))
n <- 300
Dataset <- data.frame(1:n, sample(class, n))
colnames(Dataset) <- c("y", "class")
# Split dataset into train (60
simulated <- split(p = 0.6, Dataset = Dataset, class = 2)
simulated
# Generate simulated dataset.
Dataset <- data.frame(1:n, sample(class, n), sample(type, n))
colnames(Dataset) <- c("y", "class", "type")
# Split dataset into train and test subsets.
simulated <- split(p = list(type = 3, train = "train",
test = "test"), Dataset = Dataset, class = 2)
simulated
}
Run the code above in your browser using DataLab