library(testthat) library(recipes) skip_if_not_installed("modeldata") data(biomass, package = "modeldata") biomass_tr <- biomass[biomass$dataset == "Training", ] biomass_te <- biomass[biomass$dataset == "Testing", ][1:5, ] rec <- recipe(HHV ~ carbon + hydrogen + oxygen + nitrogen + sulfur, data = biomass_tr ) %>% step_normalize(all_predictors()) # From directly calling fastICA exp_comp <- structure(c( 0.129863464905676, 0.0759034631963958, 0.345979256585598, 0.126579800253201, 0.156772622077837, 0.397465725824992, 0.697584509101097, 0.783403578028365, 0.838717872383214, -1.22958413032623, 0.274166588383082, -0.429295233592478 ), .Dim = c(6L, 2L), .Dimnames = list(NULL, c("IC1", "IC2")) ) exp_load <- structure(c( -0.41723456724402, 0.364056809629112, 0.406544129493068, 0.132202024893928, -0.0815957464153714, 0.192529689854096, -0.0343644772231862, 0.139740384225697, -0.656590943491334, -0.519748239614668 ), .Dim = c(5L, 2L) ) colnames(exp_load) <- c("IC1", "IC2") test_that("correct ICA values", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") ica_extract <- rec %>% step_ica(carbon, hydrogen, oxygen, nitrogen, sulfur, num_comp = 2, seed = 1, id = "") set.seed(12) ica_extract_trained <- prep(ica_extract, training = biomass_tr, verbose = FALSE) ica_pred <- bake(ica_extract_trained, new_data = NULL, all_predictors()) ica_pred <- head(as.matrix(ica_pred)) rownames(ica_pred) <- NULL expect_equal(ica_pred, exp_comp) vars <- c("carbon", "hydrogen", "oxygen", "nitrogen", "sulfur") tidy_exp_un <- tibble( terms = rep(vars, 2), component = rep(c("IC1", "IC2"), 5), value = rep(NA_real_, 2 * 5), id = "" ) %>% arrange(terms, component) expect_equal(tidy_exp_un, tidy(ica_extract, number = 2)) loadings <- stack(as.data.frame(exp_load)) tidy_exp_tr <- tibble( terms = rep(vars, 2), component = as.character(loadings$ind), value = loadings$values, id = "" ) %>% arrange(terms, component) expect_equal(tidy_exp_tr, tidy(ica_extract_trained, number = 2)) }) test_that("No ICA comps", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") ica_extract <- rec %>% step_ica(carbon, hydrogen, oxygen, nitrogen, sulfur, num_comp = 0) ica_extract_trained <- prep(ica_extract, training = biomass_tr) expect_equal( names(bake(ica_extract_trained, new_data = NULL)), names(biomass_tr)[-(1:2)] ) expect_true(all(names(ica_extract_trained$steps[[1]]$res) == "x_vars")) expect_snapshot(print(ica_extract_trained)) expect_true(all(is.na(tidy(ica_extract_trained, 2)$value))) }) test_that("check_name() is used", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") dat <- mtcars dat$IC1 <- dat$mpg rec <- recipe(~., data = dat) |> step_ica(mpg, disp) expect_snapshot( error = TRUE, prep(rec, training = dat) ) }) test_that("tunable", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") rec <- recipe(~., data = iris) %>% step_ica(all_predictors()) rec_param <- tunable.step_ica(rec$steps[[1]]) expect_equal(rec_param$name, c("num_comp")) expect_true(all(rec_param$source == "recipe")) expect_true(is.list(rec_param$call_info)) expect_equal(nrow(rec_param), 1) expect_equal( names(rec_param), c("name", "call_info", "source", "component", "component_id") ) }) test_that("Do nothing for num_comps = 0 and keep_original_cols = FALSE (#1152)", { rec <- recipe(~ ., data = mtcars) %>% step_ica(all_predictors(), num_comp = 0, keep_original_cols = FALSE) %>% prep() res <- bake(rec, new_data = NULL) expect_identical(res, tibble::as_tibble(mtcars)) }) # Infrastructure --------------------------------------------------------------- test_that("bake method errors when needed non-standard role columns are missing", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") ica_extract <- recipe(HHV ~ carbon + hydrogen + oxygen + nitrogen + sulfur, data = biomass_tr ) %>% step_ica(carbon, hydrogen, num_comp = 2, seed = 1) %>% update_role(carbon, hydrogen, new_role = "potato") %>% update_role_requirements(role = "potato", bake = FALSE) ica_extract_trained <- prep(ica_extract, training = biomass_tr, verbose = FALSE) expect_error(bake(ica_extract_trained, new_data = biomass_tr[, c(-3)]), class = "new_data_missing_column") }) test_that("empty printing", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") rec <- recipe(mpg ~ ., mtcars) rec <- step_ica(rec) expect_snapshot(rec) rec <- prep(rec, mtcars) expect_snapshot(rec) }) test_that("empty selection prep/bake is a no-op", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") rec1 <- recipe(mpg ~ ., mtcars) rec2 <- step_ica(rec1) rec1 <- prep(rec1, mtcars) rec2 <- prep(rec2, mtcars) baked1 <- bake(rec1, mtcars) baked2 <- bake(rec2, mtcars) expect_identical(baked1, baked2) }) test_that("empty selection tidy method works", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") rec <- recipe(mpg ~ ., mtcars) rec <- step_ica(rec) expect <- tibble( terms = character(), component = character(), value = double(), id = character() ) expect_identical(tidy(rec, number = 1), expect) rec <- prep(rec, mtcars) expect_identical(tidy(rec, number = 1), expect) }) test_that("keep_original_cols works", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") new_names <- c("IC1", "IC2", "IC3", "IC4", "IC5") rec <- recipe(~ ., mtcars) %>% step_ica(all_predictors(), keep_original_cols = FALSE) rec <- prep(rec) res <- bake(rec, new_data = NULL) expect_equal( colnames(res), new_names ) rec <- recipe(~ ., mtcars) %>% step_ica(all_predictors(), keep_original_cols = TRUE) rec <- prep(rec) res <- bake(rec, new_data = NULL) expect_equal( colnames(res), c(colnames(mtcars), new_names) ) }) test_that("keep_original_cols - can prep recipes with it missing", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") rec <- recipe(~ ., mtcars) %>% step_ica(all_predictors()) rec$steps[[1]]$keep_original_cols <- NULL expect_snapshot( rec <- prep(rec) ) expect_error( bake(rec, new_data = mtcars), NA ) }) test_that("printing", { skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") rec <- recipe(HHV ~ carbon + hydrogen + oxygen + nitrogen + sulfur, data = biomass_tr) %>% step_normalize(all_predictors()) %>% step_ica(carbon, hydrogen, num_comp = 2) expect_snapshot(print(rec)) expect_snapshot(prep(rec)) }) test_that("tunable is setup to work with extract_parameter_set_dials", { skip_if_not_installed("dials") skip_if_not_installed("dimRed") skip_if_not_installed("fastICA") skip_if_not_installed("RSpectra") rec <- recipe(~., data = mtcars) %>% step_ica( all_predictors(), num_comp = hardhat::tune() ) params <- extract_parameter_set_dials(rec) expect_s3_class(params, "parameters") expect_identical(nrow(params), 1L) })