davidrsch
diff --git a/‎tests/testthat.R‎
Lines changed: 2 additions & 2 deletions b/‎tests/testthat.R‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎tests/testthat/helper-keras.R‎
Lines changed: 19 additions & 0 deletions b/‎tests/testthat/helper-keras.R‎
Lines changed: 19 additions & 0 deletions
diff --git a/‎tests/testthat/test-e2e-classification.R‎
Lines changed: 93 additions & 0 deletions b/‎tests/testthat/test-e2e-classification.R‎
Lines changed: 93 additions & 0 deletions
diff --git a/‎tests/testthat/test-e2e-features.R‎
Lines changed: 137 additions & 0 deletions b/‎tests/testthat/test-e2e-features.R‎
Lines changed: 137 additions & 0 deletions
diff --git a/‎tests/testthat/test-e2e-multiblock-tuning.R‎
Lines changed: 93 additions & 0 deletions b/‎tests/testthat/test-e2e-multiblock-tuning.R‎
Lines changed: 93 additions & 0 deletions
@@ -7,6 +7,6 @@
 # * https://testthat.r-lib.org/articles/special-files.html
 
 library(testthat)
-library(dpl)
+library(kerasnip)
 
-test_check("dpl")
+test_check("kerasnip")
@@ -0,0 +1,19 @@
+# Helper to skip tests if Keras is not configured
+library(parsnip)
+library(recipes)
+library(workflows)
+library(modeldata)
+library(rsample)
+library(dials)
+library(tune)
+
+skip_if_no_keras <- function() {
+  testthat::skip_if_not_installed("keras3")
+
+  # is_keras_available() checks for the python 'keras' module and a backend.
+  # This is the most reliable way to check for a working installation.
+  # testthat::skip_if_not(
+  #   keras3::is_keras_available(),
+  #   "Keras 3 and a backend (e.g., tensorflow) are not available for testing"
+  # )
+}
@@ -0,0 +1,93 @@
+test_that("E2E: Classification spec generation, fitting, and prediction works", {
+  skip_if_no_keras()
+
+  input_block_class <- function(model, input_shape) {
+    keras3::keras_model_sequential(input_shape = input_shape)
+  }
+  dense_block_class <- function(model, units = 16) {
+    model |>
+      keras3::layer_dense(units = units, activation = "relu")
+  }
+  output_block_class <- function(model, num_classes) {
+    model |> keras3::layer_dense(units = num_classes, activation = "softmax")
+  }
+
+  create_keras_spec(
+    model_name = "e2e_mlp_class",
+    layer_blocks = list(
+      input = input_block_class,
+      dense = dense_block_class,
+      output = output_block_class
+    ),
+    mode = "classification"
+  )
+
+  spec <- e2e_mlp_class(
+    num_dense = 2,
+    dense_units = 8,
+    epochs = 2
+  ) |>
+    set_engine("keras")
+
+  # --- Multiclass test ---
+  multi_data <- iris
+  rec_multi <- recipe(Species ~ ., data = multi_data)
+  wf_multi <- workflow(rec_multi, spec)
+
+  expect_no_error(fit_multi <- fit(wf_multi, data = multi_data))
+  expect_s3_class(fit_multi, "workflow")
+
+  preds_class_multi <- predict(
+    fit_multi,
+    new_data = multi_data[1:5, ],
+    type = "class"
+  )
+  expect_s3_class(preds_class_multi, "tbl_df")
+  expect_equal(names(preds_class_multi), ".pred_class")
+  expect_equal(nrow(preds_class_multi), 5)
+  expect_equal(
+    levels(preds_class_multi$.pred_class),
+    levels(multi_data$Species)
+  )
+
+  preds_prob_multi <- predict(
+    fit_multi,
+    new_data = multi_data[1:5, ],
+    type = "prob"
+  )
+  expect_s3_class(preds_prob_multi, "tbl_df")
+  expect_equal(
+    names(preds_prob_multi),
+    paste0(".pred_", levels(multi_data$Species))
+  )
+  expect_equal(nrow(preds_prob_multi), 5)
+  expect_true(all(abs(rowSums(preds_prob_multi) - 1) < 1e-5))
+
+  # --- Binary test ---
+  binary_data <- modeldata::two_class_dat
+  rec_bin <- recipe(Class ~ ., data = binary_data)
+  wf_bin <- workflow(rec_bin, spec)
+
+  expect_no_error(fit_bin <- fit(wf_bin, data = binary_data))
+  expect_s3_class(fit_bin, "workflow")
+
+  preds_class_bin <- predict(
+    fit_bin,
+    new_data = binary_data[1:5, ],
+    type = "class"
+  )
+  expect_s3_class(preds_class_bin, "tbl_df")
+  expect_equal(names(preds_class_bin), ".pred_class")
+  expect_equal(nrow(preds_class_bin), 5)
+  expect_equal(levels(preds_class_bin$.pred_class), levels(binary_data$Class))
+
+  preds_prob_bin <- predict(
+    fit_bin,
+    new_data = binary_data[1:5, ],
+    type = "prob"
+  )
+  expect_s3_class(preds_prob_bin, "tbl_df")
+  expect_equal(names(preds_prob_bin), c(".pred_Class1", ".pred_Class2"))
+  expect_equal(nrow(preds_prob_bin), 5)
+  expect_true(all(abs(rowSums(preds_prob_bin) - 1) < 1e-5))
+})
@@ -0,0 +1,137 @@
+test_that("E2E: Customizing main arguments works", {
+  skip_if_no_keras()
+
+  input_block_feat <- function(model, input_shape) {
+    keras3::keras_model_sequential(input_shape = input_shape)
+  }
+  dense_block_feat <- function(model, units = 16) {
+    model |> keras3::layer_dense(units = units, activation = "relu")
+  }
+  output_block_feat <- function(model) {
+    model |> keras3::layer_dense(units = 1)
+  }
+
+  create_keras_spec(
+    model_name = "e2e_mlp_feat",
+    layer_blocks = list(
+      input = input_block_feat,
+      dense = dense_block_feat,
+      output = output_block_feat
+    ),
+    mode = "regression"
+  )
+
+  # Main arguments (like compile_*) should be set in the spec function,
+  # not in set_engine().
+  spec <- e2e_mlp_feat(
+    epochs = 2,
+    compile_optimizer = "sgd",
+    compile_loss = "mae",
+    compile_metrics = c("mean_squared_error")
+  ) |>
+    parsnip::set_engine("keras")
+
+  # This should now run without the parsnip warning about removing arguments
+  fit_obj <- NULL
+  expect_no_warning(
+    fit_obj <- parsnip::fit(spec, mpg ~ ., data = mtcars)
+  )
+
+  # Also verify the arguments were correctly used during compilation
+  keras_model <- fit_obj$fit$fit
+  compiled_loss <- keras_model$loss
+  compiled_optimizer <- tolower(keras_model$optimizer$name)
+  compiled_metrics <- sapply(
+    keras_model$metrics[[2]]$metrics,
+    function(m) {
+      m$name
+    }
+  )
+
+  # Keras might add suffixes or use different casings, so check flexibly
+  expect_true(grepl("mae", compiled_loss))
+  expect_true(grepl("sgd", tolower(compiled_optimizer)))
+  expect_true("mean_squared_error" %in% compiled_metrics)
+})
+
+test_that("E2E: Customizing fit arguments works", {
+  skip_if_no_keras()
+
+  input_block_fit <- function(model, input_shape) {
+    keras3::keras_model_sequential(input_shape = input_shape)
+  }
+  dense_block_fit <- function(model, units = 16) {
+    model |> keras3::layer_dense(units = units, activation = "relu")
+  }
+  output_block_fit <- function(model) {
+    model |> keras3::layer_dense(units = 1)
+  }
+
+  create_keras_spec(
+    model_name = "e2e_mlp_fit",
+    layer_blocks = list(
+      input = input_block_fit,
+      dense = dense_block_fit,
+      output = output_block_fit
+    ),
+    mode = "regression"
+  )
+
+  # Fit arguments (like validation_split, callbacks) should be set in the
+  # spec function, not in set_engine().
+  spec <- e2e_mlp_fit(
+    fit_validation_split = 0.2,
+    fit_callbacks = list(keras3::callback_early_stopping(patience = 1)),
+    fit_epochs = 3,
+    compile_metrics = "mean_squared_error"
+  ) |>
+    parsnip::set_engine("keras")
+
+  # This will run without error if the arguments are passed correctly
+  fit_obj <- NULL
+  expect_no_error(fit_obj <- parsnip::fit(spec, mpg ~ ., data = mtcars))
+
+  # Check that the callback was used (model should stop early)
+  expect_lt(length(fit_obj$fit$history$metrics$loss), 5)
+})
+
+test_that("E2E: Setting num_blocks = 0 works", {
+  skip_if_no_keras()
+
+  input_block_zero <- function(model, input_shape) {
+    keras3::keras_model_sequential(input_shape = input_shape)
+  }
+  dense_block_zero <- function(model, units = 16) {
+    model |> keras3::layer_dense(units = units, activation = "relu")
+  }
+  output_block_zero <- function(model) {
+    model |> keras3::layer_dense(units = 1)
+  }
+
+  create_keras_spec(
+    model_name = "e2e_mlp_zero",
+    layer_blocks = list(
+      input = input_block_zero,
+      dense = dense_block_zero,
+      output = output_block_zero
+    ),
+    mode = "regression"
+  )
+
+  spec <- e2e_mlp_zero(num_dense = 0, epochs = 2) |>
+    parsnip::set_engine("keras")
+  # This should fit a model with only an input and output layer
+  expect_no_error(parsnip::fit(spec, mpg ~ ., data = mtcars))
+})
+
+test_that("E2E: Error handling for reserved names works", {
+  bad_blocks <- list(
+    compile = function(model) model, # "compile" is a reserved name
+    dense = function(model, u = 1) model |> keras3::layer_dense(units = u)
+  )
+
+  expect_error(
+    create_keras_spec("bad_spec", bad_blocks),
+    regexp = "`compile` and `optimizer` are protected names"
+  )
+})
@@ -0,0 +1,93 @@
+test_that("E2E: Multi-block model tuning works", {
+  skip_if_no_keras()
+
+  input_block_mb <- function(model, input_shape) {
+    keras3::keras_model_sequential(input_shape = input_shape)
+  }
+
+  starting_layers <- function(model, layer1_units = 16, layer2_units = 32) {
+    model |>
+      keras3::layer_dense(units = layer1_units, activation = "relu") |>
+      keras3::layer_dense(units = layer2_units, activation = "relu")
+  }
+
+  ending_layers <- function(model, units = 32, dropout = 0.2) {
+    model |>
+      keras3::layer_dense(units = units, activation = "relu") |>
+      keras3::layer_dropout(rate = dropout)
+  }
+
+  output_block_mb <- function(model, num_classes) {
+    model |> keras3::layer_dense(units = num_classes, activation = "softmax")
+  }
+
+  create_keras_spec(
+    model_name = "mb_mt",
+    layer_blocks = list(
+      input = input_block_mb,
+      start = starting_layers,
+      end = ending_layers,
+      output = output_block_mb
+    ),
+    mode = "classification"
+  )
+
+  tune_spec <- mb_mt(
+    num_start = tune(),
+    start_layer1_units = tune(),
+    start_layer2_units = tune(),
+    end_units = tune(),
+    epochs = 1
+  ) |>
+    set_engine("keras")
+
+  rec <- recipe(Species ~ ., data = iris)
+  wf <- workflow(rec) |>
+    add_model(tune_spec)
+
+  folds <- rsample::vfold_cv(iris, v = 2)
+
+  params <- extract_parameter_set_dials(wf) |>
+    update(
+      num_start = dials::num_terms(c(1, 2)),
+      start_layer1_units = dials::hidden_units(c(4, 8)),
+      start_layer2_units = dials::hidden_units(c(8, 16)),
+      end_units = dials::hidden_units(c(4, 8))
+    )
+
+  grid <- grid_regular(params, levels = 2)
+  control <- control_grid(
+    save_pred = FALSE,
+    verbose = FALSE,
+    save_workflow = TRUE
+  )
+
+  # Use a try block because tuning can sometimes fail for non-package reasons
+  tune_res <- try(
+    tune_grid(
+      wf,
+      resamples = folds,
+      grid = grid,
+      control = control
+    ),
+    silent = TRUE
+  )
+
+  if (inherits(tune_res, "try-error")) {
+    testthat::skip(paste("Tuning failed with error:", as.character(tune_res)))
+  }
+
+  expect_s3_class(tune_res, "tune_results")
+
+  metrics <- collect_metrics(tune_res)
+  expect_s3_class(metrics, "tbl_df")
+  expect_true(all(
+    c("num_start", "start_layer1_units", "start_layer2_units", "end_units") %in%
+      names(metrics)
+  ))
+
+  expect_no_error(
+    best_fit <- tune::fit_best(tune_res)
+  )
+  expect_s3_class(best_fit, "workflow")
+})