mlverse · mattwarkentin · Jul 29, 2021 · Jul 29, 2021 · dfalbel · Jul 30, 2021
diff --git a/DESCRIPTION b/DESCRIPTION
@@ -47,6 +47,7 @@ Collate:
     'accelerator.R'
     'utils.R'
     'callbacks.R'
+    'callback-validation-check.R'
     'callbacks-interrupt.R'
     'callbacks-profile.R'
     'context.R'

diff --git a/NAMESPACE b/NAMESPACE
@@ -19,6 +19,7 @@ export(luz_callback_model_checkpoint)
 export(luz_callback_profile)
 export(luz_callback_progress)
 export(luz_callback_train_valid)
+export(luz_callback_validation_check)
 export(luz_load)
 export(luz_load_model_weights)
 export(luz_metric)

diff --git a/R/callback-validation-check.R b/R/callback-validation-check.R
@@ -0,0 +1,74 @@
+#' @include callbacks.R
+NULL
+
+#' Validation Check
+#'
+#' Check validation loop before fitting model.
+#'
+#' @param batches Number of validation batches to check. Default is 2.
+#'
+#' @note Usually the training loop is much longer than the validation
+#'   loop and issues with the validation loop aren't encountered until after
+#'   a long training runtime. This callback runs the validation loop first on
+#'   `batches` number of batches and then proceeds onto the standard
+#'   training process.
+#'
+#' @note Printing can be disabled by passing `verbose = FALSE` to
+#'   [fit.luz_module_generator()].
+#'
+#' @family luz_callbacks
+#'
+#' @returns
+#' A `luz_callback`.
+#'
+#' @export
+luz_callback_validation_check <- luz_callback(
+  "validation_check_callback",
+  initialize = function(batches = 2) {
+    if (!rlang::is_scalar_integerish(batches)) {
+      rlang::abort("`batches` must be a single integer value.")
+    }
+    self$batches <- batches
+  },
+  on_fit_begin = function() {
+    if (is.null(ctx$valid_data)) return()
+    if (self$batches <= 0) return()
+
+    ctx$model$eval()
 ctx$model$eval() 
 ctx$training <- FALSE 
 ctx$loss <- list() 
 ctx$model$eval() 
 ctx$training <- FALSE 
 ctx$loss <- list() 
+    ctx$training <- FALSE
+
+    self$initialize_progress_bar()
+
+    i <- 0
+    torch::with_no_grad({
+      coro::loop(for (batch in ctx$valid_data) {
+        self$validate_one_batch(batch)
+        self$tick_progress_bar(self$loss)
+        i <- i + 1
+        if (i >= self$batches) break()
+      })
+    })
+  },
+  validate_one_batch = function(batch) {
+    input  <- list(batch[[1]])
+    target <- batch[[2]]
+    pred <- do.call(ctx$model, input)
+    self$loss <- ctx$model$loss(pred, target)
+  },
+  initialize_progress_bar = function() {
+    format <- "Validation check: :current/:total [:bar] - Loss: :loss"
+    self$pb <- progress::progress_bar$new(
+      force = getOption("luz.force_progress_bar", FALSE),
+      show_after = 0,
+      format = format,
+      total = self$batches,
+      clear = FALSE
+    )
+  },
+  tick_progress_bar = function(token) {
+    if (ctx$verbose) {
+      loss <- format(round(as.numeric(token), digits = 4), nsmall = 4)
+      self$pb$tick(tokens = list(loss = loss))
+    }
+  }
+)
diff --git a/R/module.R b/R/module.R
@@ -413,8 +413,9 @@ clean_context <- function(ctx) {
     "pred",
     "opt",
     "opt_name",
-    "data",
     "handlers",
+    "data",
+    "train_data",
     "valid_data",
     "loss",
     "input",

diff --git a/man/ctx.Rd b/man/ctx.Rd
diff --git a/man/luz_callback.Rd b/man/luz_callback.Rd
diff --git a/man/luz_callback_csv_logger.Rd b/man/luz_callback_csv_logger.Rd
diff --git a/man/luz_callback_early_stopping.Rd b/man/luz_callback_early_stopping.Rd
diff --git a/man/luz_callback_interrupt.Rd b/man/luz_callback_interrupt.Rd
diff --git a/man/luz_callback_lr_scheduler.Rd b/man/luz_callback_lr_scheduler.Rd
diff --git a/man/luz_callback_metrics.Rd b/man/luz_callback_metrics.Rd
diff --git a/man/luz_callback_model_checkpoint.Rd b/man/luz_callback_model_checkpoint.Rd
diff --git a/man/luz_callback_profile.Rd b/man/luz_callback_profile.Rd
diff --git a/man/luz_callback_progress.Rd b/man/luz_callback_progress.Rd
diff --git a/man/luz_callback_train_valid.Rd b/man/luz_callback_train_valid.Rd
diff --git a/man/luz_callback_validation_check.Rd b/man/luz_callback_validation_check.Rd