Lightning-AI · williamFalcon · Jan 23, 2020 · Nov 25, 2019 · Nov 30, 2019 · Dec 1, 2019
@@ -124,9 +124,10 @@ def on_epoch_end(self, epoch, logs=None):
         if current is None:
             warnings.warn(
                 f'Early stopping conditioned on metric `{self.monitor}`'
-                f' which is not available. Available metrics are: {",".join(list(logs.keys()))}',
+                f' which is not available, so early stopping will not work.'
+                f' Available metrics are: {",".join(list(logs.keys()))}',
                 RuntimeWarning)
-            stop_training = True
+
             return stop_training
 
         if self.monitor_op(current - self.min_delta, self.best):

@@ -185,6 +185,8 @@ def __init__(self,
         # creates a default one if none passed in
         self.early_stop_callback = None
         self.configure_early_stopping(early_stop_callback, logger)
+        if self.enable_early_stop:
+            self.nb_sanity_val_steps = max(1, self.nb_sanity_val_steps)
 
         # configure checkpoint callback
         self.checkpoint_callback = checkpoint_callback
@@ -444,6 +446,7 @@ def run_pretrain_routine(self, model):
         # run tiny validation (if validation defined)
         # to make sure program won't crash during val
         ref_model.on_sanity_check_start()
+        callback_metrics = {}
         if self.get_val_dataloaders() is not None and self.nb_sanity_val_steps > 0:
             # init progress bars for validation sanity check
             pbar = tqdm.tqdm(desc='Validation sanity check', total=self.nb_sanity_val_steps,
@@ -453,12 +456,21 @@ def run_pretrain_routine(self, model):
             # dummy validation progress bar
             self.val_progress_bar = tqdm.tqdm(disable=True)
 
-            self.evaluate(model, self.get_val_dataloaders(), self.nb_sanity_val_steps, self.testing)
+            eval_results = self.evaluate(model, self.get_val_dataloaders(),
+                                         self.nb_sanity_val_steps, False)
+            _, _, _, callback_metrics, _ = self.process_output(eval_results)
 
             # close progress bars
             self.main_progress_bar.close()
             self.val_progress_bar.close()
 
+        if (self.enable_early_stop and
+                callback_metrics.get(self.early_stop_callback.monitor) is None):
+            raise RuntimeError(f"Early stopping was configured to monitor "
+                               f"{self.early_stop_callback.monitor} but it is not available "
+                               f"after validation_end. Available metrics are: "
+                               f"{','.join(list(callback_metrics.keys()))}")
+
         # init progress bar
         pbar = tqdm.tqdm(leave=True, position=2 * self.process_position,
                          disable=not self.show_progress_bar, dynamic_ncols=True, unit='batch',