2019-11-05 15:41:59 +00:00
|
|
|
import os
|
2020-02-27 21:21:14 +00:00
|
|
|
from abc import ABC, abstractmethod
|
2020-06-12 15:23:18 +00:00
|
|
|
from typing import List, Callable, Optional
|
2019-11-05 15:41:59 +00:00
|
|
|
|
2020-04-24 00:46:18 +00:00
|
|
|
|
|
|
|
from pytorch_lightning.callbacks import Callback, ModelCheckpoint, EarlyStopping, ProgressBarBase, ProgressBar
|
2020-02-27 21:21:14 +00:00
|
|
|
from pytorch_lightning.loggers import LightningLoggerBase
|
2020-04-24 00:46:18 +00:00
|
|
|
from pytorch_lightning.utilities.exceptions import MisconfigurationException
|
2019-10-22 01:16:51 +00:00
|
|
|
|
|
|
|
|
2019-12-04 15:57:32 +00:00
|
|
|
class TrainerCallbackConfigMixin(ABC):
|
|
|
|
|
2020-02-27 21:21:14 +00:00
|
|
|
# this is just a summary on variables used in this abstract class,
|
|
|
|
# the proper values/initialisation should be done in child class
|
2020-04-24 00:46:18 +00:00
|
|
|
callbacks: List[Callback]
|
2020-04-10 16:02:59 +00:00
|
|
|
default_root_dir: str
|
2020-06-12 15:23:18 +00:00
|
|
|
logger: LightningLoggerBase
|
|
|
|
weights_save_path: Optional[str]
|
2020-03-03 02:50:38 +00:00
|
|
|
ckpt_path: str
|
2020-06-12 15:23:18 +00:00
|
|
|
checkpoint_callback: Optional[ModelCheckpoint]
|
2020-02-27 21:21:14 +00:00
|
|
|
|
|
|
|
@property
|
|
|
|
@abstractmethod
|
|
|
|
def slurm_job_id(self) -> int:
|
|
|
|
"""Warning: this is just empty shell for code implemented in other class."""
|
|
|
|
|
|
|
|
@abstractmethod
|
|
|
|
def save_checkpoint(self, *args):
|
|
|
|
"""Warning: this is just empty shell for code implemented in other class."""
|
2019-12-04 15:57:32 +00:00
|
|
|
|
2020-06-12 15:23:18 +00:00
|
|
|
@abstractmethod
|
|
|
|
def is_overridden(self, *args):
|
|
|
|
"""Warning: this is just empty shell for code implemented in other class."""
|
|
|
|
|
2020-06-29 01:36:46 +00:00
|
|
|
def configure_checkpoint_callback(self, checkpoint_callback):
|
2019-10-22 01:16:51 +00:00
|
|
|
"""
|
|
|
|
Weight path set in this priority:
|
|
|
|
Checkpoint_callback's path (if passed in).
|
|
|
|
User provided weights_saved_path
|
|
|
|
Otherwise use os.getcwd()
|
|
|
|
"""
|
2020-06-29 01:36:46 +00:00
|
|
|
if checkpoint_callback is True:
|
2020-03-05 04:02:19 +00:00
|
|
|
# when no val step is defined, use 'loss' otherwise 'val_loss'
|
2020-05-07 13:25:54 +00:00
|
|
|
train_step_only = not self.is_overridden('validation_step')
|
2020-03-05 04:02:19 +00:00
|
|
|
monitor_key = 'loss' if train_step_only else 'val_loss'
|
2020-06-29 01:36:46 +00:00
|
|
|
checkpoint_callback = ModelCheckpoint(
|
|
|
|
filepath=None,
|
|
|
|
monitor=monitor_key
|
|
|
|
)
|
|
|
|
elif checkpoint_callback is False:
|
|
|
|
checkpoint_callback = None
|
2020-03-05 04:02:19 +00:00
|
|
|
|
2020-06-29 01:36:46 +00:00
|
|
|
if checkpoint_callback:
|
|
|
|
checkpoint_callback.save_function = self.save_checkpoint
|
2019-10-22 01:16:51 +00:00
|
|
|
|
|
|
|
# if weights_save_path is still none here, set to current working dir
|
|
|
|
if self.weights_save_path is None:
|
2020-04-10 16:02:59 +00:00
|
|
|
self.weights_save_path = self.default_root_dir
|
2019-10-22 01:16:51 +00:00
|
|
|
|
2020-06-29 01:36:46 +00:00
|
|
|
return checkpoint_callback
|
|
|
|
|
2020-01-26 14:42:57 +00:00
|
|
|
def configure_early_stopping(self, early_stop_callback):
|
2020-03-02 22:12:22 +00:00
|
|
|
if early_stop_callback is True or None:
|
2020-06-29 01:36:46 +00:00
|
|
|
early_stop_callback = EarlyStopping(
|
2019-10-22 01:16:51 +00:00
|
|
|
monitor='val_loss',
|
|
|
|
patience=3,
|
2020-01-23 16:12:51 +00:00
|
|
|
strict=True,
|
2019-10-22 01:16:51 +00:00
|
|
|
verbose=True,
|
|
|
|
mode='min'
|
|
|
|
)
|
|
|
|
elif not early_stop_callback:
|
2020-06-29 01:36:46 +00:00
|
|
|
early_stop_callback = None
|
2019-10-22 01:16:51 +00:00
|
|
|
else:
|
2020-06-29 01:36:46 +00:00
|
|
|
early_stop_callback = early_stop_callback
|
|
|
|
return early_stop_callback
|
2020-04-24 00:46:18 +00:00
|
|
|
|
2020-05-25 11:49:23 +00:00
|
|
|
def configure_progress_bar(self, refresh_rate=1, process_position=0):
|
2020-04-24 00:46:18 +00:00
|
|
|
progress_bars = [c for c in self.callbacks if isinstance(c, ProgressBarBase)]
|
|
|
|
if len(progress_bars) > 1:
|
|
|
|
raise MisconfigurationException(
|
|
|
|
'You added multiple progress bar callbacks to the Trainer, but currently only one'
|
|
|
|
' progress bar is supported.'
|
|
|
|
)
|
|
|
|
elif len(progress_bars) == 1:
|
2020-05-25 11:49:23 +00:00
|
|
|
progress_bar_callback = progress_bars[0]
|
|
|
|
elif refresh_rate > 0:
|
|
|
|
progress_bar_callback = ProgressBar(
|
|
|
|
refresh_rate=refresh_rate,
|
|
|
|
process_position=process_position,
|
2020-04-24 00:46:18 +00:00
|
|
|
)
|
2020-05-25 11:49:23 +00:00
|
|
|
self.callbacks.append(progress_bar_callback)
|
2020-04-24 00:46:18 +00:00
|
|
|
else:
|
2020-05-25 11:49:23 +00:00
|
|
|
progress_bar_callback = None
|
|
|
|
|
|
|
|
return progress_bar_callback
|