Source code for zensols.deeplearn.cli

"""Command line entry point to the application using the application CLI.

"""
from __future__ import annotations
__author__ = 'Paul Landes'
from typing import (
    List, Dict, Any, Type, Callable, Union, ClassVar, TYPE_CHECKING
)
if TYPE_CHECKING:
    from .result.manager import ModelResultManager, ModelResult
    from .result.report import ModelResultReporter
    from zensols.datdesc import DataDescriber
from dataclasses import dataclass, field
from enum import Enum, auto
import logging
import gc
import sys
import itertools as it
import copy as cp
from io import TextIOBase
from pathlib import Path
import pandas as pd
from zensols.util.std import stdout
from zensols.persist import (
    dealloc, Deallocatable, PersistedWork, persisted, Stash
)
from zensols.config import (
    Writable, Configurable, ImportConfigFactory, DictionaryConfig
)
from zensols.cli import (
    ApplicationError, Application, ApplicationFactory,
    ActionCliManager, Invokable, CliHarness,
)
from zensols.deeplearn import DeepLearnError, TorchConfig
from zensols.deeplearn.model import ModelFacade, ModelError, ModelPacker

logger = logging.getLogger(__name__)



[docs]
class InfoItem(Enum):
    """Indicates what information to dump in
    :meth:`.FacadeInfoApplication.print_information`.

    """
    meta = auto()
    param = auto()
    model = auto()
    config = auto()
    feature = auto()
    batch = auto()




[docs]
class ClearType(Enum):
    """Indicates what type of data to delete (clear).

    """
    none = auto()
    batch = auto()
    source = auto()




[docs]
class Format(Enum):
    txt = auto()
    json = auto()
    yaml = auto()
    csv = auto()
    latex = auto()
    render = auto()




[docs]
class BatchReport(Enum):
    none = auto()
    split = auto()
    labels = auto()
    stats = auto()




[docs]
class ReportType(Enum):
    combined = auto()
    label = auto()
    majority = auto()




[docs]
@dataclass
class FacadeApplication(Deallocatable):
    """Base class for applications that use :class:`.ModelFacade`.

    """
    CLI_META = {'mnemonic_excludes': {'get_cached_facade', 'create_facade',
                                      'deallocate', 'clear_cached_facade'},
                'option_overrides': {'model_path': {'long_name': 'model',
                                                    'short_name': None},
                                     'out_format': {'long_name': 'format',
                                                    'short_name': 'f'}}}
    """Tell the command line app API to igonore subclass and client specific use
    case methods.

    """
    config: Configurable = field()
    """The config used to create facade instances."""

    facade_name: str = field(default='facade')
    """The client facade."""

    # simply copy this field and documentation to the implementation class to
    # add model path location (for those subclasses that don't have the
    # ``CLASS_INSPECTOR`` class level attribute set (see
    # :obj:`~zensols.introspect.insp.ClassInspector.INSPECT_META`);
    # this can also be set as a parameter such as with
    # :meth:`.FacadeModelApplication.test`
    model_path: Path = field(default=None)
    """The path to the model or use the last trained model if not provided.

    """
    config_factory_args: Dict[str, Any] = field(default_factory=dict)
    """The arguments given to the :class:`~zensols.config.ImportConfigFactory`,
    which could be useful for reloading all classes while debugingg.

    """
    config_overwrites: Configurable = field(default=None)
    """A configurable that clobbers any configuration in :obj:`config` for those
    sections/options set.

    """
    cache_global_facade: bool = field(default=True)
    """Whether to globally cache the facade returned by
    :meth:`get_cached_facade`.

    """
    model_config_overwrites: Configurable = field(default=None)
    """Configuration that is injected into the model loaded by the
    :class:`..model.ModelManager`.

    """
    def __post_init__(self):
        self.dealloc_resources = []
        self._cached_facade = PersistedWork(
            '_cached_facade', self,
            cache_global=self.cache_global_facade)

    def _enable_cli_logging(self, facade: ModelFacade = None):
        if facade is None:
            with dealloc(self.create_facade()) as facade:
                self._enable_cli_logging(facade)
        else:
            facade.progress_bar = False
            facade.configure_cli_logging()

    def _get_model_path(self) -> Path:
        """Return the path to the model, which defaults to :obj:`model_path`."""
        return self.model_path

    def _get_batch_stash(self, facade: ModelFacade) -> Stash:
        return facade.batch_stash

    def _get_dataset_stash(self, facade: ModelFacade) -> Stash:
        return facade.batch_stash

    def _get_batch_metrics(self, facade: ModelFacade) -> Stash:
        return facade.get_batch_metrics()

    def _get_result_reporter(self, facade: ModelFacade) -> ModelResultReporter:
        return facade.get_result_reporter(cross_fold=False)


[docs]
    def create_facade(self) -> ModelFacade:
        """Create a new instance of the facade."""
        # we must create a new (non-shared) instance of the facade since it
        # will get deallcated after complete.
        config = self.config
        model_path = self._get_model_path()
        if self.config_overwrites is not None:
            config = cp.deepcopy(config)
            config.merge(self.config_overwrites)
        if model_path is None:
            cf = ImportConfigFactory(config, **self.config_factory_args)
            facade: ModelFacade = cf.instance(self.facade_name)
            if logger.isEnabledFor(logging.DEBUG):
                logger.debug(f'created facade: {facade}')
            self.dealloc_resources.extend((cf, facade))
        else:
            if logger.isEnabledFor(logging.INFO):
                logger.info(f'loading model from {model_path}')
            mconf = ImportConfigFactory(config, **self.config_factory_args)
            with dealloc(mconf) as cf:
                cls: Type[ModelFacade] = cf.get_class(self.facade_name)
            facade: ModelFacade = cls.load_from_path(
                path=model_path,
                model_config_overwrites=self.model_config_overwrites)
            if logger.isEnabledFor(logging.DEBUG):
                logger.debug(f'created facade: {type(facade)} ' +
                             f'from path: {model_path}')
            self.dealloc_resources.append(facade)
        return facade


    @persisted('_cached_facade')
    def get_cached_facade(self) -> ModelFacade:
        """Return a created facade that is cached in this application instance.

        """
        return self.create_facade()


[docs]
    def clear_cached_facade(self):
        """Clear any cached facade this application instance.

        """
        if self._cached_facade.is_set():
            self._cached_facade().deallocate()
        self._cached_facade.clear()



[docs]
    def deallocate(self):
        super().deallocate()
        self._try_deallocate(self.dealloc_resources, recursive=True)
        self._cached_facade.deallocate()





[docs]
@dataclass
class FacadeInfoApplication(FacadeApplication):
    """Contains methods that provide information about the model via the facade.

    """
    CLI_META = ActionCliManager.combine_meta(
        FacadeApplication,
        {'mnemonic_overrides': {'print_information': 'info'},
         'option_excludes': {'feature_stash_name'},
         'option_overrides': {'info_item': {'long_name': 'item',
                                            'short_name': 'i'},
                              'debug_value': {'long_name': 'execlevel',
                                              'short_name': None}}})

    feature_stash_name: str = field(default='feature_stash')
    """The section name of the stash to write for :obj:`.InfoItem.feature`."""


[docs]
    def print_information(self, info_item: InfoItem = None,
                          model_path: Path = None):
        """Output facade data set, vectorizer and other configuration
        information.

        :param info_item: what to print

        :param model_path: the path to the model or use the last trained model
                           if not provided

        """
        def write_feature():
            sec: str = self.feature_stash_name
            if sec in facade.config.sections:
                stash: Any = facade.config_factory(sec)
                if isinstance(stash, Writable):
                    stash.write()

        # see :class:`.FacadeApplicationFactory'
        def write_batch():
            for batch in it.islice(facade.batch_stash.values(), 2):
                batch.write()

        def write_model_config():
            if self.model_path is not None:
                # if the model path is given, we a facade model was created
                facade.model_config.write()
            else:
                # otherwise, use whatever configuration was used in this app
                facade.config.write()

        # inspect a model specified by a path
        self.model_path = model_path

        if not hasattr(self, '_no_op'):
            with dealloc(self.create_facade()) as facade:
                print(f'{facade.model_settings.model_name}:')
                fn_map = \
                    {None: facade.write,
                     InfoItem.meta: facade.batch_metadata.write,
                     InfoItem.param: facade.executor.write_settings,
                     InfoItem.model: facade.executor.write_model,
                     InfoItem.config: write_model_config,
                     InfoItem.feature: write_feature,
                     InfoItem.batch: write_batch}
                fn = fn_map.get(info_item)
                if fn is None:
                    raise DeepLearnError(f'No such info item: {info_item}')
                fn()



[docs]
    def debug(self, debug_value: int = None):
        """Debug the model.

        :param debug_value: the executor debugging level

        """
        debug_value = True if debug_value is None else debug_value
        with dealloc(self.create_facade()) as facade:
            facade.debug(debug_value)




@dataclass
class _DataDescriberProcessor(object):
    _DEFAULT_LATEX_DIR: ClassVar[str] = 'model-results'
    NO_WRITE: ClassVar[bool] = '_nowrite_'

    def _process_data_describer(self, out_file: Path, out_format: Format,
                                facade: ModelFacade, dd: DataDescriber,
                                res: ModelResult = None):
        def write_csv(facade: ModelFacade, w: TextIOBase):
            dd.describers[0].df.to_csv(w)

        def write_latex(facade: ModelFacade, out_file: Path):
            if out_file is None:
                out_file = Path(self._DEFAULT_LATEX_DIR)
            dd.output_dir = out_file
            logging.getLogger('zensols.datdesc').setLevel(logging.INFO)
            dd.save(include_excel=False)

        def render(facade: ModelFacade):
            from zensols.rend import ApplicationFactory
            ApplicationFactory.get_browser_manager()(dd)

        if out_file == self.NO_WRITE:
            return

        recommend_name: str = dd.describers[0].name.lower()
        fn: Callable = {
            Format.txt: (lambda w: res.write(writer=w)) if res else None,
            Format.json: (lambda w: res.asjson(w, indent=4)) if res else None,
            Format.yaml: res.asyaml if res else None,
            Format.csv: lambda w: write_csv(facade, w),
            Format.latex: lambda: write_latex(facade, out_file),
            Format.render: lambda: render(facade),
        }.get(out_format)
        if fn is None:
            raise ApplicationError(
                f'Format not supported: {out_format.name}')
        self._enable_cli_logging(facade)
        if out_format != Format.latex and out_format != Format.render:
            with stdout(out_file, recommend_name=recommend_name,
                        extension=out_format.name, logger=logger) as f:
                fn(f)
        else:
            fn()



[docs]
@dataclass
class FacadeResultApplication(FacadeApplication, _DataDescriberProcessor):
    """Contains methods that dump previous results.

    """
    CLI_META = ActionCliManager.combine_meta(
        FacadeApplication,
        {'mnemonic_overrides': {'result_ids': 'resids',
                                'run': 'resrun',
                                'summary': 'ressum',
                                'compare_results': 'rescmp'},
         'option_overrides': {'include_validation': {'long_name': 'validation',
                                                     'short_name': None},
                              'report_type': {'long_name': 'report'},
                              'describe': {'short_name': None},
                              'sort': {'short_name': 's'},
                              'out_file': {'long_name': 'outfile',
                                           'short_name': 'o'}}})


[docs]
    def result_ids(self):
        """Show all archived result IDs."""
        from zensols.deeplearn.result import ModelResultManager
        with dealloc(self.create_facade()) as facade:
            rm: ModelResultManager = \
                self._get_result_reporter(facade).result_manager
            print('\n'.join(rm.results_stash.keys()))


    def _run_combined(self, res_id: str = None, out_file: Path = None,
                      out_format: Format = None):
        """List the performance results as a summary.

        :param res_id: the result ID or use the last if not given

        :param out_file: the output path or ``-`` for standard out

        :param out_format: the output format

        """
        from zensols.datdesc import DataFrameDescriber, DataDescriber
        from zensols.deeplearn.result import \
            ModelResult, ModelResultReporter, PredictionsDataFrameFactory

        def create_data_describer(facade: ModelFacade) -> DataDescriber:
            rm: ModelResultManager = facade.result_manager
            reporter = ModelResultReporter(rm, include_validation=True)
            dfd: DataFrameDescriber = reporter.dataframe_describer
            dfd.name = 'run'
            if res_id is not None:
                dfd.df = dfd.df[dfd.df['resid'] == res_id]
            dfd = dfd.transpose()
            dfd = dfd.derive_with_index_meta()
            return DataDescriber(
                name=f'{facade.model_settings.model_name} Model Results',
                describers=(dfd,))

        out_format = Format.txt if out_format is None else out_format
        with dealloc(self.create_facade()) as facade:
            df_fac: PredictionsDataFrameFactory = \
                facade.get_predictions_factory(name=res_id)
            res: ModelResult = df_fac.result
            dd: DataDescriber = create_data_describer(facade)
            self._process_data_describer(out_file, out_format, facade, dd, res)
            return dd

    def _run_label(self, res_id: str = None, out_file: Path = None,
                   out_format: Format = None):
        """List the performance results by label.

        :param res_id: the result ID or use the last if not given

        :param out_file: the output path or ``-`` for standard out

        :param out_format: the output format

        """
        from zensols.datdesc import DataFrameDescriber, DataDescriber

        out_format = Format.csv if out_format is None else out_format
        with dealloc(self.create_facade()) as facade:
            dfd: DataFrameDescriber = facade.\
                get_predictions_factory(name=res_id).\
                metrics_dataframe_describer
            dfd.df = dfd.df.reset_index(drop=True)
            dd = DataDescriber(name=dfd.name, describers=(dfd,))
            dfd.name = 'label'
            self._process_data_describer(out_file, out_format, facade, dd)
            return dd

    def _run_majority_label(self, res_id: str = None, out_file: Path = None,
                            out_format: Format = None):
        """Show majority label metrics of the test dataset using a previous
        result set.

        :param res_id: the result ID or use the last if not given

        :param out_file: the output path or ``-`` for standard out

        :param out_format: the output format

        """
        from zensols.datdesc import DataFrameDescriber, DataDescriber
        from zensols.deeplearn.result import PredictionsDataFrameFactory

        out_format = Format.csv if out_format is None else out_format
        with dealloc(self.create_facade()) as facade:
            pfac: PredictionsDataFrameFactory = \
                facade.get_predictions_factory(name=res_id)
            dfd: DataFrameDescriber = pfac.majority_label_metrics_describer.\
                transpose()
            dd = DataDescriber(name=dfd.name, describers=(dfd,))
            dfd.name = 'majority-label'
            self._process_data_describer(out_file, out_format, facade, dd)
            return dd


[docs]
    def run(self, report_type: ReportType, res_id: str = None,
            out_file: Path = None, out_format: Format = None):
        """Report performance results.

        :param res_id: the result ID or use the last if not given

        :param out_file: the output path or ``-`` for standard out

        :param out_format: the output format

        """
        fn: Callable = {
            ReportType.combined: self._run_combined,
            ReportType.label: self._run_label,
            ReportType.majority: self._run_majority_label,
        }[report_type]
        return fn(res_id=res_id, out_file=out_file, out_format=out_format)



[docs]
    def summary(self, out_file: Path = None, out_format: Format = None,
                include_validation: bool = False):
        """Create a summary of all archived results.

        :param out_file: the output path or ``-`` for standard out

        :param out_format: the output format

        :param include_validation: whether to include validation results

        """
        from zensols.datdesc import DataFrameDescriber, DataDescriber
        from zensols.deeplearn.result import ModelResultReporter

        out_format = Format.csv if out_format is None else out_format
        with dealloc(self.create_facade()) as facade:
            reporter: ModelResultReporter = self._get_result_reporter(facade)
            reporter.include_validation = include_validation
            dfd: DataFrameDescriber = reporter.dataframe_describer
            dd = DataDescriber(name=dfd.name, describers=(dfd,))
            dfd.name = 'summary'
            self._process_data_describer(out_file, out_format, facade, dd)
            return dd



[docs]
    def compare_results(self, res_id_a: str, res_id_b: str):
        """Compare two previous archived result sets.

        :param res_id_a: the first result ID to compare

        :param res_id_b: the second result ID to compare

        """
        from zensols.deeplearn.result import ModelResultComparer
        with dealloc(self.create_facade()) as facade:
            rm: ModelResultComparer = facade.result_manager
            diff = ModelResultComparer(rm, res_id_a, res_id_b)
            diff.write()





[docs]
@dataclass
class FacadePackageApplication(FacadeApplication):
    """Contains methods that package models.

    """
    CLI_META = ActionCliManager.combine_meta(
        FacadeApplication,
        {'option_overrides':
         {'archive_model_dir': {'long_name': 'archdir', 'metavar': 'DIR'},
          'train_model_dir': {'long_name': 'modeldir', 'metavar': 'DIR'}},
         'option_excludes': {'packer'}})

    packer: ModelPacker = field(default=None)
    """The model packer used to create the model distributions from this app."""


[docs]
    def pack(self, res_id: str = None, archive_model_dir: Path = Path('.')):
        """Package a distribution model.

        :param res_id: the result ID or use the last if not given

        :param archive_model_dir: the directory where the packaged model is
                                 written

        """
        if res_id is None:
            with dealloc(self.create_facade()) as facade:
                self._enable_cli_logging(facade)
                res_id: str = facade.result_manager.get_last_id()
        self._enable_cli_logging()
        self.packer.pack(res_id, archive_model_dir)



[docs]
    def update_config(self, res_id: str = None, train_model_dir: Path = None):
        """Update a model's configuration.

        :param res_id: the result ID or use the last if not given

        :param train_model_dir: the trained model directory, which has the
                                weight and state files

        """
        from zensols.deeplearn.result import ModelResultManager, ArchivedResult
        with dealloc(self.create_facade()) as facade:
            mng: ModelResultManager = facade.result_manager
            if train_model_dir is None:
                if res_id is None:
                    res_id = mng.get_last_id()
                res: ArchivedResult = mng.results_stash[res_id]
                train_model_dir = res.model_path
            facade.update_model_config_factory(train_model_dir)
            if logger.isEnabledFor(logging.INFO):
                logger.info(f'updated model: {res.model_path}')





[docs]
@dataclass
class FacadeBatchApplication(FacadeApplication):
    """Create and analyze batches.

    """
    CLI_META = ActionCliManager.combine_meta(
        FacadeApplication,
        {'option_overrides':
         {'clear_type': {'long_name': 'ctype',
                         'short_name': None},
          'clear': {'short_name': None},
          'report': {'short_name': None},
          'limit': {'short_name': None}},
         'mnemonic_overrides':
         {'batch': {'option_includes': {'limit', 'clear_type', 'report'}}}})

    def _write_batch_splits(self, facade: ModelFacade):
        from zensols.dataset import \
            SplitStashContainer, StratifiedStashSplitKeyContainer
        batch_stash: Stash = self._get_batch_stash(facade)
        scont: SplitStashContainer = batch_stash.split_stash_container
        if hasattr(scont, 'split_container') and \
           isinstance(scont.split_container, StratifiedStashSplitKeyContainer):
            stash: StratifiedStashSplitKeyContainer = scont.split_container
            stash.stratified_write = True
            stash.write()

    def _write_batch_labels(self, facade: ModelFacade):
        df: pd.DataFrame = self._get_batch_metrics(facade).get_label_dataframe()
        model_name: str = facade.model_settings.normal_model_name
        out_file: Path = Path(f'{model_name}-split-labels.csv')
        df.to_csv(out_file, index=False)
        if logger.isEnabledFor(logging.INFO):
            logger.info(f'wrote batch labels: {out_file}')

    def _write_batch_stats(self, facade: ModelFacade):
        print(self._get_batch_metrics(facade).get_label_variance())

    def _prime(self, facade: ModelFacade):
        facade.batch_stash.prime()


[docs]
    def batch(self, limit: int = None, clear_type: ClearType = ClearType.none,
              report: BatchReport = BatchReport.none):
        """Create batches if not already, print statistics on the dataset.

        :param clear_type: what to delete to force recreate

        :param limit: the number of batches to create

        :param report: the type of report to generate

        """
        with dealloc(self.create_facade()) as facade:
            self._enable_cli_logging(facade)
            batch_stash: Stash = self._get_batch_stash(facade)
            dataset_stash: Stash = self._get_dataset_stash(facade)
            if clear_type == ClearType.batch:
                logger.info('clearing batches')
                batch_stash.clear()
            elif clear_type == ClearType.source:
                batch_stash.clear_all()
                batch_stash.clear()
            if limit is not None:
                batch_stash.batch_limit = limit
                if limit == 1:
                    batch_stash.workers = 1
            dataset_stash.write()
            fn: Callable = {
                BatchReport.none: self._prime,
                BatchReport.split: self._write_batch_splits,
                BatchReport.labels: self._write_batch_labels,
                BatchReport.stats: self._write_batch_stats,
            }[report]
            fn(facade)





[docs]
@dataclass
class FacadeModelApplication(FacadeApplication):
    """Test, train and validate models.

    """
    CLI_META = ActionCliManager.combine_meta(
        FacadeApplication,
        {'option_overrides': {'use_progress_bar': {'long_name': 'progress',
                                                   'short_name': 'p'},
                              'result_name': {'long_name': 'desc',
                                              'short_name': None}},
         'mnemonic_overrides': {'train_production': 'trainprod',
                                'early_stop': {'option_includes': {},
                                               'name': 'stop'}}})

    use_progress_bar: bool = field(default=False)
    """Display the progress bar."""


[docs]
    def create_facade(self) -> ModelFacade:
        """Create a new instance of the facade."""
        facade = super().create_facade()
        facade.progress_bar = self.use_progress_bar
        facade.configure_cli_logging()
        return facade



[docs]
    def train(self, result_name: str = None):
        """Train the model and dump the results, including a graph of the
        train/validation loss.

        :param result_name: a descriptor used in the results

        """
        with dealloc(self.create_facade()) as facade:
            if result_name is not None:
                facade.result_name = result_name
            facade.train()
            facade.persist_result()



[docs]
    def test(self, model_path: Path = None, result_name: str = None):
        """Test an existing model the model and dump the results of the test.

        :param model_path: the path to the model or use the last trained model
                           if not provided

        :param result_name: a descriptor used in the results

        """
        self.model_path = self._get_model_path()
        with dealloc(self.create_facade()) as facade:
            if result_name is not None:
                facade.result_name = result_name
            facade.test()



[docs]
    def train_test(self, result_name: str = None):
        """Train, test the model, then dump the results with a graph.

        :param result_name: a descriptor used in the results

        """
        with dealloc(self.create_facade()) as facade:
            if result_name is not None:
                facade.result_name = result_name
            facade.train()
            facade.test()
            facade.persist_result()



[docs]
    def train_production(self):
        """Train, test the model on train and test datasets, then dump the
        results with a graph.

        """
        with dealloc(self.create_facade()) as facade:
            facade.train_production()
            facade.persist_result()



[docs]
    def early_stop(self):
        """Stops the execution of training the model.

        """
        with dealloc(self.create_facade()) as facade:
            facade.stop_training()





[docs]
class FacadePredictApplication(FacadeApplication, _DataDescriberProcessor):
    """An applicaiton that provides prediction funtionality.

    """
    CLI_META = ActionCliManager.combine_meta(
        FacadeApplication,
        {'mnemonic_overrides': {'predictions': 'respreds'}})


[docs]
    def predictions(self, res_id: str = None, out_file: Path = None,
                    out_format: Format = None):
        """Write labels and predictions from the test set to a file (defaults to
        CSV).

        :param res_id: the result ID or use the last if not given

        :param out_file: the output path or ``-`` for standard out

        :param out_format: the output format

        """
        from zensols.datdesc import DataFrameDescriber, DataDescriber
        from zensols.deeplearn.result import PredictionsDataFrameFactory

        out_format = Format.csv if out_format is None else out_format
        with dealloc(self.create_facade()) as facade:
            # log from where the reults are read and output file message
            facade.configure_cli_logging()
            logging.getLogger('zensols.deeplearn.result').setLevel(logging.INFO)
            logger.setLevel(logging.INFO)
            try:
                pred_factory: PredictionsDataFrameFactory = \
                    facade.get_predictions_factory(name=res_id)
                dfd: DataFrameDescriber = pred_factory.dataframe_describer
                dd = DataDescriber(name=dfd.name, describers=(dfd,))
                dfd.name = 'predictions'
                self._process_data_describer(
                    out_file, out_format, facade, dd)
                return dd
            except ModelError as e:
                raise ApplicationError(
                    'Could not predict, probably need to train a model ' +
                    f'first: {e}') from e





[docs]
@dataclass
class FacadeApplicationFactory(ApplicationFactory):
    """This is a utility class that creates instances of
    :class:`.FacadeApplication`.  It's only needed if you need to create a
    facade without wanting invoke the command line attached to the
    applications.

    It does this by only invoking the first pass applications so all the
    correct initialization happens before returning factory artifacts.

    There mst be a :obj:`.FacadeApplication.facade_name` entry in the
    configuration tied to an instance of :class:`.FacadeApplication`.

    :see: :meth:`create_facade`

    """

[docs]
    def create_facade(self, args: List[str] = None,
                      app_args: Dict[str, Any] = None) -> ModelFacade:
        """Create the facade tied to the application without invoking the
        command line.

        :param args: the (would be) command line arguments used to create the
                     application

        :param app_args: the arguments to set on the the facade application
                         after it is created and before it creates the facade

        """
        create_args = ['info']
        if args is not None:
            create_args.extend(args)
        app: Application = self.create(create_args)
        inv: Invokable = app.invoke_but_second_pass()[1]
        fac_app: FacadeApplication = inv.instance
        if app_args is not None:
            for k, v in app_args.items():
                setattr(fac_app, k, v)
        return fac_app.create_facade()





[docs]
@dataclass
class FacadeApplicationManager(Writable):
    """A very high level client interface making it easy to configure and run
    models from an interactive environment such as a Python REPL or a Jupyter
    notebook (see :class:`.JupyterManager`)

    """
    cli_harness: CliHarness = field()
    """The CLI harness used to create the facade application."""

    cli_args_fn: List[str] = field(default=lambda: [])
    """Creates the arguments used to create the facade from the application
    factory.

    """
    reset_torch: bool = field(default=True)
    """Reset random state for consistency for each new created facade."""

    allocation_tracking: Union[bool, str] = field(default=False)
    """Whether or not to track resource/memory leaks.  If set to ``stack``, the
    stack traces of the unallocated objects will be printed.  If set to
    ``counts`` only the counts will be printed.  If set to ``True`` only the
    unallocated objects without the stack will be printed.

    """
    logger_name: str = field(default='notebook')
    """The name of the logger to use for logging in the notebook itself."""

    default_logging_level: str = field(default='WARNING')
    """If set, then initialize the logging system using this as the default

    logging level.  This is the upper case logging name such as ``WARNING``.
    """
    progress_bar_cols: int = field(default=120)
    """The number of columns to use for the progress bar."""

    config_overwrites: Dict[str, Dict[str, str]] = field(default_factory=dict)
    """Clobbers any configuration set by :meth:`config` for those
    sections/options set.

    """
    def __post_init__(self):
        if self.allocation_tracking:
            Deallocatable.ALLOCATION_TRACKING = True
        if self.logger_name is not None:
            self.logger = logging.getLogger(self.logger_name)
        else:
            self.logger = logger
        self._facade = None

    def _create_facade(self, args: List[str] = None,
                       app_args: Dict[str, Any] = None) -> ModelFacade:
        """Create the facade tied to the application without invoking the
        command line.

        :param args: the (would be) command line arguments used to create the
                     application

        :param app_args: the arguments to set on the the facade application
                         after it is created and before it creates the facade

        """
        create_args = ['info']
        if args is not None:
            create_args.extend(args)
        fac_app: FacadeApplication = self.cli_harness.get_instance(create_args)
        assert isinstance(fac_app, FacadeApplication)
        if app_args is not None:
            for k, v in app_args.items():
                setattr(fac_app, k, v)
        return fac_app.create_facade()


[docs]
    def cleanup(self, include_cuda: bool = True, quiet: bool = False):
        """Report memory leaks, run the Python garbage collector and optionally
        empty the CUDA cache.

        :param include_cuda: if ``True`` clear the GPU cache

        :param quiet: do not report unallocated objects, regardless of the
                      setting of :obj:`allocation_tracking`

        """
        if self.allocation_tracking and not quiet:
            include_stack, only_counts = False, False
            if self.allocation_tracking == 'stack':
                include_stack, only_counts = True, False
            elif self.allocation_tracking == 'counts':
                include_stack, only_counts = False, True
            include_stack = (self.allocation_tracking == 'stack')
            Deallocatable._print_undeallocated(include_stack, only_counts)
        self.deallocate()
        Deallocatable._deallocate_all()
        gc.collect()
        if include_cuda:
            # free up memory in the GPU
            TorchConfig.empty_cache()



[docs]
    def deallocate(self):
        """Deallocate all resources in the CLI factory if it exists."""
        if self._facade is not None:
            if self.logger.isEnabledFor(logging.INFO):
                self.logger.info('deallocating old factory')
            self._facade.deallocate()
            self._facade = None



[docs]
    def config(self, section: str, **kwargs):
        """Add overwriting configuration used when creating the facade.

        :param section: the section to be overwritten (or added)

        :param kwargs: the key/value pairs used as the section data to
                       overwrite

        :see: :meth:`create_facade`

        """
        if section not in self.config_overwrites:
            self.config_overwrites[section] = {}
        self.config_overwrites[section].update(kwargs)



[docs]
    def clear(self):
        """Clear all post create configuration set with :meth:`config`."""
        self.config_overwrites.clear()



[docs]
    def create_facade(self, *args, **kwargs) -> ModelFacade:
        """Create and return a facade.  This deallocates and cleans up state
        from any previous facade creation as a side effect.

        :param args: given to the :obj:`cli_args_fn` function to create
                     arguments passed to the CLI

        """
        if len(self.config_overwrites) > 0:
            dconf = DictionaryConfig(self.config_overwrites)
            app_args = {'config_overwrites': dconf}
        else:
            app_args = None
        self.deallocate()
        # reclaim memory running GC and GPU cache clear
        self.cleanup()
        try:
            # reset random state for consistency of each new test
            if self.reset_torch:
                TorchConfig.init()
            # create a factory that instantiates Python objects
            cli_args_fn = self.cli_args_fn(*args, **kwargs)
            # create the facade used for this instance
            self._facade: ModelFacade = self._create_facade(
                cli_args_fn, app_args)
            return self._facade
        except Exception as e:
            try:
                # recover the best we can
                self.cleanup(quiet=True)
                self._facade = None
            except Exception:
                pass
            raise DeepLearnError(f'Could not create facade: {e}') from e


    @property
    def facade(self) -> ModelFacade:
        """The current facade for this notebook instance.

        :return: the existing facade, or that created by :meth:`create_facade`
                 if it doesn't already exist

        """
        if self._facade is None:
            self.create_facade()
        self._facade.writer = None
        return self._facade


[docs]
    def run(self, display_results: bool = True):
        """Train, test and optionally show results.

        :param display_results: if ``True``, write and plot the results

        """
        try:
            facade = self.facade
            facade.train()
            facade.test()
            if display_results:
                facade.write_result()
                facade.plot_result()
        except Exception as e:
            try:
                facade = None
                # recover the best we can
                self.cleanup(quiet=True)
            except Exception:
                pass
            raise DeepLearnError('Could not run the model') from e



[docs]
    def show_leaks(self, output: str = 'counts', fail: bool = True):
        """Show all resources/memory leaks in the current facade.  First, this
        deallocates the facade, then prints any lingering objects using
        :class:`~zensols.persist.Deallocatable`.

        **Important**: :obj:`allocation_tracking` must be set to ``True`` for
        this to work.

        :param output: one of ``stack``, ``counts``, or ``tensors``

        :param fail: if ``True``, raise an exception if there are any
                     unallocated references found

        """
        if self._facade is None:
            raise DeepLearnError('No facade created yet')
        if self.allocation_tracking:
            self._facade.deallocate()
            if output == 'counts':
                Deallocatable._print_undeallocated(
                    only_counts=True, fail=fail)
            elif output == 'stack':
                Deallocatable._print_undeallocated(
                    include_stack=True, fail=fail)
            elif output == 'tensors':
                TorchConfig.write_in_memory_tensors()
            else:
                raise DeepLearnError(f'Unknown output type: {output}')
            self._facade = None



[docs]
    def write(self, depth: int = 0, writer: TextIOBase = sys.stdout,
              include_model=False, include_metadata=False,
              include_settings=False, **kwargs):
        self.facade.write(
            depth, writer,
            include_model=include_model,
            include_metadata=include_metadata,
            include_settings=include_settings,
            **kwargs)





[docs]
@dataclass
class JupyterManager(FacadeApplicationManager):
    """A facade application manager that provides additional convenience
    functionality.

    """
    reduce_logging: bool = field(default=False)
    """Whether to disable most information logging so the progress bar is more
    prevalent.

    """
    browser_width: int = field(default=95)
    """The width of the browser windows as a percentage."""

    def __post_init__(self):
        super().__post_init__()
        if self.browser_width is not None:
            self.set_browser_width(self.browser_width)


[docs]
    @staticmethod
    def set_browser_width(width: int = 95):
        """Use the entire width of the browser to create more real estate.

        :param width: the width as a percent (``[0, 100]``) to use as the width
                      in the notebook

        """
        from IPython.core.display import display, HTML
        html = f'<style>.container {{ width:{width}% !important; }}</style>'
        display(HTML(html))


    def _init_jupyter(self):
        """Initialize the a Jupyter notebook by configuring the logging system
        and setting the progress bar.

        """
        if self.reduce_logging:
            logging.getLogger('zensols.deeplearn.model.executor.status').\
                setLevel(logging.WARNING)
        else:
            log_level = None
            if self.default_logging_level is not None:
                log_level = getattr(logging, self.default_logging_level)
            # set console based logging
            self.facade.configure_jupyter(
                log_level=log_level,
                progress_bar_cols=self.progress_bar_cols)


[docs]
    def create_facade(self, *args, **kwargs) -> ModelFacade:
        facade = super().create_facade(*args, **kwargs)
        # initialize jupyter
        self._init_jupyter()
        return facade