Source code for zoo.chronos.autots.model.base_automodel

#
# Copyright 2018 Analytics Zoo Authors.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either exp'
# ress or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

import os
import json
DEFAULT_BEST_MODEL_DIR = "best_model.ckpt"
DEFAULT_BEST_CONFIG_DIR = "best_config.json"


[docs]class BasePytorchAutomodel:
    def __init__(self, **kwargs):
        self.best_model = None

[docs]    def fit(self,
            data,
            epochs=1,
            batch_size=32,
            validation_data=None,
            metric_threshold=None,
            n_sampling=1,
            search_alg=None,
            search_alg_params=None,
            scheduler=None,
            scheduler_params=None,
            ):
        """
        Automatically fit the model and search for the best hyper parameters.

        :param data: train data.
               data can be a tuple of ndarrays or a PyTorch DataLoader
               or a function that takes a config dictionary as parameter and returns a
               PyTorch DataLoader.
        :param epochs: Max number of epochs to train in each trial. Defaults to 1.
               If you have also set metric_threshold, a trial will stop if either it has been
               optimized to the metric_threshold or it has been trained for {epochs} epochs.
        :param batch_size: Int or hp sampling function from an integer space. Training batch size.
               It defaults to 32.
        :param validation_data: Validation data. Validation data type should be the same as data.
        :param metric_threshold: a trial will be terminated when metric threshold is met.
        :param n_sampling: Number of times to sample from the search_space. Defaults to 1.
               If hp.grid_search is in search_space, the grid will be repeated n_sampling of times.
               If this is -1, (virtually) infinite samples are generated
               until a stopping condition is met.
        :param search_alg: str, all supported searcher provided by ray tune
               (i.e."variant_generator", "random", "ax", "dragonfly", "skopt",
               "hyperopt", "bayesopt", "bohb", "nevergrad", "optuna", "zoopt" and
               "sigopt").
        :param search_alg_params: extra parameters for searcher algorithm besides search_space,
               metric and searcher mode.
        :param scheduler: str, all supported scheduler provided by ray tune.
        :param scheduler_params: parameters for scheduler.
        """
        self.search_space["batch_size"] = batch_size
        self.auto_est.fit(
            data=data,
            epochs=epochs,
            validation_data=validation_data,
            metric=self.metric,
            metric_threshold=metric_threshold,
            n_sampling=n_sampling,
            search_space=self.search_space,
            search_alg=search_alg,
            search_alg_params=search_alg_params,
            scheduler=scheduler,
            scheduler_params=scheduler_params,
        )
        self.best_model = self.auto_est._get_best_automl_model()
        self.best_config = self.auto_est.get_best_config()

[docs]    def predict(self, data, batch_size=32):
        '''
        Predict using a the trained model after HPO(Hyper Parameter Optimization).

        :param data: a numpy ndarray x, where x's shape is (num_samples, lookback, feature_dim)
               where lookback and feature_dim should be the same as past_seq_len and
               input_feature_num.
        :param batch_size: predict batch size. The value will not affect predict
               result but will affect resources cost(e.g. memory and time). The value
               defaults to 32.

        :return: A numpy array with shape (num_samples, horizon, target_dim).
        '''
        if self.best_model is None:
            raise RuntimeError("You must call fit or load first before calling predict!")
        return self.best_model.predict(data, batch_size=batch_size)

[docs]    def predict_with_onnx(self, data, batch_size=32, dirname=None):
        '''
        Predict using a the trained model after HPO(Hyper Parameter Optimization).

        Be sure to install onnx and onnxruntime to enable this function. The method
        will give exactly the same result as .predict() but with higher throughput
        and lower latency.

        :param data: a numpy ndarray x, where x's shape is (num_samples, lookback, feature_dim)
               where lookback and feature_dim should be the same as past_seq_len and
               input_feature_num.
        :param batch_size: predict batch size. The value will not affect predict
               result but will affect resources cost(e.g. memory and time). The value
               defaults to 32.
        :param dirname: The directory to save onnx model file. This value defaults
               to None for no saving file.

        :return: A numpy array with shape (num_samples, horizon, target_dim).
        '''
        if self.best_model is None:
            raise RuntimeError("You must call fit or load first before calling predict!")
        return self.best_model.predict_with_onnx(data, batch_size=batch_size, dirname=dirname)

[docs]    def evaluate(self, data,
                 batch_size=32,
                 metrics=["mse"],
                 multioutput="raw_values"):
        '''
        Evaluate using a the trained model after HPO(Hyper Parameter Optimization).

        Please note that evaluate result is calculated by scaled y and yhat. If you scaled
        your data (e.g. use .scale() on the TSDataset) please follow the following code
        snap to evaluate your result if you need to evaluate on unscaled data.

        >>> from zoo.automl.metrics import Evaluator
        >>> y_hat = automodel.predict(x)
        >>> y_hat_unscaled = tsdata.unscale_numpy(y_hat) # or other customized unscale methods
        >>> y_unscaled = tsdata.unscale_numpy(y) # or other customized unscale methods
        >>> Evaluator.evaluate(metric=..., y_unscaled, y_hat_unscaled, multioutput=...)

        :param data: a numpy ndarray tuple (x, y) x's shape is (num_samples, lookback,
               feature_dim) where lookback and feature_dim should be the same as
               past_seq_len and input_feature_num. y's shape is (num_samples, horizon,
               target_dim), where horizon and target_dim should be the same as
               future_seq_len and output_target_num.
        :param batch_size: evaluate batch size. The value will not affect evaluate
               result but will affect resources cost(e.g. memory and time).
        :param metrics: a list stated the metric names to be evaluated.
        :param multioutput: Defines aggregating of multiple output values.
               String in ['raw_values', 'uniform_average']. The value defaults to
               'raw_values'.

        :return: A list of evaluation results. Each item represents a metric.
        '''
        if self.best_model is None:
            raise RuntimeError("You must call fit or load first before calling predict!")
        return self.best_model.evaluate(data[0], data[1], metrics=metrics,
                                        multioutput=multioutput, batch_size=batch_size)

[docs]    def evaluate_with_onnx(self, data,
                           batch_size=32,
                           metrics=["mse"],
                           dirname=None,
                           multioutput="raw_values"):
        '''
        Evaluate using a the trained model after HPO(Hyper Parameter Optimization).

        Be sure to install onnx and onnxruntime to enable this function. The method
        will give exactly the same result as .evaluate() but with higher throughput
        and lower latency.

        Please note that evaluate result is calculated by scaled y and yhat. If you scaled
        your data (e.g. use .scale() on the TSDataset) please follow the following code
        snap to evaluate your result if you need to evaluate on unscaled data.

        >>> from zoo.automl.metrics import Evaluator
        >>> y_hat = automodel.predict_with_onnx(x)
        >>> y_hat_unscaled = tsdata.unscale_numpy(y_hat) # or other customized unscale methods
        >>> y_unscaled = tsdata.unscale_numpy(y) # or other customized unscale methods
        >>> Evaluator.evaluate(metric=..., y_unscaled, y_hat_unscaled, multioutput=...)

        :param data: a numpy ndarray tuple (x, y) x's shape is (num_samples, lookback,
               feature_dim) where lookback and feature_dim should be the same as
               past_seq_len and input_feature_num. y's shape is (num_samples, horizon,
               target_dim), where horizon and target_dim should be the same as
               future_seq_len and output_target_num.
        :param batch_size: evaluate batch size. The value will not affect evaluate
               result but will affect resources cost(e.g. memory and time).
        :param metrics: a list stated the metric names to be evaluated.
        :param dirname: The directory to save onnx model file. This value defaults
               to None for no saving file.
        :param multioutput: Defines aggregating of multiple output values.
               String in ['raw_values', 'uniform_average']. The value defaults to
               'raw_values'.

        :return: A list of evaluation results. Each item represents a metric.
        '''
        if self.best_model is None:
            raise RuntimeError("You must call fit or load first before calling predict!")
        return self.best_model.evaluate_with_onnx(data[0], data[1],
                                                  metrics=metrics,
                                                  dirname=dirname,
                                                  multioutput=multioutput,
                                                  batch_size=batch_size)

[docs]    def save(self, checkpoint_path):
        """
        Save the best model.

        Please note that if you only want the pytorch model or onnx model
        file, you can call .get_model() or .export_onnx_file(). The checkpoint
        file generated by .save() method can only be used by .load() in automodel.

        :param checkpoint_path: The location you want to save the best model.
        """
        if self.best_model is None:
            raise RuntimeError("You must call fit or load first before calling predict!")
        if not os.path.isdir(checkpoint_path):
            os.mkdir(checkpoint_path)
        model_path = os.path.join(checkpoint_path, DEFAULT_BEST_MODEL_DIR)
        best_config_path = os.path.join(checkpoint_path, DEFAULT_BEST_CONFIG_DIR)
        self.best_model.save(model_path)
        with open(best_config_path, "w") as f:
            json.dump(self.best_config, f)

[docs]    def load(self, checkpoint_path):
        """
        restore the best model.

        :param checkpoint_path: The checkpoint location you want to load the best model.
        """
        model_path = os.path.join(checkpoint_path, DEFAULT_BEST_MODEL_DIR)
        best_config_path = os.path.join(checkpoint_path, DEFAULT_BEST_CONFIG_DIR)
        self.best_model.restore(model_path)
        with open(best_config_path, "r") as f:
            self.best_config = json.load(f)

[docs]    def build_onnx(self, thread_num=None, sess_options=None):
        '''
        Build onnx model to speed up inference and reduce latency.
        The method is Not required to call before predict_with_onnx,
        evaluate_with_onnx or export_onnx_file.
        It is recommended to use when you want to:

        | 1. Strictly control the thread to be used during inferencing.
        | 2. Alleviate the cold start problem when you call predict_with_onnx
             for the first time.

        :param thread_num: int, the num of thread limit. The value is set to None by
               default where no limit is set.
        :param sess_options: an onnxruntime.SessionOptions instance, if you set this
               other than None, a new onnxruntime session will be built on this setting
               and ignore other settings you assigned(e.g. thread_num...).

        Example:
            >>> # to pre build onnx sess
            >>> automodel.build_onnx(thread_num=1)  # build onnx runtime sess for single thread
            >>> pred = automodel.predict_with_onnx(data)
            >>> # ------------------------------------------------------
            >>> # directly call onnx related method is also supported
            >>> pred = automodel.predict_with_onnx(data)
        '''
        import onnxruntime
        if sess_options is not None and not isinstance(sess_options, onnxruntime.SessionOptions):
            raise RuntimeError("sess_options should be an onnxruntime.SessionOptions instance"
                               f", but f{type(sess_options)}")
        if self.distributed:
            raise NotImplementedError("build_onnx has not been supported for distributed\
                                       forecaster. You can call .to_local() to transform the\
                                       forecaster to a non-distributed version.")
        import torch
        dummy_input = torch.rand(1, self.best_config["past_seq_len"],
                                 self.best_config["input_feature_num"])
        self.best_model._build_onnx(dummy_input,
                                    dirname=None,
                                    thread_num=thread_num,
                                    sess_options=None)

[docs]    def export_onnx_file(self, dirname):
        """
        Save the onnx model file to the disk.

        :param dirname: The dir location you want to save the onnx file.
        """
        if self.distributed:
            raise NotImplementedError("export_onnx_file has not been supported for distributed\
                                       forecaster. You can call .to_local() to transform the\
                                       forecaster to a non-distributed version.")
        import torch
        dummy_input = torch.rand(1, self.best_config["past_seq_len"],
                                 self.best_config["input_feature_num"])
        self.best_model._build_onnx(dummy_input, dirname)

[docs]    def get_best_model(self):
        """
        Get the best pytorch model.
        """
        return self.auto_est.get_best_model()

[docs]    def get_best_config(self):
        """
        Get the best configuration

        :return: A dictionary of best hyper parameters
        """
        return self.best_config

    def _get_best_automl_model(self):
        return self.best_model