Shellmiao
/
FateWithShellmiaoComment


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412
							#!/usr/bin/env python
# -*- coding: utf-8 -*-

#
#  Copyright 2019 The FATE Authors. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
#
################################################################################
#
#
################################################################################
import copy
from federatedml.util import LOGGER
from federatedml.util import consts
from federatedml.param.evaluation_param import EvaluateParam
from federatedml.evaluation.performance_recorder import PerformanceRecorder
from federatedml.transfer_variable.transfer_class.validation_strategy_transfer_variable import  \
    ValidationStrategyVariable
from federatedml.callbacks.callback_base import CallbackBase
from federatedml.feature.instance import Instance


class ValidationStrategy(CallbackBase):
    """
    This module is used for evaluating the performance of model during training process.
        it will be called only in fit process of models.

    Attributes
    ----------

    validation_freqs: None or positive integer or container object in python. Do validation in training process or Not.
                      if equals None, will not do validation in train process;
                      if equals positive integer, will validate data every validation_freqs epochs passes;
                      if container object in python, will validate data if epochs belong to this container.
                        e.g. validation_freqs = [10, 15], will validate data when epoch equals to 10 and 15.
                      Default: None

    train_data: None or Table,
                if train_data not equal to None, and judge need to validate data according to validation_freqs,
                training data will be used for evaluating

    validate_data: None or Table,
                if validate_data not equal to None, and judge need to validate data according to validation_freqs,
                validate data will be used for evaluating
    """

    def __init__(self, role=None, mode=None, validation_freqs=None, early_stopping_rounds=None,
                 use_first_metric_only=False, arbiter_comm=True):

        self.validation_freqs = validation_freqs
        self.role = role
        self.mode = mode
        self.flowid = ''
        self.train_data = None
        self.validate_data = None

        # early stopping related vars
        self.arbiter_comm = arbiter_comm
        self.sync_status = False
        self.early_stopping_rounds = early_stopping_rounds
        self.use_first_metric_only = use_first_metric_only
        self.first_metric = None
        self._evaluation_summary = {}

        # precompute scores
        self.cached_train_scores = None
        self.cached_validate_scores = None
        self.use_precompute_train_scores = False
        self.use_precompute_validate_scores = False

        if early_stopping_rounds is not None:
            if early_stopping_rounds <= 0:
                raise ValueError('early stopping error should be larger than 0')
            if self.mode == consts.HOMO:
                raise ValueError('early stopping is not supported for homo algorithms')

            self.sync_status = True
            LOGGER.debug("early stopping round is {}".format(self.early_stopping_rounds))

        self.cur_best_model = None
        self.best_iteration = -1
        self.metric_best_model = {}  # best model of a certain metric
        self.metric_best_iter = {}  # best iter of a certain metric
        self.performance_recorder = PerformanceRecorder()  # recorder to record performances

        self.transfer_inst = ValidationStrategyVariable()

    def set_train_data(self, train_data):
        self.train_data = train_data

    def set_validate_data(self, validate_data):
        self.validate_data = validate_data
        if self.early_stopping_rounds and self.validate_data is None:
            raise ValueError('validate data is needed when early stopping is enabled')

    def set_flowid(self, flowid):
        self.flowid = flowid

    def need_run_validation(self, epoch):
        LOGGER.debug("validation_freqs is {}".format(self.validation_freqs))
        if not self.validation_freqs:
            return False

        if isinstance(self.validation_freqs, int):
            return (epoch + 1) % self.validation_freqs == 0

        return epoch in self.validation_freqs

    @staticmethod
    def generate_flowid(prefix, epoch, keywords="iteration", data_type="train"):
        return "_".join([prefix, keywords, str(epoch), data_type])

    @staticmethod
    def make_data_set_name(need_cv, need_run_ovr, model_flowid, epoch):
        data_iteration_name = "_".join(["iteration", str(epoch)])
        if not need_cv and not need_run_ovr:
            return data_iteration_name

        if need_cv:
            if not need_run_ovr:
                prefix = "_".join(["fold", model_flowid.split(".", -1)[-1]])
            else:
                prefix = "_".join(["fold", model_flowid.split(".", -1)[-2]])
                prefix = ".".join([prefix, model_flowid.split(".", -1)[-1]])
        else:
            prefix = model_flowid.split(".", -1)[-1]

        return ".".join([prefix, data_iteration_name])

    @staticmethod
    def extract_best_model(model):
        best_model = model.export_model()
        return {'model': {'best_model': best_model}} if best_model is not None else None

    def is_best_performance_updated(self, use_first_metric_only=False):
        if len(self.performance_recorder.no_improvement_round.items()) == 0:
            return False
        for metric, no_improve_val in self.performance_recorder.no_improvement_round.items():
            if no_improve_val != 0:
                return False
            if use_first_metric_only:
                break
        return True

    def update_early_stopping_status(self, iteration, model):

        first_metric = True
        if self.role == consts.GUEST:
            LOGGER.info('showing early stopping status, {} shows cur best performances: {}'.format(
                self.role, self.performance_recorder.cur_best_performance))

        LOGGER.info('showing early stopping status, {} shows early stopping no improve rounds: {}'.format(
            self.role, self.performance_recorder.no_improvement_round))

        for metric, no_improve_round in self.performance_recorder.no_improvement_round.items():
            if no_improve_round == 0:
                self.metric_best_iter[metric] = iteration
                self.metric_best_model[metric] = self.extract_best_model(model)
                LOGGER.info('best model of metric {} is now updated to {}'.format(metric, iteration))
                # if early stopping is not triggered, return best model of first metric by default
                if first_metric:
                    LOGGER.info('default best model: metric {}, iter {}'.format(metric, iteration))
                    self.cur_best_model = self.metric_best_model[metric]
                    self.best_iteration = iteration
            first_metric = False

    def check_early_stopping(self,):
        """
        check if satisfy early_stopping_round
        Returns bool
        """
        LOGGER.info('checking early stopping')

        no_improvement_dict = self.performance_recorder.no_improvement_round
        for metric in no_improvement_dict:
            if no_improvement_dict[metric] >= self.early_stopping_rounds:
                self.best_iteration = self.metric_best_iter[metric]
                self.cur_best_model = self.metric_best_model[metric]
                LOGGER.info('early stopping triggered, model of iter {} is chosen because metric {} satisfied'
                            'stop condition'.format(self.best_iteration, metric))
                return True

        return False

    def sync_performance_recorder(self, epoch):
        """
        sync synchronize self.performance_recorder
        """
        if self.mode == consts.HETERO and self.role == consts.GUEST:
            recorder_to_send = copy.deepcopy(self.performance_recorder)
            recorder_to_send.cur_best_performance = None
            if self.arbiter_comm:
                self.transfer_inst.validation_status.remote(recorder_to_send, idx=-1, suffix=(epoch,))
            else:
                self.transfer_inst.validation_status.remote(recorder_to_send, idx=-1, suffix=(epoch,),
                                                            role=consts.HOST)

        elif self.mode == consts.HETERO:
            self.performance_recorder = self.transfer_inst.validation_status.get(idx=-1, suffix=(epoch,))[0]

        else:
            return

    def need_stop(self):
        return False if not self.early_stopping_rounds else self.check_early_stopping()

    def has_saved_best_model(self):
        return (self.early_stopping_rounds is not None) and (self.cur_best_model is not None)

    def export_best_model(self):
        if self.has_saved_best_model():
            return self.cur_best_model
        else:
            return None

    def summary(self):
        return self._evaluation_summary

    def update_metric_summary(self, metric_dict):

        iter_name = list(metric_dict.keys())[0]
        metric_dict = metric_dict[iter_name]

        if len(self._evaluation_summary) == 0:
            self._evaluation_summary = {namespace: {} for namespace in metric_dict}

        for namespace in metric_dict:
            for metric_name in metric_dict[namespace]:
                epoch_metric = metric_dict[namespace][metric_name]
                if metric_name not in self._evaluation_summary[namespace]:
                    self._evaluation_summary[namespace][metric_name] = []
                self._evaluation_summary[namespace][metric_name].append(epoch_metric)

    def evaluate(self, predicts, model, epoch):

        evaluate_param: EvaluateParam = model.get_metrics_param()
        evaluate_param.check_single_value_default_metric()

        from federatedml.evaluation.evaluation import Evaluation
        eval_obj = Evaluation()
        eval_type = evaluate_param.eval_type

        metric_list = evaluate_param.metrics
        if self.early_stopping_rounds and self.use_first_metric_only and len(metric_list) != 0:

            single_metric_list = None
            if eval_type == consts.BINARY:
                single_metric_list = consts.BINARY_SINGLE_VALUE_METRIC
            elif eval_type == consts.REGRESSION:
                single_metric_list = consts.REGRESSION_SINGLE_VALUE_METRICS
            elif eval_type == consts.MULTY:
                single_metric_list = consts.MULTI_SINGLE_VALUE_METRIC

            for metric in metric_list:
                if metric in single_metric_list:
                    self.first_metric = metric
                    LOGGER.debug('use {} as first metric'.format(self.first_metric))
                    break

        eval_obj._init_model(evaluate_param)
        eval_obj.set_tracker(model.tracker)
        data_set_name = self.make_data_set_name(model.need_cv, model.callback_one_vs_rest, model.flowid, epoch)
        eval_data = {data_set_name: predicts}
        eval_result_dict = eval_obj.fit(eval_data, return_result=True)
        epoch_summary = eval_obj.summary()
        self.update_metric_summary(epoch_summary)
        eval_obj.save_data()
        LOGGER.debug("end of eval")

        return eval_result_dict

    @staticmethod
    def _add_data_type_map_func(value, data_type):
        new_pred_rs = Instance(features=value.features + [data_type], inst_id=value.inst_id)
        return new_pred_rs

    @staticmethod
    def add_data_type(predicts, data_type: str):
        """
        predict data add data_type
        """
        predicts = predicts.mapValues(lambda value: ValidationStrategy._add_data_type_map_func(value, data_type))
        return predicts

    def handle_precompute_scores(self, precompute_scores, data_type):

        if self.mode == consts.HETERO and self.role == consts.HOST:
            return None
        if self.role == consts.ARBITER:
            return None

        LOGGER.debug('using precompute scores')

        return self.add_data_type(precompute_scores, data_type)

    def get_predict_result(self, model, epoch, data, data_type: str):

        if not data:
            return

        LOGGER.debug("start to evaluate data {}".format(data_type))
        model_flowid = model.flowid
        # model_flowid = ".".join(model.flowid.split(".", -1)[1:])
        flowid = self.generate_flowid(model_flowid, epoch, "iteration", data_type)
        model.set_flowid(flowid)
        predicts = model.predict(data)
        model.set_flowid(model_flowid)

        if self.mode == consts.HOMO and self.role == consts.ARBITER:
            pass
        elif self.mode == consts.HETERO and self.role == consts.HOST:
            pass
        else:
            predicts = self.add_data_type(predicts, data_type)

        return predicts

    def set_precomputed_train_scores(self, train_scores):
        self.use_precompute_train_scores = True
        self.cached_train_scores = train_scores

    def set_precomputed_validate_scores(self, validate_scores):
        self.use_precompute_validate_scores = True
        self.cached_validate_scores = validate_scores

    def validate(self, model, epoch):
        """
        :param model: model instance, which has predict function
        :param epoch: int, epoch idx for generating flow id
        """

        LOGGER.debug(
            "begin to check validate status, need_run_validation is {}".format(
                self.need_run_validation(epoch)))

        if not self.need_run_validation(epoch):
            return

        if self.mode == consts.HOMO and self.role == consts.ARBITER:
            return

        if not self.use_precompute_train_scores:  # call model.predict()
            train_predicts = self.get_predict_result(model, epoch, self.train_data, "train")
        else:  # use precomputed scores
            train_predicts = self.handle_precompute_scores(self.cached_train_scores, 'train')

        if not self.use_precompute_validate_scores:  # call model.predict()
            validate_predicts = self.get_predict_result(model, epoch, self.validate_data, "validate")
        else:  # use precomputed scores
            validate_predicts = self.handle_precompute_scores(self.cached_validate_scores, 'validate')

        if train_predicts is not None or validate_predicts is not None:

            predicts = train_predicts
            if validate_predicts:
                predicts = predicts.union(validate_predicts)

            # running evaluation
            eval_result_dict = self.evaluate(predicts, model, epoch)
            LOGGER.debug('showing eval_result_dict here')
            LOGGER.debug(eval_result_dict)

            if self.early_stopping_rounds:

                if len(eval_result_dict) == 0:
                    raise ValueError(
                        "eval_result len is 0, no single value metric detected for early stopping checking")

                if self.use_first_metric_only:
                    if self.first_metric:
                        eval_result_dict = {self.first_metric: eval_result_dict[self.first_metric]}
                    else:
                        LOGGER.warning('use first metric only but no single metric found in metric list')

                self.performance_recorder.update(eval_result_dict)

        if self.sync_status:
            self.sync_performance_recorder(epoch)

        if self.early_stopping_rounds and self.mode == consts.HETERO:
            self.update_early_stopping_status(epoch, model)

    def on_train_begin(self, train_data=None, validate_data=None):
        if self.role != consts.ARBITER:
            self.set_train_data(train_data)
            self.set_validate_data(validate_data)

    def on_epoch_end(self, model, epoch):
        LOGGER.debug('running validation')
        self.validate(model, epoch)

        if self.need_stop():
            LOGGER.debug('early stopping triggered')
            model.callback_variables.stop_training = True

    def on_train_end(self, model):
        if self.has_saved_best_model():
            model.load_model(self.cur_best_model)
            model.callback_variables.best_iteration = self.best_iteration

        model.callback_variables.validation_summary = self.summary()