callback.py 6.53 KB
Newer Older
wxchan's avatar
wxchan committed
1
# coding: utf-8
wxchan's avatar
wxchan committed
2
# pylint: disable = invalid-name, W0105, C0301
wxchan's avatar
wxchan committed
3
from __future__ import absolute_import
4

wxchan's avatar
wxchan committed
5
6
import collections

wxchan's avatar
wxchan committed
7

wxchan's avatar
wxchan committed
8
9
10
11
12
13
14
15
16
17
18
class EarlyStopException(Exception):
    """Exception of early stopping.
    Parameters
    ----------
    best_iteration : int
        The best iteration stopped.
    """
    def __init__(self, best_iteration):
        super(EarlyStopException, self).__init__()
        self.best_iteration = best_iteration

wxchan's avatar
wxchan committed
19

wxchan's avatar
wxchan committed
20
21
22
23
# Callback environment used by callbacks
CallbackEnv = collections.namedtuple(
    "LightGBMCallbackEnv",
    ["model",
24
     "params",
wxchan's avatar
wxchan committed
25
26
27
28
29
     "iteration",
     "begin_iteration",
     "end_iteration",
     "evaluation_result_list"])

wxchan's avatar
wxchan committed
30

wxchan's avatar
wxchan committed
31
32
33
def _format_eval_result(value, show_stdv=True):
    """format metric string"""
    if len(value) == 4:
34
        return '%s\'s %s: %g' % (value[0], value[1], value[2])
wxchan's avatar
wxchan committed
35
36
    elif len(value) == 5:
        if show_stdv:
37
            return '%s\'s %s: %g + %g' % (value[0], value[1], value[2], value[4])
wxchan's avatar
wxchan committed
38
        else:
39
            return '%s\'s %s: %g' % (value[0], value[1], value[2])
wxchan's avatar
wxchan committed
40
    else:
41
        raise ValueError("Wrong metric value")
wxchan's avatar
wxchan committed
42
43
44
45
46
47
48
49
50
51
52


def print_evaluation(period=1, show_stdv=True):
    """Create a callback that print evaluation result.

    Parameters
    ----------
    period : int
        The period to log the evaluation results

    show_stdv : bool, optional
53
        Whether show stdv if provided
wxchan's avatar
wxchan committed
54
55
56
57
58
59
60
61

    Returns
    -------
    callback : function
        A callback that print evaluation every period iterations.
    """
    def callback(env):
        """internal function"""
62
63
        if period > 0 and env.evaluation_result_list and (env.iteration + 1) % period == 0:
            result = '\t'.join([_format_eval_result(x, show_stdv) for x in env.evaluation_result_list])
wxchan's avatar
wxchan committed
64
65
            print('[%d]\t%s' % (env.iteration + 1, result))
    callback.order = 10
wxchan's avatar
wxchan committed
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
    return callback


def record_evaluation(eval_result):
    """Create a call back that records the evaluation history into eval_result.

    Parameters
    ----------
    eval_result : dict
       A dictionary to store the evaluation results.

    Returns
    -------
    callback : function
        The requested callback function.
    """
    if not isinstance(eval_result, dict):
83
        raise TypeError('Eval_result should be a dictionary')
wxchan's avatar
wxchan committed
84
85
86
87
    eval_result.clear()

    def init(env):
        """internal function"""
88
89
        for data_name, _, _, _ in env.evaluation_result_list:
            eval_result.setdefault(data_name, collections.defaultdict(list))
wxchan's avatar
wxchan committed
90
91
92

    def callback(env):
        """internal function"""
93
        if not eval_result:
wxchan's avatar
wxchan committed
94
95
96
            init(env)
        for data_name, eval_name, result, _ in env.evaluation_result_list:
            eval_result[data_name][eval_name].append(result)
wxchan's avatar
wxchan committed
97
    callback.order = 20
wxchan's avatar
wxchan committed
98
99
100
    return callback


101
102
def reset_parameter(**kwargs):
    """Reset parameter after first iteration
wxchan's avatar
wxchan committed
103

104
    NOTE: the initial parameter will still take in-effect on first iteration.
wxchan's avatar
wxchan committed
105
106
107

    Parameters
    ----------
108
109
110
111
112
113
    **kwargs: value should be list or function
        List of parameters for each boosting round
        or a customized function that calculates learning_rate in terms of
        current number of round (e.g. yields learning rate decay)
        - list l: parameter = l[current_round]
        - function f: parameter = f(current_round)
wxchan's avatar
wxchan committed
114
115
116
117
118
119
120
    Returns
    -------
    callback : function
        The requested callback function.
    """
    def callback(env):
        """internal function"""
121
        new_parameters = {}
122
        for key, value in kwargs.items():
123
124
            if key in ['num_class', 'boosting_type', 'metric']:
                raise RuntimeError("cannot reset {} during training".format(repr(key)))
125
126
127
            if isinstance(value, list):
                if len(value) != env.end_iteration - env.begin_iteration:
                    raise ValueError("Length of list {} has to equal to 'num_boost_round'.".format(repr(key)))
128
                new_param = value[env.iteration - env.begin_iteration]
wxchan's avatar
wxchan committed
129
            else:
130
131
132
133
134
135
                new_param = value(env.iteration - env.begin_iteration)
            if new_param != env.params.get(key, None):
                new_parameters[key] = new_param
        if new_parameters:
            env.model.reset_parameter(new_parameters)
            env.params.update(new_parameters)
wxchan's avatar
wxchan committed
136
    callback.before_iteration = True
wxchan's avatar
wxchan committed
137
    callback.order = 10
wxchan's avatar
wxchan committed
138
139
140
    return callback


141
def early_stopping(stopping_rounds, verbose=True):
wxchan's avatar
wxchan committed
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
    """Create a callback that activates early stopping.
    Activates early stopping.
    Requires at least one validation data and one metric
    If there's more than one, will check all of them

    Parameters
    ----------
    stopping_rounds : int
       The stopping rounds before the trend occur.

    verbose : optional, bool
        Whether to print message about early stopping information.

    Returns
    -------
    callback : function
        The requested callback function.
    """
    factor_to_bigger_better = {}
    best_score = {}
    best_iter = {}
    best_msg = {}
wxchan's avatar
wxchan committed
164

wxchan's avatar
wxchan committed
165
166
    def init(env):
        """internal function"""
167
        if not env.evaluation_result_list:
wxchan's avatar
wxchan committed
168
            raise ValueError('For early stopping, at least one dataset or eval metric is required for evaluation')
wxchan's avatar
wxchan committed
169
170
171
172
173
174
175
176
177
178

        if verbose:
            msg = "Train until valid scores didn't improve in {} rounds."
            print(msg.format(stopping_rounds))

        for i in range(len(env.evaluation_result_list)):
            best_score[i] = float('-inf')
            best_iter[i] = 0
            if verbose:
                best_msg[i] = ""
179
            factor_to_bigger_better[i] = 1.0 if env.evaluation_result_list[i][3] else -1.0
wxchan's avatar
wxchan committed
180
181
182

    def callback(env):
        """internal function"""
183
        if not best_score:
wxchan's avatar
wxchan committed
184
185
186
187
188
189
190
            init(env)
        for i in range(len(env.evaluation_result_list)):
            score = env.evaluation_result_list[i][2] * factor_to_bigger_better[i]
            if score > best_score[i]:
                best_score[i] = score
                best_iter[i] = env.iteration
                if verbose:
wxchan's avatar
wxchan committed
191
192
193
194
195
                    best_msg[i] = '[%d]\t%s' % (
                        env.iteration + 1, '\t'.join(
                            [_format_eval_result(x) for x in env.evaluation_result_list]
                        )
                    )
wxchan's avatar
wxchan committed
196
197
            else:
                if env.iteration - best_iter[i] >= stopping_rounds:
198
                    env.model.set_attr(best_iteration=str(best_iter[i]))
wxchan's avatar
wxchan committed
199
                    if verbose:
200
                        print('Early stopping, best iteration is:')
201
                        print(best_msg[i])
wxchan's avatar
wxchan committed
202
                    raise EarlyStopException(best_iter[i])
wxchan's avatar
wxchan committed
203
    callback.order = 30
wxchan's avatar
wxchan committed
204
    return callback