hooks_helper.py 5.32 KB
Newer Older
Yanhui Liang's avatar
Yanhui Liang committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
# Copyright 2017 The TensorFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================

"""Hooks helper to return a list of TensorFlow hooks for training by name.

More hooks can be added to this set. To add a new hook, 1) add the new hook to
the registry in HOOKS, 2) add a corresponding function that parses out necessary
parameters.
"""

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

Karmel Allison's avatar
Karmel Allison committed
27
import tensorflow as tf  # pylint: disable=g-bad-import-order
Yanhui Liang's avatar
Yanhui Liang committed
28

29
from official.utils.logs import hooks
Qianli Scott Zhu's avatar
Qianli Scott Zhu committed
30
from official.utils.logs import logger
31
from official.utils.logs import metric_hook
Yanhui Liang's avatar
Yanhui Liang committed
32
33
34
35
36
37
38
39
40
41
42
43
44

_TENSORS_TO_LOG = dict((x, x) for x in ['learning_rate',
                                        'cross_entropy',
                                        'train_accuracy'])


def get_train_hooks(name_list, **kwargs):
  """Factory for getting a list of TensorFlow hooks for training by name.

  Args:
    name_list: a list of strings to name desired hook classes. Allowed:
      LoggingTensorHook, ProfilerHook, ExamplesPerSecondHook, which are defined
      as keys in HOOKS
Karmel Allison's avatar
Karmel Allison committed
45
    **kwargs: a dictionary of arguments to the hooks.
Yanhui Liang's avatar
Yanhui Liang committed
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67

  Returns:
    list of instantiated hooks, ready to be used in a classifier.train call.

  Raises:
    ValueError: if an unrecognized name is passed.
  """

  if not name_list:
    return []

  train_hooks = []
  for name in name_list:
    hook_name = HOOKS.get(name.strip().lower())
    if hook_name is None:
      raise ValueError('Unrecognized training hook requested: {}'.format(name))
    else:
      train_hooks.append(hook_name(**kwargs))

  return train_hooks


68
def get_logging_tensor_hook(every_n_iter=100, tensors_to_log=None, **kwargs):  # pylint: disable=unused-argument
Yanhui Liang's avatar
Yanhui Liang committed
69
70
71
72
73
  """Function to get LoggingTensorHook.

  Args:
    every_n_iter: `int`, print the values of `tensors` once every N local
      steps taken on the current worker.
74
75
    tensors_to_log: List of tensor names or dictionary mapping labels to tensor
      names. If not set, log _TENSORS_TO_LOG by default.
Karmel Allison's avatar
Karmel Allison committed
76
    **kwargs: a dictionary of arguments to LoggingTensorHook.
Yanhui Liang's avatar
Yanhui Liang committed
77
78
79
80
81

  Returns:
    Returns a LoggingTensorHook with a standard set of tensors that will be
    printed to stdout.
  """
82
83
84
  if tensors_to_log is None:
    tensors_to_log = _TENSORS_TO_LOG

Yanhui Liang's avatar
Yanhui Liang committed
85
  return tf.train.LoggingTensorHook(
86
      tensors=tensors_to_log,
Yanhui Liang's avatar
Yanhui Liang committed
87
88
89
90
91
92
93
94
      every_n_iter=every_n_iter)


def get_profiler_hook(save_steps=1000, **kwargs):  # pylint: disable=unused-argument
  """Function to get ProfilerHook.

  Args:
    save_steps: `int`, print profile traces every N steps.
Karmel Allison's avatar
Karmel Allison committed
95
    **kwargs: a dictionary of arguments to ProfilerHook.
Yanhui Liang's avatar
Yanhui Liang committed
96
97
98
99
100
101
102
103
104
105

  Returns:
    Returns a ProfilerHook that writes out timelines that can be loaded into
    profiling tools like chrome://tracing.
  """
  return tf.train.ProfilerHook(save_steps=save_steps)


def get_examples_per_second_hook(every_n_steps=100,
                                 batch_size=128,
106
                                 warm_steps=5,
Yanhui Liang's avatar
Yanhui Liang committed
107
108
109
110
111
112
113
114
115
                                 **kwargs):  # pylint: disable=unused-argument
  """Function to get ExamplesPerSecondHook.

  Args:
    every_n_steps: `int`, print current and average examples per second every
      N steps.
    batch_size: `int`, total batch size used to calculate examples/second from
      global time.
    warm_steps: skip this number of steps before logging and running average.
Karmel Allison's avatar
Karmel Allison committed
116
    **kwargs: a dictionary of arguments to ExamplesPerSecondHook.
Yanhui Liang's avatar
Yanhui Liang committed
117
118
119
120
121

  Returns:
    Returns a ProfilerHook that writes out timelines that can be loaded into
    profiling tools like chrome://tracing.
  """
Karmel Allison's avatar
Karmel Allison committed
122
123
124
  return hooks.ExamplesPerSecondHook(
      batch_size=batch_size, every_n_steps=every_n_steps,
      warm_steps=warm_steps, metric_logger=logger.get_benchmark_logger())
Yanhui Liang's avatar
Yanhui Liang committed
125
126


127
def get_logging_metric_hook(tensors_to_log=None,
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
                            every_n_secs=600,
                            **kwargs):  # pylint: disable=unused-argument
  """Function to get LoggingMetricHook.

  Args:
    tensors_to_log: List of tensor names or dictionary mapping labels to tensor
      names. If not set, log _TENSORS_TO_LOG by default.
    every_n_secs: `int`, the frequency for logging the metric. Default to every
      10 mins.

  Returns:
    Returns a ProfilerHook that writes out timelines that can be loaded into
    profiling tools like chrome://tracing.
  """
  if tensors_to_log is None:
    tensors_to_log = _TENSORS_TO_LOG
  return metric_hook.LoggingMetricHook(
      tensors=tensors_to_log,
Qianli Scott Zhu's avatar
Qianli Scott Zhu committed
146
      metric_logger=logger.get_benchmark_logger(),
147
148
149
      every_n_secs=every_n_secs)


Yanhui Liang's avatar
Yanhui Liang committed
150
151
152
153
154
# A dictionary to map one hook name and its corresponding function
HOOKS = {
    'loggingtensorhook': get_logging_tensor_hook,
    'profilerhook': get_profiler_hook,
    'examplespersecondhook': get_examples_per_second_hook,
155
    'loggingmetrichook': get_logging_metric_hook,
Yanhui Liang's avatar
Yanhui Liang committed
156
}