keras_cifar_benchmark.py 9.66 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
Toby Boyd's avatar
Toby Boyd committed
15
"""Executes Keras benchmarks and accuracy tests."""
Shining Sun's avatar
Shining Sun committed
16
17
from __future__ import absolute_import
from __future__ import division
Toby Boyd's avatar
Toby Boyd committed
18
19
from __future__ import print_function

20
import os
21
import time
Toby Boyd's avatar
Toby Boyd committed
22
from absl import flags
23
import tensorflow as tf  # pylint: disable=g-bad-import-order
Toby Boyd's avatar
Toby Boyd committed
24
25

from official.resnet import cifar10_main as cifar_main
Toby Boyd's avatar
Toby Boyd committed
26
from official.resnet.keras import keras_benchmark
27
28
29
from official.resnet.keras import keras_cifar_main
from official.resnet.keras import keras_common

30
31
MIN_TOP_1_ACCURACY = 0.925
MAX_TOP_1_ACCURACY = 0.938
Toby Boyd's avatar
Toby Boyd committed
32

Toby Boyd's avatar
Toby Boyd committed
33
FLAGS = flags.FLAGS
34
CIFAR_DATA_DIR_NAME = 'cifar-10-batches-bin'
Toby Boyd's avatar
Toby Boyd committed
35

36

Toby Boyd's avatar
Toby Boyd committed
37
38
class Resnet56KerasAccuracy(keras_benchmark.KerasBenchmark):
  """Accuracy tests for ResNet56 Keras CIFAR-10."""
39

40
  def __init__(self, output_dir=None, root_data_dir=None, **kwargs):
41
42
43
44
45
    """A benchmark class.

    Args:
      output_dir: directory where to output e.g. log files
      root_data_dir: directory under which to look for dataset
46
47
48
      **kwargs: arbitrary named arguments. This is needed to make the
                constructor forward compatible in case PerfZero provides more
                named arguments before updating the constructor.
49
50
    """

51
    self.data_dir = os.path.join(root_data_dir, CIFAR_DATA_DIR_NAME)
52
    flag_methods = [keras_cifar_main.define_cifar_flags]
Toby Boyd's avatar
Toby Boyd committed
53

54
55
    super(Resnet56KerasAccuracy, self).__init__(
        output_dir=output_dir, flag_methods=flag_methods)
Toby Boyd's avatar
Toby Boyd committed
56

Toby Boyd's avatar
Toby Boyd committed
57
  def benchmark_graph_1_gpu(self):
58
    """Test keras based model with Keras fit and distribution strategies."""
Toby Boyd's avatar
Toby Boyd committed
59
    self._setup()
Toby Boyd's avatar
Toby Boyd committed
60
    FLAGS.num_gpus = 1
61
    FLAGS.data_dir = self.data_dir
Toby Boyd's avatar
Toby Boyd committed
62
63
    FLAGS.batch_size = 128
    FLAGS.train_epochs = 182
64
    FLAGS.model_dir = self._get_model_dir('benchmark_graph_1_gpu')
Toby Boyd's avatar
Toby Boyd committed
65
    FLAGS.dtype = 'fp32'
66
    self._run_and_report_benchmark()
Toby Boyd's avatar
Toby Boyd committed
67
68

  def benchmark_1_gpu(self):
69
70
    """Test keras based model with eager and distribution strategies."""
    self._setup()
Toby Boyd's avatar
Toby Boyd committed
71
    FLAGS.num_gpus = 1
72
    FLAGS.data_dir = self.data_dir
Toby Boyd's avatar
Toby Boyd committed
73
74
    FLAGS.batch_size = 128
    FLAGS.train_epochs = 182
75
    FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu')
Toby Boyd's avatar
Toby Boyd committed
76
77
    FLAGS.dtype = 'fp32'
    FLAGS.enable_eager = True
78
    self._run_and_report_benchmark()
79

80
81
82
83
  def benchmark_1_gpu_no_dist_strat(self):
    """Test keras based model with eager and no dist strat."""
    self._setup()
    FLAGS.num_gpus = 1
84
    FLAGS.explicit_gpu_placement = True
85
86
87
88
89
90
91
92
93
    FLAGS.data_dir = self.data_dir
    FLAGS.batch_size = 128
    FLAGS.train_epochs = 182
    FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu_no_dist_strat')
    FLAGS.dtype = 'fp32'
    FLAGS.enable_eager = True
    FLAGS.distribution_strategy = 'off'
    self._run_and_report_benchmark()

94
  def benchmark_1_gpu_no_dist_strat_run_eagerly(self):
95
    """Test keras based model with forced eager and no dist_strat."""
96
97
98
99
100
101
102
103
104
105
106
107
108
    self._setup()
    FLAGS.num_gpus = 1
    FLAGS.data_dir = self.data_dir
    FLAGS.batch_size = 128
    FLAGS.train_epochs = 182
    FLAGS.model_dir = self._get_model_dir(
        'benchmark_1_gpu_no_dist_strat_run_eagerly')
    FLAGS.dtype = 'fp32'
    FLAGS.enable_eager = True
    FLAGS.run_eagerly = True
    FLAGS.distribution_strategy = 'off'
    self._run_and_report_benchmark()

Toby Boyd's avatar
Toby Boyd committed
109
  def benchmark_2_gpu(self):
110
111
    """Test keras based model with eager and distribution strategies."""
    self._setup()
Toby Boyd's avatar
Toby Boyd committed
112
    FLAGS.num_gpus = 2
113
    FLAGS.data_dir = self.data_dir
Toby Boyd's avatar
Toby Boyd committed
114
115
    FLAGS.batch_size = 128
    FLAGS.train_epochs = 182
116
    FLAGS.model_dir = self._get_model_dir('benchmark_2_gpu')
Toby Boyd's avatar
Toby Boyd committed
117
118
    FLAGS.dtype = 'fp32'
    FLAGS.enable_eager = True
119
    self._run_and_report_benchmark()
Toby Boyd's avatar
Toby Boyd committed
120
121

  def benchmark_graph_2_gpu(self):
122
123
    """Test keras based model with Keras fit and distribution strategies."""
    self._setup()
Toby Boyd's avatar
Toby Boyd committed
124
    FLAGS.num_gpus = 2
125
    FLAGS.data_dir = self.data_dir
Toby Boyd's avatar
Toby Boyd committed
126
127
    FLAGS.batch_size = 128
    FLAGS.train_epochs = 182
128
    FLAGS.model_dir = self._get_model_dir('benchmark_graph_2_gpu')
Toby Boyd's avatar
Toby Boyd committed
129
    FLAGS.dtype = 'fp32'
130
    self._run_and_report_benchmark()
Toby Boyd's avatar
Toby Boyd committed
131
132

  def benchmark_graph_1_gpu_no_dist_strat(self):
133
    """Test keras based model with Keras fit but not distribution strategies."""
Toby Boyd's avatar
Toby Boyd committed
134
    self._setup()
135
    FLAGS.distribution_strategy = 'off'
Toby Boyd's avatar
Toby Boyd committed
136
    FLAGS.num_gpus = 1
137
    FLAGS.data_dir = self.data_dir
Toby Boyd's avatar
Toby Boyd committed
138
139
    FLAGS.batch_size = 128
    FLAGS.train_epochs = 182
140
    FLAGS.model_dir = self._get_model_dir('benchmark_graph_1_gpu_no_dist_strat')
Toby Boyd's avatar
Toby Boyd committed
141
    FLAGS.dtype = 'fp32'
142
143
144
145
    self._run_and_report_benchmark()

  def _run_and_report_benchmark(self):
    start_time_sec = time.time()
Toby Boyd's avatar
Toby Boyd committed
146
    stats = keras_cifar_main.run(FLAGS)
147
    wall_time_sec = time.time() - start_time_sec
Toby Boyd's avatar
Toby Boyd committed
148

149
    super(Resnet56KerasAccuracy, self)._report_benchmark(
Toby Boyd's avatar
Toby Boyd committed
150
        stats,
151
        wall_time_sec,
Toby Boyd's avatar
Toby Boyd committed
152
153
        top_1_min=MIN_TOP_1_ACCURACY,
        top_1_max=MAX_TOP_1_ACCURACY,
154
        total_batch_size=FLAGS.batch_size,
Toby Boyd's avatar
Toby Boyd committed
155
156
157
158
159
160
161
        log_steps=100)


class Resnet56KerasBenchmarkBase(keras_benchmark.KerasBenchmark):
  """Short performance tests for ResNet56 via Keras and CIFAR-10."""

  def __init__(self, output_dir=None, default_flags=None):
162
    flag_methods = [keras_cifar_main.define_cifar_flags]
Toby Boyd's avatar
Toby Boyd committed
163
164
165
166
167
168

    super(Resnet56KerasBenchmarkBase, self).__init__(
        output_dir=output_dir,
        flag_methods=flag_methods,
        default_flags=default_flags)

169
170
  def _run_and_report_benchmark(self):
    start_time_sec = time.time()
Toby Boyd's avatar
Toby Boyd committed
171
    stats = keras_cifar_main.run(FLAGS)
172
173
174
175
176
177
178
    wall_time_sec = time.time() - start_time_sec

    super(Resnet56KerasBenchmarkBase, self)._report_benchmark(
        stats,
        wall_time_sec,
        total_batch_size=FLAGS.batch_size,
        log_steps=FLAGS.log_steps)
Toby Boyd's avatar
Toby Boyd committed
179
180
181
182
183

  def benchmark_1_gpu_no_dist_strat(self):
    self._setup()
    FLAGS.num_gpus = 1
    FLAGS.enable_eager = True
184
    FLAGS.distribution_strategy = 'off'
185
    FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu_no_dist_strat')
Toby Boyd's avatar
Toby Boyd committed
186
    FLAGS.batch_size = 128
187
    self._run_and_report_benchmark()
Toby Boyd's avatar
Toby Boyd committed
188

189
190
191
192
193
194
195
196
197
198
199
200
201
  def benchmark_1_gpu_no_dist_strat_tweaked(self):
    """Test no distribution strategy with manual config."""
    self._setup()
    FLAGS.num_gpus = 1
    FLAGS.enable_eager = True
    FLAGS.explicit_gpu_placement = True
    FLAGS.distribution_strategy = 'off'
    FLAGS.set_learning_phase_to_train = False
    FLAGS.model_dir = self._get_model_dir(
        'benchmark_1_gpu_no_dist_strat_tweaked')
    FLAGS.batch_size = 128
    self._run_and_report_benchmark()

Toby Boyd's avatar
Toby Boyd committed
202
203
204
205
  def benchmark_graph_1_gpu_no_dist_strat(self):
    self._setup()
    FLAGS.num_gpus = 1
    FLAGS.enable_eager = False
206
    FLAGS.distribution_strategy = 'off'
207
    FLAGS.model_dir = self._get_model_dir('benchmark_graph_1_gpu_no_dist_strat')
Toby Boyd's avatar
Toby Boyd committed
208
    FLAGS.batch_size = 128
209
    self._run_and_report_benchmark()
Toby Boyd's avatar
Toby Boyd committed
210
211
212
213
214

  def benchmark_1_gpu(self):
    self._setup()
    FLAGS.num_gpus = 1
    FLAGS.enable_eager = True
215
    FLAGS.distribution_strategy = 'default'
216
    FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu')
Toby Boyd's avatar
Toby Boyd committed
217
    FLAGS.batch_size = 128
218
    self._run_and_report_benchmark()
Toby Boyd's avatar
Toby Boyd committed
219
220
221
222
223

  def benchmark_graph_1_gpu(self):
    self._setup()
    FLAGS.num_gpus = 1
    FLAGS.enable_eager = False
224
    FLAGS.distribution_strategy = 'default'
225
    FLAGS.model_dir = self._get_model_dir('benchmark_graph_1_gpu')
Toby Boyd's avatar
Toby Boyd committed
226
    FLAGS.batch_size = 128
227
    self._run_and_report_benchmark()
Toby Boyd's avatar
Toby Boyd committed
228

229
230
231
232
233
234
235
236
237
238
239
240
241
  def benchmark_1_gpu_no_dist_strat_run_eagerly(self):
    """Test keras based model with forced eager."""
    self._setup()
    FLAGS.num_gpus = 1
    FLAGS.batch_size = 128
    FLAGS.model_dir = self._get_model_dir(
        'benchmark_1_gpu_no_dist_strat_run_eagerly')
    FLAGS.dtype = 'fp32'
    FLAGS.enable_eager = True
    FLAGS.run_eagerly = True
    FLAGS.distribution_strategy = 'off'
    self._run_and_report_benchmark()

Toby Boyd's avatar
Toby Boyd committed
242
243
244
245
  def benchmark_2_gpu(self):
    self._setup()
    FLAGS.num_gpus = 2
    FLAGS.enable_eager = True
246
    FLAGS.distribution_strategy = 'default'
247
    FLAGS.model_dir = self._get_model_dir('benchmark_2_gpu')
Toby Boyd's avatar
Toby Boyd committed
248
    FLAGS.batch_size = 128 * 2  # 2 GPUs
249
    self._run_and_report_benchmark()
Toby Boyd's avatar
Toby Boyd committed
250
251
252
253
254

  def benchmark_graph_2_gpu(self):
    self._setup()
    FLAGS.num_gpus = 2
    FLAGS.enable_eager = False
255
    FLAGS.distribution_strategy = 'default'
256
    FLAGS.model_dir = self._get_model_dir('benchmark_graph_2_gpu')
Toby Boyd's avatar
Toby Boyd committed
257
    FLAGS.batch_size = 128 * 2  # 2 GPUs
258
    self._run_and_report_benchmark()
Toby Boyd's avatar
Toby Boyd committed
259
260
261
262
263


class Resnet56KerasBenchmarkSynth(Resnet56KerasBenchmarkBase):
  """Synthetic benchmarks for ResNet56 and Keras."""

264
  def __init__(self, output_dir=None, root_data_dir=None, **kwargs):
265
266
267
268
269
    default_flags = {}
    default_flags['skip_eval'] = True
    default_flags['use_synthetic_data'] = True
    default_flags['train_steps'] = 110
    default_flags['log_steps'] = 10
Toby Boyd's avatar
Toby Boyd committed
270

271
    super(Resnet56KerasBenchmarkSynth, self).__init__(
272
        output_dir=output_dir, default_flags=default_flags)
Toby Boyd's avatar
Toby Boyd committed
273
274
275
276
277


class Resnet56KerasBenchmarkReal(Resnet56KerasBenchmarkBase):
  """Real data benchmarks for ResNet56 and Keras."""

278
  def __init__(self, output_dir=None, root_data_dir=None, **kwargs):
279
280
281
282
283
    default_flags = {}
    default_flags['skip_eval'] = True
    default_flags['data_dir'] = os.path.join(root_data_dir, CIFAR_DATA_DIR_NAME)
    default_flags['train_steps'] = 110
    default_flags['log_steps'] = 10
Toby Boyd's avatar
Toby Boyd committed
284

285
    super(Resnet56KerasBenchmarkReal, self).__init__(
286
        output_dir=output_dir, default_flags=default_flags)
287
288
289
290


if __name__ == '__main__':
  tf.test.main()