Commit f4147e22 authored by Zongwei Zhou's avatar Zongwei Zhou Committed by A. Unique TensorFlower
Browse files

Enable Resnet50 and BERT 1GPU pure eager throughput test

PiperOrigin-RevId: 292671694
parent c7ad20a3
...@@ -185,6 +185,17 @@ class BertSquadBenchmarkReal(BertSquadBenchmarkBase): ...@@ -185,6 +185,17 @@ class BertSquadBenchmarkReal(BertSquadBenchmarkBase):
self._run_and_report_benchmark() self._run_and_report_benchmark()
def benchmark_1_gpu_eager(self):
"""Tests BERT SQuAD model performance with 1 GPU."""
self._setup()
self.num_gpus = 1
FLAGS.run_eagerly = True
FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu_squad_eager')
FLAGS.train_batch_size = 2
self._run_and_report_benchmark()
def benchmark_1_gpu_xla(self): def benchmark_1_gpu_xla(self):
"""Tests BERT SQuAD model performance with 1 GPU with XLA.""" """Tests BERT SQuAD model performance with 1 GPU with XLA."""
...@@ -249,6 +260,19 @@ class BertSquadBenchmarkReal(BertSquadBenchmarkBase): ...@@ -249,6 +260,19 @@ class BertSquadBenchmarkReal(BertSquadBenchmarkBase):
self._run_and_report_benchmark() self._run_and_report_benchmark()
def benchmark_1_gpu_fp16_eager(self):
"""Tests BERT SQuAD model performance with 1 GPU and FP16."""
self._setup()
self.num_gpus = 1
FLAGS.run_eagerly = True
FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu_squad_fp16_eager')
FLAGS.train_batch_size = 4
FLAGS.dtype = 'fp16'
FLAGS.loss_scale = 'dynamic'
self._run_and_report_benchmark()
def benchmark_1_gpu_fp16(self): def benchmark_1_gpu_fp16(self):
"""Tests BERT SQuAD model performance with 1 GPU and FP16.""" """Tests BERT SQuAD model performance with 1 GPU and FP16."""
......
...@@ -279,7 +279,7 @@ class Resnet50CtlBenchmarkBase(CtlBenchmark): ...@@ -279,7 +279,7 @@ class Resnet50CtlBenchmarkBase(CtlBenchmark):
FLAGS.num_gpus = 1 FLAGS.num_gpus = 1
FLAGS.distribution_strategy = 'one_device' FLAGS.distribution_strategy = 'one_device'
FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu_eager') FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu_eager')
FLAGS.batch_size = 64 FLAGS.batch_size = 108
FLAGS.use_tf_function = False FLAGS.use_tf_function = False
FLAGS.single_l2_loss_op = True FLAGS.single_l2_loss_op = True
self._run_and_report_benchmark() self._run_and_report_benchmark()
...@@ -291,7 +291,7 @@ class Resnet50CtlBenchmarkBase(CtlBenchmark): ...@@ -291,7 +291,7 @@ class Resnet50CtlBenchmarkBase(CtlBenchmark):
FLAGS.num_gpus = 1 FLAGS.num_gpus = 1
FLAGS.distribution_strategy = 'one_device' FLAGS.distribution_strategy = 'one_device'
FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu_fp16_eager') FLAGS.model_dir = self._get_model_dir('benchmark_1_gpu_fp16_eager')
FLAGS.batch_size = 128 FLAGS.batch_size = 216
FLAGS.dtype = 'fp16' FLAGS.dtype = 'fp16'
FLAGS.use_tf_function = False FLAGS.use_tf_function = False
FLAGS.single_l2_loss_op = True FLAGS.single_l2_loss_op = True
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment