Add fp16 flag to test runner to check models quantized to fp16 (#2182)

74ba9649 · Paul Fultz II · GitHub · f149b619 · 74ba9649
Unverified Commit 74ba9649 authored Sep 15, 2023 by Paul Fultz II Committed by GitHub Sep 15, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 15 additions and 1 deletion

tools/test_runner.py tools/test_runner.py +15 -1

No files found.
--- a/tools/test_runner.py
+++ b/tools/test_runner.py
@@ -39,6 +39,15 @@ def parse_args():
                        type=str,
                        default='gpu',
                        help='Specify where the tests execute (ref, gpu)')
+    parser.add_argument('--fp16', action='store_true', help='Quantize to fp16')
+    parser.add_argument('--atol',
+                        type=float,
+                        default=1e-3,
+                        help='The absolute tolerance parameter')
+    parser.add_argument('--rtol',
+                        type=float,
+                        default=1e-3,
+                        help='The relative tolerance parameter')
    args = parser.parse_args()
    return args
@@ -257,6 +266,8 @@ def main():
    # read and compile model
    model = migraphx.parse_onnx(model_path_name, map_input_dims=param_shapes)
+    if args.fp16:
+        migraphx.quantize_fp16(model)
    model.compile(migraphx.get_target(target))
    # get test cases
@@ -279,7 +290,10 @@ def main():
        output_data = run_one_case(model, input_data)
        # check output correctness
-        ret = check_correctness(gold_outputs, output_data)
+        ret = check_correctness(gold_outputs,
+                                output_data,
+                                atol=args.atol,
+                                rtol=args.rtol)
        if ret:
            correct_num += 1