Format

ff878ce6 · Paul · 93a5de9f · ff878ce6 · ff878ce6
Commit ff878ce6 authored Oct 09, 2022 by Paul
Hide whitespace changes
Inline Side-by-side

Showing with 10 additions and 7 deletions

src/targets/gpu/jit/ck_gemm.cpp src/targets/gpu/jit/ck_gemm.cpp +5 -6

tools/tune_ck.py tools/tune_ck.py +5 -1

No files found.
--- a/src/targets/gpu/jit/ck_gemm.cpp
+++ b/src/targets/gpu/jit/ck_gemm.cpp
@@ -113,7 +113,7 @@ auto action_decorate(F f, Action action)
 using tuning_entry = std::pair<std::vector<shape>, size_t>;
 static std::vector<tuning_entry> read_tuning(const std::string& s)
 {
-    if (not fs::exists(s))
+    if(not fs::exists(s))
        return {};
    return from_value<std::vector<tuning_entry>>(from_json_string(read_string(s)));
 }
@@ -121,10 +121,9 @@ static std::vector<tuning_entry> read_tuning(const std::string& s)
 static std::size_t get_tuning_for(const std::vector<shape>& inputs)
 {
    static auto tuning = read_tuning(string_value_of(MIGRAPHX_CK_TUNING{}, ""));
-    auto it = std::find_if(tuning.begin(), tuning.end(), [&](const auto& p) {
+    auto it            = std::find_if(
-        return p.first == inputs;
+        tuning.begin(), tuning.end(), [&](const auto& p) { return p.first == inputs; });
-    });
+    if(it == tuning.end())
-    if (it == tuning.end())
        return 4;
    return it->second;
 }
@@ -159,7 +158,7 @@ struct ck_gemm_compiler : compiler<ck_gemm_compiler>
        auto sb = b_shape.strides().front();
        auto sc = c_shape.strides().front();
-        auto i                = v.get("tuning_val", get_tuning_for(inputs));
+        auto i               = v.get("tuning_val", get_tuning_for(inputs));
        const auto& instance = get_instance(i, [&](const auto& x) -> bool {
            return get_layout(a_shape) == x[0] and get_layout(b_shape) == x[1] and
                   get_layout(c_shape) == x[2] and get_type(a_shape) == x[3] and

--- a/tools/tune_ck.py
+++ b/tools/tune_ck.py
 import os, json, subprocess, tempfile, sys, argparse, contextlib
 @contextlib.contextmanager
 def tmp_file(dump=None):
    tmp_name = None
@@ -12,9 +13,11 @@ def tmp_file(dump=None):
    finally:
        os.unlink(tmp_name)
 def pretty_print(obj):
    print(json.dumps(obj, indent=2))
 def benchmark_one(config, tuning):
    b = {
        'settings': {
@@ -29,7 +32,8 @@ def benchmark_one(config, tuning):
    print(b)
    with tmp_file(lambda tf: json.dump(b, tf)) as tf:
        cp = subprocess.run('./bin/gpu-driver {}'.format(tf),
-                            capture_output=True, shell=True)
+                            capture_output=True,
+                            shell=True)
        for line in cp.stdout.decode().split("\n"):
            s = line.strip()
            if not s: