From 41faabf8adf9596e0514c18df8834257b5a04a9d Mon Sep 17 00:00:00 2001 From: Yutao Xu Date: Mon, 8 Jun 2026 17:56:37 +0800 Subject: [PATCH 1/2] Update tuned_gemm.py --- aiter/tuned_gemm.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/aiter/tuned_gemm.py b/aiter/tuned_gemm.py index ffb81dff63..f01193b411 100644 --- a/aiter/tuned_gemm.py +++ b/aiter/tuned_gemm.py @@ -117,11 +117,12 @@ def get_GEMM_A16W16_config( cu_num = get_cu_num() padded_M = M config = None - + gfx = get_gfx() for gl in [None, 0, 1]: padded_M = M if gl is None else get_padded_m(M, N, K, gl) config = cfg.get( ( + gfx, cu_num, padded_M, N, @@ -161,7 +162,6 @@ def get_GEMM_A16W16_config( if config is None: default_config = {} - gfx = get_gfx() # gfx12: no ASM/skinny/hipblaslt kernels, use torch if gfx.startswith("gfx12"): default_config["libtype"] = "torch" From eb37d58446838cf92a6585f20b4018eb7ef022c3 Mon Sep 17 00:00:00 2001 From: Yutao Xu Date: Mon, 8 Jun 2026 18:05:06 +0800 Subject: [PATCH 2/2] Update tuned_gemm.py --- aiter/tuned_gemm.py | 1 + 1 file changed, 1 insertion(+) diff --git a/aiter/tuned_gemm.py b/aiter/tuned_gemm.py index f01193b411..9c04e17508 100644 --- a/aiter/tuned_gemm.py +++ b/aiter/tuned_gemm.py @@ -64,6 +64,7 @@ def get_GEMM_A16W16_config_(): gemm_dict = pd.read_csv(f"{tuned_file}").drop_duplicates() gemm_dict = gemm_dict.set_index( [ + "gfx", "cu_num", "M", "N",