File tree Expand file tree Collapse file tree 1 file changed +2
-5
lines changed
Expand file tree Collapse file tree 1 file changed +2
-5
lines changed Original file line number Diff line number Diff line change 5454from ..jit .gemm import gen_trtllm_gen_gemm_module
5555from ..jit .gemm import gen_tgv_gemm_sm10x_module
5656from ..jit .gemm import gen_deepgemm_sm100_module
57+ from ..jit .cpp_ext import get_cuda_version
5758
5859
5960CUDNN_AVAILABLE = False
@@ -93,10 +94,6 @@ def _match_sm_version(device: torch.device, sm_version: list[str]):
9394 return device_arch in sm_version
9495
9596
96- def get_cuda_version ():
97- return tuple (map (int , torch .version .cuda .split ("." ))) # (major, minor)
98-
99-
10097@functools .cache
10198def get_gemm_module ():
10299 module = gen_gemm_module ().build_and_load ()
@@ -2004,7 +2001,7 @@ def _heuristic_func_mm_fp4(
20042001 - If cuda version is 13 and cudnn version is 9.15 or greater - use cudnn.
20052002
20062003 """
2007- cuda_major , _ = get_cuda_version ()
2004+ cuda_major = get_cuda_version (). major
20082005 # If cuda version is 13 or greater:
20092006 # cudnn is more performant if cudnn version is 9.15 or greater.
20102007 if CUDNN_AVAILABLE and cuda_major >= 13 and cudnn .backend_version () >= 91500 :
You can’t perform that action at this time.
0 commit comments