File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change 14
14
VLLM_ROCM_PREFER_TORCH : bool = False
15
15
VLLM_ROCM_PREFER_TRITON : bool = True
16
16
VLLM_USE_SDPA_ATTENTION : bool = False
17
- VLLM_USE_TRITON_FLASH_ATTN : bool = True
17
+ VLLM_USE_TRITON_FLASH_ATTN : bool = False
18
18
VLLM_USE_ROCM_SKINNY_GEMM : bool = True
19
19
VLLM_USE_ROCM_CUSTOM_PAGED_ATTN : bool = True
20
20
VLLM_USE_ROCM_CUSTOM_PAGED_ATTN_FP8_OUT : bool = True
@@ -227,7 +227,7 @@ def get_default_config_root():
227
227
228
228
# flag to control if vllm should use triton flash attention
229
229
"VLLM_USE_TRITON_FLASH_ATTN" :
230
- lambda : (os .environ .get ("VLLM_USE_TRITON_FLASH_ATTN" , "True " ).lower () in
230
+ lambda : (os .environ .get ("VLLM_USE_TRITON_FLASH_ATTN" , "False " ).lower () in
231
231
("true" , "1" )),
232
232
233
233
# Internal flag to enable Dynamo fullgraph capture
You can’t perform that action at this time.
0 commit comments