Skip to content

Commit d5e35a9

Browse files
committed
Merge remote-tracking branch 'origin/main' into upstream_merge_2025_05_21
2 parents 1c450a5 + 91a5600 commit d5e35a9

File tree

1 file changed

+1
-0
lines changed

1 file changed

+1
-0
lines changed

vllm/model_executor/models/llama.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -203,6 +203,7 @@ def __init__(
203203
quant_config, Fp8Config) or (isinstance(quant_config, QuarkConfig)
204204
and quant_config.is_fp8_w8a8())
205205
self.attn_fp8_out = (envs.VLLM_USE_ROCM_CUSTOM_PAGED_ATTN_FP8_OUT
206+
and envs.VLLM_USE_TRITON_FLASH_ATTN
206207
and current_platform.is_fp8_fnuz() and use_fp8)
207208
if envs.VLLM_USE_V1 and not envs.VLLM_V1_USE_PREFILL_DECODE_ATTENTION:
208209
self.attn_fp8_out = False

0 commit comments

Comments
 (0)