From 44874a0bf970ae55c487a1dc09b25bd308872f7c Mon Sep 17 00:00:00 2001 From: DefTruth <31974251+DefTruth@users.noreply.github.com> Date: Mon, 15 Jul 2024 12:16:51 +0800 Subject: [PATCH] [Doc] add env docs for flashinfer backend (#6437) --- vllm/envs.py | 1 + 1 file changed, 1 insertion(+) diff --git a/vllm/envs.py b/vllm/envs.py index 5b4a2010d12e6..85d60f3242526 100644 --- a/vllm/envs.py +++ b/vllm/envs.py @@ -206,6 +206,7 @@ # - "FLASH_ATTN": use FlashAttention # - "XFORMERS": use XFormers # - "ROCM_FLASH": use ROCmFlashAttention + # - "FLASHINFER": use flashinfer "VLLM_ATTENTION_BACKEND": lambda: os.getenv("VLLM_ATTENTION_BACKEND", None),