From fcce742db4435a145bec8d95e77ec650361e3f1c Mon Sep 17 00:00:00 2001 From: mzusman Date: Tue, 10 Dec 2024 14:22:34 +0200 Subject: [PATCH] Small fix to logic Signed-off-by: mzusman --- vllm/config.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/config.py b/vllm/config.py index 60a32fb182dbb..e8475efcb56e1 100644 --- a/vllm/config.py +++ b/vllm/config.py @@ -701,7 +701,7 @@ def get_num_layers_by_block_type( if self.is_attention_free and attn_block_type: return 0 - if is_full_attn_model and attn_block_type: + if is_full_attn_model and not attn_block_type: return 0 start, end = self.get_layers_start_end_indices(parallel_config)