diff --git a/vllm/attention/backends/flashinfer.py b/vllm/attention/backends/flashinfer.py index 06031929f6849..b059569d446a8 100644 --- a/vllm/attention/backends/flashinfer.py +++ b/vllm/attention/backends/flashinfer.py @@ -250,7 +250,7 @@ def begin_forward(self, model_input, model): state = self try: - scale = getattr(model.model.begs[0].self_attn.attn.impl, "scale", + scale = getattr(model.model.layers[0].self_attn.attn.impl, "scale", None) except AttributeError as e: raise AttributeError("Failed to retrieve 'scale'. \