remove last line

Signed-off-by: charlifu <[email protected]>
vllm-project · Dec 2, 2024 · f441c65 · f441c65
1 parent b412bd6
commit f441c65
Showing 1 changed file with 0 additions and 3 deletions.
diff --git a/vllm/model_executor/layers/quantization/utils/w8a8_utils.py b/vllm/model_executor/layers/quantization/utils/w8a8_utils.py
@@ -146,9 +146,6 @@ def apply_fp8_linear(
 
             return output[0:input_2d.shape[0], ...].view(*output_shape)
 
-            return torch.narrow(output, 0, 0,
-                                input_2d.shape[0]).view(*output_shape)
-
         else:
             # Fallback for channelwise case, where we use unfused DQ
             # due to limitations with scaled_mm