diff --git a/vllm/model_executor/kernels/linear/mixed_precision/xpu.py b/vllm/model_executor/kernels/linear/mixed_precision/xpu.py index 68528bbd488..17900c75058 100644 --- a/vllm/model_executor/kernels/linear/mixed_precision/xpu.py +++ b/vllm/model_executor/kernels/linear/mixed_precision/xpu.py @@ -51,13 +51,6 @@ class XPUwNa16LinearKernel(MPLinearKernel): "XPUwNa16, supported sizes are multiples of 32", ) - if c.partition_weight_shape[1] % 32 != 0: - return ( - False, - f"Output size ({c.partition_weight_shape[1]}) not supported by " - "XPUWNA16, supported sizes are multiples of 32", - ) - return True, None def process_weights_after_loading(self, layer: torch.nn.Module):