We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9ae2e4c commit 225d9a5Copy full SHA for 225d9a5
vllm/model_executor/layers/quantization/utils/fp8_utils.py
@@ -472,7 +472,7 @@ def w8a8_block_fp8_matmul(
472
assert triton.cdiv(A.shape[-1], block_k) == As.shape[-1]
473
M = A.numel() // A.shape[-1]
474
475
- assert B.ndim == 2 and B.is_contiguous() and Bs.ndim == 2
+ assert B.ndim == 2 and Bs.ndim == 2
476
N, K = B.shape
477
assert triton.cdiv(N, block_n) == Bs.shape[0]
478
assert triton.cdiv(K, block_k) == Bs.shape[1]
0 commit comments