Skip to content

Commit a6b6383

Browse files
Skip fp8 blockwise quant on AMD
1 parent eeeeab8 commit a6b6383

1 file changed

Lines changed: 8 additions & 0 deletions

File tree

tests/quantize_blockwise_test.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -155,6 +155,14 @@ def test_quantize_blockwise(blocksize: int, size_multiplier: float, dtype: torch
155155
"""Test blockwise quantization method."""
156156
assert blocksize in SUPPORTED_BLOCKSIZES
157157

158+
# TODO(jmanning):
159+
# Seeing odd AMD compiler error for this kernel for FP8 cases
160+
# E RuntimeError: PassManager::run failed
161+
# .direnv/python-3.10.12/lib/python3.10/site-packages/triton/backends/amd/compiler.py:243: RuntimeError
162+
# loc("/home/$USER/conch/conch/kernels/quantization/bitsandbytes/quantize_blockwise.py":114:21): error: operand #1 does not dominate this use
163+
if current_platform.is_amd() and quant_type == "fp8":
164+
pytest.skip()
165+
158166
# There are some small rounding discrepancies between Triton and PyTorch, and its tough to adjust tolerances
159167
# to account for it because we compre bitpacked results (so if there's a rounding discrepancy in what become
160168
# the higher-bits of the result, the tolerance would need to be much higher to account for it). Consider changing

0 commit comments

Comments
 (0)