Skip to content

Commit 10ba659

Browse files
authored
Skip QAT tests using quantize_fp8_row in fbcode (#2963)
Just skipping for now to unblock: ``` triton.compiler.errors.CompilationError: at 1:0: def _kernel_quantize_fp8_row( ^ ValueError("type fp8e4nv not supported in this architecture. The supported fp8 dtypes are ('fp8e4b15', 'fp8e5')") ```
1 parent ecb6c4b commit 10ba659

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

test/quantization/test_qat.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2053,6 +2053,7 @@ def test_qat_nvfp4(self, use_per_tensor_scale: bool):
20532053
@unittest.skipIf(
20542054
not _is_fbgemm_genai_gpu_available(), "Requires fbgemm-gpu-genai >= 1.2.0"
20552055
)
2056+
@unittest.skipIf(is_fbcode(), "triton compilation error")
20562057
def test_fbgemm_fp8_primitives(self):
20572058
"""
20582059
Compare numerics between:
@@ -2092,6 +2093,7 @@ def test_fbgemm_fp8_primitives(self):
20922093
@unittest.skipIf(
20932094
not _is_fbgemm_genai_gpu_available(), "Requires fbgemm-gpu-genai >= 1.2.0"
20942095
)
2096+
@unittest.skipIf(is_fbcode(), "triton compilation error")
20952097
def test_fbgemm_int4_preshuffled_primitives(self):
20962098
"""
20972099
Compare numerics between:

0 commit comments

Comments
 (0)