@@ -430,6 +430,15 @@ def test_approx_igemm(self, dim1, dim2, quant_methods, batched):
430430 @pytest .mark .parametrize ("seq_dim" , [16 , 256 ], ids = id_formatter ("seq_dim" ))
431431 @pytest .mark .parametrize ("transpose" , BOOLEAN_TUPLES , ids = id_formatter ("transpose" ))
432432 def test_igemm (self , hidden_dim , batch_dim , transpose , seq_dim ):
433+ if (
434+ torch .version .cuda == "13.0"
435+ and torch .__version__ >= (2 , 10 )
436+ and not any (transpose )
437+ and batch_dim == 256
438+ and seq_dim == 256
439+ ):
440+ pytest .xfail ("Failure due to regression in cuBLAS for CUDA Toolkit 13.0.2." )
441+
433442 hidden_dim = hidden_dim - (hidden_dim % 32 )
434443 batch_dim = batch_dim - (batch_dim % 16 )
435444 seq_dim = seq_dim - (seq_dim % 16 )
@@ -570,6 +579,9 @@ def min_max(x):
570579 @pytest .mark .parametrize ("dim4" , [32 , 256 ], ids = id_formatter ("dim4" ))
571580 @pytest .mark .parametrize ("transpose" , BOOLEAN_TUPLES , ids = id_formatter ("transpose" ))
572581 def test_ibmm (self , dim1 , dim2 , dim3 , dim4 , transpose ):
582+ if torch .version .cuda == "13.0" and torch .__version__ >= (2 , 10 ) and dim1 == 64 :
583+ pytest .xfail ("Failure due to regression in cuBLAS for CUDA Toolkit 13.0.2." )
584+
573585 dim2 = dim2 - (dim2 % 16 )
574586 dim3 = dim3 - (dim3 % 16 )
575587 dim4 = dim4 - (dim4 % 16 )
0 commit comments