diff --git a/test/transformers/test_cross_entropy.py b/test/transformers/test_cross_entropy.py
index 4714aeabb..090989c8b 100644
--- a/test/transformers/test_cross_entropy.py
+++ b/test/transformers/test_cross_entropy.py
@@ -722,6 +722,7 @@ def test_correctness_not_last_layer(B, T, V, reduction, scalar, dtype, atol, rto
     )
 
 
+@pytest.mark.skip(reason="temporary skip to validate CI pipeline.")
 def test_float32_internal():
     """
     This test validates that the internal softmax calculations occur in float32,
@@ -763,7 +764,7 @@ def test_float32_internal():
         RETURN_Z_LOSS=0,  # False
         HAS_SOFTCAPPING=False,
         BLOCK_SIZE=BLOCK_SIZE,
-        num_warps=32 if device == "cuda" else 16,
+        num_warps=32,
     )
 
     # Run kernel for float32
@@ -787,7 +788,7 @@ def test_float32_internal():
         RETURN_Z_LOSS=0,  # False
         HAS_SOFTCAPPING=False,
         BLOCK_SIZE=BLOCK_SIZE,
-        num_warps=32 if device == "cuda" else 16,
+        num_warps=32,
     )
 
     torch.allclose(X_bf16, X_fp32.bfloat16())