Fix and reenable cudnn_fusion_test.

Disable XLA autotuning fallback to cuBLAS so that the tested fusion always executes through cuDNN.
2025-04-15 19:36:06 +00:00 · 2024-09-09 12:19:35 +00:00 · 2024-09-09 12:19:35 +00:00 · b320dc2e5e
commit b320dc2e5e
parent 15024baabf
2 changed files with 5 additions and 6 deletions
--- a/tests/BUILD
+++ b/tests/BUILD
@ -1501,10 +1501,7 @@ jax_multiplatform_test(
        "gpu_a100",
        "gpu_h100",
    ],
-    tags = [
-        "multiaccelerator",
-        "notap",  # TODO(phawkins): this test fails in our internal CI.
-    ],
+    tags = ["multiaccelerator"],
 )

 exports_files(
--- a/tests/cudnn_fusion_test.py
+++ b/tests/cudnn_fusion_test.py
@ -58,11 +58,13 @@ class CudnnFusionTest(jtu.JaxTestCase):
    self.assertIn('custom_call_target="__cudnn$fusion"', hlo)
    self.assertIn("called_computations=", hlo)

-    hlo_after_opt = lowered.compile().as_text()
+    compiled = lowered.compile({"xla_gpu_cublas_fallback": False})
+    hlo_after_opt = compiled.as_text()
+
    self.assertIn("kind=kCustom", hlo_after_opt)
    self.assertIn("plan_id", hlo_after_opt)

-    self.assertAllClose(jitted(x, y, z), fn(x, y, z))
+    self.assertAllClose(compiled(x, y, z), fn(x, y, z))


 if __name__ == '__main__':