diff --git a/jax/_src/export/_export.py b/jax/_src/export/_export.py
index 8b33e64e81db..63329da1d211 100644
--- a/jax/_src/export/_export.py
+++ b/jax/_src/export/_export.py
@@ -1086,7 +1086,7 @@ def _check_lowering(lowering) -> None:
     "cusolver_syevd_ffi", "hipsolver_syevd_ffi",
     # svd on GPU
     "cusolver_gesvd_ffi", "cusolver_gesvdj_ffi",
-    "hipsolver_gesvd_ffi", "hipsolver_gesvdj_ffi",
+    "hipsolver_gesvd_ffi", "hipsolver_gesvdj_ffi", "hipsolver_gesdd_ffi",
     # tridiagonal on GPU
     "cusolver_sytrd_ffi",
     # tridiagonal_solve on GPU
diff --git a/jax/_src/internal_test_util/export_back_compat_test_data/rocm_cholesky_solver_potrf.py b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_cholesky_solver_potrf.py
new file mode 100644
index 000000000000..1f7158bde4a1
--- /dev/null
+++ b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_cholesky_solver_potrf.py
@@ -0,0 +1,322 @@
+# Copyright 2026 The JAX Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# pyrefly: ignore-errors
+# ruff: noqa
+
+import datetime
+import numpy as np
+
+array = np.array
+float32 = np.float32
+float64 = np.float64
+complex64 = np.complex64
+complex128 = np.complex128
+
+data_2026_02_05 = {}
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_05["f32"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_potrf_ffi'],
+    serialized_date=datetime.date(2026, 2, 5),
+    inputs=(array([[34.812286  , -2.1484861 , 11.958679  , 12.6090975 ],
+       [-2.1484861 ,  0.73191243, -2.3005815 ,  0.6536075 ],
+       [11.958679  , -2.3005815 , 18.171919  , 12.823325  ],
+       [12.6090975 ,  0.6536075 , 12.823325  , 33.237614  ]],
+      dtype=float32),),
+    expected_outputs=(array([[ 5.9001937 ,  0.        ,  0.        ,  0.        ],
+       [-0.36413825,  0.77415484,  0.        ,  0.        ],
+       [ 2.0268283 , -2.0183764 ,  3.160703  ,  0.        ],
+       [ 2.137065  ,  1.8494937 ,  3.8677585 ,  3.2078629 ]],
+      dtype=float32),),
+    mlir_module_text=r"""
+#loc1 = loc("x")
+module @jit_cholesky attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<4x4xf32> loc("x")) -> (tensor<4x4xf32> {jax.result_info = "result"}) {
+    %cst = stablehlo.constant dense<0.000000e+00> : tensor<f32> loc(#loc)
+    %cst_0 = stablehlo.constant dense<0x7FC00000> : tensor<f32> loc(#loc4)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc)
+    %cst_1 = stablehlo.constant dense<2.000000e+00> : tensor<f32> loc(#loc)
+    %0 = stablehlo.transpose %arg0, dims = [1, 0] : (tensor<4x4xf32>) -> tensor<4x4xf32> loc(#loc5)
+    %1 = stablehlo.add %arg0, %0 : tensor<4x4xf32> loc(#loc6)
+    %2 = stablehlo.broadcast_in_dim %cst_1, dims = [] : (tensor<f32>) -> tensor<4x4xf32> loc(#loc7)
+    %3 = stablehlo.divide %1, %2 : tensor<4x4xf32> loc(#loc7)
+    %4:2 = stablehlo.custom_call @hipsolver_potrf_ffi(%3) {mhlo.backend_config = {lower = true}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<[0, 1]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[0, 1]> : tensor<2xindex>, dense<> : tensor<0xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j])->([k, l], []) {i=4, j=4, k=4, l=4}, custom>} : (tensor<4x4xf32>) -> (tensor<4x4xf32>, tensor<i32>) loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<i32> loc(#loc4)
+    %6 = stablehlo.compare  EQ, %4#1, %5,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %6, dims = [] : (tensor<i1>) -> tensor<1x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<f32>) -> tensor<4x4xf32> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<1x1xi1>) -> tensor<4x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %4#0, %8 : tensor<4x4xi1>, tensor<4x4xf32> loc(#loc4)
+    %11 = stablehlo.iota dim = 0 : tensor<4x4xi32> loc(#loc8)
+    %12 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<4x4xi32> loc(#loc6)
+    %13 = stablehlo.add %11, %12 : tensor<4x4xi32> loc(#loc6)
+    %14 = stablehlo.iota dim = 1 : tensor<4x4xi32> loc(#loc8)
+    %15 = stablehlo.compare  GE, %13, %14,  SIGNED : (tensor<4x4xi32>, tensor<4x4xi32>) -> tensor<4x4xi1> loc(#loc9)
+    %16 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<4x4xf32> loc(#loc10)
+    %17 = stablehlo.select %15, %10, %16 : tensor<4x4xi1>, tensor<4x4xf32> loc(#loc11)
+    return %17 : tensor<4x4xf32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":825:6)
+#loc3 = loc("jit(cholesky)"(#loc2))
+#loc4 = loc("cholesky"(#loc3))
+#loc5 = loc("transpose"(#loc3))
+#loc6 = loc("add"(#loc3))
+#loc7 = loc("div"(#loc3))
+#loc8 = loc("iota"(#loc3))
+#loc9 = loc("ge"(#loc3))
+#loc10 = loc("broadcast_in_dim"(#loc3))
+#loc11 = loc("select_n"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01+\x07\x01\x05\t\x19\x01\x03\x0f\x03\x17\x13\x17\x1b\x1f#'+/37;\x03\xdf\xa1'\x01E\x0f\x0f\x07\x0f\x0f\x0f\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0b\x17\x0b\x0f\x0b\x0b\x0b#\x0b\x0b\x0b\x0b\x0f\x0b\x0f\x0b\x0f\x0b\x03M\x0fO\x0b\x0f\x0b\x0b\x0f\x13\x0b\x0b\x0b\x0b\x1f\x1f\x1f\x1fO\x13\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x13\x0f\x0bO\x0f\x0f\x0b\x05\x11C\x13\x0f\x0f\x13\x0f\x0f\x0b\x01\x05\x0b\x0f\x03#\x17\x0f\x0f\x07\x17\x07\x07\x07\x13\x07\x17\x17\x13\x13\x13\x0f\x17\x02\x9a\x05\x1d\x1f\x03\x1d!#\x1f\x1d+\x03\x11\x03\x05\x1d-\x03\x1d7\x03\x03\x07\x11\x13\x15\t\x17\t\x05\x1f\x11\x01\x00\x05!\x05#\x05%\x1d\x1d\x05\x05'\x05)\x05+\x17%\xe6\x0c\r\x05-\x1d)\x03\x05/\x051\x053\x03\x071g3m5\x91\x055\x057\x059\x05;\x1d;\x03\x05=\x1d?\x03\x05?\x1dC\x03\x05A\x1f\x1d\x01\x1f\x1f!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\t\x07\x03\x03M\r\x01#\x1b\x03\x03S\r\x03UW\x1dC\x1dE\x1dG\x1dI\x1f\x07\t\x00\x00\x00\x00\x1f\x07\t\x00\x00\xc0\x7f\x1f\t\t\x00\x00\x00\x00\x1f\x07\t\x00\x00\x00@\x1f\x15!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\r\x03ik\x1dK\x05\x03\r\x03oq\x1dM\x1dO\x0b\x03\x1dQ\x1dS\x03\x01\x05\x01\x03\x03G\x03\x03\x81\x15\x03\x01\x01\x01\x03\x05G\x85\x1f!\x01\x07\x01\x1f\x15!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x13\x0b\x01\x13\x0b\x05\x07\x05\x15\t\x11\x11\x11\x11\x03\x93\x05\x99\x9f\x01\x01\x01\x01\x01\x13\x05\x95\x97\x11\x03\x01\x11\x03\x05\x13\x05\x9b\x9d\x11\x03\t\x11\x03\r\x13\x01\x01\t\x01\x02\x02)\x05\x11\x11\x11)\x01\x11)\x01\x13\x1d)\x05\x11\x11\x13\x01\t\x1b)\x03\t\x0b\x13)\x05\x11\x11\x0f\x11\x03\x05\x03\x05)\x03\x01\x0b)\x03\t\x17)\x03\x01\x17)\x01\x0f)\x05\x05\x05\x0f\x04.\x03\x05\x01Q\x05\x0f\x01\x07\x04\x06\x03\x03\x01\x05\x0fP\x05\x03\x07\x04\xda\x02\x031_\x03\x0b\x1b\x00\x05B\x05\x05\x03\x07\x05B\x01\x07\x03\x07\x05B\x05\t\x03\t\x05B\x05\x0b\x03\x07\x11F'\r\x03\x05\x03\x01\x07\x06\x07\x03\x05\x05\x01\x0b\x03F\x0b\x0f\x03\x05\x03\t\x13\x06\x0b\x03\x05\x05\r\x0f\x15G\x01/\x11\x05\x05\t\x03\x11\x03F\x01\x0f\x03\t\x03\x07\tF\x01\x13\x03#\x05\x15\x17\x03F\x01\x0f\x03%\x03\x19\x03F\x01\x0f\x03\x05\x03\x05\x03F\x01\x15\x03\x19\x03\x1b\x0b\x06\x01\x03\x05\x07\x1f\x13\x1d\rB\r\x17\x03\r\x03F\x07\x0f\x03\r\x03\x07\x07\x06\x07\x03\r\x05#%\rB\r\x19\x03\r\tF9\x1b\x03\x19\x05')\x03F=\x0f\x03\x05\x03\x03\x0b\x06A\x03\x05\x07+!-\x17\x04\x05\x03/\x06\x03\x01\x05\x01\x00b\x08U)\x03\x05\x1f\r\x0f\x0b\x0f!\x13#\x07\x0b%3)\t\t\x15_\x1d\x13\x05\x1b%)9\x15\x1f\x15\x1b\x11\x11\x15\x17\x0f\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00add_v1\x00compare_v1\x00select_v1\x00iota_v1\x00func_v1\x00transpose_v1\x00divide_v1\x00custom_call_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_cholesky\x00x\x00cholesky\x00jit(cholesky)\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00transpose\x00add\x00div\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00iota\x00ge\x00broadcast_in_dim\x00select_n\x00jax.result_info\x00result\x00main\x00public\x00lower\x00num_batch_dims\x000\x00\x00hipsolver_potrf_ffi\x00\x08W\x1d\x053\x01\x0bKOQY[\x03]\x03_\x03a\x03c\x03e\x03E\x11suwy{}\x7f\x83\x05I\x87\x03\x89\x03\x8b\x03\x8d\x05I\x8f",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_05["f64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_potrf_ffi'],
+    serialized_date=datetime.date(2026, 2, 5),
+    inputs=(array([[ 22.512951744778434 ,  -1.5384549502899474,  -0.7079098803209338,
+         -7.513422195751226 ],
+       [ -1.5384549502899474,  20.359325409167592 , -11.28730444363775  ,
+        -16.410921233814605 ],
+       [ -0.7079098803209338, -11.28730444363775  ,   9.98412985373178  ,
+         16.396557441992236 ],
+       [ -7.513422195751226 , -16.410921233814605 ,  16.396557441992236 ,
+         30.554293874957157 ]]),),
+    expected_outputs=(array([[ 4.7447815276130925 ,  0.                 ,  0.                 ,
+         0.                 ],
+       [-0.3242414727288575 ,  4.500465851057001  ,  0.                 ,
+         0.                 ],
+       [-0.14919757131095024, -2.5187793573024955 ,  1.9020043342940942 ,
+         0.                 ],
+       [-1.5835127817846915 , -3.7605799733577596 ,  3.5164115306360086 ,
+         1.2408341372126808 ]]),),
+    mlir_module_text=r"""
+#loc1 = loc("x")
+module @jit_cholesky attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<4x4xf64> loc("x")) -> (tensor<4x4xf64> {jax.result_info = "result"}) {
+    %cst = stablehlo.constant dense<0.000000e+00> : tensor<f64> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i64> loc(#loc)
+    %cst_0 = stablehlo.constant dense<0x7FF8000000000000> : tensor<f64> loc(#loc4)
+    %c_1 = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %cst_2 = stablehlo.constant dense<2.000000e+00> : tensor<f64> loc(#loc)
+    %0 = stablehlo.transpose %arg0, dims = [1, 0] : (tensor<4x4xf64>) -> tensor<4x4xf64> loc(#loc5)
+    %1 = stablehlo.add %arg0, %0 : tensor<4x4xf64> loc(#loc6)
+    %2 = stablehlo.broadcast_in_dim %cst_2, dims = [] : (tensor<f64>) -> tensor<4x4xf64> loc(#loc7)
+    %3 = stablehlo.divide %1, %2 : tensor<4x4xf64> loc(#loc7)
+    %4:2 = stablehlo.custom_call @hipsolver_potrf_ffi(%3) {mhlo.backend_config = {lower = true}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<[0, 1]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[0, 1]> : tensor<2xindex>, dense<> : tensor<0xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j])->([k, l], []) {i=4, j=4, k=4, l=4}, custom>} : (tensor<4x4xf64>) -> (tensor<4x4xf64>, tensor<i32>) loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %c_1, dims = [] : (tensor<i32>) -> tensor<i32> loc(#loc4)
+    %6 = stablehlo.compare  EQ, %4#1, %5,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %6, dims = [] : (tensor<i1>) -> tensor<1x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<f64>) -> tensor<4x4xf64> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<1x1xi1>) -> tensor<4x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %4#0, %8 : tensor<4x4xi1>, tensor<4x4xf64> loc(#loc4)
+    %11 = stablehlo.iota dim = 0 : tensor<4x4xi64> loc(#loc8)
+    %12 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i64>) -> tensor<4x4xi64> loc(#loc6)
+    %13 = stablehlo.add %11, %12 : tensor<4x4xi64> loc(#loc6)
+    %14 = stablehlo.iota dim = 1 : tensor<4x4xi64> loc(#loc8)
+    %15 = stablehlo.compare  GE, %13, %14,  SIGNED : (tensor<4x4xi64>, tensor<4x4xi64>) -> tensor<4x4xi1> loc(#loc9)
+    %16 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<4x4xf64> loc(#loc10)
+    %17 = stablehlo.select %15, %10, %16 : tensor<4x4xi1>, tensor<4x4xf64> loc(#loc11)
+    return %17 : tensor<4x4xf64> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":825:6)
+#loc3 = loc("jit(cholesky)"(#loc2))
+#loc4 = loc("cholesky"(#loc3))
+#loc5 = loc("transpose"(#loc3))
+#loc6 = loc("add"(#loc3))
+#loc7 = loc("div"(#loc3))
+#loc8 = loc("iota"(#loc3))
+#loc9 = loc("ge"(#loc3))
+#loc10 = loc("broadcast_in_dim"(#loc3))
+#loc11 = loc("select_n"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01+\x07\x01\x05\t\x19\x01\x03\x0f\x03\x17\x13\x17\x1b\x1f#'+/37;\x03\xe3\xa3)\x01E\x0f\x0f\x07\x0f\x0f\x0f\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0b\x17\x0b\x0f\x0b\x0b\x0b#\x0b\x0b\x0b\x0b\x0f\x0b\x0f\x0b\x0f\x0b\x03O\x0fO\x0b\x0f\x0b\x0b\x0f\x13\x0b\x0b\x0b\x0b///\x1f/O\x13\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x13\x0f\x0bO\x0f\x0f\x0b\x05\x11C\x13\x0f\x0f\x13\x0f\x0f\x0b\x01\x05\x0b\x0f\x03%\x17\x0f\x07\x0f\x17\x07\x07\x0f\x13\x07\x17\x17\x07\x13\x13\x13\x0f\x17\x02\x02\x06\x1d\x1f\x03\x1d!#\x1f\x1d+\x03\x11\x03\x05\x1d-\x03\x1d7\x03\x03\x07\x11\x13\x15\t\x17\t\x05\x1f\x11\x01\x00\x05!\x05#\x05%\x1d\x1d\x05\x05'\x05)\x05+\x17%\xe6\x0c\r\x05-\x1d)\x03\x05/\x051\x053\x03\x071i3o5\x93\x055\x057\x059\x05;\x1d;\x03\x05=\x1d?\x03\x05?\x1dC\x03\x05A\x1f\x1f\x01\x1f!!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\t\x07\x03\x03M\r\x01#\x1b\x03\x03S\r\x03UW\x1dC\x1dE\x1dG\x1dI\x1f\x07\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x13\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x07\x11\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x0b\t\x00\x00\x00\x00\x1f\x07\x11\x00\x00\x00\x00\x00\x00\x00@\x1f\x15!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\r\x03km\x1dK\x05\x03\r\x03qs\x1dM\x1dO\x0b\x03\x1dQ\x1dS\x03\x01\x05\x01\x03\x03G\x03\x03\x83\x15\x03\x01\x01\x01\x03\x05G\x87\x1f#\x01\x07\x01\x1f\x15!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x13\t\x01\x13\t\x05\x07\x05\x15\t\x11\x11\x11\x11\x03\x95\x05\x9b\xa1\x01\x01\x01\x01\x01\x13\x05\x97\x99\x11\x03\x01\x11\x03\x05\x13\x05\x9d\x9f\x11\x03\t\x11\x03\r\x13\x01\x01\t\x01\x02\x02)\x05\x11\x11\x11)\x01\x11\x1d)\x01\x1d)\x05\x11\x11\t\x01\x0b)\x01\t)\x03\t\t\x13)\x05\x11\x11\x0f\x11\x03\x05\x03\x05\x1b)\x03\x01\t)\x03\t\x17)\x03\x01\x17)\x01\x0f)\x05\x05\x05\x0f\x04F\x03\x05\x01Q\x05\x0f\x01\x07\x04\x1e\x03\x03\x01\x05\x0fP\x05\x03\x07\x04\xf2\x02\x033c\x03\x0b\x1b\x00\x05B\x05\x05\x03\x07\x05B\x05\x07\x03\x13\x05B\x01\t\x03\x07\x05B\x01\x0b\x03\x0b\x05B\x05\r\x03\x07\x11F'\x0f\x03\x05\x03\x01\x07\x06\x07\x03\x05\x05\x01\r\x03F\x0b\x11\x03\x05\x03\x0b\x13\x06\x0b\x03\x05\x05\x0f\x11\x15G\x01/\x13\x05\x05\x0b\x03\x13\x03F\x01\x11\x03\x0b\x03\t\tF\x01\x15\x03%\x05\x17\x19\x03F\x01\x11\x03'\x03\x1b\x03F\x01\x11\x03\x05\x03\x07\x03F\x01\x17\x03\x19\x03\x1d\x0b\x06\x01\x03\x05\x07!\x15\x1f\rB\r\x19\x03\r\x03F\x07\x11\x03\r\x03\x05\x07\x06\x07\x03\r\x05%'\rB\r\x1b\x03\r\tF9\x1d\x03\x19\x05)+\x03F=\x11\x03\x05\x03\x03\x0b\x06A\x03\x05\x07-#/\x17\x04\x05\x031\x06\x03\x01\x05\x01\x00b\x08U)\x03\x05\x1f\r\x0f\x0b\x0f!\x13#\x07\x0b%3)\t\t\x15_\x1d\x13\x05\x1b%)9\x15\x1f\x15\x1b\x11\x11\x15\x17\x0f\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00add_v1\x00compare_v1\x00select_v1\x00iota_v1\x00func_v1\x00transpose_v1\x00divide_v1\x00custom_call_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_cholesky\x00x\x00cholesky\x00jit(cholesky)\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00transpose\x00add\x00div\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00iota\x00ge\x00broadcast_in_dim\x00select_n\x00jax.result_info\x00result\x00main\x00public\x00lower\x00num_batch_dims\x000\x00\x00hipsolver_potrf_ffi\x00\x08[\x1f\x053\x01\x0bKOQY[\x03]\x03_\x03a\x03c\x03e\x03g\x03E\x11uwy{}\x7f\x81\x85\x05I\x89\x03\x8b\x03\x8d\x03\x8f\x05I\x91",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_05["c64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_potrf_ffi'],
+    serialized_date=datetime.date(2026, 2, 5),
+    inputs=(array([[ 62.221153 -6.4815424e-08j, -22.13242  -1.0246023e+01j,
+          2.020702 +2.5961372e+01j, -10.631899 -4.9574718e+01j],
+       [-22.13242  +1.0246025e+01j,  78.902084 +1.7114758e-07j,
+          1.8615259+1.0474155e+01j,  24.668098 +1.4437879e+00j],
+       [  2.020702 -2.5961372e+01j,   1.8615259-1.0474156e+01j,
+         48.52617  +5.4661250e-08j, -31.667604 -9.3938026e+00j],
+       [-10.631899 +4.9574718e+01j,  24.668098 -1.4437873e+00j,
+        -31.667604 +9.3938026e+00j,  52.51258  +4.5532943e-08j]],
+      dtype=complex64),),
+    expected_outputs=(array([[ 7.8880386+0.j       ,  0.       +0.j       ,
+         0.       +0.j       ,  0.       +0.j       ],
+       [-2.8058202+1.2989317j,  8.327198 +0.j       ,
+         0.       +0.j       ,  0.       +0.j       ],
+       [ 0.2561729-3.2912328j,  0.8232526-2.3268344j,
+         5.6157303+0.j       ,  0.       +0.j       ],
+       [-1.3478507+6.284796j ,  1.5278549+1.7340113j,
+        -1.3997552+1.2887555j,  1.4952842+0.j       ]], dtype=complex64),),
+    mlir_module_text=r"""
+#loc1 = loc("x")
+module @jit_cholesky attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<4x4xcomplex<f32>> loc("x")) -> (tensor<4x4xcomplex<f32>> {jax.result_info = "result"}) {
+    %cst = stablehlo.constant dense<(0.000000e+00,0.000000e+00)> : tensor<complex<f32>> loc(#loc)
+    %cst_0 = stablehlo.constant dense<(0x7FC00000,0x7FC00000)> : tensor<complex<f32>> loc(#loc4)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc)
+    %cst_1 = stablehlo.constant dense<(2.000000e+00,0.000000e+00)> : tensor<complex<f32>> loc(#loc)
+    %0 = stablehlo.transpose %arg0, dims = [1, 0] : (tensor<4x4xcomplex<f32>>) -> tensor<4x4xcomplex<f32>> loc(#loc5)
+    %1 = stablehlo.real %0 : (tensor<4x4xcomplex<f32>>) -> tensor<4x4xf32> loc(#loc6)
+    %2 = stablehlo.imag %0 : (tensor<4x4xcomplex<f32>>) -> tensor<4x4xf32> loc(#loc6)
+    %3 = stablehlo.negate %2 : tensor<4x4xf32> loc(#loc6)
+    %4 = stablehlo.complex %1, %3 : tensor<4x4xcomplex<f32>> loc(#loc6)
+    %5 = stablehlo.add %arg0, %4 : tensor<4x4xcomplex<f32>> loc(#loc7)
+    %6 = stablehlo.broadcast_in_dim %cst_1, dims = [] : (tensor<complex<f32>>) -> tensor<4x4xcomplex<f32>> loc(#loc8)
+    %7 = stablehlo.divide %5, %6 : tensor<4x4xcomplex<f32>> loc(#loc8)
+    %8:2 = stablehlo.custom_call @hipsolver_potrf_ffi(%7) {mhlo.backend_config = {lower = true}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<[0, 1]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[0, 1]> : tensor<2xindex>, dense<> : tensor<0xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j])->([k, l], []) {i=4, j=4, k=4, l=4}, custom>} : (tensor<4x4xcomplex<f32>>) -> (tensor<4x4xcomplex<f32>>, tensor<i32>) loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<i32> loc(#loc4)
+    %10 = stablehlo.compare  EQ, %8#1, %9,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %10, dims = [] : (tensor<i1>) -> tensor<1x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<complex<f32>>) -> tensor<4x4xcomplex<f32>> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1] : (tensor<1x1xi1>) -> tensor<4x4xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %8#0, %12 : tensor<4x4xi1>, tensor<4x4xcomplex<f32>> loc(#loc4)
+    %15 = stablehlo.iota dim = 0 : tensor<4x4xi32> loc(#loc9)
+    %16 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<4x4xi32> loc(#loc7)
+    %17 = stablehlo.add %15, %16 : tensor<4x4xi32> loc(#loc7)
+    %18 = stablehlo.iota dim = 1 : tensor<4x4xi32> loc(#loc9)
+    %19 = stablehlo.compare  GE, %17, %18,  SIGNED : (tensor<4x4xi32>, tensor<4x4xi32>) -> tensor<4x4xi1> loc(#loc10)
+    %20 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f32>>) -> tensor<4x4xcomplex<f32>> loc(#loc11)
+    %21 = stablehlo.select %19, %14, %20 : tensor<4x4xi1>, tensor<4x4xcomplex<f32>> loc(#loc12)
+    return %21 : tensor<4x4xcomplex<f32>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":825:6)
+#loc3 = loc("jit(cholesky)"(#loc2))
+#loc4 = loc("cholesky"(#loc3))
+#loc5 = loc("transpose"(#loc3))
+#loc6 = loc(""(#loc3))
+#loc7 = loc("add"(#loc3))
+#loc8 = loc("div"(#loc3))
+#loc9 = loc("iota"(#loc3))
+#loc10 = loc("ge"(#loc3))
+#loc11 = loc("broadcast_in_dim"(#loc3))
+#loc12 = loc("select_n"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x013\x07\x01\x05\t!\x01\x03\x0f\x03\x1f\x13\x17\x1b\x1f#'+/37;?CGK\x03\xe7\xa5+\x01I\x0f\x0f\x07\x0f\x0f\x0f\x0f\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0b\x17\x0b\x0f\x0b\x0b\x0b\x0b#\x0b\x0b\x0b\x0b\x0f\x0b\x0f\x0b\x0f\x0b\x03M\x0fO\x0b\x0f\x0b\x0b\x0f\x13\x0b\x0b\x0b\x0b//\x1f/O\x13\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x13\x0f\x0bO\x0f\x0f\x0b\x05\x11C\x13\x0f\x0f\x13\x0f\x0f\x0b\x01\x05\x0b\x0f\x03'\x17\x0f\x0f\x07\x17\x17\x07\x0b\x07\x07\x13\x07\x17\x17\x13\x13\x13\x0f\x17\x02\xfa\x05\x1d#%\x1d!\x01\x1f\x1d-\x01\x1d/\x01\x11\x03\x05\x1d1\x01\x1d;\x01\x03\x07\x13\x15\x17\x0b\x19\x0b\x05'\x11\x01\x00\x05)\x05+\x05-\x1d\x1f\x05\x05/\x051\x053\x17'\xe6\x0c\r\x055\x1d+\x01\x057\x059\x05;\x05=\x03\x075k7q9\x95\x05?\x05A\x05C\x05E\x1d?\x01\x05G\x1dC\x01\x05I\x1dG\x01\x05K\x1f!\x01\x1f#!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\t\x07\x03\x03Q\r\x01#\x1f\x03\x03W\r\x03Y[\x1dM\x1dO\x1dQ\x1dS\x1f\x07\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x07\x11\x00\x00\xc0\x7f\x00\x00\xc0\x7f\x1f\t\t\x00\x00\x00\x00\x1f\x07\x11\x00\x00\x00@\x00\x00\x00\x00\x1f\x19!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\r\x03mo\x1dU\x05\x03\r\x03su\x1dW\x1dY\x0b\x03\x1d9\x1d[\x03\x01\x05\x01\x03\x03K\x03\x03\x85\x15\x03\x01\x01\x01\x03\x05K\x89\x1f%\x01\x07\x01\x1f\x19!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x13\x0b\x01\x13\x0b\x05\x07\x05\x15\t\x11\x11\x11\x11\x03\x97\x05\x9d\xa3\x01\x01\x01\x01\x01\x13\x05\x99\x9b\x11\x03\x01\x11\x03\x05\x13\x05\x9f\xa1\x11\x03\t\x11\x03\r\x13\x01\x01\t\x01\x02\x02)\x05\x11\x11\x13)\x01\x13)\x01\x17\x1d)\x05\x11\x11\x17)\x05\x11\x11\x15\x01\x03\x15\t\x1b)\x03\t\x0b\x13)\x05\x11\x11\x11\x11\x03\x05\x03\x05)\x03\x01\x0b)\x03\t\x1b)\x03\x01\x1b)\x01\x11)\x05\x05\x05\x11\x04\xa2\x03\x05\x01Q\x05\x11\x01\x07\x04z\x03\x03\x01\x05\x0fP\x05\x03\x07\x04N\x03\x039o\x03\x0b\x1d\x00\x05B\x05\x05\x03\x07\x05B\x03\x07\x03\x07\x05B\x05\t\x03\t\x05B\x05\x0b\x03\x07\x11F)\r\x03\x05\x03\x01\x13\x06\x07\x03\x0f\x03\x0b\x15\x06\x07\x03\x0f\x03\x0b\x17\x06\x07\x03\x0f\x03\x0f\x19\x06\x07\x03\x05\x05\r\x11\x07\x06\t\x03\x05\x05\x01\x13\x03F\r\x0f\x03\x05\x03\t\x1b\x06\r\x03\x05\x05\x15\x17\x1dG\x033\x11\x05\x05\t\x03\x19\x03F\x03\x0f\x03\t\x03\x07\tF\x03\x13\x03'\x05\x1d\x1f\x03F\x03\x0f\x03)\x03!\x03F\x03\x0f\x03\x05\x03\x05\x03F\x03\x15\x03\x1d\x03#\x0b\x06\x03\x03\x05\x07'\x1b%\rB\x0f\x17\x03\r\x03F\t\x0f\x03\r\x03\x07\x07\x06\t\x03\r\x05+-\rB\x0f\x19\x03\r\tF=\x1b\x03\x1d\x05/1\x03FA\x0f\x03\x05\x03\x03\x0b\x06E\x03\x05\x073)5\x1f\x04\x05\x037\x06\x03\x01\x05\x01\x00\x06\t])\x05\x1f\r\x0f\x0b\x0f!\x13#\x07\x0b%3)\t\t\x03\x15_\x1d\x13\x05\x1b%)9\x15\x1f\x15\x17\x15\x11\x11\x1b\x11\x11\x15\x17\x0f\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00add_v1\x00compare_v1\x00select_v1\x00iota_v1\x00func_v1\x00transpose_v1\x00real_v1\x00imag_v1\x00negate_v1\x00complex_v1\x00divide_v1\x00custom_call_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_cholesky\x00x\x00cholesky\x00jit(cholesky)\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00transpose\x00\x00add\x00div\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00iota\x00ge\x00broadcast_in_dim\x00select_n\x00jax.result_info\x00result\x00main\x00public\x00lower\x00num_batch_dims\x000\x00hipsolver_potrf_ffi\x00\x08W\x1d\x057\x01\x0bOSU]_\x03a\x03c\x03e\x03g\x03i\x03I\x11wy{}\x7f\x81\x83\x87\x05M\x8b\x03\x8d\x03\x8f\x03\x91\x05M\x93",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_05["c128"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_potrf_ffi'],
+    serialized_date=datetime.date(2026, 2, 12),
+    inputs=(array([[ 89.87952196174669   +0.j                ,
+             21.172589387233007  -0.5065005061603287j,
+             26.675332736174525 -21.04249820574197j  ,
+            -22.454631781241247  -0.2825311262043684j],
+           [ 21.172589387233007  +0.5065005061603287j,
+            124.54705989631825   +0.j                ,
+             19.85813796022367  -18.26763890302077j  ,
+              0.8537948497861074+40.151936454090915j ],
+           [ 26.675332736174525 +21.04249820574197j  ,
+             19.85813796022367  +18.26763890302077j  ,
+             80.50543748874053   +0.j                ,
+            -27.820142802134686 -26.403643030508185j ],
+           [-22.454631781241247  +0.2825311262043684j,
+              0.8537948497861074-40.151936454090915j ,
+            -27.820142802134686 +26.403643030508185j ,
+             68.7846809105664    +0.j                ]]),),
+    expected_outputs=(array([[ 9.480481103918022 +0.j                  ,
+             0.                +0.j                  ,
+             0.                +0.j                  ,
+             0.                +0.j                  ],
+           [ 2.233282167345174 +0.05342561211909446j ,
+            10.934196649105319 +0.j                  ,
+             0.                +0.j                  ,
+             0.                +0.j                  ],
+           [ 2.813710870131933 +2.219560165258458j   ,
+             1.2306113307857565+1.2310972103527822j  ,
+             8.03940400229041  +0.j                  ,
+             0.                +0.j                  ],
+           [-2.3685118439781885+0.029801349014619737j,
+             0.561701801775981 -3.689802896839719j   ,
+            -2.1606964535715916+3.270759732680002j   ,
+             5.820421952921915 +0.j                  ]]),),
+    mlir_module_text=r"""
+#loc1 = loc("x")
+module @jit_cholesky attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<4x4xcomplex<f64>> loc("x")) -> (tensor<4x4xcomplex<f64>> {jax.result_info = "result"}) {
+    %cst = stablehlo.constant dense<(0.000000e+00,0.000000e+00)> : tensor<complex<f64>> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i64> loc(#loc)
+    %cst_0 = stablehlo.constant dense<(0x7FF8000000000000,0x7FF8000000000000)> : tensor<complex<f64>> loc(#loc4)
+    %c_1 = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %cst_2 = stablehlo.constant dense<(2.000000e+00,0.000000e+00)> : tensor<complex<f64>> loc(#loc)
+    %0 = stablehlo.transpose %arg0, dims = [1, 0] : (tensor<4x4xcomplex<f64>>) -> tensor<4x4xcomplex<f64>> loc(#loc5)
+    %1 = stablehlo.real %0 : (tensor<4x4xcomplex<f64>>) -> tensor<4x4xf64> loc(#loc6)
+    %2 = stablehlo.imag %0 : (tensor<4x4xcomplex<f64>>) -> tensor<4x4xf64> loc(#loc6)
+    %3 = stablehlo.negate %2 : tensor<4x4xf64> loc(#loc6)
+    %4 = stablehlo.complex %1, %3 : tensor<4x4xcomplex<f64>> loc(#loc6)
+    %5 = stablehlo.add %arg0, %4 : tensor<4x4xcomplex<f64>> loc(#loc7)
+    %6 = stablehlo.broadcast_in_dim %cst_2, dims = [] : (tensor<complex<f64>>) -> tensor<4x4xcomplex<f64>> loc(#loc8)
+    %7 = stablehlo.divide %5, %6 : tensor<4x4xcomplex<f64>> loc(#loc8)
+    %8:2 = stablehlo.custom_call @hipsolver_potrf_ffi(%7) {mhlo.backend_config = {lower = true}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<[0, 1]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[0, 1]> : tensor<2xindex>, dense<> : tensor<0xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j])->([k, l], []) {i=4, j=4, k=4, l=4}, custom>} : (tensor<4x4xcomplex<f64>>) -> (tensor<4x4xcomplex<f64>>, tensor<i32>) loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %c_1, dims = [] : (tensor<i32>) -> tensor<i32> loc(#loc4)
+    %10 = stablehlo.compare  EQ, %8#1, %9,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %10, dims = [] : (tensor<i1>) -> tensor<1x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<complex<f64>>) -> tensor<4x4xcomplex<f64>> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1] : (tensor<1x1xi1>) -> tensor<4x4xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %8#0, %12 : tensor<4x4xi1>, tensor<4x4xcomplex<f64>> loc(#loc4)
+    %15 = stablehlo.iota dim = 0 : tensor<4x4xi64> loc(#loc9)
+    %16 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i64>) -> tensor<4x4xi64> loc(#loc7)
+    %17 = stablehlo.add %15, %16 : tensor<4x4xi64> loc(#loc7)
+    %18 = stablehlo.iota dim = 1 : tensor<4x4xi64> loc(#loc9)
+    %19 = stablehlo.compare  GE, %17, %18,  SIGNED : (tensor<4x4xi64>, tensor<4x4xi64>) -> tensor<4x4xi1> loc(#loc10)
+    %20 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f64>>) -> tensor<4x4xcomplex<f64>> loc(#loc11)
+    %21 = stablehlo.select %19, %14, %20 : tensor<4x4xi1>, tensor<4x4xcomplex<f64>> loc(#loc12)
+    return %21 : tensor<4x4xcomplex<f64>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":235:6)
+#loc3 = loc("jit(cholesky)"(#loc2))
+#loc4 = loc("cholesky"(#loc3))
+#loc5 = loc("transpose"(#loc3))
+#loc6 = loc(""(#loc3))
+#loc7 = loc("add"(#loc3))
+#loc8 = loc("div"(#loc3))
+#loc9 = loc("iota"(#loc3))
+#loc10 = loc("ge"(#loc3))
+#loc11 = loc("broadcast_in_dim"(#loc3))
+#loc12 = loc("select_n"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x013\x07\x01\x05\t!\x01\x03\x0f\x03\x1f\x13\x17\x1b\x1f#'+/37;?CGK\x03\xeb\xa7-\x01I\x0f\x0f\x07\x0f\x0f\x0f\x0f\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0b\x17\x0b\x0f\x0b\x0b\x0b\x0b#\x0b\x0b\x0b\x0b\x0f\x0b\x0f\x0b\x0f\x0b\x03O\x0fO\x0b\x0f\x0b\x0b\x0f\x13\x0b\x0b\x0b\x0bO/O\x1fOO\x13\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x13\x0f\x0bO\x0f\x0f\x0b\x05\x11C\x13\x0f\x0f\x13\x0f\x0f\x0b\x01\x05\x0b\x0f\x03)\x17\x0f\x07\x0f\x17\x17\x07\x0b\x07\x0f\x13\x07\x17\x17\x07\x13\x13\x13\x0f\x17\x02\x92\x06\x1d!\x03\x1d#%\x1f\x1d-\x03\x1d/\x03\x11\x03\x05\x1d1\x03\x1d;\x03\x03\x07\x13\x15\x17\x0b\x19\x0b\x05'\x11\x01\x00\x05)\x05+\x05-\x1d\x1f\x05\x05/\x051\x053\x17'\xae\x03\r\x055\x1d+\x03\x057\x059\x05;\x05=\x03\x075m7s9\x97\x05?\x05A\x05C\x05E\x1d?\x03\x05G\x1dC\x03\x05I\x1dG\x03\x05K\x1f#\x01\x1f%!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\t\x07\x03\x03Q\r\x01#\x1f\x03\x03W\r\x03Y[\x1dM\x1dO\x1dQ\x1dS\x1f\x07!\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x17\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x07!\x00\x00\x00\x00\x00\x00\xf8\x7f\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x0b\t\x00\x00\x00\x00\x1f\x07!\x00\x00\x00\x00\x00\x00\x00@\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x19!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\r\x03oq\x1dU\x05\x03\r\x03uw\x1dW\x1dY\x0b\x03\x1d9\x1d[\x03\x01\x05\x01\x03\x03K\x03\x03\x87\x15\x03\x01\x01\x01\x03\x05K\x8b\x1f'\x01\x07\x01\x1f\x19!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x13\t\x01\x13\t\x05\x07\x05\x15\t\x11\x11\x11\x11\x03\x99\x05\x9f\xa5\x01\x01\x01\x01\x01\x13\x05\x9b\x9d\x11\x03\x01\x11\x03\x05\x13\x05\xa1\xa3\x11\x03\t\x11\x03\r\x13\x01\x01\t\x01\x02\x02)\x05\x11\x11\x13)\x01\x13\x1d)\x01!)\x05\x11\x11\t)\x05\x11\x11\x15\x01\x03\x15\x0b)\x01\t)\x03\t\t\x13)\x05\x11\x11\x11\x11\x03\x05\x03\x05\x1b)\x03\x01\t)\x03\t\x1b)\x03\x01\x1b)\x01\x11)\x05\x05\x05\x11\x04\xba\x03\x05\x01Q\x05\x11\x01\x07\x04\x92\x03\x03\x01\x05\x0fP\x05\x03\x07\x04f\x03\x03;s\x03\x0b\x1d\x00\x05B\x05\x05\x03\x07\x05B\x05\x07\x03\x17\x05B\x01\t\x03\x07\x05B\x01\x0b\x03\x0b\x05B\x05\r\x03\x07\x11F)\x0f\x03\x05\x03\x01\x13\x06\x07\x03\x0f\x03\r\x15\x06\x07\x03\x0f\x03\r\x17\x06\x07\x03\x0f\x03\x11\x19\x06\x07\x03\x05\x05\x0f\x13\x07\x06\t\x03\x05\x05\x01\x15\x03F\r\x11\x03\x05\x03\x0b\x1b\x06\r\x03\x05\x05\x17\x19\x1dG\x013\x13\x05\x05\x0b\x03\x1b\x03F\x01\x11\x03\x0b\x03\t\tF\x01\x15\x03)\x05\x1f!\x03F\x01\x11\x03+\x03#\x03F\x01\x11\x03\x05\x03\x07\x03F\x01\x17\x03\x1d\x03%\x0b\x06\x01\x03\x05\x07)\x1d'\rB\x0f\x19\x03\r\x03F\t\x11\x03\r\x03\x05\x07\x06\t\x03\r\x05-/\rB\x0f\x1b\x03\r\tF=\x1d\x03\x1d\x0513\x03FA\x11\x03\x05\x03\x03\x0b\x06E\x03\x05\x075+7\x1f\x04\x05\x039\x06\x03\x01\x05\x01\x00\x06\t])\x05\x1f\r\x0f\x0b\x0f!\x13#\x07\x0b%3)\t\t\x03\x15_\x1d\x13\x05\x1b%)9\x15\x1f\x15\x17\x15\x11\x11\x1b\x11\x11\x15\x17\x0f\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00add_v1\x00compare_v1\x00select_v1\x00iota_v1\x00func_v1\x00transpose_v1\x00real_v1\x00imag_v1\x00negate_v1\x00complex_v1\x00divide_v1\x00custom_call_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_cholesky\x00x\x00cholesky\x00jit(cholesky)\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00transpose\x00\x00add\x00div\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00iota\x00ge\x00broadcast_in_dim\x00select_n\x00jax.result_info\x00result\x00main\x00public\x00lower\x00num_batch_dims\x000\x00hipsolver_potrf_ffi\x00\x08[\x1f\x057\x01\x0bOSU]_\x03a\x03c\x03e\x03g\x03i\x03k\x03I\x11y{}\x7f\x81\x83\x85\x89\x05M\x8d\x03\x8f\x03\x91\x03\x93\x05M\x95",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
diff --git a/jax/_src/internal_test_util/export_back_compat_test_data/rocm_lu_pivots_to_permutation.py b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_lu_pivots_to_permutation.py
new file mode 100644
index 000000000000..4be8bffe9356
--- /dev/null
+++ b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_lu_pivots_to_permutation.py
@@ -0,0 +1,57 @@
+# Copyright 2026 The JAX Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import datetime
+import numpy as np
+array = np.array
+int32 = np.int32
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04 = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hip_lu_pivots_to_permutation'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(),
+    expected_outputs=(array([[[0, 1, 2, 3, 4, 5, 6, 7],
+        [4, 5, 6, 7, 0, 1, 2, 3],
+        [0, 1, 2, 3, 4, 5, 6, 7]],
+
+       [[0, 1, 2, 3, 4, 5, 6, 7],
+        [0, 1, 2, 3, 4, 5, 6, 7],
+        [0, 1, 2, 3, 4, 5, 6, 7]]], dtype=int32),),
+    mlir_module_text=r"""
+module @jit__lambda attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main() -> (tensor<2x3x8xi32> {jax.result_info = "result"}) {
+    %0 = stablehlo.iota dim = 0 : tensor<24xi32> loc(#loc7)
+    %1 = stablehlo.reshape %0 : (tensor<24xi32>) -> tensor<2x3x4xi32> loc(#loc8)
+    %2 = stablehlo.custom_call @hip_lu_pivots_to_permutation(%1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "2"}, operand_layouts = [dense<[2, 1, 0]> : tensor<3xindex>], result_layouts = [dense<[2, 1, 0]> : tensor<3xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, j, l]) {i=2, j=3, k=4, l=8}, custom>} : (tensor<2x3x4xi32>) -> tensor<2x3x8xi32> loc(#loc9)
+    return %2 : tensor<2x3x8xi32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc1 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":382:26)
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":382:14)
+#loc3 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":383:11)
+#loc4 = loc("jit(<lambda>)"(#loc1))
+#loc5 = loc("jit(<lambda>)"(#loc2))
+#loc6 = loc("jit(<lambda>)"(#loc3))
+#loc7 = loc("iota"(#loc4))
+#loc8 = loc("reshape"(#loc5))
+#loc9 = loc("lu_pivots_to_permutation"(#loc6))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01\x1f\x07\x01\x05\t\r\x01\x03\x0f\x03\x0b\x13\x17\x1b\x1f#\x03\x95i\x15\x015\x07\x0b\x0b\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0f\x17\x0f\x0b\x0f\x17#\x0b\x0b\x0b\x0f\x0b\x0f\x17\x03'\x0b\x0f\x0b\x0f\x13\x0b\x0b\x0b\x0b\x0f\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0bo\x05\x0f\x0f\x0f?\x17\x0f\x17\x0f\x01\x05\x0b\x0f\x03\x11\x07\x1b\x13\x13\x07\x1b\x13\x07\x02n\x03\x1f\x05\x13\x05\x15\x11\x03\x05\x03\x07\x0b\r\x0f\x07\x11\x07\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x17\x19\x05\x1f\x1d\x03\x1b\x17\x05\xfa\x055\x1d\x1f!\x05!\x1d\x03#\x17\x05\xfa\x05\x1d\x03\x07'I)K+_\x05#\x05%\x05'\x1d/1\x05)\x1d\x033\x17\x05\xfe\x05\x17\x03\x01\x03\x03Y#\t\x03\x03=\r\x03?A\x1d+\x1d-\x1d/\x1d1\x13\r\x01\r\x01\r\x03MO\x1d3\x1d5\x0b\x03\x1d7\x1d9\x05\x01\x1f\x111\x02\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x11\x03\x05\x15\t\t\r\x11!\x03a\x03e\x01\x01\x01\x01\x01\x13\x07[]c\x11\x03\t\x13\x07[]g\x11\x03\r\x01\t\x01\x02\x02\x1b)\x07\t\r!\x05\x11\x01\x03\x07)\x03a\x05\x1d)\x07\t\r\x11\x05)\x03\r\x13\x13\x04c\x05\x01Q\x01\t\x01\x07\x04Q\x03\x01\x05\x03P\x01\x03\x07\x04=\x03\x07\x11\x05B\x15\x05\x03\x0b\x07\x06\x1d\x03\x0f\x03\x01\tG-%\x07\x03\x07\x03\x03\x0b\x04\x01\x03\x05\x06\x03\x01\x05\x01\x00\xb2\x06;;\x03\x05\x1f\x0f\x0b\x0f!3%3)\x11\x0b\x19%)9_\x1d\x15\x1f\x17\x11\x11\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00func_v1\x00iota_v1\x00reshape_v1\x00custom_call_v1\x00return_v1\x00jit(<lambda>)\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit__lambda\x00iota\x00reshape\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00lu_pivots_to_permutation\x00jax.result_info\x00result\x00main\x00public\x00num_batch_dims\x002\x00\x00hip_lu_pivots_to_permutation\x00\x08+\t\x05'\x01\x0b59;CE\x03G\x11QSU5W757",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
diff --git a/jax/_src/internal_test_util/export_back_compat_test_data/rocm_lu_rocsolver_getrf.py b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_lu_rocsolver_getrf.py
new file mode 100644
index 000000000000..b940faa48f87
--- /dev/null
+++ b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_lu_rocsolver_getrf.py
@@ -0,0 +1,220 @@
+# Copyright 2026 The JAX Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# pyrefly: ignore-errors
+import datetime
+import numpy
+array = numpy.array
+complex64 = numpy.complex64
+float32 = numpy.float32
+int32 = numpy.int32
+
+
+data_2026_02_04 = {}
+
+
+data_2026_02_04['f32'] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hip_lu_pivots_to_permutation', 'hipsolver_getrf_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(),
+    expected_outputs=(array([[ 8. ,  9. , 10. , 11. ],
+       [ 0. ,  1. ,  2. ,  3. ],
+       [ 0.5,  0.5,  0. ,  0. ]], dtype=float32), array([2, 2, 2], dtype=int32), array([2, 0, 1], dtype=int32)),
+    mlir_module_text=r"""
+module @jit__lambda attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main() -> (tensor<3x4xf32> {jax.result_info = "result[0]"}, tensor<3xi32> {jax.result_info = "result[1]"}, tensor<3xi32> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<0x7FC00000> : tensor<f32> loc(#loc7)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc7)
+    %c_0 = stablehlo.constant dense<1> : tensor<i32> loc(#loc7)
+    %0 = stablehlo.iota dim = 0 : tensor<12xf32> loc(#loc8)
+    %1 = stablehlo.reshape %0 : (tensor<12xf32>) -> tensor<3x4xf32> loc(#loc9)
+    %2:3 = stablehlo.custom_call @hipsolver_getrf_ffi(%1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<[0, 1]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[0, 1]> : tensor<2xindex>, dense<0> : tensor<1xindex>, dense<> : tensor<0xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j])->([k, l], [m], []) {i=3, j=4, k=3, l=4, m=3}, custom>} : (tensor<3x4xf32>) -> (tensor<3x4xf32>, tensor<3xi32>, tensor<i32>) loc(#loc7)
+    %3 = stablehlo.broadcast_in_dim %c_0, dims = [] : (tensor<i32>) -> tensor<3xi32> loc(#loc7)
+    %4 = stablehlo.subtract %2#1, %3 : tensor<3xi32> loc(#loc7)
+    %5 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<i32> loc(#loc7)
+    %6 = stablehlo.compare  GE, %2#2, %5,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1> loc(#loc7)
+    %7 = stablehlo.broadcast_in_dim %6, dims = [] : (tensor<i1>) -> tensor<1x1xi1> loc(#loc7)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<3x4xf32> loc(#loc7)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<1x1xi1>) -> tensor<3x4xi1> loc(#loc7)
+    %10 = stablehlo.select %9, %2#0, %8 : tensor<3x4xi1>, tensor<3x4xf32> loc(#loc7)
+    %11 = stablehlo.custom_call @hip_lu_pivots_to_permutation(%4) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<0> : tensor<1xindex>], result_layouts = [dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i])->([j]) {i=3, j=3}, custom>} : (tensor<3xi32>) -> tensor<3xi32> loc(#loc10)
+    return %10, %4, %11 : tensor<3x4xf32>, tensor<3xi32>, tensor<3xi32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc1 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":463:11)
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":462:26)
+#loc3 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":462:14)
+#loc4 = loc("jit(<lambda>)"(#loc1))
+#loc5 = loc("jit(<lambda>)"(#loc2))
+#loc6 = loc("jit(<lambda>)"(#loc3))
+#loc7 = loc("lu"(#loc4))
+#loc8 = loc("iota"(#loc5))
+#loc9 = loc("reshape"(#loc6))
+#loc10 = loc(""(#loc4))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01)\x07\x01\x05\t\x17\x01\x03\x0f\x03\x15\x13\x17\x1b\x1f#'+/37\x03\xe1\x9f+\x01;\x0f\x07\x0b\x0b\x0f\x0f\x0b\x0b\x0b#\x0b\x0f\x0b\x0b\x0b\x0b\x17\x0f\x0b\x0f\x17\x0f\x0b\x0f\x17##\x0f\x0b\x03K\x0b\x0f\x0b\x0b\x13\x0b\x0b\x0bO/\x0f\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b\x1f\x1f\x1f\x0f\x0b\x0b\x0b\x0f\x0f\x17\x17\x0f\x0b\x0bO\x0b\x05\x1b\x0f\x0fK\x13\x13\x0f\x0f\x0f\x0f\x0b7\x0f\x0f\x01\x05\x0b\x0f\x03'\x13\x0f\x17\x07\x07\x07\x07\x07\x0f\x1b\x13\x13\x13\x13\x13\x0f\x17\x17\x13\x02\xf6\x05\x1d\x1f\x0b\x1f\x05\x1d\x05\x1f\x11\x03\x05\x1d\x05!\x05!\x05#\x05%\x03\x07\x15\x17\x19\t\x1b\t\x05'\x11\x01\x00\x05)\x05+\x05-\x05/\x17\x07>\x07\x17\x1d%'\x051\x1d\x05)\x17\x07:\x075\x1d-/\x053\x1d\x051\x17\x07:\x07\x1d\x03\x07\rA\x0fC\x11\x89\x03\x07\rA\x0fC\x11\x99\x1d9\x0b\x055\x03\x01\x1f!\x01\x1d7\r\x01\r\x03mo\x0b\x03\x1d5\x05\x01\x1f\x1b!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1f\x1d\x11\x00\x00\x00\x00\x00\x00\x00\x00\x03\x03M#\x17\x03\x07UY]\r\x03?W\x1d9\r\x03?[\x1d;\r\x03?_\x1d=\x1d?\x1dA\x1f\x15\t\x00\x00\xc0\x7f\x1f\x07\t\x00\x00\x00\x00\x1f\x07\t\x01\x00\x00\x00\x13\r\x01\x1dC\x1dE\x1dG\x03\x03K\x03\x03w\x15\x03\x01\x01\x01\x03\x07KM{\x1f\x1f\x01\t\x07\x07\x05\x1f)!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1dI\x11\x03\x01\x11\x03\x05\x15\x0b\r\x11\r\x11\r\x03\x8b\x07\x8d\x93\x97\x01\x01\x01\x01\x01\x13\x05\x85\x87\x13\x05\x8f\x91\x11\x03\t\x11\x03\r\x13\x03\x95\x11\x03\x11\x13\x01\x15\x05\r\r\x03\x9b\x03\x9d\x01\x01\x01\x01\x01\x13\x03\x85\x13\x03\x87\x01\t\x01\x02\x02)\x03\r\x13)\x01\x13)\x05\r\x11\x0b\t\x1d\x13\x01\x1b)\x01\x0b\x11\x01\x07\t\x05\x05)\x031\x0b)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0f)\x03\x01\r)\x01\x11)\x05\x05\x05\x11)\x05\r\x11\x11)\x03\t\r\x04N\x02\x05\x01Q\x03\x13\x01\x07\x04&\x02\x03\x01\x05\tP\x03\x03\x07\x04\xff\x03#A\x05B\x01\x05\x03\x15\x05B\x01\x07\x03\x07\x05B\x01\t\x03\x07\x0bB#\x0b\x03\x19\r\x06+\x03\t\x03\x07\x07G\x013\r\x07\t\x05\x07\x03\t\x03F\x01\x0f\x03\x05\x03\x05\x0f\x06\x01\x03\x05\x05\r\x11\x03F\x01\x0f\x03\x07\x03\x03\x11F\x01\x11\x03#\x05\x0f\x15\x03F\x01\x0f\x03%\x03\x17\x03F\x01\x0f\x03\t\x03\x01\x03F\x01\x13\x03'\x03\x19\x13\x06\x01\x03\t\x07\x1d\x0b\x1b\x07G75\x15\x03\x05\x03\x13\x15\x04\x03\x07\x1f\x13!\x06\x03\x01\x05\x01\x00*\x08K;)\x05\x1f\x0f\x0b\x15\x15\x15!\x03\x11\x0b\x07\x19%)9%3)_\x1d\x15\x15\x17\x19\x17\x11\x11\x1f\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00custom_call_v1\x00func_v1\x00iota_v1\x00reshape_v1\x00subtract_v1\x00compare_v1\x00select_v1\x00return_v1\x00jit(<lambda>)\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit__lambda\x00lu\x00iota\x00reshape\x00\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00num_batch_dims\x000\x00hipsolver_getrf_ffi\x00hip_lu_pivots_to_permutation\x00\x08W\x17\x05;\x01\x0b;QSac\x03e\x03g\x03i\x03k\x11EGq;Isuy\x03=\x05}\x7f\x03\x81\x11EG\x83;IO;O",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04['f64'] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hip_lu_pivots_to_permutation', 'hipsolver_getrf_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(),
+    expected_outputs=(array([[ 8. ,  9. , 10. , 11. ],
+       [ 0. ,  1. ,  2. ,  3. ],
+       [ 0.5,  0.5,  0. ,  0. ]]), array([2, 2, 2], dtype=int32), array([2, 0, 1], dtype=int32)),
+    mlir_module_text=r"""
+module @jit__lambda attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main() -> (tensor<3x4xf64> {jax.result_info = "result[0]"}, tensor<3xi32> {jax.result_info = "result[1]"}, tensor<3xi32> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<0x7FF8000000000000> : tensor<f64> loc(#loc7)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc7)
+    %c_0 = stablehlo.constant dense<1> : tensor<i32> loc(#loc7)
+    %0 = stablehlo.iota dim = 0 : tensor<12xf64> loc(#loc8)
+    %1 = stablehlo.reshape %0 : (tensor<12xf64>) -> tensor<3x4xf64> loc(#loc9)
+    %2:3 = stablehlo.custom_call @hipsolver_getrf_ffi(%1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<[0, 1]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[0, 1]> : tensor<2xindex>, dense<0> : tensor<1xindex>, dense<> : tensor<0xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j])->([k, l], [m], []) {i=3, j=4, k=3, l=4, m=3}, custom>} : (tensor<3x4xf64>) -> (tensor<3x4xf64>, tensor<3xi32>, tensor<i32>) loc(#loc7)
+    %3 = stablehlo.broadcast_in_dim %c_0, dims = [] : (tensor<i32>) -> tensor<3xi32> loc(#loc7)
+    %4 = stablehlo.subtract %2#1, %3 : tensor<3xi32> loc(#loc7)
+    %5 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<i32> loc(#loc7)
+    %6 = stablehlo.compare  GE, %2#2, %5,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1> loc(#loc7)
+    %7 = stablehlo.broadcast_in_dim %6, dims = [] : (tensor<i1>) -> tensor<1x1xi1> loc(#loc7)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<3x4xf64> loc(#loc7)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<1x1xi1>) -> tensor<3x4xi1> loc(#loc7)
+    %10 = stablehlo.select %9, %2#0, %8 : tensor<3x4xi1>, tensor<3x4xf64> loc(#loc7)
+    %11 = stablehlo.custom_call @hip_lu_pivots_to_permutation(%4) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<0> : tensor<1xindex>], result_layouts = [dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i])->([j]) {i=3, j=3}, custom>} : (tensor<3xi32>) -> tensor<3xi32> loc(#loc10)
+    return %10, %4, %11 : tensor<3x4xf64>, tensor<3xi32>, tensor<3xi32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc1 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":463:11)
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":462:26)
+#loc3 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":462:14)
+#loc4 = loc("jit(<lambda>)"(#loc1))
+#loc5 = loc("jit(<lambda>)"(#loc2))
+#loc6 = loc("jit(<lambda>)"(#loc3))
+#loc7 = loc("lu"(#loc4))
+#loc8 = loc("iota"(#loc5))
+#loc9 = loc("reshape"(#loc6))
+#loc10 = loc(""(#loc4))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01)\x07\x01\x05\t\x17\x01\x03\x0f\x03\x15\x13\x17\x1b\x1f#'+/37\x03\xe1\x9f+\x01;\x0f\x07\x0b\x0b\x0f\x0f\x0b\x0b\x0b#\x0b\x0f\x0b\x0b\x0b\x0b\x17\x0f\x0b\x0f\x17\x0f\x0b\x0f\x17##\x0f\x0b\x03K\x0b\x0f\x0b\x0b\x13\x0b\x0b\x0bO/\x0f\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b/\x1f\x1f\x0f\x0b\x0b\x0b\x0f\x0f\x17\x17\x0f\x0b\x0bO\x0b\x05\x1b\x0f\x0fK\x13\x13\x0f\x0f\x0f\x0f\x0b7\x0f\x0f\x01\x05\x0b\x0f\x03'\x13\x0f\x17\x07\x07\x07\x07\x07\x0f\x1b\x13\x13\x13\x13\x13\x0f\x17\x17\x13\x02\x06\x06\x1d\x1f\x0b\x1f\x05\x1d\x05\x1f\x11\x03\x05\x1d\x05!\x05!\x05#\x05%\x03\x07\x15\x17\x19\t\x1b\t\x05'\x11\x01\x00\x05)\x05+\x05-\x05/\x17\x07>\x07\x17\x1d%'\x051\x1d\x05)\x17\x07:\x075\x1d-/\x053\x1d\x051\x17\x07:\x07\x1d\x03\x07\rA\x0fC\x11\x89\x03\x07\rA\x0fC\x11\x99\x1d9\x0b\x055\x03\x01\x1f!\x01\x1d7\r\x01\r\x03mo\x0b\x03\x1d5\x05\x01\x1f\x1b!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1f\x1d\x11\x00\x00\x00\x00\x00\x00\x00\x00\x03\x03M#\x17\x03\x07UY]\r\x03?W\x1d9\r\x03?[\x1d;\r\x03?_\x1d=\x1d?\x1dA\x1f\x15\x11\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x07\t\x00\x00\x00\x00\x1f\x07\t\x01\x00\x00\x00\x13\r\x01\x1dC\x1dE\x1dG\x03\x03K\x03\x03w\x15\x03\x01\x01\x01\x03\x07KM{\x1f\x1f\x01\t\x07\x07\x05\x1f)!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1dI\x11\x03\x01\x11\x03\x05\x15\x0b\r\x11\r\x11\r\x03\x8b\x07\x8d\x93\x97\x01\x01\x01\x01\x01\x13\x05\x85\x87\x13\x05\x8f\x91\x11\x03\t\x11\x03\r\x13\x03\x95\x11\x03\x11\x13\x01\x15\x05\r\r\x03\x9b\x03\x9d\x01\x01\x01\x01\x01\x13\x03\x85\x13\x03\x87\x01\t\x01\x02\x02)\x03\r\x13)\x01\x13)\x05\r\x11\x0b\x0b\x1d\x13\x01\x1b)\x01\x0b\x11\x01\x07\t\x05\x05)\x031\x0b)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0f)\x03\x01\r)\x01\x11)\x05\x05\x05\x11)\x05\r\x11\x11)\x03\t\r\x04N\x02\x05\x01Q\x03\x13\x01\x07\x04&\x02\x03\x01\x05\tP\x03\x03\x07\x04\xff\x03#A\x05B\x01\x05\x03\x15\x05B\x01\x07\x03\x07\x05B\x01\t\x03\x07\x0bB#\x0b\x03\x19\r\x06+\x03\t\x03\x07\x07G\x013\r\x07\t\x05\x07\x03\t\x03F\x01\x0f\x03\x05\x03\x05\x0f\x06\x01\x03\x05\x05\r\x11\x03F\x01\x0f\x03\x07\x03\x03\x11F\x01\x11\x03#\x05\x0f\x15\x03F\x01\x0f\x03%\x03\x17\x03F\x01\x0f\x03\t\x03\x01\x03F\x01\x13\x03'\x03\x19\x13\x06\x01\x03\t\x07\x1d\x0b\x1b\x07G75\x15\x03\x05\x03\x13\x15\x04\x03\x07\x1f\x13!\x06\x03\x01\x05\x01\x00*\x08K;)\x05\x1f\x0f\x0b\x15\x15\x15!\x03\x11\x0b\x07\x19%)9%3)_\x1d\x15\x15\x17\x19\x17\x11\x11\x1f\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00custom_call_v1\x00func_v1\x00iota_v1\x00reshape_v1\x00subtract_v1\x00compare_v1\x00select_v1\x00return_v1\x00jit(<lambda>)\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit__lambda\x00lu\x00iota\x00reshape\x00\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00num_batch_dims\x000\x00hipsolver_getrf_ffi\x00hip_lu_pivots_to_permutation\x00\x08W\x17\x05;\x01\x0b;QSac\x03e\x03g\x03i\x03k\x11EGq;Isuy\x03=\x05}\x7f\x03\x81\x11EG\x83;IO;O",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04['c64'] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hip_lu_pivots_to_permutation', 'hipsolver_getrf_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(),
+    expected_outputs=(array([[ 8. +0.j,  9. +0.j, 10. +0.j, 11. +0.j],
+       [ 0. +0.j,  1. +0.j,  2. +0.j,  3. +0.j],
+       [ 0.5+0.j,  0.5+0.j,  0. +0.j,  0. +0.j]], dtype=complex64), array([2, 2, 2], dtype=int32), array([2, 0, 1], dtype=int32)),
+    mlir_module_text=r"""
+module @jit__lambda attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main() -> (tensor<3x4xcomplex<f32>> {jax.result_info = "result[0]"}, tensor<3xi32> {jax.result_info = "result[1]"}, tensor<3xi32> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<(0x7FC00000,0x7FC00000)> : tensor<complex<f32>> loc(#loc7)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc7)
+    %c_0 = stablehlo.constant dense<1> : tensor<i32> loc(#loc7)
+    %0 = stablehlo.iota dim = 0 : tensor<12xcomplex<f32>> loc(#loc8)
+    %1 = stablehlo.reshape %0 : (tensor<12xcomplex<f32>>) -> tensor<3x4xcomplex<f32>> loc(#loc9)
+    %2:3 = stablehlo.custom_call @hipsolver_getrf_ffi(%1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<[0, 1]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[0, 1]> : tensor<2xindex>, dense<0> : tensor<1xindex>, dense<> : tensor<0xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j])->([k, l], [m], []) {i=3, j=4, k=3, l=4, m=3}, custom>} : (tensor<3x4xcomplex<f32>>) -> (tensor<3x4xcomplex<f32>>, tensor<3xi32>, tensor<i32>) loc(#loc7)
+    %3 = stablehlo.broadcast_in_dim %c_0, dims = [] : (tensor<i32>) -> tensor<3xi32> loc(#loc7)
+    %4 = stablehlo.subtract %2#1, %3 : tensor<3xi32> loc(#loc7)
+    %5 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<i32> loc(#loc7)
+    %6 = stablehlo.compare  GE, %2#2, %5,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1> loc(#loc7)
+    %7 = stablehlo.broadcast_in_dim %6, dims = [] : (tensor<i1>) -> tensor<1x1xi1> loc(#loc7)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f32>>) -> tensor<3x4xcomplex<f32>> loc(#loc7)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<1x1xi1>) -> tensor<3x4xi1> loc(#loc7)
+    %10 = stablehlo.select %9, %2#0, %8 : tensor<3x4xi1>, tensor<3x4xcomplex<f32>> loc(#loc7)
+    %11 = stablehlo.custom_call @hip_lu_pivots_to_permutation(%4) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<0> : tensor<1xindex>], result_layouts = [dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i])->([j]) {i=3, j=3}, custom>} : (tensor<3xi32>) -> tensor<3xi32> loc(#loc10)
+    return %10, %4, %11 : tensor<3x4xcomplex<f32>>, tensor<3xi32>, tensor<3xi32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc1 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":463:11)
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":462:26)
+#loc3 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":462:14)
+#loc4 = loc("jit(<lambda>)"(#loc1))
+#loc5 = loc("jit(<lambda>)"(#loc2))
+#loc6 = loc("jit(<lambda>)"(#loc3))
+#loc7 = loc("lu"(#loc4))
+#loc8 = loc("iota"(#loc5))
+#loc9 = loc("reshape"(#loc6))
+#loc10 = loc(""(#loc4))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01)\x07\x01\x05\t\x17\x01\x03\x0f\x03\x15\x13\x17\x1b\x1f#'+/37\x03\xe3\x9f-\x01;\x0f\x07\x0b\x0b\x0f\x0f\x0b\x0b\x0b#\x0b\x0f\x0b\x0b\x0b\x0b\x17\x0f\x0b\x0f\x17\x0f\x0b\x0f\x17##\x0f\x0b\x03K\x0b\x0f\x0b\x0b\x13\x0b\x0b\x0bO/\x0f\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b/\x1f\x1f\x0f\x0b\x0b\x0b\x0f\x0f\x17\x17\x0f\x0b\x0bO\x0b\x05\x1b\x0f\x0fK\x13\x13\x0f\x0f\x0f\x0f\x0b7\x0f\x0f\x01\x05\x0b\x0f\x03)\x13\x0f\x17\x0b\x07\x07\x07\x07\x0f\x1b\x07\x13\x13\x13\x13\x13\x0f\x17\x17\x13\x02\x0e\x06\x1d\x1f\x0b\x1f\x05\x1d\x05\x1f\x11\x03\x05\x1d\x05!\x05!\x05#\x05%\x03\x07\x15\x17\x19\t\x1b\t\x05'\x11\x01\x00\x05)\x05+\x05-\x05/\x17\x07>\x07\x17\x1d%'\x051\x1d\x05)\x17\x07:\x075\x1d-/\x053\x1d\x051\x17\x07:\x07\x1d\x03\x07\rA\x0fC\x11\x89\x03\x07\rA\x0fC\x11\x99\x1d9\x0b\x055\x03\x01\x1f#\x01\x1d7\r\x01\r\x03mo\x0b\x03\x1d5\x05\x01\x1f\x1d!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1f\x1f\x11\x00\x00\x00\x00\x00\x00\x00\x00\x03\x03M#\x17\x03\x07UY]\r\x03?W\x1d9\r\x03?[\x1d;\r\x03?_\x1d=\x1d?\x1dA\x1f\x15\x11\x00\x00\xc0\x7f\x00\x00\xc0\x7f\x1f\x07\t\x00\x00\x00\x00\x1f\x07\t\x01\x00\x00\x00\x13\r\x01\x1dC\x1dE\x1dG\x03\x03K\x03\x03w\x15\x03\x01\x01\x01\x03\x07KM{\x1f!\x01\t\x07\x07\x05\x1f+!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1dI\x11\x03\x01\x11\x03\x05\x15\x0b\r\x11\r\x11\r\x03\x8b\x07\x8d\x93\x97\x01\x01\x01\x01\x01\x13\x05\x85\x87\x13\x05\x8f\x91\x11\x03\t\x11\x03\r\x13\x03\x95\x11\x03\x11\x13\x01\x15\x05\r\r\x03\x9b\x03\x9d\x01\x01\x01\x01\x01\x13\x03\x85\x13\x03\x87\x01\t\x01\x02\x02)\x03\r\x13)\x01\x13)\x05\r\x11\x0b\x03\x19\x1d\x13\x01\x1b)\x01\x0b\x11\x01\x07\t\x05\x05\t)\x031\x0b)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0f)\x03\x01\r)\x01\x11)\x05\x05\x05\x11)\x05\r\x11\x11)\x03\t\r\x04N\x02\x05\x01Q\x03\x13\x01\x07\x04&\x02\x03\x01\x05\tP\x03\x03\x07\x04\xff\x03#A\x05B\x01\x05\x03\x15\x05B\x01\x07\x03\x07\x05B\x01\t\x03\x07\x0bB#\x0b\x03\x1b\r\x06+\x03\t\x03\x07\x07G\x013\r\x07\t\x05\x07\x03\t\x03F\x01\x0f\x03\x05\x03\x05\x0f\x06\x01\x03\x05\x05\r\x11\x03F\x01\x0f\x03\x07\x03\x03\x11F\x01\x11\x03%\x05\x0f\x15\x03F\x01\x0f\x03'\x03\x17\x03F\x01\x0f\x03\t\x03\x01\x03F\x01\x13\x03)\x03\x19\x13\x06\x01\x03\t\x07\x1d\x0b\x1b\x07G75\x15\x03\x05\x03\x13\x15\x04\x03\x07\x1f\x13!\x06\x03\x01\x05\x01\x00*\x08K;)\x05\x1f\x0f\x0b\x15\x15\x15!\x03\x11\x0b\x07\x19%)9%3)_\x1d\x15\x15\x17\x19\x17\x11\x11\x1f\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00custom_call_v1\x00func_v1\x00iota_v1\x00reshape_v1\x00subtract_v1\x00compare_v1\x00select_v1\x00return_v1\x00jit(<lambda>)\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit__lambda\x00lu\x00iota\x00reshape\x00\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00num_batch_dims\x000\x00hipsolver_getrf_ffi\x00hip_lu_pivots_to_permutation\x00\x08W\x17\x05;\x01\x0b;QSac\x03e\x03g\x03i\x03k\x11EGq;Isuy\x03=\x05}\x7f\x03\x81\x11EG\x83;IO;O",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04['c128'] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hip_lu_pivots_to_permutation', 'hipsolver_getrf_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(),
+    expected_outputs=(array([[ 8. +0.j,  9. +0.j, 10. +0.j, 11. +0.j],
+       [ 0. +0.j,  1. +0.j,  2. +0.j,  3. +0.j],
+       [ 0.5+0.j,  0.5+0.j,  0. +0.j,  0. +0.j]]), array([2, 2, 2], dtype=int32), array([2, 0, 1], dtype=int32)),
+    mlir_module_text=r"""
+module @jit__lambda attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main() -> (tensor<3x4xcomplex<f64>> {jax.result_info = "result[0]"}, tensor<3xi32> {jax.result_info = "result[1]"}, tensor<3xi32> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<(0x7FF8000000000000,0x7FF8000000000000)> : tensor<complex<f64>> loc(#loc7)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc7)
+    %c_0 = stablehlo.constant dense<1> : tensor<i32> loc(#loc7)
+    %0 = stablehlo.iota dim = 0 : tensor<12xcomplex<f64>> loc(#loc8)
+    %1 = stablehlo.reshape %0 : (tensor<12xcomplex<f64>>) -> tensor<3x4xcomplex<f64>> loc(#loc9)
+    %2:3 = stablehlo.custom_call @hipsolver_getrf_ffi(%1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<[0, 1]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[0, 1]> : tensor<2xindex>, dense<0> : tensor<1xindex>, dense<> : tensor<0xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j])->([k, l], [m], []) {i=3, j=4, k=3, l=4, m=3}, custom>} : (tensor<3x4xcomplex<f64>>) -> (tensor<3x4xcomplex<f64>>, tensor<3xi32>, tensor<i32>) loc(#loc7)
+    %3 = stablehlo.broadcast_in_dim %c_0, dims = [] : (tensor<i32>) -> tensor<3xi32> loc(#loc7)
+    %4 = stablehlo.subtract %2#1, %3 : tensor<3xi32> loc(#loc7)
+    %5 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<i32> loc(#loc7)
+    %6 = stablehlo.compare  GE, %2#2, %5,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1> loc(#loc7)
+    %7 = stablehlo.broadcast_in_dim %6, dims = [] : (tensor<i1>) -> tensor<1x1xi1> loc(#loc7)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f64>>) -> tensor<3x4xcomplex<f64>> loc(#loc7)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<1x1xi1>) -> tensor<3x4xi1> loc(#loc7)
+    %10 = stablehlo.select %9, %2#0, %8 : tensor<3x4xi1>, tensor<3x4xcomplex<f64>> loc(#loc7)
+    %11 = stablehlo.custom_call @hip_lu_pivots_to_permutation(%4) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "0"}, operand_layouts = [dense<0> : tensor<1xindex>], result_layouts = [dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i])->([j]) {i=3, j=3}, custom>} : (tensor<3xi32>) -> tensor<3xi32> loc(#loc10)
+    return %10, %4, %11 : tensor<3x4xcomplex<f64>>, tensor<3xi32>, tensor<3xi32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc1 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":463:11)
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":462:26)
+#loc3 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":462:14)
+#loc4 = loc("jit(<lambda>)"(#loc1))
+#loc5 = loc("jit(<lambda>)"(#loc2))
+#loc6 = loc("jit(<lambda>)"(#loc3))
+#loc7 = loc("lu"(#loc4))
+#loc8 = loc("iota"(#loc5))
+#loc9 = loc("reshape"(#loc6))
+#loc10 = loc(""(#loc4))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01)\x07\x01\x05\t\x17\x01\x03\x0f\x03\x15\x13\x17\x1b\x1f#'+/37\x03\xe3\x9f-\x01;\x0f\x07\x0b\x0b\x0f\x0f\x0b\x0b\x0b#\x0b\x0f\x0b\x0b\x0b\x0b\x17\x0f\x0b\x0f\x17\x0f\x0b\x0f\x17##\x0f\x0b\x03K\x0b\x0f\x0b\x0b\x13\x0b\x0b\x0bO/\x0f\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0bO\x1f\x1f\x0f\x0b\x0b\x0b\x0f\x0f\x17\x17\x0f\x0b\x0bO\x0b\x05\x1b\x0f\x0fK\x13\x13\x0f\x0f\x0f\x0f\x0b7\x0f\x0f\x01\x05\x0b\x0f\x03)\x13\x0f\x17\x0b\x07\x07\x07\x07\x0f\x1b\x07\x13\x13\x13\x13\x13\x0f\x17\x17\x13\x02.\x06\x1d\x1f\x0b\x1f\x05\x1d\x05\x1f\x11\x03\x05\x1d\x05!\x05!\x05#\x05%\x03\x07\x15\x17\x19\t\x1b\t\x05'\x11\x01\x00\x05)\x05+\x05-\x05/\x17\x07>\x07\x17\x1d%'\x051\x1d\x05)\x17\x07:\x075\x1d-/\x053\x1d\x051\x17\x07:\x07\x1d\x03\x07\rA\x0fC\x11\x89\x03\x07\rA\x0fC\x11\x99\x1d9\x0b\x055\x03\x01\x1f#\x01\x1d7\r\x01\r\x03mo\x0b\x03\x1d5\x05\x01\x1f\x1d!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1f\x1f\x11\x00\x00\x00\x00\x00\x00\x00\x00\x03\x03M#\x17\x03\x07UY]\r\x03?W\x1d9\r\x03?[\x1d;\r\x03?_\x1d=\x1d?\x1dA\x1f\x15!\x00\x00\x00\x00\x00\x00\xf8\x7f\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x07\t\x00\x00\x00\x00\x1f\x07\t\x01\x00\x00\x00\x13\r\x01\x1dC\x1dE\x1dG\x03\x03K\x03\x03w\x15\x03\x01\x01\x01\x03\x07KM{\x1f!\x01\t\x07\x07\x05\x1f+!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1dI\x11\x03\x01\x11\x03\x05\x15\x0b\r\x11\r\x11\r\x03\x8b\x07\x8d\x93\x97\x01\x01\x01\x01\x01\x13\x05\x85\x87\x13\x05\x8f\x91\x11\x03\t\x11\x03\r\x13\x03\x95\x11\x03\x11\x13\x01\x15\x05\r\r\x03\x9b\x03\x9d\x01\x01\x01\x01\x01\x13\x03\x85\x13\x03\x87\x01\t\x01\x02\x02)\x03\r\x13)\x01\x13)\x05\r\x11\x0b\x03\x19\x1d\x13\x01\x1b)\x01\x0b\x11\x01\x07\t\x05\x05\x0b)\x031\x0b)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0f)\x03\x01\r)\x01\x11)\x05\x05\x05\x11)\x05\r\x11\x11)\x03\t\r\x04N\x02\x05\x01Q\x03\x13\x01\x07\x04&\x02\x03\x01\x05\tP\x03\x03\x07\x04\xff\x03#A\x05B\x01\x05\x03\x15\x05B\x01\x07\x03\x07\x05B\x01\t\x03\x07\x0bB#\x0b\x03\x1b\r\x06+\x03\t\x03\x07\x07G\x013\r\x07\t\x05\x07\x03\t\x03F\x01\x0f\x03\x05\x03\x05\x0f\x06\x01\x03\x05\x05\r\x11\x03F\x01\x0f\x03\x07\x03\x03\x11F\x01\x11\x03%\x05\x0f\x15\x03F\x01\x0f\x03'\x03\x17\x03F\x01\x0f\x03\t\x03\x01\x03F\x01\x13\x03)\x03\x19\x13\x06\x01\x03\t\x07\x1d\x0b\x1b\x07G75\x15\x03\x05\x03\x13\x15\x04\x03\x07\x1f\x13!\x06\x03\x01\x05\x01\x00*\x08K;)\x05\x1f\x0f\x0b\x15\x15\x15!\x03\x11\x0b\x07\x19%)9%3)_\x1d\x15\x15\x17\x19\x17\x11\x11\x1f\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00custom_call_v1\x00func_v1\x00iota_v1\x00reshape_v1\x00subtract_v1\x00compare_v1\x00select_v1\x00return_v1\x00jit(<lambda>)\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit__lambda\x00lu\x00iota\x00reshape\x00\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00num_batch_dims\x000\x00hipsolver_getrf_ffi\x00hip_lu_pivots_to_permutation\x00\x08W\x17\x05;\x01\x0b;QSac\x03e\x03g\x03i\x03k\x11EGq;Isuy\x03=\x05}\x7f\x03\x81\x11EG\x83;IO;O",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
diff --git a/jax/_src/internal_test_util/export_back_compat_test_data/rocm_qr_hipsolver_geqrf.py b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_qr_hipsolver_geqrf.py
new file mode 100644
index 000000000000..dbad849de98d
--- /dev/null
+++ b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_qr_hipsolver_geqrf.py
@@ -0,0 +1,284 @@
+# Copyright 2026 The JAX Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# pyrefly: ignore-errors
+# ruff: noqa
+
+import datetime
+import numpy as np
+
+array = np.array
+float32 = np.float32
+complex64 = np.complex64
+
+
+data_2026_02_04 = {}
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["f32"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_geqrf_ffi', 'hipsolver_orgqr_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(),
+    expected_outputs=(array([[[ 0.        ,  0.9128709 ,  0.40824834],
+        [-0.4472136 ,  0.3651484 , -0.81649655],
+        [-0.8944272 , -0.18257423,  0.40824828]],
+
+       [[-0.42426407,  0.8082909 ,  0.40824693],
+        [-0.5656854 ,  0.11546878, -0.81649673],
+        [-0.7071068 , -0.5773496 ,  0.40824923]]], dtype=float32), array([[[-6.7082038e+00, -8.0498447e+00, -9.3914852e+00],
+        [ 0.0000000e+00,  1.0954450e+00,  2.1908898e+00],
+        [ 0.0000000e+00,  0.0000000e+00,  4.8374091e-08]],
+
+       [[-2.1213203e+01, -2.2910263e+01, -2.4607315e+01],
+        [ 0.0000000e+00,  3.4641260e-01,  6.9282037e-01],
+        [ 0.0000000e+00,  0.0000000e+00, -1.8281829e-06]]], dtype=float32)),
+    mlir_module_text=r"""
+module @jit__lambda attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main() -> (tensor<2x3x3xf32> {jax.result_info = "result[0]"}, tensor<2x3x3xf32> {jax.result_info = "result[1]"}) {
+    %c = stablehlo.constant dense<-1> : tensor<i32> loc(#loc7)
+    %cst = stablehlo.constant dense<0.000000e+00> : tensor<f32> loc(#loc)
+    %0 = stablehlo.iota dim = 0 : tensor<18xf32> loc(#loc8)
+    %1 = stablehlo.reshape %0 : (tensor<18xf32>) -> tensor<2x3x3xf32> loc(#loc9)
+    %2:2 = stablehlo.custom_call @hipsolver_geqrf_ffi(%1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n]) {i=2, j=3, k=3, l=3, m=3, n=3}, custom>} : (tensor<2x3x3xf32>) -> (tensor<2x3x3xf32>, tensor<2x3xf32>) loc(#loc10)
+    %3 = stablehlo.pad %2#0, %cst, low = [0, 0, 0], high = [0, 0, 0], interior = [0, 0, 0] : (tensor<2x3x3xf32>, tensor<f32>) -> tensor<2x3x3xf32> loc(#loc10)
+    %4 = stablehlo.custom_call @hipsolver_orgqr_ffi(%3, %2#1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k], [i, l])->([i, m, n]) {i=2, j=3, k=3, l=3, m=3, n=3}, custom>} : (tensor<2x3x3xf32>, tensor<2x3xf32>) -> tensor<2x3x3xf32> loc(#loc10)
+    %5 = stablehlo.iota dim = 0 : tensor<3x3xi32> loc(#loc10)
+    %6 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<3x3xi32> loc(#loc10)
+    %7 = stablehlo.add %5, %6 : tensor<3x3xi32> loc(#loc10)
+    %8 = stablehlo.iota dim = 1 : tensor<3x3xi32> loc(#loc10)
+    %9 = stablehlo.compare  GE, %7, %8,  SIGNED : (tensor<3x3xi32>, tensor<3x3xi32>) -> tensor<3x3xi1> loc(#loc10)
+    %10 = stablehlo.broadcast_in_dim %9, dims = [1, 2] : (tensor<3x3xi1>) -> tensor<2x3x3xi1> loc(#loc10)
+    %11 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x3x3xf32> loc(#loc10)
+    %12 = stablehlo.select %10, %11, %2#0 : tensor<2x3x3xi1>, tensor<2x3x3xf32> loc(#loc10)
+    return %4, %12 : tensor<2x3x3xf32>, tensor<2x3x3xf32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc1 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":403:11)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":402:26)
+#loc3 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":402:14)
+#loc4 = loc("jit(<lambda>)"(#loc1))
+#loc5 = loc("jit(<lambda>)"(#loc2))
+#loc6 = loc("jit(<lambda>)"(#loc3))
+#loc7 = loc("qr"(#loc4))
+#loc8 = loc("iota"(#loc5))
+#loc9 = loc("reshape"(#loc6))
+#loc10 = loc(""(#loc4))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01+\x07\x01\x05\t\x19\x01\x03\x0f\x03\x17\x13\x17\x1b\x1f#'+/37;\x03\xdf\x9d+\x01;\x0f\x07\x0b\x0b\x0f\x0f\x0b\x0b\x0b#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x17\x0f\x0b\x0f\x17\x0f\x0b\x0f\x17#\x0b#\x03I\x0b/\x0b\x0f\x0b\x13\x0b\x0b\x0b\x0fo\x13\x0f\x0b\x13\x13\x0b\x13\x0b\x0b\x0b\x1f\x1f\x0b\x0b\x0b\x0f\x17O\x0b\x0f\x13\x0f\x0b\x0bO\x05\x1b\x0f\x17\x0f\x0f\x0fK\x0f\x0f\x17\x13K\x13\x17\x01\x05\x0b\x0f\x03'\x1b\x07\x07\x17\x0f\x07\x0f\x07\x07\x17\x13\x17\x13\x13\x13\x13\x17\x1b\x13\x02v\x06\x1d7\x0b\x1f\x05\x1f\x05!\x11\x03\x05\x1d\x05#\x05#\x05%\x05'\x03\x07\x15\x17\x19\t\x1b\t\x05)\x11\x01\x00\x05+\x05-\x05/\x1d!\x0b\x051\x17\x07N\x06\x17\x1d')\x053\x1d\x05+\x17\x07J\x065\x1d/1\x055\x1d\x053\x17\x07J\x06\x1d\x03\x07\rC\x0fE\x11\x8d\x057\x03\x07\rC\x0fE\x11\x97\x03\x01\x1f!\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1d9\x13\x07\x01\r\x01\r\x03ik\x0b\x03\x1d7\x05\x01\x03\x03O\x1f\x1d1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x03\x05Os\x1f#\x01#\x17\x03\x05Y]\r\x03?[\x1d;\r\x03?_\x1d=\x1d?\x1dA\x1f\r\t\xff\xff\xff\xff\x1f\x11\t\x00\x00\x00\x00\x1dC\x1dE\x1dG\x03\x03q\x15\x03\x01\x01\x01\x1f\x1f!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1dI\x03\x03y\x15\x01\x01\x01\x13\x07\x05\t\x07\x07\x05\x1f)!\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x13\x07\x83\x8f\x91\x11\x03\r\x11\x03\x11\x11\x03\x15\x15\r\t\r\r\r\r\r\x03\x85\x05\x93\x95\x01\x01\x01\x01\x01\x11\x03\x05\x11\x03\t\x13\x07\x83\x87\x89\x13\x05\x83\x8b\x15\r\t\r\r\r\r\r\x05\x85\x99\x03\x9b\x01\x01\x01\x01\x01\x13\x05\x83\x87\x13\x07\x83\x89\x8b\x01\t\x01\x02\x02)\x07\t\r\r\t\x1d\t)\x05\r\r\x0f)\x01\x0f\x1b)\x01\t\x13\x01\x11\x01\x05\x05\x05)\x03I\t)\x05\t\r\t)\x03\r\x13)\x03\t\x13)\x03\r\x07)\x03\x01\x07)\x05\r\r\x15)\x07\t\r\r\x15)\x03\t\x07\x04F\x02\x05\x01Q\x03\x13\x01\x07\x04\x1e\x02\x03\x01\x05\x0bP\x03\x03\x07\x04\xfb\x03!A\x07B\x1f\x05\x03\r\x07B\x03\x07\x03\x11\x03B%\t\x03\x19\r\x06-\x03\x05\x03\x05\tG\x015\x0b\x05\x05\x1b\x03\x07\x0fF\x01\r\x03\x05\x05\t\x03\tG\x019\x0f\x03\x05\x05\r\x0b\x03B\x01\t\x03\x0b\x05F\x01\x11\x03\x0b\x03\x01\x11\x06\x01\x03\x0b\x05\x11\x13\x03B\x01\x13\x03\x0b\x13F\x01\x15\x03%\x05\x15\x17\x05F\x01\x17\x03'\x03\x19\x05F\x01\x11\x03\x05\x03\x03\x15\x06\x01\x03\x05\x07\x1b\x1d\t\x17\x04\x03\x05\x0f\x1f\x06\x03\x01\x05\x01\x00\x0e\x08K))\x05\x1f\x0f\x0b\x15\x15!\x03\x11\x0b\x07\x19%)9%3)s\x1d\x15\x15\x17\x0f\x0f\x17\x11\x1f\x19)\x11\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00iota_v1\x00broadcast_in_dim_v1\x00constant_v1\x00custom_call_v1\x00func_v1\x00reshape_v1\x00pad_v1\x00add_v1\x00compare_v1\x00select_v1\x00return_v1\x00jit(<lambda>)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit__lambda\x00qr\x00iota\x00reshape\x00\x00jax.result_info\x00result[0]\x00result[1]\x00main\x00public\x00num_batch_dims\x001\x00hipsolver_geqrf_ffi\x00hipsolver_orgqr_ffi\x00\x08_\x19\x05;\x01\x0b;UWac\x03e\x03g\x03A\x11GIm;KMoQ\x07===\x11GIu;KQwM\x03S\x03{\x05}\x7f\x03\x81",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["f64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_geqrf_ffi', 'hipsolver_orgqr_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(),
+    expected_outputs=(array([[[ 0.                 ,  0.9128709291752773 ,
+          0.408248290463862  ],
+        [-0.447213595499958  ,  0.36514837167011   ,
+         -0.8164965809277264 ],
+        [-0.894427190999916  , -0.18257418583505472,
+          0.4082482904638633 ]],
+
+       [[-0.42426406871192857,  0.8082903768654768 ,
+          0.4082482904638614 ],
+        [-0.565685424949238  ,  0.11547005383792366,
+         -0.8164965809277263 ],
+        [-0.7071067811865476 , -0.577350269189625  ,
+          0.4082482904638642 ]]]), array([[[-6.7082039324993694e+00, -8.0498447189992444e+00,
+         -9.3914855054991175e+00],
+        [ 0.0000000000000000e+00,  1.0954451150103344e+00,
+          2.1908902300206661e+00],
+        [ 0.0000000000000000e+00,  0.0000000000000000e+00,
+         -1.7577018578317312e-15]],
+
+       [[-2.1213203435596427e+01, -2.2910259710444144e+01,
+         -2.4607315985291855e+01],
+        [ 0.0000000000000000e+00,  3.4641016151377924e-01,
+          6.9282032302755281e-01],
+        [ 0.0000000000000000e+00,  0.0000000000000000e+00,
+         -1.8103038069914667e-15]]])),
+    mlir_module_text=r"""
+module @jit__lambda attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main() -> (tensor<2x3x3xf64> {jax.result_info = "result[0]"}, tensor<2x3x3xf64> {jax.result_info = "result[1]"}) {
+    %c = stablehlo.constant dense<-1> : tensor<i64> loc(#loc7)
+    %cst = stablehlo.constant dense<0.000000e+00> : tensor<f64> loc(#loc)
+    %0 = stablehlo.iota dim = 0 : tensor<18xf64> loc(#loc8)
+    %1 = stablehlo.reshape %0 : (tensor<18xf64>) -> tensor<2x3x3xf64> loc(#loc9)
+    %2:2 = stablehlo.custom_call @hipsolver_geqrf_ffi(%1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n]) {i=2, j=3, k=3, l=3, m=3, n=3}, custom>} : (tensor<2x3x3xf64>) -> (tensor<2x3x3xf64>, tensor<2x3xf64>) loc(#loc10)
+    %3 = stablehlo.pad %2#0, %cst, low = [0, 0, 0], high = [0, 0, 0], interior = [0, 0, 0] : (tensor<2x3x3xf64>, tensor<f64>) -> tensor<2x3x3xf64> loc(#loc10)
+    %4 = stablehlo.custom_call @hipsolver_orgqr_ffi(%3, %2#1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k], [i, l])->([i, m, n]) {i=2, j=3, k=3, l=3, m=3, n=3}, custom>} : (tensor<2x3x3xf64>, tensor<2x3xf64>) -> tensor<2x3x3xf64> loc(#loc10)
+    %5 = stablehlo.iota dim = 0 : tensor<3x3xi64> loc(#loc10)
+    %6 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i64>) -> tensor<3x3xi64> loc(#loc10)
+    %7 = stablehlo.add %5, %6 : tensor<3x3xi64> loc(#loc10)
+    %8 = stablehlo.iota dim = 1 : tensor<3x3xi64> loc(#loc10)
+    %9 = stablehlo.compare  GE, %7, %8,  SIGNED : (tensor<3x3xi64>, tensor<3x3xi64>) -> tensor<3x3xi1> loc(#loc10)
+    %10 = stablehlo.broadcast_in_dim %9, dims = [1, 2] : (tensor<3x3xi1>) -> tensor<2x3x3xi1> loc(#loc10)
+    %11 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x3x3xf64> loc(#loc10)
+    %12 = stablehlo.select %10, %11, %2#0 : tensor<2x3x3xi1>, tensor<2x3x3xf64> loc(#loc10)
+    return %4, %12 : tensor<2x3x3xf64>, tensor<2x3x3xf64> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc1 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":403:11)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":402:26)
+#loc3 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":402:14)
+#loc4 = loc("jit(<lambda>)"(#loc1))
+#loc5 = loc("jit(<lambda>)"(#loc2))
+#loc6 = loc("jit(<lambda>)"(#loc3))
+#loc7 = loc("qr"(#loc4))
+#loc8 = loc("iota"(#loc5))
+#loc9 = loc("reshape"(#loc6))
+#loc10 = loc(""(#loc4))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01+\x07\x01\x05\t\x19\x01\x03\x0f\x03\x17\x13\x17\x1b\x1f#'+/37;\x03\xdd\x9d)\x01;\x0f\x07\x0b\x0b\x0f\x0f\x0b\x0b\x0b#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x17\x0f\x0b\x0f\x17\x0f\x0b\x0f\x17#\x0b#\x03I\x0b/\x0b\x0f\x0b\x13\x0b\x0b\x0b\x0fo\x13\x0f\x0b\x13\x13\x0b\x13\x0b\x0b\x0b//\x0b\x0b\x0b\x0f\x17O\x0b\x0f\x13\x0f\x0b\x0bO\x05\x1b\x0f\x17\x0f\x0f\x0fK\x0f\x0f\x17\x13K\x13\x17\x01\x05\x0b\x0f\x03%\x1b\x07\x07\x17\x0f\x0f\x07\x07\x17\x13\x17\x13\x13\x13\x13\x17\x1b\x13\x02\x92\x06\x1d7\x0b\x1f\x05\x1f\x05!\x11\x03\x05\x1d\x05#\x05#\x05%\x05'\x03\x07\x15\x17\x19\t\x1b\t\x05)\x11\x01\x00\x05+\x05-\x05/\x1d!\x0b\x051\x17\x07N\x06\x17\x1d')\x053\x1d\x05+\x17\x07J\x065\x1d/1\x055\x1d\x053\x17\x07J\x06\x1d\x03\x07\rC\x0fE\x11\x8d\x057\x03\x07\rC\x0fE\x11\x97\x03\x01\x1f\x1f\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1d9\x13\x07\x01\r\x01\r\x03ik\x0b\x03\x1d7\x05\x01\x03\x03O\x1f\x1b1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x03\x05Os\x1f!\x01#\x15\x03\x05Y]\r\x03?[\x1d;\r\x03?_\x1d=\x1d?\x1dA\x1f\r\x11\xff\xff\xff\xff\xff\xff\xff\xff\x1f\x0f\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1dC\x1dE\x1dG\x03\x03q\x15\x03\x01\x01\x01\x1f\x1d!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1dI\x03\x03y\x15\x01\x01\x01\x13\x07\x05\t\x07\x07\x05\x1f'!\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x13\x07\x83\x8f\x91\x11\x03\r\x11\x03\x11\x11\x03\x15\x15\r\t\r\r\r\r\r\x03\x85\x05\x93\x95\x01\x01\x01\x01\x01\x11\x03\x05\x11\x03\t\x13\x07\x83\x87\x89\x13\x05\x83\x8b\x15\r\t\r\r\r\r\r\x05\x85\x99\x03\x9b\x01\x01\x01\x01\x01\x13\x05\x83\x87\x13\x07\x83\x89\x8b\x01\t\x01\x02\x02)\x07\t\r\r\t\x1d\x0b)\x05\r\r\x07)\x01\x07)\x01\t\x13\x01\x11\x01\x05\x05\x05)\x03I\t)\x05\t\r\t)\x03\r\x11)\x03\t\x11)\x03\r\x07)\x03\x01\x07)\x05\r\r\x13)\x07\t\r\r\x13)\x03\t\x07\x04F\x02\x05\x01Q\x03\x13\x01\x07\x04\x1e\x02\x03\x01\x05\x0bP\x03\x03\x07\x04\xfb\x03!A\x07B\x1f\x05\x03\r\x07B\x03\x07\x03\x0f\x03B%\t\x03\x17\r\x06-\x03\x05\x03\x05\tG\x015\x0b\x05\x05\x19\x03\x07\x0fF\x01\r\x03\x05\x05\t\x03\tG\x019\x0f\x03\x05\x05\r\x0b\x03B\x01\t\x03\x0b\x05F\x01\x11\x03\x0b\x03\x01\x11\x06\x01\x03\x0b\x05\x11\x13\x03B\x01\x13\x03\x0b\x13F\x01\x15\x03#\x05\x15\x17\x05F\x01\x17\x03%\x03\x19\x05F\x01\x11\x03\x05\x03\x03\x15\x06\x01\x03\x05\x07\x1b\x1d\t\x17\x04\x03\x05\x0f\x1f\x06\x03\x01\x05\x01\x00\x0e\x08K))\x05\x1f\x0f\x0b\x15\x15!\x03\x11\x0b\x07\x19%)9%3)s\x1d\x15\x15\x17\x0f\x0f\x17\x11\x1f\x19)\x11\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00iota_v1\x00broadcast_in_dim_v1\x00constant_v1\x00custom_call_v1\x00func_v1\x00reshape_v1\x00pad_v1\x00add_v1\x00compare_v1\x00select_v1\x00return_v1\x00jit(<lambda>)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit__lambda\x00qr\x00iota\x00reshape\x00\x00jax.result_info\x00result[0]\x00result[1]\x00main\x00public\x00num_batch_dims\x001\x00hipsolver_geqrf_ffi\x00hipsolver_orgqr_ffi\x00\x08_\x19\x05;\x01\x0b;UWac\x03e\x03g\x03A\x11GIm;KMoQ\x07===\x11GIu;KQwM\x03S\x03{\x05}\x7f\x03\x81",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["c64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_geqrf_ffi', 'hipsolver_orgqr_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(),
+    expected_outputs=(array([[[ 0.         -0.j,  0.9128708  +0.j,  0.4082482  +0.j],
+        [-0.4472136  -0.j,  0.36514837 +0.j, -0.81649655 +0.j],
+        [-0.8944272  -0.j, -0.18257421 +0.j,  0.40824828 +0.j]],
+
+       [[-0.42426407 -0.j,  0.8082913  +0.j,  0.4082465  +0.j],
+        [-0.5656854  -0.j,  0.115468234+0.j, -0.81649685 +0.j],
+        [-0.7071068  -0.j, -0.57734936 +0.j,  0.4082496  +0.j]]],
+      dtype=complex64), array([[[-6.7082038e+00+0.j, -8.0498447e+00+0.j, -9.3914852e+00+0.j],
+        [ 0.0000000e+00+0.j,  1.0954450e+00+0.j,  2.1908901e+00+0.j],
+        [ 0.0000000e+00+0.j,  0.0000000e+00+0.j,  0.0000000e+00+0.j]],
+
+       [[-2.1213203e+01+0.j, -2.2910263e+01+0.j, -2.4607315e+01+0.j],
+        [ 0.0000000e+00+0.j,  3.4641233e-01+0.j,  6.9282043e-01+0.j],
+        [ 0.0000000e+00+0.j,  0.0000000e+00+0.j, -1.9669533e-06+0.j]]],
+      dtype=complex64)),
+    mlir_module_text=r"""
+module @jit__lambda attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main() -> (tensor<2x3x3xcomplex<f32>> {jax.result_info = "result[0]"}, tensor<2x3x3xcomplex<f32>> {jax.result_info = "result[1]"}) {
+    %c = stablehlo.constant dense<-1> : tensor<i32> loc(#loc7)
+    %cst = stablehlo.constant dense<(0.000000e+00,0.000000e+00)> : tensor<complex<f32>> loc(#loc)
+    %0 = stablehlo.iota dim = 0 : tensor<18xcomplex<f32>> loc(#loc8)
+    %1 = stablehlo.reshape %0 : (tensor<18xcomplex<f32>>) -> tensor<2x3x3xcomplex<f32>> loc(#loc9)
+    %2:2 = stablehlo.custom_call @hipsolver_geqrf_ffi(%1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n]) {i=2, j=3, k=3, l=3, m=3, n=3}, custom>} : (tensor<2x3x3xcomplex<f32>>) -> (tensor<2x3x3xcomplex<f32>>, tensor<2x3xcomplex<f32>>) loc(#loc10)
+    %3 = stablehlo.pad %2#0, %cst, low = [0, 0, 0], high = [0, 0, 0], interior = [0, 0, 0] : (tensor<2x3x3xcomplex<f32>>, tensor<complex<f32>>) -> tensor<2x3x3xcomplex<f32>> loc(#loc10)
+    %4 = stablehlo.custom_call @hipsolver_orgqr_ffi(%3, %2#1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k], [i, l])->([i, m, n]) {i=2, j=3, k=3, l=3, m=3, n=3}, custom>} : (tensor<2x3x3xcomplex<f32>>, tensor<2x3xcomplex<f32>>) -> tensor<2x3x3xcomplex<f32>> loc(#loc10)
+    %5 = stablehlo.iota dim = 0 : tensor<3x3xi32> loc(#loc10)
+    %6 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<3x3xi32> loc(#loc10)
+    %7 = stablehlo.add %5, %6 : tensor<3x3xi32> loc(#loc10)
+    %8 = stablehlo.iota dim = 1 : tensor<3x3xi32> loc(#loc10)
+    %9 = stablehlo.compare  GE, %7, %8,  SIGNED : (tensor<3x3xi32>, tensor<3x3xi32>) -> tensor<3x3xi1> loc(#loc10)
+    %10 = stablehlo.broadcast_in_dim %9, dims = [1, 2] : (tensor<3x3xi1>) -> tensor<2x3x3xi1> loc(#loc10)
+    %11 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f32>>) -> tensor<2x3x3xcomplex<f32>> loc(#loc10)
+    %12 = stablehlo.select %10, %11, %2#0 : tensor<2x3x3xi1>, tensor<2x3x3xcomplex<f32>> loc(#loc10)
+    return %4, %12 : tensor<2x3x3xcomplex<f32>>, tensor<2x3x3xcomplex<f32>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc1 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":403:11)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":402:26)
+#loc3 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":402:14)
+#loc4 = loc("jit(<lambda>)"(#loc1))
+#loc5 = loc("jit(<lambda>)"(#loc2))
+#loc6 = loc("jit(<lambda>)"(#loc3))
+#loc7 = loc("qr"(#loc4))
+#loc8 = loc("iota"(#loc5))
+#loc9 = loc("reshape"(#loc6))
+#loc10 = loc(""(#loc4))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01+\x07\x01\x05\t\x19\x01\x03\x0f\x03\x17\x13\x17\x1b\x1f#'+/37;\x03\xe1\x9d-\x01;\x0f\x07\x0b\x0b\x0f\x0f\x0b\x0b\x0b#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x17\x0f\x0b\x0f\x17\x0f\x0b\x0f\x17#\x0b#\x03I\x0b/\x0b\x0f\x0b\x13\x0b\x0b\x0b\x0fo\x13\x0f\x0b\x13\x13\x0b\x13\x0b\x0b\x0b\x1f/\x0b\x0b\x0b\x0f\x17O\x0b\x0f\x13\x0f\x0b\x0bO\x05\x1b\x0f\x17\x0f\x0f\x0fK\x0f\x0f\x17\x13K\x13\x17\x01\x05\x0b\x0f\x03)\x1b\x07\x0b\x17\x0f\x07\x0f\x07\x07\x17\x07\x13\x17\x13\x13\x13\x13\x17\x1b\x13\x02\x8e\x06\x1d7\x0b\x1f\x05\x1f\x05!\x11\x03\x05\x1d\x05#\x05#\x05%\x05'\x03\x07\x15\x17\x19\t\x1b\t\x05)\x11\x01\x00\x05+\x05-\x05/\x1d!\x0b\x051\x17\x07N\x06\x17\x1d')\x053\x1d\x05+\x17\x07J\x065\x1d/1\x055\x1d\x053\x17\x07J\x06\x1d\x03\x07\rC\x0fE\x11\x8d\x057\x03\x07\rC\x0fE\x11\x97\x03\x01\x1f#\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1d9\x13\x07\x01\r\x01\r\x03ik\x0b\x03\x1d7\x05\x01\x03\x03O\x1f\x1f1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x03\x05Os\x1f%\x01#\x17\x03\x05Y]\r\x03?[\x1d;\r\x03?_\x1d=\x1d?\x1dA\x1f\r\t\xff\xff\xff\xff\x1f\x11\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1dC\x1dE\x1dG\x03\x03q\x15\x03\x01\x01\x01\x1f!!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1dI\x03\x03y\x15\x01\x01\x01\x13\x07\x05\t\x07\x07\x05\x1f+!\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x13\x07\x83\x8f\x91\x11\x03\r\x11\x03\x11\x11\x03\x15\x15\r\t\r\r\r\r\r\x03\x85\x05\x93\x95\x01\x01\x01\x01\x01\x11\x03\x05\x11\x03\t\x13\x07\x83\x87\x89\x13\x05\x83\x8b\x15\r\t\r\r\r\r\r\x05\x85\x99\x03\x9b\x01\x01\x01\x01\x01\x13\x05\x83\x87\x13\x07\x83\x89\x8b\x01\t\x01\x02\x02)\x07\t\r\r\t\x1d\x03\x19)\x05\r\r\x0f)\x01\x0f\x1b)\x01\t\x13\x01\x11\x01\x05\x05\x05\t)\x03I\t)\x05\t\r\t)\x03\r\x13)\x03\t\x13)\x03\r\x07)\x03\x01\x07)\x05\r\r\x15)\x07\t\r\r\x15)\x03\t\x07\x04F\x02\x05\x01Q\x03\x13\x01\x07\x04\x1e\x02\x03\x01\x05\x0bP\x03\x03\x07\x04\xfb\x03!A\x07B\x1f\x05\x03\r\x07B\x03\x07\x03\x11\x03B%\t\x03\x1b\r\x06-\x03\x05\x03\x05\tG\x015\x0b\x05\x05\x1d\x03\x07\x0fF\x01\r\x03\x05\x05\t\x03\tG\x019\x0f\x03\x05\x05\r\x0b\x03B\x01\t\x03\x0b\x05F\x01\x11\x03\x0b\x03\x01\x11\x06\x01\x03\x0b\x05\x11\x13\x03B\x01\x13\x03\x0b\x13F\x01\x15\x03'\x05\x15\x17\x05F\x01\x17\x03)\x03\x19\x05F\x01\x11\x03\x05\x03\x03\x15\x06\x01\x03\x05\x07\x1b\x1d\t\x17\x04\x03\x05\x0f\x1f\x06\x03\x01\x05\x01\x00\x0e\x08K))\x05\x1f\x0f\x0b\x15\x15!\x03\x11\x0b\x07\x19%)9%3)s\x1d\x15\x15\x17\x0f\x0f\x17\x11\x1f\x19)\x11\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00iota_v1\x00broadcast_in_dim_v1\x00constant_v1\x00custom_call_v1\x00func_v1\x00reshape_v1\x00pad_v1\x00add_v1\x00compare_v1\x00select_v1\x00return_v1\x00jit(<lambda>)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit__lambda\x00qr\x00iota\x00reshape\x00\x00jax.result_info\x00result[0]\x00result[1]\x00main\x00public\x00num_batch_dims\x001\x00hipsolver_geqrf_ffi\x00hipsolver_orgqr_ffi\x00\x08_\x19\x05;\x01\x0b;UWac\x03e\x03g\x03A\x11GIm;KMoQ\x07===\x11GIu;KQwM\x03S\x03{\x05}\x7f\x03\x81",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["c128"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_geqrf_ffi', 'hipsolver_orgqr_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(),
+    expected_outputs=(array([[[ 0.                 -0.j,  0.9128709291752763 +0.j,
+          0.4082482904638633 +0.j],
+        [-0.44721359549995787-0.j,  0.3651483716701112 +0.j,
+         -0.8164965809277258 +0.j],
+        [-0.8944271909999157 -0.j, -0.1825741858350558 +0.j,
+          0.4082482904638628 +0.j]],
+
+       [[-0.42426406871192857-0.j,  0.8082903768654766 +0.j,
+          0.4082482904638618 +0.j],
+        [-0.565685424949238  -0.j,  0.11547005383792402+0.j,
+         -0.8164965809277261 +0.j],
+        [-0.7071067811865476 -0.j, -0.5773502691896252 +0.j,
+          0.40824829046386385+0.j]]]), array([[[-6.7082039324993694e+00+0.j, -8.0498447189992426e+00+0.j,
+         -9.3914855054991158e+00+0.j],
+        [ 0.0000000000000000e+00+0.j,  1.0954451150103306e+00+0.j,
+          2.1908902300206621e+00+0.j],
+        [ 0.0000000000000000e+00+0.j,  0.0000000000000000e+00+0.j,
+          0.0000000000000000e+00+0.j]],
+
+       [[-2.1213203435596427e+01+0.j, -2.2910259710444144e+01+0.j,
+         -2.4607315985291855e+01+0.j],
+        [ 0.0000000000000000e+00+0.j,  3.4641016151378073e-01+0.j,
+          6.9282032302755370e-01+0.j],
+        [ 0.0000000000000000e+00+0.j,  0.0000000000000000e+00+0.j,
+         -2.1094237467877974e-15+0.j]]])),
+    mlir_module_text=r"""
+module @jit__lambda attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main() -> (tensor<2x3x3xcomplex<f64>> {jax.result_info = "result[0]"}, tensor<2x3x3xcomplex<f64>> {jax.result_info = "result[1]"}) {
+    %c = stablehlo.constant dense<-1> : tensor<i64> loc(#loc7)
+    %cst = stablehlo.constant dense<(0.000000e+00,0.000000e+00)> : tensor<complex<f64>> loc(#loc)
+    %0 = stablehlo.iota dim = 0 : tensor<18xcomplex<f64>> loc(#loc8)
+    %1 = stablehlo.reshape %0 : (tensor<18xcomplex<f64>>) -> tensor<2x3x3xcomplex<f64>> loc(#loc9)
+    %2:2 = stablehlo.custom_call @hipsolver_geqrf_ffi(%1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n]) {i=2, j=3, k=3, l=3, m=3, n=3}, custom>} : (tensor<2x3x3xcomplex<f64>>) -> (tensor<2x3x3xcomplex<f64>>, tensor<2x3xcomplex<f64>>) loc(#loc10)
+    %3 = stablehlo.pad %2#0, %cst, low = [0, 0, 0], high = [0, 0, 0], interior = [0, 0, 0] : (tensor<2x3x3xcomplex<f64>>, tensor<complex<f64>>) -> tensor<2x3x3xcomplex<f64>> loc(#loc10)
+    %4 = stablehlo.custom_call @hipsolver_orgqr_ffi(%3, %2#1) {mhlo.backend_config = {}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k], [i, l])->([i, m, n]) {i=2, j=3, k=3, l=3, m=3, n=3}, custom>} : (tensor<2x3x3xcomplex<f64>>, tensor<2x3xcomplex<f64>>) -> tensor<2x3x3xcomplex<f64>> loc(#loc10)
+    %5 = stablehlo.iota dim = 0 : tensor<3x3xi64> loc(#loc10)
+    %6 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i64>) -> tensor<3x3xi64> loc(#loc10)
+    %7 = stablehlo.add %5, %6 : tensor<3x3xi64> loc(#loc10)
+    %8 = stablehlo.iota dim = 1 : tensor<3x3xi64> loc(#loc10)
+    %9 = stablehlo.compare  GE, %7, %8,  SIGNED : (tensor<3x3xi64>, tensor<3x3xi64>) -> tensor<3x3xi1> loc(#loc10)
+    %10 = stablehlo.broadcast_in_dim %9, dims = [1, 2] : (tensor<3x3xi1>) -> tensor<2x3x3xi1> loc(#loc10)
+    %11 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f64>>) -> tensor<2x3x3xcomplex<f64>> loc(#loc10)
+    %12 = stablehlo.select %10, %11, %2#0 : tensor<2x3x3xi1>, tensor<2x3x3xcomplex<f64>> loc(#loc10)
+    return %4, %12 : tensor<2x3x3xcomplex<f64>>, tensor<2x3x3xcomplex<f64>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc1 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":403:11)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":402:26)
+#loc3 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":402:14)
+#loc4 = loc("jit(<lambda>)"(#loc1))
+#loc5 = loc("jit(<lambda>)"(#loc2))
+#loc6 = loc("jit(<lambda>)"(#loc3))
+#loc7 = loc("qr"(#loc4))
+#loc8 = loc("iota"(#loc5))
+#loc9 = loc("reshape"(#loc6))
+#loc10 = loc(""(#loc4))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01+\x07\x01\x05\t\x19\x01\x03\x0f\x03\x17\x13\x17\x1b\x1f#'+/37;\x03\xdf\x9d+\x01;\x0f\x07\x0b\x0b\x0f\x0f\x0b\x0b\x0b#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x17\x0f\x0b\x0f\x17\x0f\x0b\x0f\x17#\x0b#\x03I\x0b/\x0b\x0f\x0b\x13\x0b\x0b\x0b\x0fo\x13\x0f\x0b\x13\x13\x0b\x13\x0b\x0b\x0b/O\x0b\x0b\x0b\x0f\x17O\x0b\x0f\x13\x0f\x0b\x0bO\x05\x1b\x0f\x17\x0f\x0f\x0fK\x0f\x0f\x17\x13K\x13\x17\x01\x05\x0b\x0f\x03'\x1b\x07\x0b\x17\x0f\x0f\x07\x07\x17\x07\x13\x17\x13\x13\x13\x13\x17\x1b\x13\x02\xba\x06\x1d7\x0b\x1f\x05\x1f\x05!\x11\x03\x05\x1d\x05#\x05#\x05%\x05'\x03\x07\x15\x17\x19\t\x1b\t\x05)\x11\x01\x00\x05+\x05-\x05/\x1d!\x0b\x051\x17\x07N\x06\x17\x1d')\x053\x1d\x05+\x17\x07J\x065\x1d/1\x055\x1d\x053\x17\x07J\x06\x1d\x03\x07\rC\x0fE\x11\x8d\x057\x03\x07\rC\x0fE\x11\x97\x03\x01\x1f!\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1d9\x13\x07\x01\r\x01\r\x03ik\x0b\x03\x1d7\x05\x01\x03\x03O\x1f\x1d1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x03\x05Os\x1f#\x01#\x15\x03\x05Y]\r\x03?[\x1d;\r\x03?_\x1d=\x1d?\x1dA\x1f\r\x11\xff\xff\xff\xff\xff\xff\xff\xff\x1f\x0f!\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1dC\x1dE\x1dG\x03\x03q\x15\x03\x01\x01\x01\x1f\x1f!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1dI\x03\x03y\x15\x01\x01\x01\x13\x07\x05\t\x07\x07\x05\x1f)!\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x13\x07\x83\x8f\x91\x11\x03\r\x11\x03\x11\x11\x03\x15\x15\r\t\r\r\r\r\r\x03\x85\x05\x93\x95\x01\x01\x01\x01\x01\x11\x03\x05\x11\x03\t\x13\x07\x83\x87\x89\x13\x05\x83\x8b\x15\r\t\r\r\r\r\r\x05\x85\x99\x03\x9b\x01\x01\x01\x01\x01\x13\x05\x83\x87\x13\x07\x83\x89\x8b\x01\t\x01\x02\x02)\x07\t\r\r\t\x1d\x03\x17)\x05\r\r\x07)\x01\x07)\x01\t\x13\x01\x11\x01\x05\x05\x05\x0b)\x03I\t)\x05\t\r\t)\x03\r\x11)\x03\t\x11)\x03\r\x07)\x03\x01\x07)\x05\r\r\x13)\x07\t\r\r\x13)\x03\t\x07\x04F\x02\x05\x01Q\x03\x13\x01\x07\x04\x1e\x02\x03\x01\x05\x0bP\x03\x03\x07\x04\xfb\x03!A\x07B\x1f\x05\x03\r\x07B\x03\x07\x03\x0f\x03B%\t\x03\x19\r\x06-\x03\x05\x03\x05\tG\x015\x0b\x05\x05\x1b\x03\x07\x0fF\x01\r\x03\x05\x05\t\x03\tG\x019\x0f\x03\x05\x05\r\x0b\x03B\x01\t\x03\x0b\x05F\x01\x11\x03\x0b\x03\x01\x11\x06\x01\x03\x0b\x05\x11\x13\x03B\x01\x13\x03\x0b\x13F\x01\x15\x03%\x05\x15\x17\x05F\x01\x17\x03'\x03\x19\x05F\x01\x11\x03\x05\x03\x03\x15\x06\x01\x03\x05\x07\x1b\x1d\t\x17\x04\x03\x05\x0f\x1f\x06\x03\x01\x05\x01\x00\x0e\x08K))\x05\x1f\x0f\x0b\x15\x15!\x03\x11\x0b\x07\x19%)9%3)s\x1d\x15\x15\x17\x0f\x0f\x17\x11\x1f\x19)\x11\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00iota_v1\x00broadcast_in_dim_v1\x00constant_v1\x00custom_call_v1\x00func_v1\x00reshape_v1\x00pad_v1\x00add_v1\x00compare_v1\x00select_v1\x00return_v1\x00jit(<lambda>)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit__lambda\x00qr\x00iota\x00reshape\x00\x00jax.result_info\x00result[0]\x00result[1]\x00main\x00public\x00num_batch_dims\x001\x00hipsolver_geqrf_ffi\x00hipsolver_orgqr_ffi\x00\x08_\x19\x05;\x01\x0b;UWac\x03e\x03g\x03A\x11GIm;KMoQ\x07===\x11GIu;KQwM\x03S\x03{\x05}\x7f\x03\x81",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
diff --git a/jax/_src/internal_test_util/export_back_compat_test_data/rocm_svd_hipsolver_gesvd.py b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_svd_hipsolver_gesvd.py
new file mode 100644
index 000000000000..0ab4f9d644cf
--- /dev/null
+++ b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_svd_hipsolver_gesvd.py
@@ -0,0 +1,908 @@
+# Copyright 2026 The JAX Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# type: ignore
+# ruff: noqa
+
+import datetime
+import numpy as np
+
+array = np.array
+float32 = np.float32
+complex64 = np.complex64
+
+data_2026_02_04 = {"jacobi": {}, "qr": {}, "gesdd": {}}
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["jacobi"]["f32"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_gesvdj_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[ 3.7223358 , -1.2193766 ,  1.795808  ,  1.0418197 ],
+        [ 4.6901207 ,  0.11149647,  3.8279397 ,  8.07944   ],
+        [-3.763075  ,  9.478659  ,  0.14772141,  0.86707467],
+        [ 3.7043862 , -5.310245  ,  7.1758327 ,  3.8767374 ]],
+
+       [[-3.2586122 ,  8.368001  ,  3.8854764 , -9.429428  ],
+        [ 1.1301196 ,  9.584712  , -0.7165561 , -3.439898  ],
+        [ 4.4551563 , -5.166789  ,  1.8632321 ,  4.3077874 ],
+        [-1.3375099 , -1.1678746 ,  7.680391  ,  1.983631  ]]],
+      dtype=float32),),
+    expected_outputs=(array([[[-0.26312542 , -0.02221384 ,  0.19764648 , -0.94403785 ],
+        [-0.5306547  , -0.6105559  ,  0.5214799  ,  0.27145126 ],
+        [ 0.44124788 , -0.7911463  , -0.3813815  , -0.18421714 ],
+        [-0.6741445  , -0.028558023, -0.73725355 ,  0.0342183  ]],
+
+       [[-0.741788   ,  0.3681162  ,  0.2151611  , -0.51763594 ],
+        [-0.51899517 , -0.25662977 , -0.7801523  ,  0.2369551  ],
+        [ 0.41801134 ,  0.17694637 , -0.549365   , -0.70153725 ],
+        [ 0.07524119 ,  0.87596905 , -0.20800538 ,  0.42866164 ]]],
+      dtype=float32), array([[14.886929 ,  9.745339 ,  3.74923  ,  2.0411706],
+       [17.598677 ,  8.969212 ,  5.1799684,  2.7928188]], dtype=float32), array([[[-0.5122628   ,  0.53899616  , -0.48876467  , -0.4562667   ],
+        [-0.007687226 , -0.75814134  , -0.27693856  , -0.59031165  ],
+        [ 0.5029314   ,  0.03124599  , -0.79899544  ,  0.32816154  ],
+        [-0.69612336  , -0.3656894   , -0.2145239   ,  0.57936424  ]],
+
+       [[ 0.20412575  , -0.76308864  , -0.06554903  ,  0.60969806  ],
+        [-0.20881027  , -0.14679018  ,  0.9668265   , -0.0098668765],
+        [-0.72434616  , -0.5011017   , -0.2367066   , -0.41010973  ],
+        [-0.6245429   ,  0.38084862  , -0.07014099  ,  0.6782189   ]]],
+      dtype=float32)),
+    mlir_module_text=r"""
+#loc1 = loc("operand")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xf32> loc("operand")) -> (tensor<2x4x4xf32> {jax.result_info = "result[0]"}, tensor<2x4xf32> {jax.result_info = "result[1]"}, tensor<2x4x4xf32> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<0x7FC00000> : tensor<f32> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_gesvdj_ffi(%arg0) {mhlo.backend_config = {compute_uv = true, full_matrices = true}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o, p], [i, q, r], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=4, p=4, q=4, r=4}, custom>} : (tensor<2x4x4xf32>) -> (tensor<2x4x4xf32>, tensor<2x4xf32>, tensor<2x4x4xf32>, tensor<2x4x4xf32>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.transpose %0#3, dims = [0, 2, 1] : (tensor<2x4x4xf32>) -> tensor<2x4x4xf32> loc(#loc4)
+    %2 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %3 = stablehlo.compare  EQ, %0#4, %2,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %3, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4xf32> loc(#loc4)
+    %6 = stablehlo.broadcast_in_dim %4, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %7 = stablehlo.select %6, %0#1, %5 : tensor<2x4xi1>, tensor<2x4xf32> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %3, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4x4xf32> loc(#loc4)
+    %10 = stablehlo.broadcast_in_dim %8, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %11 = stablehlo.select %10, %0#2, %9 : tensor<2x4x4xi1>, tensor<2x4x4xf32> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %3, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4x4xf32> loc(#loc4)
+    %14 = stablehlo.broadcast_in_dim %12, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %15 = stablehlo.select %14, %1, %13 : tensor<2x4x4xi1>, tensor<2x4x4xf32> loc(#loc4)
+    return %11, %7, %15 : tensor<2x4x4xf32>, tensor<2x4xf32>, tensor<2x4x4xf32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":621:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("svd"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01%\x07\x01\x05\t\x13\x01\x03\x0f\x03\x11\x13\x17\x1b\x1f#'+/\x03\xe7\x9d3\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03So\x0f\x0b/\x0bo\x0f\x0b\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b\x1f\x1f\x1b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1fO/o\x0b\x0bO\x05#\x0fg\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x17\x0f\x0f\x17\x0f\x0f\x0f\x01\x05\x0b\x0f\x03/\x1b\x07\x17\x07\x07\x07\x0f\x0f\x07\x13\x13\x1b\x1b\x1f\x13\x13\x13\x13\x13\x17\x13\x17\x13\x02~\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x19\x11\x01\x00\x05\x1b\x05\x1d\x05\x1f\x1d\x15\x03\x05!\x05#\x1d\x1b\x1d\x05%\x17\x1f\xb6\t\x1b\x05'\x03\x07#Q%W'}\x05)\x05+\x05-\x1f!1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f'\x01\x1d/\x1f-\x11\x00\x00\x00\x00\x00\x00\x00\x00\x05\x03\x1f\x191\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x037\r\x01#\x1f\x03\x07=AE\r\x03-?\x1d1\r\x03-C\x1d3\r\x03-G\x1d5\x1d7\x1d9\x1f\x11\t\x00\x00\xc0\x7f\x1f\x13\t\x00\x00\x00\x00\r\x05S1U1\x1d;\x1d=\r\x03Y[\x1d?\x1dA\x0b\x03\x1dC\x1dE\x03\x01\x05\x01\x03\x03)\x03\x03k\x15\x03\x01\x01\x01\x03\x0b)o))q\x1f#!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f%\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x191\x00\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f1!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x15\t\x11\x11\x11\x11\x11\x11\x11\x11\x11\x03\x7f\x0b\x85\x8b\x8f\x95\x9b\x01\x01\x01\x01\x01\x13\x07{\x81\x83\x11\x03\x05\x11\x03\t\x13\x07{\x87\x89\x11\x03\r\x11\x03\x11\x13\x05{\x8d\x11\x03\x15\x13\x07{\x91\x93\x11\x03\x19\x11\x03\x1d\x13\x07{\x97\x99\x11\x03!\x11\x03%\x13\x03{\x01\t\x01\x02\x02)\x07\t\x11\x11\r\x01)\x05\t\x11\r\x1d\t\x13)\x01\r)\x01\x15\x1b)\x03\t\x15)\x03\r\x0b)\x07\t\x05\x05\x07)\x07\t\x11\x11\x07\x11\x03\x05\x07\x05\t\x05)\x03\r\x0f)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0b)\x03\t\x07)\x05\t\x05\x07)\x03\x05\x0b)\x05\t\x11\x07)\x03\t\x0b\x04\xe2\x02\x05\x01Q\x03\x07\x01\x07\x04\xba\x02\x03\x01\x05\tP\x03\x03\x07\x04\x8e\x02\x03/O\x03\x0b\x13\x00\x07B\x03\x05\x03\x11\x07B\x01\x07\x03\x13\x0bG\x01!\t\x0b\x05\t\x05\x05\x17\x03\x01\rF\x01\x0b\x03\x05\x03\r\x03F\x01\r\x03\x17\x03\x05\x0fF\x01\x0f\x03)\x05\x0f\x13\x03F\x01\x11\x03+\x03\x15\x03F\x01\r\x03\t\x03\x03\x03F\x01\x13\x03/\x03\x17\x05\x06\x01\x03\t\x07\x1b\t\x19\x03F\x01\x11\x03\x1b\x03\x15\x03F\x01\r\x03\x05\x03\x03\x03F\x01\x15\x03\x1d\x03\x1f\x05\x06\x01\x03\x05\x07#\x0b!\x03F\x01\x11\x03\x1b\x03\x15\x03F\x01\r\x03\x05\x03\x03\x03F\x01\x15\x03\x1d\x03'\x05\x06\x01\x03\x05\x07+\x11)\x11\x04\x03\x07%\x1d-\x06\x03\x01\x05\x01\x00\xca\x07G+\x03\x05\x1f\x1d\x17\x0f\x0b\x15\x15\x15!%3)s\x15\t\x11\x13%)9\x15\x17\x1b\x1f\x11\x19\x15)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00select_v1\x00constant_v1\x00func_v1\x00custom_call_v1\x00transpose_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00operand\x00svd\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00compute_uv\x00full_matrices\x00num_batch_dims\x001\x00\x00hipsolver_gesvdj_ffi\x00\x08I\x17\x05#\x01\x0b59;IK\x03M\x03O\x11]_acegim\x03s\x03+\x05uw\x03/\x03y\x033",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["jacobi"]["f64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_gesvdj_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[ 6.765010292858648 , -8.41155960620905  , -4.844896569854504 ,
+          9.95142460562528  ],
+        [-2.3172669439509725, -2.377110651443677 , -6.845706401083533 ,
+         -0.2688427639827662],
+        [ 5.816161074813861 , -1.7232775955098916,  5.541301732723863 ,
+          6.036680333196475 ],
+        [-8.991063432111106 , -5.6496730486346936,  6.836412081386392 ,
+         -0.5190364760940618]],
+
+       [[-6.141369069758367 ,  5.548388466467886 ,  0.3686736359214944,
+         -5.673263508349118 ],
+        [-6.44854045236065  , -6.90827339890318  , -3.6114354632331853,
+          1.485277184786895 ],
+        [ 5.029310351636605 ,  3.1332466505034784, -2.6674713013275557,
+         -3.478972614333551 ],
+        [-6.013442048617872 , -3.3540895366085755, -2.4965517430649165,
+          6.810791397528835 ]]]),),
+    expected_outputs=(array([[[-0.8582826839566826  ,  0.1513382685059182  ,
+          0.36013035494839635 , -0.3327967703426305  ],
+        [-0.06441044954508533 , -0.29407362148116534 ,
+          0.6308874214363143  ,  0.7150895472678866  ],
+        [-0.3777672731992751  ,  0.4538714107552889  ,
+         -0.5233373280534688  ,  0.61433758705165    ],
+        [ 0.34131219683611846 ,  0.8274165674758919  ,
+          0.4454270198181023  , -0.02196766198937948 ]],
+
+       [[-0.17339573460073665 , -0.9777805849977806  ,
+          0.05338819597560617 ,  0.10501784302745319 ],
+        [ 0.6262340205527418  , -0.1769136278875054  ,
+         -0.7175042887139369  , -0.24843533453825947 ],
+        [-0.41056955000343537 ,  0.11049263814893846 ,
+         -0.6153961832518882  ,  0.6637104482859019  ],
+        [ 0.6396854815724643  , -0.020930188340448217,
+          0.32190811398066105 ,  0.697667240190373   ]]]), array([[17.334179944404195 , 12.265833831731298 , 10.472378382078709 ,
+         0.3060234958213206],
+       [14.908186073428876 ,  9.911591222615328 ,  5.124458445072229 ,
+         3.603674967389374 ]]), array([[[-0.6301394090884883  ,  0.35163487969387064 ,
+          0.2791741088511297  , -0.6335132622474965  ],
+        [-0.25227095254238124 , -0.4916685588357358  ,
+          0.7705568653330496  ,  0.3175901636446802  ],
+        [-0.5800330711340123  , -0.5866488459963135  ,
+         -0.5651544995632785  ,  0.002271454472501866],
+        [-0.4503835343435822  ,  0.5389416212599115  ,
+         -0.09436273554037346 ,  0.7055439568214439  ]],
+
+       [[-0.5959813910148998  , -0.5849296973169651  ,
+         -0.18965121472926696 ,  0.5164260329537445  ],
+        [ 0.7897127913564964  , -0.3820311302146965  ,
+          0.003626822614449421,  0.47999246751645436 ],
+        [-0.14280833301192955 ,  0.438102406219792   ,
+          0.6730066572461373  ,  0.5785620977813557  ],
+        [ 0.027670720161007956,  0.5656639871938048  ,
+         -0.7148995049738235  ,  0.4100942362749819  ]]])),
+    mlir_module_text=r"""
+#loc1 = loc("operand")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xf64> loc("operand")) -> (tensor<2x4x4xf64> {jax.result_info = "result[0]"}, tensor<2x4xf64> {jax.result_info = "result[1]"}, tensor<2x4x4xf64> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<0x7FF8000000000000> : tensor<f64> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_gesvdj_ffi(%arg0) {mhlo.backend_config = {compute_uv = true, full_matrices = true}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o, p], [i, q, r], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=4, p=4, q=4, r=4}, custom>} : (tensor<2x4x4xf64>) -> (tensor<2x4x4xf64>, tensor<2x4xf64>, tensor<2x4x4xf64>, tensor<2x4x4xf64>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.transpose %0#3, dims = [0, 2, 1] : (tensor<2x4x4xf64>) -> tensor<2x4x4xf64> loc(#loc4)
+    %2 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %3 = stablehlo.compare  EQ, %0#4, %2,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %3, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x4xf64> loc(#loc4)
+    %6 = stablehlo.broadcast_in_dim %4, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %7 = stablehlo.select %6, %0#1, %5 : tensor<2x4xi1>, tensor<2x4xf64> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %3, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x4x4xf64> loc(#loc4)
+    %10 = stablehlo.broadcast_in_dim %8, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %11 = stablehlo.select %10, %0#2, %9 : tensor<2x4x4xi1>, tensor<2x4x4xf64> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %3, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x4x4xf64> loc(#loc4)
+    %14 = stablehlo.broadcast_in_dim %12, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %15 = stablehlo.select %14, %1, %13 : tensor<2x4x4xi1>, tensor<2x4x4xf64> loc(#loc4)
+    return %11, %7, %15 : tensor<2x4x4xf64>, tensor<2x4xf64>, tensor<2x4x4xf64> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":621:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("svd"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01%\x07\x01\x05\t\x13\x01\x03\x0f\x03\x11\x13\x17\x1b\x1f#'+/\x03\xe7\x9d3\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03So\x0f\x0b/\x0bo\x0f\x0b\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b/\x1f\x1b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1fO/o\x0b\x0bO\x05#\x0fg\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x17\x0f\x0f\x17\x0f\x0f\x0f\x01\x05\x0b\x0f\x03/\x1b\x07\x17\x07\x07\x07\x0f\x0f\x07\x13\x13\x1b\x1b\x1f\x13\x13\x13\x13\x13\x17\x13\x17\x13\x02\x8e\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x19\x11\x01\x00\x05\x1b\x05\x1d\x05\x1f\x1d\x15\x03\x05!\x05#\x1d\x1b\x1d\x05%\x17\x1f\xb6\t\x1b\x05'\x03\x07#Q%W'}\x05)\x05+\x05-\x1f!1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f'\x01\x1d/\x1f-\x11\x00\x00\x00\x00\x00\x00\x00\x00\x05\x03\x1f\x191\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x037\r\x01#\x1f\x03\x07=AE\r\x03-?\x1d1\r\x03-C\x1d3\r\x03-G\x1d5\x1d7\x1d9\x1f\x11\x11\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x13\t\x00\x00\x00\x00\r\x05S1U1\x1d;\x1d=\r\x03Y[\x1d?\x1dA\x0b\x03\x1dC\x1dE\x03\x01\x05\x01\x03\x03)\x03\x03k\x15\x03\x01\x01\x01\x03\x0b)o))q\x1f#!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f%\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x191\x00\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f1!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x15\t\x11\x11\x11\x11\x11\x11\x11\x11\x11\x03\x7f\x0b\x85\x8b\x8f\x95\x9b\x01\x01\x01\x01\x01\x13\x07{\x81\x83\x11\x03\x05\x11\x03\t\x13\x07{\x87\x89\x11\x03\r\x11\x03\x11\x13\x05{\x8d\x11\x03\x15\x13\x07{\x91\x93\x11\x03\x19\x11\x03\x1d\x13\x07{\x97\x99\x11\x03!\x11\x03%\x13\x03{\x01\t\x01\x02\x02)\x07\t\x11\x11\r\x01)\x05\t\x11\r\x1d\x0b\x13)\x01\r)\x01\x15\x1b)\x03\t\x15)\x03\r\x0b)\x07\t\x05\x05\x07)\x07\t\x11\x11\x07\x11\x03\x05\x07\x05\t\x05)\x03\r\x0f)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0b)\x03\t\x07)\x05\t\x05\x07)\x03\x05\x0b)\x05\t\x11\x07)\x03\t\x0b\x04\xe2\x02\x05\x01Q\x03\x07\x01\x07\x04\xba\x02\x03\x01\x05\tP\x03\x03\x07\x04\x8e\x02\x03/O\x03\x0b\x13\x00\x07B\x03\x05\x03\x11\x07B\x01\x07\x03\x13\x0bG\x01!\t\x0b\x05\t\x05\x05\x17\x03\x01\rF\x01\x0b\x03\x05\x03\r\x03F\x01\r\x03\x17\x03\x05\x0fF\x01\x0f\x03)\x05\x0f\x13\x03F\x01\x11\x03+\x03\x15\x03F\x01\r\x03\t\x03\x03\x03F\x01\x13\x03/\x03\x17\x05\x06\x01\x03\t\x07\x1b\t\x19\x03F\x01\x11\x03\x1b\x03\x15\x03F\x01\r\x03\x05\x03\x03\x03F\x01\x15\x03\x1d\x03\x1f\x05\x06\x01\x03\x05\x07#\x0b!\x03F\x01\x11\x03\x1b\x03\x15\x03F\x01\r\x03\x05\x03\x03\x03F\x01\x15\x03\x1d\x03'\x05\x06\x01\x03\x05\x07+\x11)\x11\x04\x03\x07%\x1d-\x06\x03\x01\x05\x01\x00\xca\x07G+\x03\x05\x1f\x1d\x17\x0f\x0b\x15\x15\x15!%3)s\x15\t\x11\x13%)9\x15\x17\x1b\x1f\x11\x19\x15)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00select_v1\x00constant_v1\x00func_v1\x00custom_call_v1\x00transpose_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00operand\x00svd\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00compute_uv\x00full_matrices\x00num_batch_dims\x001\x00\x00hipsolver_gesvdj_ffi\x00\x08I\x17\x05#\x01\x0b59;IK\x03M\x03O\x11]_acegim\x03s\x03+\x05uw\x03/\x03y\x033",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["jacobi"]["c64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_gesvdj_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[-6.511656   +3.9382665j ,  6.8709564  +2.5289335j ,
+         -9.411133   -9.168636j  , -7.3314643  +7.189627j  ],
+        [ 6.2476263  -2.9142983j , -0.060004584+2.8443305j ,
+          7.9243956  -7.338787j  ,  7.5318184  -4.295307j  ],
+        [-8.464032   -5.655291j  ,  5.0108194  +1.0293938j ,
+          1.2175745  +2.8760285j ,  4.345743   +0.604459j  ],
+        [ 9.876885   -8.447743j  ,  8.306228   +4.8012953j ,
+          7.807553   +3.5845838j ,  3.5843878  -7.8993335j ]],
+
+       [[-9.904369   +8.589717j  ,  6.794971   +2.5694795j ,
+          2.2921402  -6.3595896j ,  4.2440815  -4.766851j  ],
+        [ 7.0766907  -2.7424748j , -3.7027502  +2.6230326j ,
+         -5.010383   +4.308751j  ,  1.4581944  -0.17130353j],
+        [ 1.99838    -8.123547j  , -2.6369176  +7.5087905j ,
+         -0.5215636  -9.439996j  ,  9.993352   -3.7125206j ],
+        [-0.031122532+4.9268885j , -5.443708   -0.5684887j ,
+          2.8900268  +7.271322j  , -9.371372   +2.0711803j ]]],
+      dtype=complex64),),
+    expected_outputs=(array([[[-0.49599195 -0.3477366j   , -0.47453368 +0.21972746j  ,
+         -0.35997757 -0.35410944j  , -0.2512339  +0.20374799j  ],
+        [ 0.44907737 +0.002405172j , -0.24904558 -0.24744749j  ,
+         -0.5188636  -0.1262432j   ,  0.5398943  +0.3137309j   ],
+        [ 0.044145714-0.11281507j  ,  0.44468585 +0.40522593j  ,
+         -0.076412916-0.63636005j  ,  0.3233734  -0.32864404j  ],
+        [ 0.6423971  +0.06360132j  , -0.07980481 +0.484728j    ,
+         -0.2172295  +0.043406248j , -0.54105425 -0.011761099j ]],
+
+       [[-0.19801104 +0.5015972j   ,  0.2974156  -0.56987107j  ,
+         -0.14941728 +0.2827743j   , -0.044859245-0.43781692j  ],
+        [ 0.031362493-0.19080958j  , -0.38242713 +0.34200114j  ,
+         -0.05559378 +0.4285319j   ,  0.2569481  -0.66831154j  ],
+        [-0.6645802  -0.041444328j , -0.43262926 -0.0030564666j,
+         -0.3622315  +0.21935806j  , -0.34698528 +0.26402578j  ],
+        [ 0.44450504 -0.17558658j  ,  0.3494469  +0.11952038j  ,
+         -0.5150082  +0.5161587j   , -0.24080087 +0.2134198j   ]]],
+      dtype=complex64), array([[28.04699  , 15.29802  , 10.812811 ,  8.262912 ],
+       [24.471525 , 17.579378 ,  7.0476294,  4.6335263]], dtype=float32), array([[[ 0.3826026   -0.45641175j  ,  0.05130297  +0.1989237j   ,
+          0.5836618   +0.0010950209j,  0.2293342   -0.45808792j  ],
+        [-0.51104975  -0.089208454j ,  0.05988489  -0.6154523j   ,
+          0.33436182  +0.45249024j  ,  0.15088452  -0.09586868j  ],
+        [-0.01766008  -0.45967096j  , -0.58548707  +0.16145816j  ,
+         -0.0013295817+0.38968956j  , -0.47265458  +0.2103918j   ],
+        [-0.14836499  -0.37756056j  , -0.43804413  -0.12117417j  ,
+         -0.28388205  -0.33218026j  ,  0.65180457  +0.114404j    ]],
+
+       [[ 0.21023     +0.4984393j   , -0.06341874  -0.4433479j   ,
+         -0.15844418  +0.37922654j  , -0.5790327   +0.050856397j ],
+        [-0.66821074  +0.044658013j ,  0.11475918  +0.11917833j  ,
+          0.55912364  +0.3275715j   , -0.22622015  +0.23027979j  ],
+        [ 0.3396066   -0.19580403j  ,  0.8731466   +0.013714722j ,
+          0.052092    +0.071940996j , -0.09583993  +0.2582264j   ],
+        [-0.31174853  +0.08945723j  , -0.01018406  +0.09680383j  ,
+         -0.6347194   +0.020064345j ,  0.13741249  +0.680575j    ]]],
+      dtype=complex64)),
+    mlir_module_text=r"""
+#loc1 = loc("operand")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xcomplex<f32>> loc("operand")) -> (tensor<2x4x4xcomplex<f32>> {jax.result_info = "result[0]"}, tensor<2x4xf32> {jax.result_info = "result[1]"}, tensor<2x4x4xcomplex<f32>> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<(0x7FC00000,0x7FC00000)> : tensor<complex<f32>> loc(#loc)
+    %cst_0 = stablehlo.constant dense<0x7FC00000> : tensor<f32> loc(#loc4)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_gesvdj_ffi(%arg0) {mhlo.backend_config = {compute_uv = true, full_matrices = true}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o, p], [i, q, r], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=4, p=4, q=4, r=4}, custom>} : (tensor<2x4x4xcomplex<f32>>) -> (tensor<2x4x4xcomplex<f32>>, tensor<2x4xf32>, tensor<2x4x4xcomplex<f32>>, tensor<2x4x4xcomplex<f32>>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.transpose %0#3, dims = [0, 2, 1] : (tensor<2x4x4xcomplex<f32>>) -> tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %2 = stablehlo.real %1 : (tensor<2x4x4xcomplex<f32>>) -> tensor<2x4x4xf32> loc(#loc4)
+    %3 = stablehlo.imag %1 : (tensor<2x4x4xcomplex<f32>>) -> tensor<2x4x4xf32> loc(#loc4)
+    %4 = stablehlo.negate %3 : tensor<2x4x4xf32> loc(#loc4)
+    %5 = stablehlo.complex %2, %4 : tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %6 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %7 = stablehlo.compare  EQ, %0#4, %6,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %7, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<f32>) -> tensor<2x4xf32> loc(#loc4)
+    %10 = stablehlo.broadcast_in_dim %8, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %11 = stablehlo.select %10, %0#1, %9 : tensor<2x4xi1>, tensor<2x4xf32> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %7, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f32>>) -> tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %14 = stablehlo.broadcast_in_dim %12, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %15 = stablehlo.select %14, %0#2, %13 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %16 = stablehlo.broadcast_in_dim %7, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %17 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f32>>) -> tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %18 = stablehlo.broadcast_in_dim %16, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %19 = stablehlo.select %18, %5, %17 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    return %15, %11, %19 : tensor<2x4x4xcomplex<f32>>, tensor<2x4xf32>, tensor<2x4x4xcomplex<f32>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":621:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("svd"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01-\x07\x01\x05\t\x1b\x01\x03\x0f\x03\x19\x13\x17\x1b\x1f#'+/37;?\x03\xef\x9f9\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03Uo\x0f\x0b/\x0bo\x0f\x0b\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b/\x1f\x1f\x1b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1fO/o\x0b\x0bO\x05#\x0fg\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x17\x0f\x0f\x17\x0f\x0f\x0f\x01\x05\x0b\x0f\x035\x1b\x07\x07\x17\x07\x07\x1b\x0b\x0f\x0f\x0f\x07\x13\x13\x1b\x1b\x1f\x13\x13\x13\x13\x13\x17\x13\x17\x13\x02\xd6\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05!\x11\x01\x00\x05#\x05%\x05'\x1d\x15\x03\x05)\x05+\x1d\x1b\x1d\x05-\x17\x1f\xb6\t\x1b\x05/\x03\x07#S%Y'\x7f\x051\x053\x055\x1f'1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f-\x01\x1d7\x1f3\x11\x00\x00\x00\x00\x00\x00\x00\x00\x05\x03\x1f\x1f1\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x037\r\x01#%\x03\x07=AE\r\x03-?\x1d9\r\x03-C\x1d;\r\x03-G\x1d=\x1d?\x1dA\x1f\x15\x11\x00\x00\xc0\x7f\x00\x00\xc0\x7f\x1f\x17\t\x00\x00\xc0\x7f\x1f\x19\t\x00\x00\x00\x00\r\x05U1W1\x1dC\x1dE\r\x03[]\x1dG\x1dI\x0b\x03\x1dK\x1dM\x03\x01\x05\x01\x03\x03)\x03\x03m\x15\x03\x01\x01\x01\x03\x0b)q))s\x1f)!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f+\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x1f1\x00\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f7!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x15\t\x11\x11\x11\x11\x11\x11\x11\x11\x11\x03\x81\x0b\x87\x8d\x91\x97\x9d\x01\x01\x01\x01\x01\x13\x07}\x83\x85\x11\x03\x05\x11\x03\t\x13\x07}\x89\x8b\x11\x03\r\x11\x03\x11\x13\x05}\x8f\x11\x03\x15\x13\x07}\x93\x95\x11\x03\x19\x11\x03\x1d\x13\x07}\x99\x9b\x11\x03!\x11\x03%\x13\x03}\x01\t\x01\x02\x02)\x07\t\x11\x11\x13\x01\t)\x05\t\x11\t\x1d\x13)\x07\t\x11\x11\t\x03\t)\x01\x13)\x01\t)\x01\x1b\x1b)\x03\t\x1b)\x03\r\r)\x07\t\x05\x05\x07)\x07\t\x11\x11\x07\x11\x03\x05\x07\x05\x0b\x05)\x03\r\x0f)\x03\t\x0f)\x03\x05\x0f)\x03\x01\r)\x03\t\x07)\x05\t\x05\x07)\x03\x05\r)\x05\t\x11\x07)\x03\t\r\x04n\x03\x05\x01Q\x03\x07\x01\x07\x04F\x03\x03\x01\x05\tP\x03\x03\x07\x04\x1a\x03\x039c\x03\x0b\x13\x00\x05B\x03\x05\x03\x15\x05B\x01\x07\x03\x17\x05B\x01\t\x03\x19\x0bG\x01!\x0b\x0b\x05\x0b\x05\x05\x1d\x03\x01\rF\x01\r\x03\x05\x03\x0f\x0f\x06\x01\x03\x11\x03\x13\x11\x06\x01\x03\x11\x03\x13\x13\x06\x01\x03\x11\x03\x17\x15\x06\x01\x03\x05\x05\x15\x19\x03F\x01\x0f\x03\x1d\x03\x07\x17F\x01\x11\x03/\x05\x11\x1d\x03F\x01\x13\x031\x03\x1f\x03F\x01\x0f\x03\x0b\x03\x05\x03F\x01\x15\x035\x03!\x07\x06\x01\x03\x0b\x07%\x0b#\x03F\x01\x13\x03!\x03\x1f\x03F\x01\x0f\x03\x05\x03\x03\x03F\x01\x17\x03#\x03)\x07\x06\x01\x03\x05\x07-\r+\x03F\x01\x13\x03!\x03\x1f\x03F\x01\x0f\x03\x05\x03\x03\x03F\x01\x17\x03#\x031\x07\x06\x01\x03\x05\x075\x1b3\x19\x04\x03\x07/'7\x06\x03\x01\x05\x01\x00n\x08O+\x03\x05\x1f\x1d\x17\x0f\x0b\x15\x15\x15!%3)s\x15\t\x11\x13%)9\x15\x17\x17\x15\x11\x11\x1b\x1f\x11\x15\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00select_v1\x00func_v1\x00custom_call_v1\x00transpose_v1\x00real_v1\x00imag_v1\x00negate_v1\x00complex_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00operand\x00svd\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00compute_uv\x00full_matrices\x00num_batch_dims\x001\x00\x00hipsolver_gesvdj_ffi\x00\x08M\x19\x05#\x01\x0b59;IK\x03M\x03O\x03Q\x11_acegiko\x03u\x03+\x05wy\x03/\x03{\x033",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["jacobi"]["c128"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_gesvdj_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[-4.305409063295221  +8.562910525232837j  ,
+          0.4575391541476215 +0.29707312893051707j,
+         -6.438158508718077  +7.685372543598643j  ,
+         -4.621486740450309  +2.022385511640895j  ],
+        [-3.5167752452788665 +2.745861246229973j  ,
+          5.0549083156572685 -2.880319974395058j  ,
+          2.5302278647207253 +9.906980376253383j  ,
+          1.574596247755391  -2.7961023138146217j ],
+        [-1.5784784544179953 +0.0829102322391222j ,
+         -9.237548951603042  +9.879555522852257j  ,
+          1.8891026618492859 +1.1401945748088593j ,
+          5.394099323297649  -3.921517130110881j  ],
+        [-2.7752654445789844 -5.990566343812964j  ,
+         -8.878414655317396  -4.134572951945792j  ,
+          5.958890395293434  -9.029222489105175j  ,
+         -6.2944520404181965 +0.45060194198164893j]],
+
+       [[-7.5785161987812755 -0.7677461987355709j ,
+         -2.040365479133275  +7.603905932243634j  ,
+         -3.691071372147059  +9.89712814444609j   ,
+          3.4952539163073126 -7.56289549560567j   ],
+        [ 1.3927209035377324 -5.2169992228732625j ,
+          0.8154615431862204 -5.117885610665862j  ,
+         -9.010010491559825  -4.203757768856371j  ,
+          2.9119697324078473 +5.922071817981767j  ],
+        [ 0.10728598047305837-2.507471821947698j  ,
+         -5.0232104603833605 -5.470368656051647j  ,
+         -8.321741577357662  +9.579011995819101j  ,
+          9.889795999159439  +1.972451322561211j  ],
+        [-7.955739588892468  +6.00000543801551j   ,
+         -2.931108343578779  +6.770562873038649j  ,
+         -6.313940666870044  +7.8176854249436865j ,
+          9.46517759029885   -0.29194868150852216j]]]),),
+    expected_outputs=(array([[[-0.3123156550421202  +0.334289656331932j  ,
+          0.23030981198221195 +0.4356027470031708j ,
+         -0.3877002524330693  +0.45470400435639374j,
+         -0.37575438848476694 -0.22284168553736483j],
+        [ 0.0787616912430086  +0.4683162862107368j ,
+          0.053391106496996105+0.05898993599000597j,
+         -0.506388304927506   -0.2242931168984999j ,
+          0.3627677994695937  +0.5742900271411976j ],
+        [-0.19117032519989163 -0.19935157910756654j,
+          0.5228407641137001  -0.6623932430619892j ,
+         -0.4086691211938215  -0.1222852659623192j ,
+         -0.1177858097416972  -0.12549082728150862j],
+        [ 0.3091438755425131  -0.6271592526880687j ,
+         -0.08376759919479365 +0.17813739292718545j,
+         -0.33697567172992837 +0.2016916577440831j ,
+         -0.3364442790211764  +0.45268588836087237j]],
+
+       [[-0.05334865675740175 +0.5161114058374165j ,
+          0.17087006804744356 -0.2815593776541724j ,
+          0.22716540797510043 +0.6924263330356862j ,
+          0.19836035173275507 -0.2278277768093274j ],
+        [-0.3731280907418766  -0.23027974587285818j,
+         -0.17809521970913889 +0.04907999950574157j,
+          0.06027805674221967 +0.36857770774438403j,
+         -0.7853175228581392  -0.13195957876015255j],
+        [-0.44247472043682406 +0.26036051542030303j,
+         -0.35552787026936694 +0.5455376957814335j ,
+          0.19677100058992886 -0.19168167356500643j,
+          0.24448011783021284 -0.42093450922860026j],
+        [-0.2178752955950242  +0.4769575279629936j ,
+         -0.3294494231631181  -0.5699584340865812j ,
+         -0.34372129423527903 -0.3685833165010564j ,
+         -0.18997371175984737 -0.03955164479974399j]]]), array([[23.168604748820908 , 15.485742042115662 , 11.129821974271639 ,
+         4.172163032990345 ],
+       [31.035300784567507 , 12.500953553782981 ,  6.796077120797179 ,
+         1.5199501235275763]]), array([[[ 0.36257669741978926 -0.14221175501714423j ,
+         -0.058250697282110166-0.5790785298475211j  ,
+          0.7050592229784634  +0.01949879578361566j ,
+         -0.06663926262442564 -0.08751780099928909j ],
+        [ 0.0644324594822553  +0.27093299962776496j ,
+         -0.712394512739288   +0.0252882035037107j  ,
+          0.04580605296283848 +0.4195153849647771j  ,
+          0.37202557799112873 +0.31273622986546246j ],
+        [ 0.6369967429219748  -0.10691103955907996j ,
+          0.24877842613377837 +0.02569569786047833j ,
+         -0.20245308774453494 -0.2601671253010774j  ,
+          0.2720824775068983  +0.5809915184734116j  ],
+        [-0.3815416405835403  +0.4560579773766533j  ,
+          0.2169579367540845  -0.20858513130029815j ,
+          0.20518865758270805 -0.416705369920401j   ,
+          0.5823815708987322  +0.030733529055695246j]],
+
+       [[ 0.1477206865428076  +0.315398845668301j   ,
+          0.3084825844834702  +0.20608887424285138j ,
+          0.6739221002092323  +0.003451102602297634j,
+         -0.4061164568347281  -0.34921992229904514j ],
+        [-0.30299017724213945 -0.5665496536910978j  ,
+         -0.5581728194563791  +0.19040909260866232j ,
+          0.3031519199482866  -0.25576049135034773j ,
+         -0.2314434986696236  -0.16889438974932564j ],
+        [-0.4513340696752332  -0.17983214863943056j ,
+          0.226097381405423   -0.42903008355691824j ,
+         -0.03866935846260517 +0.4630617127443596j  ,
+         -0.5388857439413695  +0.14983925812009435j ],
+        [ 0.409305316379769   +0.24969526059794167j ,
+         -0.48587930748034175 +0.20805723285421662j ,
+         -0.35061304467035664 +0.22282639217479672j ,
+         -0.5598471225880682  +0.06888405058400499j ]]])),
+    mlir_module_text=r"""
+#loc1 = loc("operand")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xcomplex<f64>> loc("operand")) -> (tensor<2x4x4xcomplex<f64>> {jax.result_info = "result[0]"}, tensor<2x4xf64> {jax.result_info = "result[1]"}, tensor<2x4x4xcomplex<f64>> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<(0x7FF8000000000000,0x7FF8000000000000)> : tensor<complex<f64>> loc(#loc)
+    %cst_0 = stablehlo.constant dense<0x7FF8000000000000> : tensor<f64> loc(#loc4)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_gesvdj_ffi(%arg0) {mhlo.backend_config = {compute_uv = true, full_matrices = true}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o, p], [i, q, r], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=4, p=4, q=4, r=4}, custom>} : (tensor<2x4x4xcomplex<f64>>) -> (tensor<2x4x4xcomplex<f64>>, tensor<2x4xf64>, tensor<2x4x4xcomplex<f64>>, tensor<2x4x4xcomplex<f64>>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.transpose %0#3, dims = [0, 2, 1] : (tensor<2x4x4xcomplex<f64>>) -> tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %2 = stablehlo.real %1 : (tensor<2x4x4xcomplex<f64>>) -> tensor<2x4x4xf64> loc(#loc4)
+    %3 = stablehlo.imag %1 : (tensor<2x4x4xcomplex<f64>>) -> tensor<2x4x4xf64> loc(#loc4)
+    %4 = stablehlo.negate %3 : tensor<2x4x4xf64> loc(#loc4)
+    %5 = stablehlo.complex %2, %4 : tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %6 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %7 = stablehlo.compare  EQ, %0#4, %6,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %7, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<f64>) -> tensor<2x4xf64> loc(#loc4)
+    %10 = stablehlo.broadcast_in_dim %8, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %11 = stablehlo.select %10, %0#1, %9 : tensor<2x4xi1>, tensor<2x4xf64> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %7, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f64>>) -> tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %14 = stablehlo.broadcast_in_dim %12, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %15 = stablehlo.select %14, %0#2, %13 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %16 = stablehlo.broadcast_in_dim %7, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %17 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f64>>) -> tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %18 = stablehlo.broadcast_in_dim %16, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %19 = stablehlo.select %18, %5, %17 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    return %15, %11, %19 : tensor<2x4x4xcomplex<f64>>, tensor<2x4xf64>, tensor<2x4x4xcomplex<f64>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":621:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("svd"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01-\x07\x01\x05\t\x1b\x01\x03\x0f\x03\x19\x13\x17\x1b\x1f#'+/37;?\x03\xef\x9f9\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03Uo\x0f\x0b/\x0bo\x0f\x0b\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0bO/\x1f\x1b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1fO/o\x0b\x0bO\x05#\x0fg\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x17\x0f\x0f\x17\x0f\x0f\x0f\x01\x05\x0b\x0f\x035\x1b\x07\x07\x17\x07\x07\x1b\x0b\x0f\x0f\x0f\x07\x13\x13\x1b\x1b\x1f\x13\x13\x13\x13\x13\x17\x13\x17\x13\x02\x06\x08\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05!\x11\x01\x00\x05#\x05%\x05'\x1d\x15\x03\x05)\x05+\x1d\x1b\x1d\x05-\x17\x1f\xb6\t\x1b\x05/\x03\x07#S%Y'\x7f\x051\x053\x055\x1f'1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f-\x01\x1d7\x1f3\x11\x00\x00\x00\x00\x00\x00\x00\x00\x05\x03\x1f\x1f1\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x037\r\x01#%\x03\x07=AE\r\x03-?\x1d9\r\x03-C\x1d;\r\x03-G\x1d=\x1d?\x1dA\x1f\x15!\x00\x00\x00\x00\x00\x00\xf8\x7f\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x17\x11\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x19\t\x00\x00\x00\x00\r\x05U1W1\x1dC\x1dE\r\x03[]\x1dG\x1dI\x0b\x03\x1dK\x1dM\x03\x01\x05\x01\x03\x03)\x03\x03m\x15\x03\x01\x01\x01\x03\x0b)q))s\x1f)!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f+\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x1f1\x00\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f7!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x15\t\x11\x11\x11\x11\x11\x11\x11\x11\x11\x03\x81\x0b\x87\x8d\x91\x97\x9d\x01\x01\x01\x01\x01\x13\x07}\x83\x85\x11\x03\x05\x11\x03\t\x13\x07}\x89\x8b\x11\x03\r\x11\x03\x11\x13\x05}\x8f\x11\x03\x15\x13\x07}\x93\x95\x11\x03\x19\x11\x03\x1d\x13\x07}\x99\x9b\x11\x03!\x11\x03%\x13\x03}\x01\t\x01\x02\x02)\x07\t\x11\x11\x13\x01\x0b)\x05\t\x11\t\x1d\x13)\x07\t\x11\x11\t\x03\t)\x01\x13)\x01\t)\x01\x1b\x1b)\x03\t\x1b)\x03\r\r)\x07\t\x05\x05\x07)\x07\t\x11\x11\x07\x11\x03\x05\x07\x05\x0b\x05)\x03\r\x0f)\x03\t\x0f)\x03\x05\x0f)\x03\x01\r)\x03\t\x07)\x05\t\x05\x07)\x03\x05\r)\x05\t\x11\x07)\x03\t\r\x04n\x03\x05\x01Q\x03\x07\x01\x07\x04F\x03\x03\x01\x05\tP\x03\x03\x07\x04\x1a\x03\x039c\x03\x0b\x13\x00\x05B\x03\x05\x03\x15\x05B\x01\x07\x03\x17\x05B\x01\t\x03\x19\x0bG\x01!\x0b\x0b\x05\x0b\x05\x05\x1d\x03\x01\rF\x01\r\x03\x05\x03\x0f\x0f\x06\x01\x03\x11\x03\x13\x11\x06\x01\x03\x11\x03\x13\x13\x06\x01\x03\x11\x03\x17\x15\x06\x01\x03\x05\x05\x15\x19\x03F\x01\x0f\x03\x1d\x03\x07\x17F\x01\x11\x03/\x05\x11\x1d\x03F\x01\x13\x031\x03\x1f\x03F\x01\x0f\x03\x0b\x03\x05\x03F\x01\x15\x035\x03!\x07\x06\x01\x03\x0b\x07%\x0b#\x03F\x01\x13\x03!\x03\x1f\x03F\x01\x0f\x03\x05\x03\x03\x03F\x01\x17\x03#\x03)\x07\x06\x01\x03\x05\x07-\r+\x03F\x01\x13\x03!\x03\x1f\x03F\x01\x0f\x03\x05\x03\x03\x03F\x01\x17\x03#\x031\x07\x06\x01\x03\x05\x075\x1b3\x19\x04\x03\x07/'7\x06\x03\x01\x05\x01\x00n\x08O+\x03\x05\x1f\x1d\x17\x0f\x0b\x15\x15\x15!%3)s\x15\t\x11\x13%)9\x15\x17\x17\x15\x11\x11\x1b\x1f\x11\x15\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00select_v1\x00func_v1\x00custom_call_v1\x00transpose_v1\x00real_v1\x00imag_v1\x00negate_v1\x00complex_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00operand\x00svd\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00compute_uv\x00full_matrices\x00num_batch_dims\x001\x00\x00hipsolver_gesvdj_ffi\x00\x08M\x19\x05#\x01\x0b59;IK\x03M\x03O\x03Q\x11_acegiko\x03u\x03+\x05wy\x03/\x03{\x033",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["qr"]["f32"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_gesvd_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[-8.088836  , -2.6205542 , -7.2633333 ,  5.0895734 ],
+        [ 9.784253  ,  8.099774  , -8.470991  ,  3.0590599 ],
+        [-6.5720334 , -4.4796433 ,  5.5712957 ,  7.9569902 ],
+        [-7.765548  , -8.527966  ,  5.5323663 , -0.61520344]],
+
+       [[-6.685037  ,  5.1507697 , -8.878728  ,  8.7760725 ],
+        [ 2.2026582 ,  5.15965   ,  8.254493  ,  5.2088103 ],
+        [ 1.649047  , -3.3060083 , -4.6077223 , -0.92500544],
+        [-2.111105  ,  2.339333  ,  2.2933412 ,  1.7438462 ]]],
+      dtype=float32),),
+    expected_outputs=(array([[[-0.19646618 , -0.88533336 ,  0.40994054 , -0.097645864],
+        [ 0.6584475  , -0.35089356 , -0.3007529  ,  0.5940271  ],
+        [-0.46186477 , -0.27749717 , -0.8389231  , -0.07670852 ],
+        [-0.56082886 ,  0.126704   ,  0.19417621 ,  0.7948037  ]],
+
+       [[-0.9831455  , -0.14481494 , -0.070398524, -0.0865914  ],
+        [ 0.15959439 , -0.84682167 , -0.50710094 ,  0.016481   ],
+        [-0.06209982 ,  0.41913196 , -0.70081264 ,  0.5738761  ],
+        [-0.06402065 , -0.29368412 ,  0.49674392 ,  0.8141846  ]]],
+      dtype=float32), array([[22.384214 , 12.4938135,  7.4144673,  1.7072145],
+       [15.208481 , 12.81391  ,  3.4745562,  0.4607253]], dtype=float32), array([[[ 0.6889739  ,  0.56735736 , -0.4389969  , -0.10345369 ],
+        [ 0.3656113  , -0.028776985,  0.68496627 , -0.6295405  ],
+        [-0.30387047 , -0.1899195  , -0.5434635  , -0.75910497 ],
+        [ 0.54708886 , -0.80075485 , -0.20676109 ,  0.12936543 ]],
+
+       [[ 0.4574187  , -0.2751733  ,  0.6697428  , -0.5162291  ],
+        [ 0.03230872 , -0.5609443  , -0.64844155 , -0.51363546 ],
+        [-0.8204515  ,  0.14386664 ,  0.23241581 , -0.5021402  ],
+        [-0.3414436  , -0.7674136  ,  0.2774007  ,  0.4664135  ]]],
+      dtype=float32)),
+    mlir_module_text=r"""
+#loc1 = loc("operand")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xf32> loc("operand")) -> (tensor<2x4x4xf32> {jax.result_info = "result[0]"}, tensor<2x4xf32> {jax.result_info = "result[1]"}, tensor<2x4x4xf32> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<0x7FC00000> : tensor<f32> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_gesvd_ffi(%arg0) {mhlo.backend_config = {compute_uv = true, full_matrices = true, transposed = false}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o, p], [i, q, r], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=4, p=4, q=4, r=4}, custom>} : (tensor<2x4x4xf32>) -> (tensor<2x4x4xf32>, tensor<2x4xf32>, tensor<2x4x4xf32>, tensor<2x4x4xf32>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %2 = stablehlo.compare  EQ, %0#4, %1,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %3 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4xf32> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %3, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %6 = stablehlo.select %5, %0#1, %4 : tensor<2x4xi1>, tensor<2x4xf32> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4x4xf32> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %0#2, %8 : tensor<2x4x4xi1>, tensor<2x4x4xf32> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4x4xf32> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %0#3, %12 : tensor<2x4x4xi1>, tensor<2x4x4xf32> loc(#loc4)
+    return %10, %6, %14 : tensor<2x4x4xf32>, tensor<2x4xf32>, tensor<2x4x4xf32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":621:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("svd"(#loc3))
+""",
+    mlir_module_serialized=b'ML\xefR\rStableHLO_v1.13.1\x00\x01#\x07\x01\x05\t\x11\x01\x03\x0f\x03\x0f\x13\x17\x1b\x1f#\'+\x03\xe7\x9d3\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03So\x0f\x0b/\x0b\x0bo\x0f\x0b\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b\x1f\x1f#\x0b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1fO/\x0b\x0bO\x05#\x0fg\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x17\x0f\x0f\x17\x0f\x0f\x0f\x01\x05\x0b\x0f\x03/\x1b\x07\x17\x07\x07\x07\x0f\x0f\x07\x13\x1b\x1b\x1f\x13\x13\x13\x13\x13\x17\x13\x17\x13\x13\x02"\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x15\x03\x05\x1f\x05!\x1d\x1b\x1d\x05#\x17\x1f\xb6\t\x1b\x05%\x03\x07#S%[\'}\x05\'\x05)\x05+\x1f\x1f1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f%\x01\x1d-\x1f+\x11\x00\x00\x00\x00\x00\x00\x00\x00\x05\x03\x05\x01\x1f11\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x039\r\x01#\x1d\x03\x07?CG\r\x03-A\x1d/\r\x03-E\x1d1\r\x03-I\x1d3\x1d5\x1d7\x1f\x11\t\x00\x00\xc0\x7f\x1f\x13\t\x00\x00\x00\x00\r\x07U1W1Y3\x1d9\x1d;\x1d=\r\x03]_\x1d?\x1dA\x0b\x03\x1dC\x1dE\x03\x01\x03\x03)\x03\x03m\x15\x03\x01\x01\x01\x03\x0b)q))s\x1f!!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f#\x11\x00\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f/!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x15\t\x11\x11\x11\x11\x11\x11\x11\x11\x11\x03\x7f\x0b\x85\x8b\x8f\x95\x9b\x01\x01\x01\x01\x01\x13\x07{\x81\x83\x11\x03\x05\x11\x03\t\x13\x07{\x87\x89\x11\x03\r\x11\x03\x11\x13\x05{\x8d\x11\x03\x15\x13\x07{\x91\x93\x11\x03\x19\x11\x03\x1d\x13\x07{\x97\x99\x11\x03!\x11\x03%\x13\x03{\x01\t\x01\x02\x02)\x07\t\x11\x11\r\x01)\x05\t\x11\r\x1d\t\x13)\x01\r)\x01\x15\x1b)\x03\t\x15)\x07\t\x05\x05\x07)\x07\t\x11\x11\x07\x11\x03\x05\x07\x05\t\x05)\x03\r\x0f)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0b)\x03\t\x07)\x05\t\x05\x07)\x03\x05\x0b)\x05\t\x11\x07)\x03\t\x0b)\x03\r\x0b\x04\xc2\x02\x05\x01Q\x03\x07\x01\x07\x04\x9a\x02\x03\x01\x05\tP\x03\x03\x07\x04n\x02\x03-K\x03\x0b\x13\x00\x07B\x03\x05\x03\x11\x07B\x01\x07\x03\x13\x0bG\x01!\t\x0b\x05\t\x05\x05\x17\x03\x01\x03F\x01\x0b\x03\x17\x03\x05\rF\x01\r\x03\'\x05\x0f\x11\x03F\x01\x0f\x03)\x03\x13\x03F\x01\x0b\x03\t\x03\x03\x03F\x01\x11\x03-\x03\x15\x05\x06\x01\x03\t\x07\x19\t\x17\x03F\x01\x0f\x03\x19\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1b\x03\x1d\x05\x06\x01\x03\x05\x07!\x0b\x1f\x03F\x01\x0f\x03\x19\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1b\x03%\x05\x06\x01\x03\x05\x07)\r\'\x0f\x04\x03\x07#\x1b+\x06\x03\x01\x05\x01\x00\xbe\x07G)\x03\x05\x1f\x17\x1d\x17\x0f\x0b\x15\x15\x15!%3)s\x15\t\x11\x13%)9\x15\x17\x1f\x11\x19\x15)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00select_v1\x00constant_v1\x00func_v1\x00custom_call_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00operand\x00svd\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00compute_uv\x00full_matrices\x00transposed\x00num_batch_dims\x001\x00\x00hipsolver_gesvd_ffi\x00\x08E\x15\x05#\x01\x0b7;=KM\x03O\x03Q\x11aceg3iko\x03+\x05uw\x03/\x03y\x035',
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# gesdd (divide-and-conquer) on ROCm; same I/O as qr but custom_call @hipsolver_gesdd_ffi.
+# Derived from qr f32 by replacing custom call target (inputs/outputs are algorithm-independent).
+data_2026_02_04["gesdd"]["f32"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_gesdd_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[-8.088836  , -2.6205542 , -7.2633333 ,  5.0895734 ],
+        [ 9.784253  ,  8.099774  , -8.470991  ,  3.0590599 ],
+        [-6.5720334 , -4.4796433 ,  5.5712957 ,  7.9569902 ],
+        [-7.765548  , -8.527966  ,  5.5323663 , -0.61520344]],
+
+       [[-6.685037  ,  5.1507697 , -8.878728  ,  8.7760725 ],
+        [ 2.2026582 ,  5.15965   ,  8.254493  ,  5.2088103 ],
+        [ 1.649047  , -3.3060083 , -4.6077223 , -0.92500544],
+        [-2.111105  ,  2.339333  ,  2.2933412 ,  1.7438462 ]]],
+      dtype=float32),),
+    expected_outputs=(array([[[-0.19646618 , -0.88533336 ,  0.40994054 , -0.097645864],
+        [ 0.6584475  , -0.35089356 , -0.3007529  ,  0.5940271  ],
+        [-0.46186477 , -0.27749717 , -0.8389231  , -0.07670852 ],
+        [-0.56082886 ,  0.126704   ,  0.19417621 ,  0.7948037  ]],
+
+       [[-0.9831455  , -0.14481494 , -0.070398524, -0.0865914  ],
+        [ 0.15959439 , -0.84682167 , -0.50710094 ,  0.016481   ],
+        [-0.06209982 ,  0.41913196 , -0.70081264 ,  0.5738761  ],
+        [-0.06402065 , -0.29368412 ,  0.49674392 ,  0.8141846  ]]],
+      dtype=float32), array([[22.384214 , 12.4938135,  7.4144673,  1.7072145],
+       [15.208481 , 12.81391  ,  3.4745562,  0.4607253]], dtype=float32), array([[[ 0.6889739  ,  0.56735736 , -0.4389969  , -0.10345369 ],
+        [ 0.3656113  , -0.028776985,  0.68496627 , -0.6295405  ],
+        [-0.30387047 , -0.1899195  , -0.5434635  , -0.75910497 ],
+        [ 0.54708886 , -0.80075485 , -0.20676109 ,  0.12936543 ]],
+
+       [[ 0.4574187  , -0.2751733  ,  0.6697428  , -0.5162291  ],
+        [ 0.03230872 , -0.5609443  , -0.64844155 , -0.51363546 ],
+        [-0.8204515  ,  0.14386664 ,  0.23241581 , -0.5021402  ],
+        [-0.3414436  , -0.7674136  ,  0.2774007  ,  0.4664135  ]]],
+      dtype=float32)),
+    mlir_module_text=r"""
+#loc1 = loc("operand")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xf32> loc("operand")) -> (tensor<2x4x4xf32> {jax.result_info = "result[0]"}, tensor<2x4xf32> {jax.result_info = "result[1]"}, tensor<2x4x4xf32> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<0x7FC00000> : tensor<f32> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_gesdd_ffi(%arg0) {mhlo.backend_config = {compute_uv = true, full_matrices = true, transposed = false}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o, p], [i, q, r], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=4, p=4, q=4, r=4}, custom>} : (tensor<2x4x4xf32>) -> (tensor<2x4x4xf32>, tensor<2x4xf32>, tensor<2x4x4xf32>, tensor<2x4x4xf32>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %2 = stablehlo.compare  EQ, %0#4, %1,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %3 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4xf32> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %3, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %6 = stablehlo.select %5, %0#1, %4 : tensor<2x4xi1>, tensor<2x4xf32> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4x4xf32> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %0#2, %8 : tensor<2x4x4xi1>, tensor<2x4x4xf32> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4x4xf32> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %0#3, %12 : tensor<2x4x4xi1>, tensor<2x4x4xf32> loc(#loc4)
+    return %10, %6, %14 : tensor<2x4x4xf32>, tensor<2x4xf32>, tensor<2x4x4xf32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":621:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("svd"(#loc3))
+""",
+    mlir_module_serialized=b'ML\xefR\rStableHLO_v1.13.1\x00\x01#\x07\x01\x05\t\x11\x01\x03\x0f\x03\x0f\x13\x17\x1b\x1f#\'+\x03\xe7\x9d3\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03So\x0f\x0b/\x0b\x0bo\x0f\x0b\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b\x1f\x1f#\x0b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1fO/\x0b\x0bO\x05#\x0fg\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x17\x0f\x0f\x17\x0f\x0f\x0f\x01\x05\x0b\x0f\x03/\x1b\x07\x17\x07\x07\x07\x0f\x0f\x07\x13\x1b\x1b\x1f\x13\x13\x13\x13\x13\x17\x13\x17\x13\x13\x02"\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x15\x03\x05\x1f\x05!\x1d\x1b\x1d\x05#\x17\x1f\xb6\t\x1b\x05%\x03\x07#S%[\'}\x05\'\x05)\x05+\x1f\x1f1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f%\x01\x1d-\x1f+\x11\x00\x00\x00\x00\x00\x00\x00\x00\x05\x03\x05\x01\x1f11\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x039\r\x01#\x1d\x03\x07?CG\r\x03-A\x1d/\r\x03-E\x1d1\r\x03-I\x1d3\x1d5\x1d7\x1f\x11\t\x00\x00\xc0\x7f\x1f\x13\t\x00\x00\x00\x00\r\x07U1W1Y3\x1d9\x1d;\x1d=\r\x03]_\x1d?\x1dA\x0b\x03\x1dC\x1dE\x03\x01\x03\x03)\x03\x03m\x15\x03\x01\x01\x01\x03\x0b)q))s\x1f!!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f#\x11\x00\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f/!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x15\t\x11\x11\x11\x11\x11\x11\x11\x11\x11\x03\x7f\x0b\x85\x8b\x8f\x95\x9b\x01\x01\x01\x01\x01\x13\x07{\x81\x83\x11\x03\x05\x11\x03\t\x13\x07{\x87\x89\x11\x03\r\x11\x03\x11\x13\x05{\x8d\x11\x03\x15\x13\x07{\x91\x93\x11\x03\x19\x11\x03\x1d\x13\x07{\x97\x99\x11\x03!\x11\x03%\x13\x03{\x01\t\x01\x02\x02)\x07\t\x11\x11\r\x01)\x05\t\x11\r\x1d\t\x13)\x01\r)\x01\x15\x1b)\x03\t\x15)\x07\t\x05\x05\x07)\x07\t\x11\x11\x07\x11\x03\x05\x07\x05\t\x05)\x03\r\x0f)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0b)\x03\t\x07)\x05\t\x05\x07)\x03\x05\x0b)\x05\t\x11\x07)\x03\t\x0b)\x03\r\x0b\x04\xc2\x02\x05\x01Q\x03\x07\x01\x07\x04\x9a\x02\x03\x01\x05\tP\x03\x03\x07\x04n\x02\x03-K\x03\x0b\x13\x00\x07B\x03\x05\x03\x11\x07B\x01\x07\x03\x13\x0bG\x01!\t\x0b\x05\t\x05\x05\x17\x03\x01\x03F\x01\x0b\x03\x17\x03\x05\rF\x01\r\x03\'\x05\x0f\x11\x03F\x01\x0f\x03)\x03\x13\x03F\x01\x0b\x03\t\x03\x03\x03F\x01\x11\x03-\x03\x15\x05\x06\x01\x03\t\x07\x19\t\x17\x03F\x01\x0f\x03\x19\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1b\x03\x1d\x05\x06\x01\x03\x05\x07!\x0b\x1f\x03F\x01\x0f\x03\x19\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1b\x03%\x05\x06\x01\x03\x05\x07)\r\'\x0f\x04\x03\x07#\x1b+\x06\x03\x01\x05\x01\x00\xbe\x07G)\x03\x05\x1f\x17\x1d\x17\x0f\x0b\x15\x15\x15!%3)s\x15\t\x11\x13%)9\x15\x17\x1f\x11\x19\x15)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00select_v1\x00constant_v1\x00func_v1\x00custom_call_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00operand\x00svd\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00compute_uv\x00full_matrices\x00transposed\x00num_batch_dims\x001\x00\x00hipsolver_gesdd_ffi\x00\x08E\x15\x05#\x01\x0b7;=KM\x03O\x03Q\x11aceg3iko\x03+\x05uw\x03/\x03y\x035',
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["qr"]["f64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_gesvd_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[ 7.516621433947318  ,  9.495925414094074  ,
+          4.361961694107173  ,  5.57838011364683   ],
+        [-7.294446875834851  , -9.622183592984825  ,
+          4.291499000204173  , -2.5015601805990517 ],
+        [-2.40944749022721   ,  6.628440455612534  ,
+         -1.6017329763895418 , -8.169012011427746  ],
+        [-0.9524103592344364 ,  2.6056644652182754 ,
+         -1.7707069509199496 ,  9.079755164737282  ]],
+
+       [[-8.292072309603471  ,  4.387200699980834  ,
+         -6.17701480971335   ,  2.3067167339225403 ],
+        [-8.572355700016178  ,  9.039479678554585  ,
+          4.690587216470503  ,  9.421807731360794  ],
+        [-0.40052116228612533, -9.00913849115783   ,
+          4.660812984455196  , -0.39685471313335086],
+        [ 6.85836794331054   , -0.7762372063612624 ,
+         -1.9062402955103508 ,  8.146374381579843  ]]]),),
+    expected_outputs=(array([[[ 0.710593156752799   ,  0.04339323803857607 ,
+          0.6108799359169268  , -0.3464103006013976  ],
+        [-0.6414551962489828  ,  0.2654507519818231  ,
+          0.3810239670429581  , -0.6106487255503853  ],
+        [ 0.002097973122686177, -0.8301780287591775  ,
+         -0.23115175512952152 , -0.5073153902404739  ],
+        [ 0.28911623145379906 ,  0.48832096589265755 ,
+         -0.6543816214820828  , -0.49973906435868637 ]],
+
+       [[-0.4845794420083184  ,  0.36379198830363746 ,
+          0.3585778089804869  ,  0.7101127435384802  ],
+        [-0.8117357808096087  , -0.2737011928801392  ,
+         -0.48805327524177633 , -0.16726230805289055 ],
+        [ 0.32303983104156553 , -0.02153072337219175 ,
+         -0.7310502778628764  ,  0.6006223328750929  ],
+        [ 0.043738473875528   , -0.8901008224988602  ,
+          0.31431106673030207 ,  0.32713303871781874 ]]]), array([[18.683935768333495 , 12.662275558869085 ,  6.8338862408024434,
+         4.845264432750695 ],
+       [18.74775820344496  , 11.410736777937716 ,  9.946895692662434 ,
+         6.137629336027487 ]]), array([[[ 5.2129853559569894e-01,  7.3256436071718900e-01,
+         -9.0197653754896436e-03,  4.3762533978891865e-01],
+        [-5.9197451292344128e-03, -5.0326988476028811e-01,
+          1.4164211376179620e-01,  8.5242119361267688e-01],
+        [ 4.3790339491604441e-01, -1.6135574983257261e-01,
+          8.5292030374161054e-01, -2.3394848617225703e-01],
+        [ 7.3242979876871994e-01, -4.2899091190414557e-01,
+         -5.0237745859759764e-01, -1.6471270889728379e-01]],
+
+       [[ 5.9459087097069763e-01, -6.6183264336451042e-01,
+          3.2429963316260670e-02, -4.5539822772465766e-01],
+        [-5.9298019579717476e-01,  5.9722166419666663e-04,
+         -1.6953966020379732e-01, -7.8716607798901594e-01],
+        [ 3.6784091434819871e-01,  3.5222631382775416e-01,
+         -8.5560743787328120e-01, -9.2550515042935433e-02],
+        [-3.9941112313270993e-01, -6.6175057185524333e-01,
+         -4.8799642760291367e-01,  4.0548294910380545e-01]]])),
+    mlir_module_text=r"""
+#loc1 = loc("operand")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xf64> loc("operand")) -> (tensor<2x4x4xf64> {jax.result_info = "result[0]"}, tensor<2x4xf64> {jax.result_info = "result[1]"}, tensor<2x4x4xf64> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<0x7FF8000000000000> : tensor<f64> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_gesvd_ffi(%arg0) {mhlo.backend_config = {compute_uv = true, full_matrices = true, transposed = false}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o, p], [i, q, r], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=4, p=4, q=4, r=4}, custom>} : (tensor<2x4x4xf64>) -> (tensor<2x4x4xf64>, tensor<2x4xf64>, tensor<2x4x4xf64>, tensor<2x4x4xf64>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %2 = stablehlo.compare  EQ, %0#4, %1,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %3 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x4xf64> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %3, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %6 = stablehlo.select %5, %0#1, %4 : tensor<2x4xi1>, tensor<2x4xf64> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x4x4xf64> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %0#2, %8 : tensor<2x4x4xi1>, tensor<2x4x4xf64> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x4x4xf64> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %0#3, %12 : tensor<2x4x4xi1>, tensor<2x4x4xf64> loc(#loc4)
+    return %10, %6, %14 : tensor<2x4x4xf64>, tensor<2x4xf64>, tensor<2x4x4xf64> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":621:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("svd"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01#\x07\x01\x05\t\x11\x01\x03\x0f\x03\x0f\x13\x17\x1b\x1f#'+\x03\xe7\x9d3\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03So\x0f\x0b/\x0b\x0bo\x0f\x0b\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b/\x1f#\x0b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1fO/\x0b\x0bO\x05#\x0fg\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x17\x0f\x0f\x17\x0f\x0f\x0f\x01\x05\x0b\x0f\x03/\x1b\x07\x17\x07\x07\x07\x0f\x0f\x07\x13\x1b\x1b\x1f\x13\x13\x13\x13\x13\x17\x13\x17\x13\x13\x022\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x15\x03\x05\x1f\x05!\x1d\x1b\x1d\x05#\x17\x1f\xb6\t\x1b\x05%\x03\x07#S%['}\x05'\x05)\x05+\x1f\x1f1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f%\x01\x1d-\x1f+\x11\x00\x00\x00\x00\x00\x00\x00\x00\x05\x03\x05\x01\x1f11\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x039\r\x01#\x1d\x03\x07?CG\r\x03-A\x1d/\r\x03-E\x1d1\r\x03-I\x1d3\x1d5\x1d7\x1f\x11\x11\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x13\t\x00\x00\x00\x00\r\x07U1W1Y3\x1d9\x1d;\x1d=\r\x03]_\x1d?\x1dA\x0b\x03\x1dC\x1dE\x03\x01\x03\x03)\x03\x03m\x15\x03\x01\x01\x01\x03\x0b)q))s\x1f!!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f#\x11\x00\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f/!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x15\t\x11\x11\x11\x11\x11\x11\x11\x11\x11\x03\x7f\x0b\x85\x8b\x8f\x95\x9b\x01\x01\x01\x01\x01\x13\x07{\x81\x83\x11\x03\x05\x11\x03\t\x13\x07{\x87\x89\x11\x03\r\x11\x03\x11\x13\x05{\x8d\x11\x03\x15\x13\x07{\x91\x93\x11\x03\x19\x11\x03\x1d\x13\x07{\x97\x99\x11\x03!\x11\x03%\x13\x03{\x01\t\x01\x02\x02)\x07\t\x11\x11\r\x01)\x05\t\x11\r\x1d\x0b\x13)\x01\r)\x01\x15\x1b)\x03\t\x15)\x07\t\x05\x05\x07)\x07\t\x11\x11\x07\x11\x03\x05\x07\x05\t\x05)\x03\r\x0f)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0b)\x03\t\x07)\x05\t\x05\x07)\x03\x05\x0b)\x05\t\x11\x07)\x03\t\x0b)\x03\r\x0b\x04\xc2\x02\x05\x01Q\x03\x07\x01\x07\x04\x9a\x02\x03\x01\x05\tP\x03\x03\x07\x04n\x02\x03-K\x03\x0b\x13\x00\x07B\x03\x05\x03\x11\x07B\x01\x07\x03\x13\x0bG\x01!\t\x0b\x05\t\x05\x05\x17\x03\x01\x03F\x01\x0b\x03\x17\x03\x05\rF\x01\r\x03'\x05\x0f\x11\x03F\x01\x0f\x03)\x03\x13\x03F\x01\x0b\x03\t\x03\x03\x03F\x01\x11\x03-\x03\x15\x05\x06\x01\x03\t\x07\x19\t\x17\x03F\x01\x0f\x03\x19\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1b\x03\x1d\x05\x06\x01\x03\x05\x07!\x0b\x1f\x03F\x01\x0f\x03\x19\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1b\x03%\x05\x06\x01\x03\x05\x07)\r'\x0f\x04\x03\x07#\x1b+\x06\x03\x01\x05\x01\x00\xbe\x07G)\x03\x05\x1f\x17\x1d\x17\x0f\x0b\x15\x15\x15!%3)s\x15\t\x11\x13%)9\x15\x17\x1f\x11\x19\x15)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00select_v1\x00constant_v1\x00func_v1\x00custom_call_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00operand\x00svd\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00compute_uv\x00full_matrices\x00transposed\x00num_batch_dims\x001\x00\x00hipsolver_gesvd_ffi\x00\x08E\x15\x05#\x01\x0b7;=KM\x03O\x03Q\x11aceg3iko\x03+\x05uw\x03/\x03y\x035",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["qr"]["c64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_gesvd_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[ 5.1529994  -1.2366186j,  3.4151247  -4.7387176j,
+          9.5636425  -8.201898j ,  6.536134   -4.6525245j],
+        [-8.4091     +6.4209814j, -3.8424058  -0.511163j ,
+         -2.1341999  +4.956986j , -0.68947995 +2.1529553j],
+        [-0.30219    -9.666059j , -0.044237416+4.2940593j,
+         -4.1715403  +5.2976294j, -1.3943245  +1.8789417j],
+        [-9.0755005  +7.546829j , -7.630291   -3.62061j  ,
+          6.448428   -4.0384274j, -7.065759   -9.805366j ]],
+
+       [[ 4.286493   +0.7896354j, -4.024747   +2.2482893j,
+         -8.564833   +5.948362j , -9.7399845  -3.4490995j],
+        [ 6.6070595  -8.43279j  ,  1.6180693  +5.6450553j,
+         -8.772443   -2.9169078j, -1.2268616  -4.769274j ],
+        [ 1.3227078  +1.7313296j,  3.9845204  -0.5684758j,
+          9.138408   +6.9373603j, -4.7926993  -4.8423553j],
+        [ 3.4307988  -5.6387033j,  5.9531016  -0.8393127j,
+         -2.0458186  -6.3643475j, -4.3651037  -8.67327j  ]]],
+      dtype=complex64),),
+    expected_outputs=(array([[[ 0.30495852 +0.096999586j,  0.72827613 +0.03194175j ,
+          0.20767818 +0.042641692j, -0.28966787 -0.4871642j  ],
+        [ 0.115591295-0.1449632j  , -0.49115598 +0.23452608j ,
+         -0.013264754-0.5263807j  , -0.35325044 -0.5170581j  ],
+        [-0.2174027  +0.29466262j , -0.2795165  -0.27255905j ,
+         -0.27765262 +0.6150545j  , -0.34620082 -0.37182543j ],
+        [ 0.60895675 -0.59857947j , -0.12601145 +0.06371821j ,
+         -0.22057684 +0.4168473j  ,  0.15328544 -0.07087361j ]],
+
+       [[-0.022096228+0.5509537j  ,  0.10202758 +0.25620914j ,
+          0.46818483 +0.513836j   ,  0.31120205 -0.19959508j ],
+        [-0.4309677  +0.4594079j  ,  0.15301313 -0.036881473j,
+          0.22284088 -0.48527643j , -0.05199984 +0.53905755j ],
+        [ 0.26196426 -0.032041073j,  0.6947033  -0.22732396j ,
+         -0.117719345+0.40873566j , -0.19235809 +0.42206088j ],
+        [-0.3937812  +0.2728696j  ,  0.23826325 -0.55508226j ,
+         -0.22510253 +0.005555059j, -0.16906178 -0.5712348j  ]]],
+      dtype=complex64), array([[23.247055 , 20.633308 ,  7.335599 ,  2.013584 ],
+       [22.780914 , 15.782362 , 12.775513 ,  1.0651652]], dtype=float32), array([[[-0.57116145 -0.j         , -0.042698324-0.4338231j  ,
+          0.4287732  -0.07257515j ,  0.15371813 -0.5205827j  ],
+        [ 0.6636313  +0.j         ,  0.17815456 -0.12978375j ,
+          0.36668688 -0.52016j    ,  0.271322   -0.17991613j ],
+        [-0.40411592 -0.j         ,  0.49817383 -0.045163676j,
+          0.049928322-0.5456577j  , -0.1296575  +0.51906395j ],
+        [ 0.2646859  +0.j         ,  0.22178493 -0.6796956j  ,
+          0.08210006 +0.3144607j  , -0.5465213  +0.12022976j ]],
+
+       [[-0.39417964 -0.j         ,  0.07517068 -0.10199716j ,
+          0.3137599  +0.6606039j  , -0.22367497 +0.4936552j  ],
+        [ 0.40769133 +0.j         ,  0.31594533 +0.36745775j ,
+          0.45824614 +0.397673j   , -0.021774545-0.47993127j ],
+        [ 0.6047127  -0.j         , -0.4034314  +0.29415658j ,
+          0.054178037-0.06489535j , -0.3735269  +0.48823014j ],
+        [-0.55922544 +0.j         , -0.25889853 +0.6578646j  ,
+          0.17150019 -0.24589685j , -0.2621226  -0.1699021j  ]]],
+      dtype=complex64)),
+    mlir_module_text=r"""
+#loc1 = loc("operand")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xcomplex<f32>> loc("operand")) -> (tensor<2x4x4xcomplex<f32>> {jax.result_info = "result[0]"}, tensor<2x4xf32> {jax.result_info = "result[1]"}, tensor<2x4x4xcomplex<f32>> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<(0x7FC00000,0x7FC00000)> : tensor<complex<f32>> loc(#loc)
+    %cst_0 = stablehlo.constant dense<0x7FC00000> : tensor<f32> loc(#loc4)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_gesvd_ffi(%arg0) {mhlo.backend_config = {compute_uv = true, full_matrices = true, transposed = false}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o, p], [i, q, r], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=4, p=4, q=4, r=4}, custom>} : (tensor<2x4x4xcomplex<f32>>) -> (tensor<2x4x4xcomplex<f32>>, tensor<2x4xf32>, tensor<2x4x4xcomplex<f32>>, tensor<2x4x4xcomplex<f32>>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %2 = stablehlo.compare  EQ, %0#4, %1,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %3 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<f32>) -> tensor<2x4xf32> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %3, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %6 = stablehlo.select %5, %0#1, %4 : tensor<2x4xi1>, tensor<2x4xf32> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f32>>) -> tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %0#2, %8 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f32>>) -> tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %0#3, %12 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    return %10, %6, %14 : tensor<2x4x4xcomplex<f32>>, tensor<2x4xf32>, tensor<2x4x4xcomplex<f32>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":621:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("svd"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01#\x07\x01\x05\t\x11\x01\x03\x0f\x03\x0f\x13\x17\x1b\x1f#'+\x03\xed\x9f7\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03Uo\x0f\x0b/\x0b\x0bo\x0f\x0b\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0b/\x1f\x1f#\x0b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1fO/\x0b\x0bO\x05#\x0fg\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x17\x0f\x0f\x17\x0f\x0f\x0f\x01\x05\x0b\x0f\x033\x1b\x07\x17\x07\x07\x07\x0b\x0f\x0f\x0f\x07\x13\x1b\x1b\x1f\x13\x13\x13\x13\x13\x17\x13\x17\x13\x13\x02b\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x15\x03\x05\x1f\x05!\x1d\x1b\x1d\x05#\x17\x1f\xb6\t\x1b\x05%\x03\x07#U%]'\x7f\x05'\x05)\x05+\x1f#1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f)\x01\x1d-\x1f/\x11\x00\x00\x00\x00\x00\x00\x00\x00\x05\x03\x05\x01\x1f51\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x039\r\x01#!\x03\x07?CG\r\x03-A\x1d/\r\x03-E\x1d1\r\x03-I\x1d3\x1d5\x1d7\x1f\x13\x11\x00\x00\xc0\x7f\x00\x00\xc0\x7f\x1f\x15\t\x00\x00\xc0\x7f\x1f\x17\t\x00\x00\x00\x00\r\x07W1Y1[3\x1d9\x1d;\x1d=\r\x03_a\x1d?\x1dA\x0b\x03\x1dC\x1dE\x03\x01\x03\x03)\x03\x03o\x15\x03\x01\x01\x01\x03\x0b)s))u\x1f%!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f'\x11\x00\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f3!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x15\t\x11\x11\x11\x11\x11\x11\x11\x11\x11\x03\x81\x0b\x87\x8d\x91\x97\x9d\x01\x01\x01\x01\x01\x13\x07}\x83\x85\x11\x03\x05\x11\x03\t\x13\x07}\x89\x8b\x11\x03\r\x11\x03\x11\x13\x05}\x8f\x11\x03\x15\x13\x07}\x93\x95\x11\x03\x19\x11\x03\x1d\x13\x07}\x99\x9b\x11\x03!\x11\x03%\x13\x03}\x01\t\x01\x02\x02)\x07\t\x11\x11\x11\x01)\x05\t\x11\r\x1d\t\x13\x03\r)\x01\x11)\x01\r)\x01\x19\x1b)\x03\t\x19)\x07\t\x05\x05\x07)\x07\t\x11\x11\x07\x11\x03\x05\x07\x05\t\x05)\x03\r\x0f)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0b)\x03\t\x07)\x05\t\x05\x07)\x03\x05\x0b)\x05\t\x11\x07)\x03\t\x0b)\x03\r\x0b\x04\xda\x02\x05\x01Q\x03\x07\x01\x07\x04\xb2\x02\x03\x01\x05\tP\x03\x03\x07\x04\x86\x02\x03/O\x03\x0b\x13\x00\x05B\x03\x05\x03\x13\x05B\x01\x07\x03\x15\x05B\x01\t\x03\x17\x0bG\x01!\x0b\x0b\x05\t\x05\x05\x1b\x03\x01\x03F\x01\r\x03\x1b\x03\x07\rF\x01\x0f\x03+\x05\x11\x13\x03F\x01\x11\x03-\x03\x15\x03F\x01\r\x03\t\x03\x05\x03F\x01\x13\x031\x03\x17\x07\x06\x01\x03\t\x07\x1b\x0b\x19\x03F\x01\x11\x03\x1d\x03\x15\x03F\x01\r\x03\x05\x03\x03\x03F\x01\x15\x03\x1f\x03\x1f\x07\x06\x01\x03\x05\x07#\r!\x03F\x01\x11\x03\x1d\x03\x15\x03F\x01\r\x03\x05\x03\x03\x03F\x01\x15\x03\x1f\x03'\x07\x06\x01\x03\x05\x07+\x0f)\x0f\x04\x03\x07%\x1d-\x06\x03\x01\x05\x01\x00\xbe\x07G)\x03\x05\x1f\x17\x1d\x17\x0f\x0b\x15\x15\x15!%3)s\x15\t\x11\x13%)9\x15\x17\x1f\x11\x15\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00select_v1\x00func_v1\x00custom_call_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00operand\x00svd\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00compute_uv\x00full_matrices\x00transposed\x00num_batch_dims\x001\x00\x00hipsolver_gesvd_ffi\x00\x08I\x17\x05#\x01\x0b7;=KM\x03O\x03Q\x03S\x11cegi3kmq\x03+\x05wy\x03/\x03{\x035",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["qr"]["c128"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_gesvd_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[-1.9905224803805588-1.8349519681179167j,
+          5.735842655793476 +9.800262022922936j ,
+          9.930770453807153 -7.660992394369175j ,
+         -3.2929936512332603-0.3833378170735138j],
+        [ 4.341007948722385 +6.667554829993922j ,
+          1.5156378758308087+7.411002120943763j ,
+          2.4340125691446453-3.0850645481331496j,
+          9.875989691331203 -6.1366179498083735j],
+        [ 3.818748621455894 +4.606673418196037j ,
+          2.3537469571912517-2.9500306466751454j,
+         -7.202066665251294 +9.776480393608004j ,
+          1.520165382948818 +3.0178751445902474j],
+        [-0.2425449354190654-6.241013740812507j ,
+         -4.519117705886435 +3.868789479046006j ,
+         -1.1661731919174017-2.2818202948221833j,
+         -4.660958033035887 +8.360465211846016j ]],
+
+       [[-6.145471273178405 -1.0978433303755946j,
+          9.51601108696423  +5.991155719658801j ,
+          1.5805963559425624+8.308317987231838j ,
+          3.5484468974281995+9.934912177588416j ],
+        [ 7.09882908688272  +9.89156207005951j  ,
+          9.567356209650448 -4.229572146087315j ,
+         -2.044167232859591 -7.774476424929708j ,
+          3.1765005877310397+6.075776012012803j ],
+        [ 3.117187801988422 +7.826519832345586j ,
+          4.6711728079985235+2.922980100012577j ,
+         -9.474622452988285 +9.198398274345259j ,
+         -9.629383830755769 -0.6972018625578293j],
+        [ 7.526887742226929 +8.892734666231693j ,
+          3.629557229748798 -6.978519004131796j ,
+         -8.884252532467453 +9.982683952825951j ,
+          0.7061661847199137-1.6717995600652547j]]]),),
+    expected_outputs=(array([[[-0.35905865386373553  -0.6657106780577163j  ,
+          0.10967295665724751  +0.0725422808481802j  ,
+         -0.06540584145175349  +0.4126017403819886j  ,
+         -0.001892455755736052 -0.48589498312068874j ],
+        [-0.019365762327029423 -0.3458402738996379j  ,
+         -0.16646314362343423  -0.7163119320774831j  ,
+         -0.2931706961839591   -0.30249907055652614j ,
+         -0.3813721127443      +0.12769994835294057j ],
+        [ 0.23695882564468548  +0.4995905479185137j  ,
+         -0.08616434176653853  -0.2306488965643763j  ,
+         -0.4047944302869717   +0.45289367548195103j ,
+         -0.20089033683194188  -0.4736121330643781j  ],
+        [-0.019328042734500266 -0.04256611971555387j ,
+          0.40686973660845127  +0.4644679838261983j  ,
+         -0.528195531188617    -0.008087255323249769j,
+         -0.49750847736278525  +0.29995075218256234j ]],
+
+       [[-0.05849782863570836  +0.1349108572724311j  ,
+          0.6915190647040965   -0.00724172047557089j ,
+          0.35050509142457625  +0.5154062016013146j  ,
+          0.3335086644994931   +0.02001509955933467j ],
+        [ 0.12409676403141817  +0.46965841967658595j ,
+         -0.0010071875014091454-0.47363472964505565j ,
+         -0.6419183280668094   +0.10040875952807082j ,
+          0.3407897981969638   +0.03756787161969258j ],
+        [ 0.18961104008215124  +0.4852170511373144j  ,
+          0.10670334298673206  +0.512049704917858j   ,
+         -0.004857315166004077 -0.2903275987339464j  ,
+          0.11649485988968188  -0.5976176056439488j  ],
+        [ 0.5193617369970899   +0.44863512961725066j ,
+         -0.10599623987661626  +0.11226024453798102j ,
+          0.3132053628168187   -0.08336823102264292j ,
+         -0.10592214730187742  +0.6236064293405494j  ]]]), array([[21.932220876405268 , 18.880687206540177 ,  9.052253933601701 ,
+         6.147242993662446 ],
+       [27.125418969190424 , 23.667528381493124 , 12.813953745318111 ,
+         2.4083691203679507]]), array([[[ 0.1378321823471533  -0.j                  ,
+         -0.5548648056348718  -0.0666549568767057j  ,
+          0.2667942513133091  +0.7373836529036589j  ,
+          0.22664082543819475 +0.049036372646054247j],
+        [-0.5423046445376736  +0.j                  ,
+         -0.20047141262021817 +0.26380919119352203j ,
+         -0.04399203613481576 -0.11619433399764471j ,
+          0.18656608276051542 +0.7388357531574219j  ],
+        [-0.35321469731224603 -0.j                  ,
+          0.11589839419447341 -0.7372405155817185j  ,
+          0.48459340421596897 -0.16079096916727068j ,
+          0.23904452001415227 -0.021367645785028748j],
+        [-0.7497648562215402  -0.j                  ,
+         -0.011601857648442198+0.14424794231622187j ,
+         -0.14742701295968097 +0.2953481438482363j  ,
+         -0.20589294112027193 -0.5153187702614431j  ]],
+
+       [[ 0.6645194179564081  +0.j                  ,
+          0.01882587817102112 -0.5020226405475181j  ,
+         -0.012734677138399427+0.5459009841135211j  ,
+          0.06757793695402495 +0.05741048533823283j ],
+        [-0.18562298018354922 +0.j                  ,
+          0.3953840883722747  +0.2957581208145406j  ,
+          0.4427410359357688  +0.4465462969959478j  ,
+         -0.09067453282761491 +0.5640013960056106j  ],
+        [-0.5427543454444135  +0.j                  ,
+          0.05497243001630322 -0.1241954144322904j  ,
+         -0.06802220053499675 +0.5372137093245434j  ,
+          0.4327322582872426  -0.45441000743718807j ],
+        [ 0.478931908404379   -0.j                  ,
+          0.18941886075062406 +0.670441225975174j   ,
+          0.11217879809210324 +0.024434632932612357j,
+          0.3614901872681235  -0.37602791824264514j ]]])),
+    mlir_module_text=r"""
+#loc1 = loc("operand")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xcomplex<f64>> loc("operand")) -> (tensor<2x4x4xcomplex<f64>> {jax.result_info = "result[0]"}, tensor<2x4xf64> {jax.result_info = "result[1]"}, tensor<2x4x4xcomplex<f64>> {jax.result_info = "result[2]"}) {
+    %cst = stablehlo.constant dense<(0x7FF8000000000000,0x7FF8000000000000)> : tensor<complex<f64>> loc(#loc)
+    %cst_0 = stablehlo.constant dense<0x7FF8000000000000> : tensor<f64> loc(#loc4)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_gesvd_ffi(%arg0) {mhlo.backend_config = {compute_uv = true, full_matrices = true, transposed = false}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 2, 0]> : tensor<3xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o, p], [i, q, r], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=4, p=4, q=4, r=4}, custom>} : (tensor<2x4x4xcomplex<f64>>) -> (tensor<2x4x4xcomplex<f64>>, tensor<2x4xf64>, tensor<2x4x4xcomplex<f64>>, tensor<2x4x4xcomplex<f64>>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %2 = stablehlo.compare  EQ, %0#4, %1,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %3 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<f64>) -> tensor<2x4xf64> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %3, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %6 = stablehlo.select %5, %0#1, %4 : tensor<2x4xi1>, tensor<2x4xf64> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f64>>) -> tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %0#2, %8 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<complex<f64>>) -> tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %0#3, %12 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    return %10, %6, %14 : tensor<2x4x4xcomplex<f64>>, tensor<2x4xf64>, tensor<2x4x4xcomplex<f64>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":621:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("svd"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01#\x07\x01\x05\t\x11\x01\x03\x0f\x03\x0f\x13\x17\x1b\x1f#'+\x03\xed\x9f7\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03Uo\x0f\x0b/\x0b\x0bo\x0f\x0b\x0b\x17\x13\x0b\x13\x0b\x13\x0b\x0b\x0bO/\x1f#\x0b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1fO/\x0b\x0bO\x05#\x0fg\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x17\x0f\x0f\x17\x0f\x0f\x0f\x01\x05\x0b\x0f\x033\x1b\x07\x17\x07\x07\x07\x0b\x0f\x0f\x0f\x07\x13\x1b\x1b\x1f\x13\x13\x13\x13\x13\x17\x13\x17\x13\x13\x02\x92\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x15\x03\x05\x1f\x05!\x1d\x1b\x1d\x05#\x17\x1f\xb6\t\x1b\x05%\x03\x07#U%]'\x7f\x05'\x05)\x05+\x1f#1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f)\x01\x1d-\x1f/\x11\x00\x00\x00\x00\x00\x00\x00\x00\x05\x03\x05\x01\x1f51\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x03\x039\r\x01#!\x03\x07?CG\r\x03-A\x1d/\r\x03-E\x1d1\r\x03-I\x1d3\x1d5\x1d7\x1f\x13!\x00\x00\x00\x00\x00\x00\xf8\x7f\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x15\x11\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x17\t\x00\x00\x00\x00\r\x07W1Y1[3\x1d9\x1d;\x1d=\r\x03_a\x1d?\x1dA\x0b\x03\x1dC\x1dE\x03\x01\x03\x03)\x03\x03o\x15\x03\x01\x01\x01\x03\x0b)s))u\x1f%!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f'\x11\x00\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f3!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x15\t\x11\x11\x11\x11\x11\x11\x11\x11\x11\x03\x81\x0b\x87\x8d\x91\x97\x9d\x01\x01\x01\x01\x01\x13\x07}\x83\x85\x11\x03\x05\x11\x03\t\x13\x07}\x89\x8b\x11\x03\r\x11\x03\x11\x13\x05}\x8f\x11\x03\x15\x13\x07}\x93\x95\x11\x03\x19\x11\x03\x1d\x13\x07}\x99\x9b\x11\x03!\x11\x03%\x13\x03}\x01\t\x01\x02\x02)\x07\t\x11\x11\x11\x01)\x05\t\x11\r\x1d\x0b\x13\x03\r)\x01\x11)\x01\r)\x01\x19\x1b)\x03\t\x19)\x07\t\x05\x05\x07)\x07\t\x11\x11\x07\x11\x03\x05\x07\x05\t\x05)\x03\r\x0f)\x03\t\x0f)\x03\x05\x0f)\x03\x01\x0b)\x03\t\x07)\x05\t\x05\x07)\x03\x05\x0b)\x05\t\x11\x07)\x03\t\x0b)\x03\r\x0b\x04\xda\x02\x05\x01Q\x03\x07\x01\x07\x04\xb2\x02\x03\x01\x05\tP\x03\x03\x07\x04\x86\x02\x03/O\x03\x0b\x13\x00\x05B\x03\x05\x03\x13\x05B\x01\x07\x03\x15\x05B\x01\t\x03\x17\x0bG\x01!\x0b\x0b\x05\t\x05\x05\x1b\x03\x01\x03F\x01\r\x03\x1b\x03\x07\rF\x01\x0f\x03+\x05\x11\x13\x03F\x01\x11\x03-\x03\x15\x03F\x01\r\x03\t\x03\x05\x03F\x01\x13\x031\x03\x17\x07\x06\x01\x03\t\x07\x1b\x0b\x19\x03F\x01\x11\x03\x1d\x03\x15\x03F\x01\r\x03\x05\x03\x03\x03F\x01\x15\x03\x1f\x03\x1f\x07\x06\x01\x03\x05\x07#\r!\x03F\x01\x11\x03\x1d\x03\x15\x03F\x01\r\x03\x05\x03\x03\x03F\x01\x15\x03\x1f\x03'\x07\x06\x01\x03\x05\x07+\x0f)\x0f\x04\x03\x07%\x1d-\x06\x03\x01\x05\x01\x00\xbe\x07G)\x03\x05\x1f\x17\x1d\x17\x0f\x0b\x15\x15\x15!%3)s\x15\t\x11\x13%)9\x15\x17\x1f\x11\x15\x19)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00constant_v1\x00select_v1\x00func_v1\x00custom_call_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00operand\x00svd\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00main\x00public\x00compute_uv\x00full_matrices\x00transposed\x00num_batch_dims\x001\x00\x00hipsolver_gesvd_ffi\x00\x08I\x17\x05#\x01\x0b7;=KM\x03O\x03Q\x03S\x11cegi3kmq\x03+\x05wy\x03/\x03{\x035",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
diff --git a/jax/_src/internal_test_util/export_back_compat_test_data/rocm_threefry2x32.py b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_threefry2x32.py
new file mode 100644
index 000000000000..7f1bb542ddcb
--- /dev/null
+++ b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_threefry2x32.py
@@ -0,0 +1,106 @@
+# Copyright 2026 The JAX Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import datetime
+import numpy as np
+array = np.array
+uint32 = np.uint32
+float32 = np.float32
+
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_05 = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hip_threefry2x32_ffi'],
+    serialized_date=datetime.date(2026, 2, 5),
+    inputs=(array([0, 42], dtype=uint32),),
+    expected_outputs=(array([[0.6878003   , 0.599579    , 0.2652017   , 0.24115169  ],
+       [0.76292205  , 0.28484797  , 0.040389538 , 0.0032066107]],
+      dtype=float32),),
+    mlir_module_text=r"""
+#loc = loc(unknown)
+#loc1 = loc("x")
+#loc2 = loc("/rocm-jax/jax/tests/export_back_compat_test.py":808:15)
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  sdy.mesh @empty_mesh = <[]> loc(#loc)
+  func.func public @main(%arg0: tensor<2xui32> loc("x")) -> (tensor<2x4xf32> {jax.result_info = "result"}) {
+    %cst = stablehlo.constant dense<1.000000e+00> : tensor<f32> loc(#loc)
+    %cst_0 = stablehlo.constant dense<0.000000e+00> : tensor<f32> loc(#loc)
+    %0 = sdy.sharding_constraint %arg0 <@empty_mesh, [{}]> : tensor<2xui32> loc(#loc)
+    %1 = call @_uniform(%0, %cst_0, %cst) : (tensor<2xui32>, tensor<f32>, tensor<f32>) -> tensor<2x4xf32> loc(#loc4)
+    return %1 : tensor<2x4xf32> loc(#loc)
+  } loc(#loc)
+  func.func private @_uniform(%arg0: tensor<2xui32> loc(unknown), %arg1: tensor<f32> loc(unknown), %arg2: tensor<f32> loc(unknown)) -> tensor<2x4xf32> {
+    %cst = stablehlo.constant dense<1.000000e+00> : tensor<f32> loc(#loc16)
+    %c = stablehlo.constant dense<1065353216> : tensor<ui32> loc(#loc16)
+    %c_0 = stablehlo.constant dense<9> : tensor<ui32> loc(#loc16)
+    %0 = stablehlo.convert %arg1 : tensor<f32> loc(#loc6)
+    %1 = stablehlo.convert %arg2 : tensor<f32> loc(#loc6)
+    %2 = stablehlo.broadcast_in_dim %0, dims = [] : (tensor<f32>) -> tensor<1x1xf32> loc(#loc7)
+    %3 = stablehlo.broadcast_in_dim %1, dims = [] : (tensor<f32>) -> tensor<1x1xf32> loc(#loc7)
+    %4 = stablehlo.iota dim = 0 : tensor<8xui32> loc(#loc8)
+    %5 = stablehlo.slice %arg0 [0:1] : (tensor<2xui32>) -> tensor<1xui32> loc(#loc8)
+    %6 = stablehlo.reshape %5 : (tensor<1xui32>) -> tensor<ui32> loc(#loc8)
+    %7 = stablehlo.slice %arg0 [1:2] : (tensor<2xui32>) -> tensor<1xui32> loc(#loc8)
+    %8 = stablehlo.reshape %7 : (tensor<1xui32>) -> tensor<ui32> loc(#loc8)
+    %9 = stablehlo.slice %4 [0:4] : (tensor<8xui32>) -> tensor<4xui32> loc(#loc8)
+    %10 = stablehlo.slice %4 [4:8] : (tensor<8xui32>) -> tensor<4xui32> loc(#loc8)
+    %11:2 = call @threefry2x32(%6, %8, %9, %10) : (tensor<ui32>, tensor<ui32>, tensor<4xui32>, tensor<4xui32>) -> (tensor<4xui32>, tensor<4xui32>) loc(#loc8)
+    %12 = stablehlo.concatenate %11#0, %11#1, dim = 0 : (tensor<4xui32>, tensor<4xui32>) -> tensor<8xui32> loc(#loc8)
+    %13 = stablehlo.reshape %12 : (tensor<8xui32>) -> tensor<2x4xui32> loc(#loc8)
+    %14 = stablehlo.broadcast_in_dim %c_0, dims = [] : (tensor<ui32>) -> tensor<2x4xui32> loc(#loc9)
+    %15 = stablehlo.shift_right_logical %13, %14 : tensor<2x4xui32> loc(#loc9)
+    %16 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<ui32>) -> tensor<2x4xui32> loc(#loc10)
+    %17 = stablehlo.or %15, %16 : tensor<2x4xui32> loc(#loc10)
+    %18 = stablehlo.bitcast_convert %17 : (tensor<2x4xui32>) -> tensor<2x4xf32> loc(#loc11)
+    %19 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4xf32> loc(#loc12)
+    %20 = stablehlo.subtract %18, %19 : tensor<2x4xf32> loc(#loc12)
+    %21 = stablehlo.subtract %3, %2 : tensor<1x1xf32> loc(#loc12)
+    %22 = stablehlo.broadcast_in_dim %21, dims = [0, 1] : (tensor<1x1xf32>) -> tensor<2x4xf32> loc(#loc13)
+    %23 = stablehlo.multiply %20, %22 : tensor<2x4xf32> loc(#loc13)
+    %24 = stablehlo.broadcast_in_dim %2, dims = [0, 1] : (tensor<1x1xf32>) -> tensor<2x4xf32> loc(#loc14)
+    %25 = stablehlo.add %23, %24 : tensor<2x4xf32> loc(#loc14)
+    %26 = stablehlo.broadcast_in_dim %2, dims = [0, 1] : (tensor<1x1xf32>) -> tensor<2x4xf32> loc(#loc15)
+    %27 = stablehlo.maximum %26, %25 : tensor<2x4xf32> loc(#loc15)
+    return %27 : tensor<2x4xf32> loc(#loc16)
+  } loc(#loc16)
+  func.func private @threefry2x32(%arg0: tensor<ui32> loc("/rocm-jax/jax/tests/export_back_compat_test.py":808:15), %arg1: tensor<ui32> loc("/rocm-jax/jax/tests/export_back_compat_test.py":808:15), %arg2: tensor<4xui32> loc("/rocm-jax/jax/tests/export_back_compat_test.py":808:15), %arg3: tensor<4xui32> loc("/rocm-jax/jax/tests/export_back_compat_test.py":808:15)) -> (tensor<4xui32>, tensor<4xui32>) {
+    %0 = stablehlo.broadcast_in_dim %arg0, dims = [] : (tensor<ui32>) -> tensor<4xui32> loc(#loc3)
+    %1 = stablehlo.broadcast_in_dim %arg1, dims = [] : (tensor<ui32>) -> tensor<4xui32> loc(#loc3)
+    %2 = stablehlo.broadcast_in_dim %arg2, dims = [0] : (tensor<4xui32>) -> tensor<4xui32> loc(#loc3)
+    %3 = stablehlo.broadcast_in_dim %arg3, dims = [0] : (tensor<4xui32>) -> tensor<4xui32> loc(#loc3)
+    %4:2 = stablehlo.custom_call @hip_threefry2x32_ffi(%0, %1, %2, %3) {mhlo.backend_config = {}, operand_layouts = [dense<0> : tensor<1xindex>, dense<0> : tensor<1xindex>, dense<0> : tensor<1xindex>, dense<0> : tensor<1xindex>], result_layouts = [dense<0> : tensor<1xindex>, dense<0> : tensor<1xindex>]} : (tensor<4xui32>, tensor<4xui32>, tensor<4xui32>, tensor<4xui32>) -> (tensor<4xui32>, tensor<4xui32>) loc(#loc3)
+    return %4#0, %4#1 : tensor<4xui32>, tensor<4xui32> loc(#loc2)
+  } loc(#loc2)
+} loc(#loc)
+#loc3 = loc("threefry2x32")
+#loc4 = loc("jit(func)/jit(_uniform)"(#loc2))
+#loc5 = loc("jit(func)/jit"(#loc2))
+#loc6 = loc("convert_element_type"(#loc2))
+#loc7 = loc("broadcast_in_dim"(#loc2))
+#loc8 = loc(""(#loc2))
+#loc9 = loc("shift_right_logical"(#loc2))
+#loc10 = loc("or"(#loc2))
+#loc11 = loc("bitcast_convert_type"(#loc2))
+#loc12 = loc("sub"(#loc2))
+#loc13 = loc("mul"(#loc2))
+#loc14 = loc("add"(#loc2))
+#loc15 = loc("max"(#loc2))
+#loc16 = loc("jit:"(#loc5))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.13.1\x00\x01C\x07\x01\x05\t-\x01\x05\x0f\x13\x03\x05\x17\x1b\x05%\x1f#'+/37;?CGKOSW[_c\x03\xed\xa51\x01Y\x17\x07\x0f\x0f\x0f\x0f\x0f\x0b\x0f\x0f\x0f\x0f\x0f\x0f\x0f\x0f\x0f#\x0b\x0f\x0b\x0b\x0b\x0b\x0f\x0b\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x03\x07\x0f\x17\x13\x05G\x0f//\x0b\x0b/O\x0f\x0b\x0b\x0b\x1f\x0f/\x0b\x0f\x13\x0b\x0b\x0b\x0b\x17\x0b\x0b\x0b\x0b\x0b\x0b\x1b\x13\x1f\x1f//\x1f\x01\t\x13\x0b\x0f\x0f\x05)\x13\x17\x0f\x0f\x07\x13\x13\x17\x07\x07\x17\x13\x13\x17\x1f'\x13\x13\x07\x13\x02&\x06\x175\xa2\x0c\x1f\x1f\x1dA\x01\x1d/1\x1d7\x03\x1dK\x01\x11\x05\x05\x053\x1d=\x01\x1d?\x01\x1dC\x01\x1dE\x01\x1dM\x01\x1dO\x01\x1dQ\x01\x1dS\x03\x1dW\x01\x03\x07%')\r+\r\x055\x11\x03\x00\x057\x059\x05;\x05=\x1d3\x01\x05?\x05A\x05C\x03\x03;e\x05E\x05G\x05I\x05K\x05M\x05O\x1dI\x01\x05Q\x05S\x05U\x05W\x05Y\x05[\t\x0f\x05]\x05\x01\x01\rU\x03]\x01\x0b\x01\x01\x01\x1f)\x01\x1f+\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f\x15\x11\x01\x00\x00\x00\x00\x00\x00\x00\r\x01\x03\x01\x1f\x15\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f/!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x03\x03e\x1d_\x1da\x1dC\x1f\r\t\x00\x00\x80?\x13\x19\x01\x1f\x15\x11\x04\x00\x00\x00\x00\x00\x00\x00##\x03\x03\x7f\r\x03\x81\x83\x1dc\x1de\x1dg\x1di\x03\x07eee#%#'\x0b\x03\x1dK\x1dk\x05\x01\x03\taaaa\x03\x05aa\x1f\x0f\t\x00\x00\x80?\x1f\x0f\t\t\x00\x00\x00\x1f\x15\x11\x02\x00\x00\x00\x00\x00\x00\x00\x1f\x15\x11\x08\x00\x00\x00\x00\x00\x00\x00\x1f\r\t\x00\x00\x00\x00\x1b\x03\t\x07\x01\t\x01\x02\x02\x01\n\x02)\x03\x11\x11)\x05\t\x11\x1b)\x01\x1b)\x01\x11%)\x03\t\x11)\x03\x05\x19)\x05\t\x11\x11\x1d\t)\x05\x05\x05\x1b)\x03!\x11)\x03\x05\x11\x11\x03\x13\x03\x0b\x11\x07\x13\r\r\x03\x0b\x11\t\x0f\x0f\t\t\x05\t\t)\x03\x01\x19)\x03\x05-\x13)\x03\t\x19\x04n\x06\x05\x03Q\x03#\x01\x07\x04F\x06\x03\x01\x11\x05@\x03\x03\x0fP\x03\x05\x07\x04q\x03\x0f\x1f\x03'\x1f\x00\x01\x06\x1f\x03\x01\x03\x01\x0bB\x03\x07\x03\r\x0bB\x03\t\x03\r\x07F\x03\x0b\x03\x01\x03\x03\x01\x06!\x03\x13\x03\t\x17F!\r\x03\x0b\x07\x0b\x07\x05\x11\x04\x03\x03\r\x0fP\x07\x0f\x07\x04\xf2\x03\x03G\x83\x07%\x19\x19\x00\x0bB\x07\x07\x03\r\x0bB\x07\x11\x03\x0f\x0bB\x07\x13\x03\x0f\x15\x06\x11\x03\r\x03\x03\x15\x06\x11\x03\r\x03\x05\tF\x13\x15\x03\x1d\x03\r\tF\x13\x15\x03\x1d\x03\x0f\x1dB\x05\x17\x03\x1f\rF\x05\x19\x03!\x03\x01\x13\x06\x05\x03\x0f\x03\x17\rF\x05\x1b\x03!\x03\x01\x13\x06\x05\x03\x0f\x03\x1b\rF\x05\x1d\x03\t\x03\x15\rF\x05\x1f\x03\t\x03\x15\x17F\x05!\x05\t\t\t\x19\x1d\x1f!\x1fF\x05\x17\x03\x1f\x05#%\x13\x06\x05\x03\x17\x03'\tF\x15\x15\x03\x17\x03\x0b!\x06\x15\x03\x17\x05)+\tF\x17\x15\x03\x17\x03\t#\x06\x17\x03\x17\x05-/%\x06G\x03\x0b\x031\tF\x0b\x15\x03\x0b\x03\x07\x19\x06\x0b\x03\x0b\x0535\x19\x06\x0b\x03\x1d\x05\x13\x11\tF\x19#\x03\x0b\x039'\x06\x19\x03\x0b\x057;\tF\x1b#\x03\x0b\x03\x11)\x06\x1b\x03\x0b\x05=?\tF\x1d#\x03\x0b\x03\x11+\x06\x1d\x03\x0b\x05CA\x11\x04\x07\x03E\x0fP\x01%\x07\x04\x81\x03\x15\x1b\t\x1f\x01\x1f\x01\x13\x01\x13\x01\x00\tF\t\x15\x03\t\x03\x01\tF\t\x15\x03\t\x03\x03\tF\t'\x03\t\x03\x05\tF\t'\x03\t\x03\x07\x1bG\t9)\x05\t\t\t\t\x0b\r\x0f\x11\x04\x01\x05\x11\x13\x06\x03\x01\x05\x01\x00n\x0bm+\x0f\x0b\x0f!\x11\x131\x05\t\t\t\t+\x07)\x03#+)\x1b_\x1d\x0b\x13%)9\x17\x17\x0f\x19'\r/\x1f\x11\x1f\x19\x11\x17\x17\x15\x11\x13\x19))\x0b\x0f7\x0b\t\x11builtin\x00sdy\x00vhlo\x00unrealized_conversion_cast\x00module\x00mesh\x00sharding_constraint\x00broadcast_in_dim_v1\x00constant_v1\x00slice_v1\x00func_v1\x00return_v1\x00reshape_v1\x00convert_v1\x00call_v1\x00subtract_v1\x00custom_call_v1\x00iota_v1\x00concatenate_v1\x00shift_right_logical_v1\x00or_v1\x00bitcast_convert_v1\x00multiply_v1\x00add_v1\x00maximum_v1\x00empty_mesh\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00jit:\x00jit(func)/jit\x00/rocm-jax/jax/tests/export_back_compat_test.py\x00threefry2x32\x00mhlo.backend_config\x00convert_element_type\x00broadcast_in_dim\x00\x00shift_right_logical\x00or\x00bitcast_convert_type\x00sub\x00mul\x00add\x00max\x00x\x00jit(func)/jit(_uniform)\x00_uniform\x00private\x00jax.result_info\x00result\x00main\x00public\x00hip_threefry2x32_ffi\x00\x08\x91+\x05[\x01\x05Y\x0f\x0bm{}\x85\x87\x03u\x03\xa3\x03[\x03o\x0b\x89\x8bmoq\x03\x9b\x03\x9d\x03_\x03w\x07cic\x07\x9fcc\x07yic\x07\xa1yc\x03s\x03k\x0bg\x8dgsq\x03i\x11\x8f\x91\x93g\x95\x97g\x99",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
diff --git a/jax/_src/internal_test_util/export_back_compat_test_data/rocm_tridiagonal_hipsolver_sytrd.py b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_tridiagonal_hipsolver_sytrd.py
new file mode 100644
index 000000000000..7e7caf653932
--- /dev/null
+++ b/jax/_src/internal_test_util/export_back_compat_test_data/rocm_tridiagonal_hipsolver_sytrd.py
@@ -0,0 +1,383 @@
+# Copyright 2026 The JAX Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# pyrefly: ignore-errors
+# ruff: noqa
+
+import datetime
+import numpy as np
+
+array = np.array
+float32 = np.float32
+complex64 = np.complex64
+
+data_2026_02_04 = {}
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["f32"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_sytrd_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[ 3.517052  ,  7.324363  ,  0.17285964,  6.048615  ],
+        [ 2.634785  , -1.5823158 ,  5.00702   , -9.524221  ],
+        [-9.572195  , -1.6510249 , -7.1607885 ,  0.27307302],
+        [-3.616519  ,  9.1224375 ,  8.262698  , -9.876812  ]],
+
+       [[-9.066103  ,  0.91170084, -9.563753  , -2.7974956 ],
+        [ 1.9257098 , -3.1175334 ,  3.5549293 , -7.2144737 ],
+        [-0.92147785,  5.217206  ,  3.3423822 ,  3.6858516 ],
+        [ 4.3601804 ,  6.6677866 , -5.461852  , -6.232803  ]]],
+      dtype=float32),),
+    expected_outputs=(array([[[  3.517052  ,   7.324363  ,   0.17285964,   6.048615  ],
+        [-10.566372  ,  -2.8193984 ,   5.00702   ,  -9.524221  ],
+        [ -0.7251028 ,  -3.1670432 ,  -4.499419  ,   0.27307302],
+        [ -0.27395472,   0.9202458 ,  11.912114  , -11.301102  ]],
+
+       [[ -9.066103  ,   0.91170084,  -9.563753  ,  -2.7974956 ],
+        [ -4.854756  ,   0.4297719 ,   3.5549293 ,  -7.2144737 ],
+        [ -0.13590185,  -5.4479847 , -12.038837  ,   3.6858516 ],
+        [  0.6430503 ,   0.5523631 ,   3.6679316 ,   5.6011105 ]]],
+      dtype=float32), array([[  3.517052 ,  -2.8193984,  -4.499419 , -11.301102 ],
+       [ -9.066103 ,   0.4297719, -12.038837 ,   5.6011105]],
+      dtype=float32), array([[-10.566372 ,  -3.1670432,  11.912114 ],
+       [ -4.854756 ,  -5.4479847,   3.6679316]], dtype=float32), array([[1.2493557, 1.0829235, 0.       ],
+       [1.3966646, 1.5324438, 0.       ]], dtype=float32)),
+    mlir_module_text=r"""
+#loc1 = loc("x")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xf32> loc("x")) -> (tensor<2x4x4xf32> {jax.result_info = "result[0]"}, tensor<2x4xf32> {jax.result_info = "result[1]"}, tensor<2x3xf32> {jax.result_info = "result[2]"}, tensor<2x3xf32> {jax.result_info = "result[3]"}) {
+    %cst = stablehlo.constant dense<0x7FC00000> : tensor<f32> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_sytrd_ffi(%arg0) {mhlo.backend_config = {lower = true}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 0]> : tensor<2xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o], [i, p], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=3, p=3}, custom>} : (tensor<2x4x4xf32>) -> (tensor<2x4x4xf32>, tensor<2x4xf32>, tensor<2x3xf32>, tensor<2x3xf32>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %2 = stablehlo.compare  EQ, %0#4, %1,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %3 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4x4xf32> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %3, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %6 = stablehlo.select %5, %0#0, %4 : tensor<2x4x4xi1>, tensor<2x4x4xf32> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4xf32> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %0#1, %8 : tensor<2x4xi1>, tensor<2x4xf32> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x3xf32> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x3xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %0#2, %12 : tensor<2x3xi1>, tensor<2x3xf32> loc(#loc4)
+    %15 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %16 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x3xf32> loc(#loc4)
+    %17 = stablehlo.broadcast_in_dim %15, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x3xi1> loc(#loc4)
+    %18 = stablehlo.select %17, %0#3, %16 : tensor<2x3xi1>, tensor<2x3xf32> loc(#loc4)
+    return %6, %10, %14, %18 : tensor<2x4x4xf32>, tensor<2x4xf32>, tensor<2x3xf32>, tensor<2x3xf32> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":764:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("tridiagonal"(#loc3))
+""",
+    mlir_module_serialized=b'ML\xefR\rStableHLO_v1.12.1\x00\x01#\x07\x01\x05\t\x11\x01\x03\x0f\x03\x0f\x13\x17\x1b\x1f#\'+\x03\xe7\x997\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03S\x0f\x0b/OOo\x0f\x0b\x0b\x1b\x13\x0b\x13\x0b\x13\x0b\x13\x0b\x0b\x0b\x1f\x1f\x13\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1f/\x0b\x0bo\x05\x1f\x0f_\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x13\x0f\x13\x0f\x0f\x01\x05\x0b\x0f\x033\x17\x1b\x07\x07\x17\x07\x07\x17\x0f\x0f\x07\x13\x17#\x13\x13\x13\x13\x13\x1b\x13\x1b\x13\x17\x13\x02"\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x15\x03\x05\x1f\x05!\x1d\x1b\x1d\x05#\x17\x1f\xf2\x0b\x1b\x05%\x03\x07#U%[\'}\x05\'\x05)\x05+\x1f\'\x01\x1d-\x1f-\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f#!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f5!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1f!1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x03\x037\r\x01#\x1f\x03\t=AEI\r\x03+?\x1d/\r\x03+C\x1d1\r\x03+G\x1d3\r\x03+K\x1d5\x1d7\x1d9\x1f\x15\t\x00\x00\xc0\x7f\x1f\x17\t\x00\x00\x00\x00\r\x03WY\x1d;\x05\x03\r\x03]_\x1d=\x1d?\x0b\x03\x1dA\x1dC\x03\x01\x05\x01\x03\x033\x03\x03o\x15\x03\x01\x01\x01\x03\x0b3///s\x1f%\x11\x00\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f11\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x11\t\x11\x11\x11\x11\x11\r\r\x03\x7f\x0b\x85\x8b\x8f\x93\x97\x01\x01\x01\x01\x01\x13\x07{\x81\x83\x11\x03\x05\x11\x03\t\x13\x07{\x87\x89\x11\x03\r\x11\x03\x11\x13\x05{\x8d\x11\x03\x15\x13\x05{\x91\x11\x03\x19\x13\x05{\x95\x11\x03\x1d\x13\x03{\x01\t\x01\x02\x02)\x05\t\r\x0b)\x07\t\x11\x11\x0b\x01\t)\x05\t\x11\x0b\x1d\x13)\x05\t\x05\t)\x01\x0b)\x01\x19\x1b)\x03\t\x19)\x05\t\r\t\x11\x03\x07\t\x07\r\x05\x05)\x03\r\x11)\x03\t\x11)\x03\x05\x11)\x03\x01\x0f)\x03\t\t)\x07\t\x05\x05\t)\x03\x05\x0f)\x07\t\x11\x11\t)\x03\r\x0f)\x05\t\x11\t)\x03\t\x0f\x04J\x03\x05\x01Q\x03\x07\x01\x07\x04"\x03\x03\x01\x05\tP\x03\x03\x07\x04\xf6\x02\x035[\x03\x0f\x13\x00\x07B\x03\x05\x03\x15\x07B\x01\x07\x03\x17\x0bG\x01!\t\x0b\x07\r\x05\x05\x1b\x03\x01\x03F\x01\x0b\x03\x1b\x03\x05\rF\x01\r\x03)\x05\x0f\x11\x03F\x01\x0f\x03+\x03\x13\x03F\x01\x0b\x03\x07\x03\x03\x03F\x01\x11\x03/\x03\x15\x05\x06\x01\x03\x07\x07\x19\x07\x17\x03F\x01\x0f\x03\x13\x03\x13\x03F\x01\x0b\x03\r\x03\x03\x03F\x01\x13\x033\x03\x1d\x05\x06\x01\x03\r\x07!\t\x1f\x03F\x01\x0f\x03\x13\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1d\x03%\x05\x06\x01\x03\x05\x07)\x0b\'\x03F\x01\x0f\x03\x13\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1d\x03-\x05\x06\x01\x03\x05\x071\r/\x0f\x04\x03\t\x1b#+3\x06\x03\x01\x05\x01\x00r\x07E)\x03\x05\x1f\r\x0f\x0b\x15\x15\x15\x15!%3)s\x15\x19\x05\x13%)9\x15\x17\x1f\x11\x19\x15)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00select_v1\x00constant_v1\x00func_v1\x00custom_call_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00x\x00tridiagonal\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00result[3]\x00main\x00public\x00lower\x00num_batch_dims\x001\x00\x00hipsolver_sytrd_ffi\x00\x08E\x15\x05#\x01\x0b59;MO\x03Q\x03S\x11acegikmq\x03)\x05uw\x03-\x03y\x031',
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["f64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_sytrd_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[ 7.035349169825569  ,  1.484998381764381  ,
+          8.018528146255836  , -4.530334856568022  ],
+        [ 9.878251523361389  ,  4.093041770635891  ,
+         -9.877581529120809  ,  6.311932164866882  ],
+        [-7.49184464571486   , -6.59107026401994   ,
+          1.1241396190859394 ,  7.700650796628231  ],
+        [ 4.63003758138132   , -0.04006710103875122,
+          1.3302998218441715 ,  1.4217252024769529 ]],
+
+       [[ 9.87349262986562   , -0.7610867121172475 ,
+         -5.8439127140031255 ,  7.363308757108598  ],
+        [-8.602243503020022  ,  1.0149675283651831 ,
+          6.189214809971542  ,  3.8755163293613073 ],
+        [-7.2550065371548556 , -0.8199129790471194 ,
+          3.3263222105883834 ,  9.414314634323905  ],
+        [ 9.50720541720979   ,  8.190248152372803  ,
+          6.1792809430264235 , -3.395527362127919  ]]]),),
+    expected_outputs=(array([[[  7.035349169825569  ,   1.484998381764381  ,
+           8.018528146255836  ,  -4.530334856568022  ],
+        [-13.234229760712234  ,   7.836821389949192  ,
+          -9.877581529120809  ,   6.311932164866882  ],
+        [ -0.32414713736847234,  -3.231749037742704  ,
+           2.91526168804856   ,   7.700650796628231  ],
+        [  0.20032628796856145,   0.8955299566988397 ,
+           1.1712939642530218 ,  -4.113176485798968  ]],
+
+       [[  9.87349262986562   ,  -0.7610867121172475 ,
+          -5.8439127140031255 ,   7.363308757108598  ],
+        [ 14.731621363055496  , -10.83373801371347   ,
+           6.189214809971542  ,   3.8755163293613073 ],
+        [  0.31092176880233485,   4.1168822837917665 ,
+           8.31687010427185   ,   9.414314634323905  ],
+        [ -0.4074423792104866 ,   0.5649683724391054 ,
+          -1.2386684521243119 ,   3.4626302862672684 ]]]), array([[  7.035349169825569 ,   7.836821389949192 ,   2.91526168804856  ,
+         -4.113176485798968 ],
+       [  9.87349262986562  , -10.83373801371347  ,   8.31687010427185  ,
+          3.4626302862672684]]), array([[-13.234229760712234 ,  -3.231749037742704 ,   1.1712939642530218],
+       [ 14.731621363055496 ,   4.1168822837917665,  -1.2386684521243119]]), array([[1.7464168071712372, 1.109893986970275 , 0.                ],
+       [1.5839305322218669, 1.51608268641105  , 0.                ]])),
+    mlir_module_text=r"""
+#loc1 = loc("x")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xf64> loc("x")) -> (tensor<2x4x4xf64> {jax.result_info = "result[0]"}, tensor<2x4xf64> {jax.result_info = "result[1]"}, tensor<2x3xf64> {jax.result_info = "result[2]"}, tensor<2x3xf64> {jax.result_info = "result[3]"}) {
+    %cst = stablehlo.constant dense<0x7FF8000000000000> : tensor<f64> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_sytrd_ffi(%arg0) {mhlo.backend_config = {lower = true}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 0]> : tensor<2xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o], [i, p], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=3, p=3}, custom>} : (tensor<2x4x4xf64>) -> (tensor<2x4x4xf64>, tensor<2x4xf64>, tensor<2x3xf64>, tensor<2x3xf64>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %2 = stablehlo.compare  EQ, %0#4, %1,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %3 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x4x4xf64> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %3, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %6 = stablehlo.select %5, %0#0, %4 : tensor<2x4x4xi1>, tensor<2x4x4xf64> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x4xf64> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %0#1, %8 : tensor<2x4xi1>, tensor<2x4xf64> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x3xf64> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x3xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %0#2, %12 : tensor<2x3xi1>, tensor<2x3xf64> loc(#loc4)
+    %15 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %16 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x3xf64> loc(#loc4)
+    %17 = stablehlo.broadcast_in_dim %15, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x3xi1> loc(#loc4)
+    %18 = stablehlo.select %17, %0#3, %16 : tensor<2x3xi1>, tensor<2x3xf64> loc(#loc4)
+    return %6, %10, %14, %18 : tensor<2x4x4xf64>, tensor<2x4xf64>, tensor<2x3xf64>, tensor<2x3xf64> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":764:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("tridiagonal"(#loc3))
+""",
+    mlir_module_serialized=b'ML\xefR\rStableHLO_v1.12.1\x00\x01#\x07\x01\x05\t\x11\x01\x03\x0f\x03\x0f\x13\x17\x1b\x1f#\'+\x03\xe7\x997\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03S\x0f\x0b/OOo\x0f\x0b\x0b\x1b\x13\x0b\x13\x0b\x13\x0b\x13\x0b\x0b\x0b/\x1f\x13\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1f/\x0b\x0bo\x05\x1f\x0f_\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x13\x0f\x13\x0f\x0f\x01\x05\x0b\x0f\x033\x17\x1b\x07\x07\x17\x07\x07\x17\x0f\x0f\x07\x13\x17#\x13\x13\x13\x13\x13\x1b\x13\x1b\x13\x17\x13\x022\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x15\x03\x05\x1f\x05!\x1d\x1b\x1d\x05#\x17\x1f\xf2\x0b\x1b\x05%\x03\x07#U%[\'}\x05\'\x05)\x05+\x1f\'\x01\x1d-\x1f-\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f#!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f5!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1f!1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x03\x037\r\x01#\x1f\x03\t=AEI\r\x03+?\x1d/\r\x03+C\x1d1\r\x03+G\x1d3\r\x03+K\x1d5\x1d7\x1d9\x1f\x15\x11\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x17\t\x00\x00\x00\x00\r\x03WY\x1d;\x05\x03\r\x03]_\x1d=\x1d?\x0b\x03\x1dA\x1dC\x03\x01\x05\x01\x03\x033\x03\x03o\x15\x03\x01\x01\x01\x03\x0b3///s\x1f%\x11\x00\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f11\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x11\t\x11\x11\x11\x11\x11\r\r\x03\x7f\x0b\x85\x8b\x8f\x93\x97\x01\x01\x01\x01\x01\x13\x07{\x81\x83\x11\x03\x05\x11\x03\t\x13\x07{\x87\x89\x11\x03\r\x11\x03\x11\x13\x05{\x8d\x11\x03\x15\x13\x05{\x91\x11\x03\x19\x13\x05{\x95\x11\x03\x1d\x13\x03{\x01\t\x01\x02\x02)\x05\t\r\x0b)\x07\t\x11\x11\x0b\x01\x0b)\x05\t\x11\x0b\x1d\x13)\x05\t\x05\t)\x01\x0b)\x01\x19\x1b)\x03\t\x19)\x05\t\r\t\x11\x03\x07\t\x07\r\x05\x05)\x03\r\x11)\x03\t\x11)\x03\x05\x11)\x03\x01\x0f)\x03\t\t)\x07\t\x05\x05\t)\x03\x05\x0f)\x07\t\x11\x11\t)\x03\r\x0f)\x05\t\x11\t)\x03\t\x0f\x04J\x03\x05\x01Q\x03\x07\x01\x07\x04"\x03\x03\x01\x05\tP\x03\x03\x07\x04\xf6\x02\x035[\x03\x0f\x13\x00\x07B\x03\x05\x03\x15\x07B\x01\x07\x03\x17\x0bG\x01!\t\x0b\x07\r\x05\x05\x1b\x03\x01\x03F\x01\x0b\x03\x1b\x03\x05\rF\x01\r\x03)\x05\x0f\x11\x03F\x01\x0f\x03+\x03\x13\x03F\x01\x0b\x03\x07\x03\x03\x03F\x01\x11\x03/\x03\x15\x05\x06\x01\x03\x07\x07\x19\x07\x17\x03F\x01\x0f\x03\x13\x03\x13\x03F\x01\x0b\x03\r\x03\x03\x03F\x01\x13\x033\x03\x1d\x05\x06\x01\x03\r\x07!\t\x1f\x03F\x01\x0f\x03\x13\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1d\x03%\x05\x06\x01\x03\x05\x07)\x0b\'\x03F\x01\x0f\x03\x13\x03\x13\x03F\x01\x0b\x03\x05\x03\x03\x03F\x01\x13\x03\x1d\x03-\x05\x06\x01\x03\x05\x071\r/\x0f\x04\x03\t\x1b#+3\x06\x03\x01\x05\x01\x00r\x07E)\x03\x05\x1f\r\x0f\x0b\x15\x15\x15\x15!%3)s\x15\x19\x05\x13%)9\x15\x17\x1f\x11\x19\x15)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00select_v1\x00constant_v1\x00func_v1\x00custom_call_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00x\x00tridiagonal\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00result[3]\x00main\x00public\x00lower\x00num_batch_dims\x001\x00\x00hipsolver_sytrd_ffi\x00\x08E\x15\x05#\x01\x0b59;MO\x03Q\x03S\x11acegikmq\x03)\x05uw\x03-\x03y\x031',
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["c64"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_sytrd_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[-4.489628   -1.9558684j , -8.210964   +7.1605806j ,
+         -1.546595   +3.65443j   , -0.42576104 +4.1540704j ],
+        [ 1.2732816  +4.58178j   , -4.3097434  +1.9485371j ,
+         -7.340492   -4.6551476j ,  0.51207775 -1.5729961j ],
+        [-1.6132524  +9.396326j  , -8.6812315  +0.57193804j,
+         -4.0404854  +5.580052j  ,  7.198982   -7.8558793j ],
+        [ 5.0999346  -5.281331j  , -0.20722196 -8.790846j  ,
+         -8.34889    +5.4901276j ,  1.5386024  -7.8014874j ]],
+
+       [[-3.7505336  +4.8419423j , -6.9383445  -6.1508617j ,
+         -5.090222   +8.55102j   , -2.8638835  -2.8485649j ],
+        [ 0.39724413 -9.112975j  ,  5.8403125  -4.28845j   ,
+         -5.876785   +5.7571j    ,  0.81345195 -8.658585j  ],
+        [-9.730914   -4.9138327j ,  4.2365274  +0.08631961j,
+         -0.020483766+2.811939j  , -3.4501777  -7.5303087j ],
+        [-6.0442333  +6.9959636j , -9.286192   +0.29182708j,
+          3.5280166  +8.255178j  ,  5.123959   -3.4980805j ]]],
+      dtype=complex64),),
+    expected_outputs=(array([[[-4.4896278e+00+0.j        , -8.2109642e+00+7.1605806j ,
+         -1.5465950e+00+3.65443j   , -4.2576104e-01+4.1540704j ],
+        [-1.2938673e+01+0.j        , -1.0068893e-02+0.j        ,
+         -7.3404918e+00-4.6551476j ,  5.1207775e-01-1.5729961j ],
+        [ 9.0255260e-02+0.63205916j, -1.2945498e+01+0.j        ,
+          2.4201365e+00+0.j        ,  7.1989818e+00-7.8558793j ],
+        [ 2.1653868e-01-0.44142157j,  5.5885059e-03+0.24181136j,
+          7.6457381e+00+0.j        , -9.2216911e+00+0.j        ]],
+
+       [[-3.7505336e+00+0.j        , -6.9383445e+00-6.1508617j ,
+         -5.0902219e+00+8.55102j   , -2.8638835e+00-2.8485649j ],
+        [-1.6956322e+01+0.j        ,  3.5084348e+00+0.j        ,
+         -5.8767848e+00+5.7571j    ,  8.1345195e-01-8.658585j  ],
+        [-3.2297978e-01-0.45276803j,  8.2233658e+00+0.j        ,
+          1.4219294e+00+0.j        , -3.4501777e+00-7.5303087j ],
+        [-4.3895450e-01+0.1726321j , -7.5097442e-02-0.18226749j,
+          1.1053572e+01+0.j        ,  6.0134225e+00+0.j        ]]],
+      dtype=complex64), array([[-4.489628   , -0.010068893,  2.4201365  , -9.221691   ],
+       [-3.7505336  ,  3.5084348  ,  1.4219294  ,  6.0134225  ]],
+      dtype=float32), array([[-12.938673, -12.945498,   7.645738],
+       [-16.956322,   8.223366,  11.053572]], dtype=float32), array([[1.0984089+0.35411513j, 1.7074363+0.55748767j,
+        1.634002 -0.77333146j],
+       [1.0234275-0.5374382j , 1.904741 +0.19733457j,
+        1.2192558+0.9756674j ]], dtype=complex64)),
+    mlir_module_text=r"""
+#loc1 = loc("x")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xcomplex<f32>> loc("x")) -> (tensor<2x4x4xcomplex<f32>> {jax.result_info = "result[0]"}, tensor<2x4xf32> {jax.result_info = "result[1]"}, tensor<2x3xf32> {jax.result_info = "result[2]"}, tensor<2x3xcomplex<f32>> {jax.result_info = "result[3]"}) {
+    %cst = stablehlo.constant dense<0x7FC00000> : tensor<f32> loc(#loc)
+    %cst_0 = stablehlo.constant dense<(0x7FC00000,0x7FC00000)> : tensor<complex<f32>> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_sytrd_ffi(%arg0) {mhlo.backend_config = {lower = true}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 0]> : tensor<2xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o], [i, p], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=3, p=3}, custom>} : (tensor<2x4x4xcomplex<f32>>) -> (tensor<2x4x4xcomplex<f32>>, tensor<2x4xf32>, tensor<2x3xf32>, tensor<2x3xcomplex<f32>>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %2 = stablehlo.compare  EQ, %0#4, %1,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %3 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<complex<f32>>) -> tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %3, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %6 = stablehlo.select %5, %0#0, %4 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f32>> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x4xf32> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %0#1, %8 : tensor<2x4xi1>, tensor<2x4xf32> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f32>) -> tensor<2x3xf32> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x3xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %0#2, %12 : tensor<2x3xi1>, tensor<2x3xf32> loc(#loc4)
+    %15 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %16 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<complex<f32>>) -> tensor<2x3xcomplex<f32>> loc(#loc4)
+    %17 = stablehlo.broadcast_in_dim %15, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x3xi1> loc(#loc4)
+    %18 = stablehlo.select %17, %0#3, %16 : tensor<2x3xi1>, tensor<2x3xcomplex<f32>> loc(#loc4)
+    return %6, %10, %14, %18 : tensor<2x4x4xcomplex<f32>>, tensor<2x4xf32>, tensor<2x3xf32>, tensor<2x3xcomplex<f32>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":764:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("tridiagonal"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.12.1\x00\x01#\x07\x01\x05\t\x11\x01\x03\x0f\x03\x0f\x13\x17\x1b\x1f#'+\x03\xef\x9b=\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03U\x0f\x0b/OOo\x0f\x0b\x0b\x1b\x13\x0b\x13\x0b\x13\x0b\x13\x0b\x0b\x0b\x1f/\x1f\x13\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1f/\x0b\x0bo\x05\x1f\x0f_\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x13\x0f\x13\x0f\x0f\x01\x05\x0b\x0f\x039\x1b\x07\x07\x17\x17\x17\x07\x0b\x07\x17\x0f\x0f\x0f\x07\x13\x17#\x13\x13\x13\x13\x13\x1b\x13\x1b\x13\x17\x13\x02v\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x15\x03\x05\x1f\x05!\x1d\x1b\x1d\x05#\x17\x1f\xf2\x0b\x1b\x05%\x03\x07#W%]'\x7f\x05'\x05)\x05+\x1f-\x01\x1d-\x1f3\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f)!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f;!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1f'1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x03\x037\r\x01#%\x03\t=AEI\r\x03+?\x1d/\r\x03+C\x1d1\r\x03+G\x1d3\r\x03+K\x1d5\x1d7\x1d9\x1f\x19\t\x00\x00\xc0\x7f\x1f\x1b\x11\x00\x00\xc0\x7f\x00\x00\xc0\x7f\x1f\x1d\t\x00\x00\x00\x00\r\x03Y[\x1d;\x05\x03\r\x03_a\x1d=\x1d?\x0b\x03\x1dA\x1dC\x03\x01\x05\x01\x03\x033\x03\x03q\x15\x03\x01\x01\x01\x03\x0b3///u\x1f+\x11\x00\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f71\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x11\t\x11\x11\x11\x11\x11\r\r\x03\x81\x0b\x87\x8d\x91\x95\x99\x01\x01\x01\x01\x01\x13\x07}\x83\x85\x11\x03\x05\x11\x03\t\x13\x07}\x89\x8b\x11\x03\r\x11\x03\x11\x13\x05}\x8f\x11\x03\x15\x13\x05}\x93\x11\x03\x19\x13\x05}\x97\x11\x03\x1d\x13\x03}\x01\t\x01\x02\x02)\x07\t\x11\x11\x13\x01\t)\x05\t\x11\t)\x05\t\r\t)\x05\t\r\x13\x1d\x03\t\x13)\x05\t\x05\x07)\x01\t)\x01\x13)\x01\x1f\x1b)\x03\t\x1f)\x05\t\r\x07\x11\x03\x05\t\x05\x0b\r\x0f)\x03\r\x15)\x03\t\x15)\x03\x05\x15)\x03\x01\x11)\x03\t\x07)\x07\t\x05\x05\x07)\x03\x05\x11)\x07\t\x11\x11\x07)\x03\r\x11)\x05\t\x11\x07)\x03\t\x11\x04b\x03\x05\x01Q\x03\x07\x01\x07\x04:\x03\x03\x01\x05\tP\x03\x03\x07\x04\x0e\x03\x037_\x03\x0b\x13\x00\x07B\x03\x05\x03\x19\x07B\x03\x07\x03\x1b\x07B\x01\t\x03\x1d\x0bG\x01!\x0b\x0b\x05\x0b\r\x0f!\x03\x01\x03F\x01\r\x03!\x03\x07\rF\x01\x0f\x03/\x05\x11\x13\x03F\x01\x11\x031\x03\x15\x03F\x01\r\x03\x05\x03\x05\x03F\x01\x13\x035\x03\x17\x05\x06\x01\x03\x05\x07\x1b\t\x19\x03F\x01\x11\x03\x17\x03\x15\x03F\x01\r\x03\x0b\x03\x03\x03F\x01\x15\x039\x03\x1f\x05\x06\x01\x03\x0b\x07#\x0b!\x03F\x01\x11\x03\x17\x03\x15\x03F\x01\r\x03\r\x03\x03\x03F\x01\x15\x03#\x03'\x05\x06\x01\x03\r\x07+\r)\x03F\x01\x11\x03\x17\x03\x15\x03F\x01\r\x03\x0f\x03\x05\x03F\x01\x15\x03#\x03/\x05\x06\x01\x03\x0f\x073\x0f1\x0f\x04\x03\t\x1d%-5\x06\x03\x01\x05\x01\x00r\x07E)\x03\x05\x1f\r\x0f\x0b\x15\x15\x15\x15!%3)s\x15\x19\x05\x13%)9\x15\x17\x1f\x11\x19\x15)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00select_v1\x00constant_v1\x00func_v1\x00custom_call_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00x\x00tridiagonal\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00result[3]\x00main\x00public\x00lower\x00num_batch_dims\x001\x00\x00hipsolver_sytrd_ffi\x00\x08I\x17\x05#\x01\x0b59;MO\x03Q\x03S\x03U\x11cegikmos\x03)\x05wy\x03-\x03{\x031",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
+
+# Pasted from the test output (see export_back_compat_test_util.py module docstring)
+data_2026_02_04["c128"] = dict(
+    testdata_version=1,
+    platform='rocm',
+    custom_call_targets=['hipsolver_sytrd_ffi'],
+    serialized_date=datetime.date(2026, 2, 4),
+    inputs=(array([[[ 9.636811089187177  -5.5483943045483075j ,
+         -0.7013595675721049 +9.280476944337625j  ,
+          6.277881297993044  +9.583766011933022j  ,
+          1.5176610958978305 -6.759859673083863j  ],
+        [-0.3885087082062455 +0.5895084066496903j ,
+          6.964207617750493  +2.527176875608994j  ,
+          5.538066653380939  -7.747050813954031j  ,
+         -8.175356094532935  -4.1980578398170625j ],
+        [ 1.0279072759095182 +3.4596945172274793j ,
+          8.950471968823695  -2.304755231947957j  ,
+          5.421547479246534  +4.581737009453139j  ,
+         -4.897557901418952  +3.5957170627858677j ],
+        [ 8.035494168741337  +3.544344260400223j  ,
+          9.975999717803504  +6.346230772630385j  ,
+          4.740819751509449  +2.756160834913411j  ,
+         -3.4198929512643    +0.8932196515922382j ]],
+
+       [[ 9.53448278116884   -2.772437604863242j  ,
+         -6.107167742373565  +1.7555826763979088j ,
+          0.8426783600121581 -1.4969268724718319j ,
+         -7.791881813923409  +2.569663008343241j  ],
+        [-0.23022736962356838+5.931740292160859j  ,
+          0.19505301380201168+5.199989565595661j  ,
+          1.6452867779721974 +7.611177005682343j  ,
+          6.421835818993721  +7.956773248634036j  ],
+        [ 4.514416045392142  +0.24019209063138547j,
+          2.7074137337969297 +7.481936712692281j  ,
+         -4.349739517583451  -7.480660445679543j  ,
+         -4.16307684864292   -9.500272650463366j  ],
+        [-7.187003466047763  -4.305905192850112j  ,
+         -2.790206322615103  -1.8113900331362842j ,
+          3.92920022932449   +4.618786545064131j  ,
+          8.34362192900138   -7.169529907261547j  ]]]),),
+    expected_outputs=(array([[[  9.636811089187177  +0.j                 ,
+          -0.7013595675721049 +9.280476944337625j  ,
+           6.277881297993044  +9.583766011933022j  ,
+           1.5176610958978305 -6.759859673083863j  ],
+        [  9.52134872118296   +0.j                 ,
+          -2.0750820650530635 +0.j                 ,
+           5.538066653380939  -7.747050813954031j  ,
+          -8.175356094532935  -4.1980578398170625j ],
+        [ -0.08266529223728494-0.3540339936208098j ,
+         -12.876186833321775  +0.j                 ,
+          12.221606003386894  +0.j                 ,
+          -4.897557901418952  +3.5957170627858677j ],
+        [ -0.7867983987261797 -0.4044627845907229j ,
+           0.3731807938459702 +0.29875225015983237j,
+          -7.533551178724111  +0.j                 ,
+          -1.1806617926011036 +0.j                 ]],
+
+       [[  9.53448278116884   +0.j                 ,
+          -6.107167742373565  +1.7555826763979088j ,
+           0.8426783600121581 -1.4969268724718319j ,
+          -7.791881813923409  +2.569663008343241j  ],
+        [ 11.219181358613488  +0.j                 ,
+          -2.758824792396279  +0.j                 ,
+           1.6452867779721974 +7.611177005682343j  ,
+           6.421835818993721  +7.956773248634036j  ],
+        [ -0.3022871001148797 -0.17758826769531866j,
+          11.759659907134653  +0.j                 ,
+           3.455913613847388  +0.j                 ,
+          -4.16307684864292   -9.500272650463366j  ],
+        [  0.34127558839537164+0.5528899789954966j ,
+           0.29825641618428594+0.3179804603998629j ,
+          -1.1276010073572176 +0.j                 ,
+           3.4918466037688343 +0.j                 ]]]), array([[ 9.636811089187177 , -2.0750820650530635, 12.221606003386894 ,
+        -1.1806617926011036],
+       [ 9.53448278116884  , -2.758824792396279 ,  3.455913613847388 ,
+         3.4918466037688343]]), array([[  9.52134872118296  , -12.876186833321775 ,  -7.533551178724111 ],
+       [ 11.219181358613488 ,  11.759659907134653 ,  -1.1276010073572176]]), array([[1.0408039574626542-0.06191438040055822j,
+        1.4371627190112481+0.5236740849282041j ,
+        1.5581940209289933-0.8297104525068505j ],
+       [1.0205208706646687-0.5287141817710955j ,
+        1.6435963381260008-0.24653387207157834j,
+        1.809618408219541 -0.586956585338351j  ]])),
+    mlir_module_text=r"""
+#loc1 = loc("x")
+module @jit_func attributes {jax.uses_shape_polymorphism = false, mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
+  func.func public @main(%arg0: tensor<2x4x4xcomplex<f64>> loc("x")) -> (tensor<2x4x4xcomplex<f64>> {jax.result_info = "result[0]"}, tensor<2x4xf64> {jax.result_info = "result[1]"}, tensor<2x3xf64> {jax.result_info = "result[2]"}, tensor<2x3xcomplex<f64>> {jax.result_info = "result[3]"}) {
+    %cst = stablehlo.constant dense<0x7FF8000000000000> : tensor<f64> loc(#loc)
+    %cst_0 = stablehlo.constant dense<(0x7FF8000000000000,0x7FF8000000000000)> : tensor<complex<f64>> loc(#loc)
+    %c = stablehlo.constant dense<0> : tensor<i32> loc(#loc4)
+    %0:5 = stablehlo.custom_call @hipsolver_sytrd_ffi(%arg0) {mhlo.backend_config = {lower = true}, mhlo.frontend_attributes = {num_batch_dims = "1"}, operand_layouts = [dense<[1, 2, 0]> : tensor<3xindex>], output_operand_aliases = [#stablehlo.output_operand_alias<output_tuple_indices = [0], operand_index = 0, operand_tuple_indices = []>], result_layouts = [dense<[1, 2, 0]> : tensor<3xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 0]> : tensor<2xindex>, dense<[1, 0]> : tensor<2xindex>, dense<0> : tensor<1xindex>], sdy.sharding_rule = #sdy.op_sharding_rule<([i, j, k])->([i, l, m], [i, n], [i, o], [i, p], [i]) {i=2, j=4, k=4, l=4, m=4, n=4, o=3, p=3}, custom>} : (tensor<2x4x4xcomplex<f64>>) -> (tensor<2x4x4xcomplex<f64>>, tensor<2x4xf64>, tensor<2x3xf64>, tensor<2x3xcomplex<f64>>, tensor<2xi32>) loc(#loc4)
+    %1 = stablehlo.broadcast_in_dim %c, dims = [] : (tensor<i32>) -> tensor<2xi32> loc(#loc4)
+    %2 = stablehlo.compare  EQ, %0#4, %1,  SIGNED : (tensor<2xi32>, tensor<2xi32>) -> tensor<2xi1> loc(#loc4)
+    %3 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1x1xi1> loc(#loc4)
+    %4 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<complex<f64>>) -> tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %5 = stablehlo.broadcast_in_dim %3, dims = [0, 1, 2] : (tensor<2x1x1xi1>) -> tensor<2x4x4xi1> loc(#loc4)
+    %6 = stablehlo.select %5, %0#0, %4 : tensor<2x4x4xi1>, tensor<2x4x4xcomplex<f64>> loc(#loc4)
+    %7 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %8 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x4xf64> loc(#loc4)
+    %9 = stablehlo.broadcast_in_dim %7, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x4xi1> loc(#loc4)
+    %10 = stablehlo.select %9, %0#1, %8 : tensor<2x4xi1>, tensor<2x4xf64> loc(#loc4)
+    %11 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %12 = stablehlo.broadcast_in_dim %cst, dims = [] : (tensor<f64>) -> tensor<2x3xf64> loc(#loc4)
+    %13 = stablehlo.broadcast_in_dim %11, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x3xi1> loc(#loc4)
+    %14 = stablehlo.select %13, %0#2, %12 : tensor<2x3xi1>, tensor<2x3xf64> loc(#loc4)
+    %15 = stablehlo.broadcast_in_dim %2, dims = [0] : (tensor<2xi1>) -> tensor<2x1xi1> loc(#loc4)
+    %16 = stablehlo.broadcast_in_dim %cst_0, dims = [] : (tensor<complex<f64>>) -> tensor<2x3xcomplex<f64>> loc(#loc4)
+    %17 = stablehlo.broadcast_in_dim %15, dims = [0, 1] : (tensor<2x1xi1>) -> tensor<2x3xi1> loc(#loc4)
+    %18 = stablehlo.select %17, %0#3, %16 : tensor<2x3xi1>, tensor<2x3xcomplex<f64>> loc(#loc4)
+    return %6, %10, %14, %18 : tensor<2x4x4xcomplex<f64>>, tensor<2x4xf64>, tensor<2x3xf64>, tensor<2x3xcomplex<f64>> loc(#loc)
+  } loc(#loc)
+} loc(#loc)
+#loc = loc(unknown)
+#loc2 = loc("/workspace/rocm-jax/jax/tests/export_back_compat_test.py":764:13)
+#loc3 = loc("jit(func)"(#loc2))
+#loc4 = loc("tridiagonal"(#loc3))
+""",
+    mlir_module_serialized=b"ML\xefR\rStableHLO_v1.12.1\x00\x01#\x07\x01\x05\t\x11\x01\x03\x0f\x03\x0f\x13\x17\x1b\x1f#'+\x03\xef\x9b=\x01)\x0f\x07\x0f#\x0b\x0f\x0b\x0b\x0b\x0f\x0b\x0b\x0f\x0b\x17\x0b#\x0b\x0b\x0b\x03U\x0f\x0b/OOo\x0f\x0b\x0b\x1b\x13\x0b\x13\x0b\x13\x0b\x13\x0b\x0b\x0b/O\x1f\x13\x0b\x0b\x13\x0b\x0b\x0b\x0b\x0b\x0b\x0b\x0f\x0f\x17\x1f/\x0b\x0bo\x05\x1f\x0f_\x17\x0f\x0f\x17\x0f\x0f\x13\x0f\x13\x0f\x13\x0f\x0f\x01\x05\x0b\x0f\x039\x1b\x07\x07\x17\x17\x17\x07\x0b\x07\x17\x0f\x0f\x0f\x07\x13\x17#\x13\x13\x13\x13\x13\x1b\x13\x1b\x13\x17\x13\x02\xa6\x07\x1d\x17\x19\x1f\x11\x03\x05\x03\x07\t\x0b\r\x05\x0f\x05\x05\x17\x11\x01\x00\x05\x19\x05\x1b\x05\x1d\x1d\x15\x03\x05\x1f\x05!\x1d\x1b\x1d\x05#\x17\x1f\xf2\x0b\x1b\x05%\x03\x07#W%]'\x7f\x05'\x05)\x05+\x1f-\x01\x1d-\x1f3\x11\x00\x00\x00\x00\x00\x00\x00\x00\x1f)!\x01\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x1f;!\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x1f'1\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x03\x037\r\x01#%\x03\t=AEI\r\x03+?\x1d/\r\x03+C\x1d1\r\x03+G\x1d3\r\x03+K\x1d5\x1d7\x1d9\x1f\x19\x11\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x1b!\x00\x00\x00\x00\x00\x00\xf8\x7f\x00\x00\x00\x00\x00\x00\xf8\x7f\x1f\x1d\t\x00\x00\x00\x00\r\x03Y[\x1d;\x05\x03\r\x03_a\x1d=\x1d?\x0b\x03\x1dA\x1dC\x03\x01\x05\x01\x03\x033\x03\x03q\x15\x03\x01\x01\x01\x03\x0b3///u\x1f+\x11\x00\x00\x00\x00\x00\x00\x00\x00\t\x07\x07\x01\x1f71\x00\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x02\x00\x00\x00\x00\x00\x00\x00\x11\x03\x01\x15\x11\t\x11\x11\x11\x11\x11\r\r\x03\x81\x0b\x87\x8d\x91\x95\x99\x01\x01\x01\x01\x01\x13\x07}\x83\x85\x11\x03\x05\x11\x03\t\x13\x07}\x89\x8b\x11\x03\r\x11\x03\x11\x13\x05}\x8f\x11\x03\x15\x13\x05}\x93\x11\x03\x19\x13\x05}\x97\x11\x03\x1d\x13\x03}\x01\t\x01\x02\x02)\x07\t\x11\x11\x13\x01\x0b)\x05\t\x11\t)\x05\t\r\t)\x05\t\r\x13\x1d\x03\t\x13)\x05\t\x05\x07)\x01\t)\x01\x13)\x01\x1f\x1b)\x03\t\x1f)\x05\t\r\x07\x11\x03\x05\t\x05\x0b\r\x0f)\x03\r\x15)\x03\t\x15)\x03\x05\x15)\x03\x01\x11)\x03\t\x07)\x07\t\x05\x05\x07)\x03\x05\x11)\x07\t\x11\x11\x07)\x03\r\x11)\x05\t\x11\x07)\x03\t\x11\x04b\x03\x05\x01Q\x03\x07\x01\x07\x04:\x03\x03\x01\x05\tP\x03\x03\x07\x04\x0e\x03\x037_\x03\x0b\x13\x00\x07B\x03\x05\x03\x19\x07B\x03\x07\x03\x1b\x07B\x01\t\x03\x1d\x0bG\x01!\x0b\x0b\x05\x0b\r\x0f!\x03\x01\x03F\x01\r\x03!\x03\x07\rF\x01\x0f\x03/\x05\x11\x13\x03F\x01\x11\x031\x03\x15\x03F\x01\r\x03\x05\x03\x05\x03F\x01\x13\x035\x03\x17\x05\x06\x01\x03\x05\x07\x1b\t\x19\x03F\x01\x11\x03\x17\x03\x15\x03F\x01\r\x03\x0b\x03\x03\x03F\x01\x15\x039\x03\x1f\x05\x06\x01\x03\x0b\x07#\x0b!\x03F\x01\x11\x03\x17\x03\x15\x03F\x01\r\x03\r\x03\x03\x03F\x01\x15\x03#\x03'\x05\x06\x01\x03\r\x07+\r)\x03F\x01\x11\x03\x17\x03\x15\x03F\x01\r\x03\x0f\x03\x05\x03F\x01\x15\x03#\x03/\x05\x06\x01\x03\x0f\x073\x0f1\x0f\x04\x03\t\x1d%-5\x06\x03\x01\x05\x01\x00r\x07E)\x03\x05\x1f\r\x0f\x0b\x15\x15\x15\x15!%3)s\x15\x19\x05\x13%)9\x15\x17\x1f\x11\x19\x15)\x0f\t\x0b\x11builtin\x00vhlo\x00sdy\x00module\x00broadcast_in_dim_v1\x00select_v1\x00constant_v1\x00func_v1\x00custom_call_v1\x00compare_v1\x00return_v1\x00jax.uses_shape_polymorphism\x00mhlo.num_partitions\x00mhlo.num_replicas\x00jit_func\x00x\x00tridiagonal\x00jit(func)\x00/workspace/rocm-jax/jax/tests/export_back_compat_test.py\x00mhlo.backend_config\x00mhlo.frontend_attributes\x00sdy.sharding_rule\x00jax.result_info\x00result[0]\x00result[1]\x00result[2]\x00result[3]\x00main\x00public\x00lower\x00num_batch_dims\x001\x00\x00hipsolver_sytrd_ffi\x00\x08I\x17\x05#\x01\x0b59;MO\x03Q\x03S\x03U\x11cegikmos\x03)\x05wy\x03-\x03{\x031",
+    xla_call_module_version=10,
+    nr_devices=1,
+)  # End paste
diff --git a/jax/_src/lax/linalg.py b/jax/_src/lax/linalg.py
index bcd9148e07d1..868e1fe97fc5 100644
--- a/jax/_src/lax/linalg.py
+++ b/jax/_src/lax/linalg.py
@@ -361,9 +361,8 @@ def lu_pivots_to_permutation(pivots: ArrayLike, permutation_size: int) -> Array:
   return lu_pivots_to_permutation_p.bind(
       pivots, permutation_size=permutation_size)
 
-
 @overload
-def qr(x: ArrayLike, *, pivoting: Literal[False], full_matrices: bool = True,
+def qr(x: ArrayLike, *, pivoting: Literal[False] = False, full_matrices: bool = True,
       use_magma: bool | None = None) -> tuple[Array, Array]:
   ...
 
@@ -1023,13 +1022,13 @@ def _eig_cpu_lowering(ctx, operand, *, compute_left_eigenvectors,
     output.append(vr)
   return output
 
-def _unpack_conjugate_pairs(w, vr):
+def _unpack_conjugate_pairs(w: Array, vr: Array) -> Array:
   # cusolver, like LAPACK, uses a packed representation of the complex
   # eigenvectors, where the (re, im) vectors are adjacent and shared by the
   # conjugate pair:
   # https://docs.nvidia.com/cuda/cusolver/index.html?highlight=geev#cusolverdnxgeev
   if w.size == 0:
-    return lax.complex(vr, lax.zeros_like_array(vr))
+    return lax.complex(vr, lax.full_like(vr, 0))
 
   is_real = ((w.imag == 0) | (w.imag == np.nan))
   # Finds the positions at which each conjugate pair starts, via the parity of
@@ -1042,13 +1041,13 @@ def _unpack_conjugate_pairs(w, vr):
   vr_shifted_left = lax.pad(vr, lax._zero(vr), pads)
   pads[-1] = (1, -1, 0)
   vr_shifted_right = lax.pad(vr, lax._zero(vr), pads)
-  dims = np.delete(np.arange(len(vr.shape), dtype=np.int32), -2)
+  dims = list(np.delete(np.arange(len(vr.shape), dtype=np.int32), -2))
   is_real = lax.broadcast_in_dim(is_real, vr.shape, broadcast_dimensions=dims)
   conj_pair_start = lax.broadcast_in_dim(conj_pair_start, vr.shape,
                                          broadcast_dimensions=dims)
   re = lax.select(is_real | conj_pair_start, vr, vr_shifted_right)
   im = lax.select(conj_pair_start, vr_shifted_left, -vr)
-  im = lax.select(is_real, lax.zeros_like_array(vr), im)
+  im = lax.select(is_real, lax.full_like(vr, 0), im)
   return lax.complex(re, im)
 
 
@@ -1368,7 +1367,7 @@ def _householder_product_lowering(ctx, a, taus):
     result_shapes = None
   op = mlir.custom_call(
       "ProductOfElementaryHouseholderReflectors",
-      result_types=[mlir.aval_to_ir_type(aval_out)],
+      result_types=mlir.flatten_ir_types([mlir.aval_to_ir_type(aval_out)]),
       operands=[a, taus],
       api_version=1,
       result_shapes=result_shapes)
@@ -1528,8 +1527,8 @@ def _lu_jvp_rule(primals, tangents):
     lu_dot_fun = api.vmap(lu_dot_fun)
   lu_dot = lu_dot_fun(lu, a_dot, permutation)
 
-  return (lu, pivots, permutation), (lu_dot, ad_util.Zero.from_primal_value(pivots),
-                                     ad_util.Zero.from_primal_value(permutation))
+  return (lu, pivots, permutation), (lu_dot, ad_util.p2tz(pivots),
+                                     ad_util.p2tz(permutation))
 
 
 def _lu_cpu_gpu_lowering(ctx, operand, *, target_name_prefix: str):
@@ -1562,10 +1561,11 @@ def _lu_cpu_gpu_lowering(ctx, operand, *, target_name_prefix: str):
 
 
 def _lu_tpu_lowering_rule(ctx, operand):
-  result_types = [
-    mlir.aval_to_ir_type(ctx.avals_out[0]),
-    mlir.aval_to_ir_type(ctx.avals_out[1]),
-    mlir.aval_to_ir_type(ctx.avals_out[2])]
+  result_types = mlir.flatten_ir_types([
+      mlir.aval_to_ir_type(ctx.avals_out[0]),
+      mlir.aval_to_ir_type(ctx.avals_out[1]),
+      mlir.aval_to_ir_type(ctx.avals_out[2]),
+  ])
   if any(not is_constant_shape(a.shape) for a in ctx.avals_out):
     result_shapes = [
       mlir.eval_dynamic_shape_as_tensor(ctx, a.shape)
@@ -1767,7 +1767,7 @@ def _geqrf_dtype_rule(dtype):
 def _geqrf_lowering_rule(ctx, operand):
   ts_type = mlir.aval_to_ir_type(ctx.avals_out[0])
   r_type = mlir.aval_to_ir_type(ctx.avals_out[1])
-  result_types = [ts_type, r_type]
+  result_types = mlir.flatten_ir_types([ts_type, r_type])
   if any(not is_constant_shape(aval_out.shape)
          for aval_out in ctx.avals_out):
     result_shapes = [
@@ -1879,7 +1879,7 @@ def qr_jvp_rule(primals, tangents, *, pivoting, full_matrices, use_magma):
   dq = q @ (do - qt_dx_rinv) + dx_rinv
   dr = (qt_dx_rinv - do) @ r
   if pivoting:
-    dp = ad_util.Zero.from_primal_value(p[0])
+    dp = ad_util.p2tz(p[0])
     return (q, r, p[0]), (dq, dr, dp)
   return (q, r), (dq, dr)
 
@@ -1896,12 +1896,14 @@ def _qr_lowering(a, *, pivoting, full_matrices, use_magma):
       return q, r, p
     return q, r
 
+  p = None
   if pivoting:
     jpvt = lax.full((*batch_dims, n), 0, dtype=np.dtype(np.int32))
     r, p, taus = geqp3(a, jpvt, use_magma=use_magma)
     p -= 1  # Convert geqp3's 1-based indices to 0-based indices by subtracting 1.
   else:
     r, taus = geqrf(a)
+    p = None
 
   if m < n:
     q = householder_product(r[..., :m, :m], taus)
@@ -1914,6 +1916,7 @@ def _qr_lowering(a, *, pivoting, full_matrices, use_magma):
     r = r[..., :n, :n]
   r = _triu(r)
   if pivoting:
+    assert p is not None
     return q, r, p
   return q, r
 
@@ -2179,28 +2182,25 @@ def _svd_gpu_sub_lowering(ctx, operand, *, full_matrices, compute_uv,
   transposed = False
   kwargs = {}
 
-  # The Jacobi algorithm appears to outperform the default QR algorithm for
-  # small to medium sized matrices. See:
+  # The Jacobi algorithm (gesvdj) appears to outperform the default QR
+  # algorithm (gesvd) on CUDA for small to medium matrices. See:
   # https://developer.download.nvidia.com/video/gputechconf/gtc/2019/presentation/s9226-fast-singular-value-decomposition-on-gpus-v2.pdf
-  # slide 5. With this in mind, we default to using the Jacobi algorithm for
-  # matrices smaller than 1024x1024.
+  # slide 5. So on CUDA we default to Jacobi for matrices with m, n <= 1024.
   #
-  # Note that the Jacobi algorithm is only used by default for matrices with
-  # concrete matrix dimensions. When using dynamic shapes, we always use the
-  # default QR algorithm, but users can (in principle) override this behavior
-  # by passing `use_jacobi=True`.
+  # On ROCm, rocsolver benchmarks show gesdd (divide-and-conquer) is faster
+  # than gesvdj for all tested sizes (e.g. ~3x faster at m=256,512). We
+  # therefore use gesdd by default on ROCm for all dimensions and do not
+  # default to Jacobi there.
   #
-  # TODO(danfm): Since this was originally implemented, hipSolver appears to
-  # have added support for the Jacobi algorithm, so we should investigate
-  # removing this condition.
-  # TODO(phawkins): Consider making polar decomposition the default.
+  # Note that the Jacobi algorithm is only used by default for matrices with
+  # concrete dimensions. When using dynamic shapes we use the default path.
+  # Users can override via algorithm=SvdAlgorithm.JACOBI or .DEFAULT.
   use_jacobi = False
   use_polar = False
   if algorithm is None or algorithm == SvdAlgorithm.DEFAULT:
     try:
-      gpu_available = target_name_prefix == "cu" or \
-                      target_name_prefix == "hip"
-      use_jacobi = gpu_available and m <= 1024 and n <= 1024
+      # Only CUDA: use Jacobi for small/medium; ROCm uses gesdd for all sizes.
+      use_jacobi = (target_name_prefix == "cu") and m <= 1024 and n <= 1024
     except core.InconclusiveDimensionOperation:
       use_jacobi = False
   elif algorithm == SvdAlgorithm.JACOBI:
@@ -2209,28 +2209,46 @@ def _svd_gpu_sub_lowering(ctx, operand, *, full_matrices, compute_uv,
     use_polar = True
 
   column_major = True
+  econ = not full_matrices
+  transposed = False
+  kwargs = {}
   if use_jacobi:
     target_name = f"{target_name_prefix}solver_gesvdj_ffi"
-    # The gesvdjbatched kernel doesn't support "econ" mode, but it also only
-    # supports matrices up to 32x32, so it's always worth using the batched
-    # version and then slicing afterwards when the matrix is small enough.
-    try:
-      econ = not full_matrices and m > 32 and n > 32
-    except core.InconclusiveDimensionOperation:
-      econ = False
+  elif algorithm == SvdAlgorithm.QR:
+    # Explicit QR (gesvd) path: use gesvd on both CUDA and ROCm for back-compat.
+    target_name = f"{target_name_prefix}solver_gesvd_ffi"
+    econ = not full_matrices
+    transposed = m < n
+    kwargs = {"transposed": transposed}
+    if transposed:
+      column_major = False
   elif use_polar:
     target_name = f"{target_name_prefix}solver_gesvdp_ffi"
     econ = not full_matrices
   else:
-    target_name = f"{target_name_prefix}solver_gesvd_ffi"
+    # On ROCm, use gesdd (divide-and-conquer) for better performance when
+    # rocsolver is available; on CUDA use gesvd (QR-based).
+    if target_name_prefix == "hip":
+      target_name = f"{target_name_prefix}solver_gesdd_ffi"
+    else:
+      target_name = f"{target_name_prefix}solver_gesvd_ffi"
     econ = not full_matrices
     # Because the base gesvd kernel only supports matrices where m >= n, we
-    # conceptually transpose the matrix if m < n.
-    transposed = m < n
+    # conceptually transpose the matrix if m < n. gesdd supports any shape.
+    transposed = m < n and target_name_prefix != "hip"
     kwargs = {"transposed": transposed}
     if transposed:
       column_major = False
 
+  if use_jacobi:
+    # The gesvdjbatched kernel doesn't support "econ" mode, but it also only
+    # supports matrices up to 32x32, so it's always worth using the batched
+    # version and then slicing afterwards when the matrix is small enough.
+    try:
+      econ = not full_matrices and m > 32 and n > 32
+    except core.InconclusiveDimensionOperation:
+      econ = False
+
   if use_jacobi or use_polar:
     # When using the Jacobi or polar algorithms, the U and V matrices must
     # always be allocated even if compute_uv is False.
@@ -2250,7 +2268,7 @@ def _svd_gpu_sub_lowering(ctx, operand, *, full_matrices, compute_uv,
   if (use_jacobi or use_polar) and compute_uv:
     vt = hlo.transpose(
         vt,
-        mlir.dense_int_array(np.array(tuple(range(nb)) + (nb + 1, nb))))
+        mlir.dense_int_array(tuple(range(nb)) + (nb + 1, nb)))
     if np.issubdtype(operand_aval.dtype, np.complexfloating):
       vt = hlo.complex(hlo.real(vt), hlo.negate(hlo.imag(vt)))
     if not full_matrices and not econ:
@@ -2421,7 +2439,7 @@ def _triangular_solve_lowering(
   out = hlo.triangular_solve(a, b, ir.BoolAttr.get(left_side),
                              ir.BoolAttr.get(lower),
                              ir.BoolAttr.get(unit_diagonal),
-                             hlo.TransposeAttr.get(transpose))
+                             hlo.TransposeAttr.get(transpose))  # pyrefly: ignore[missing-attribute]
   return [mlir.lower_with_sharding_in_types(ctx, out, out_aval)]
 
 
@@ -2458,6 +2476,7 @@ def _triangular_solve_cpu_lower(
     return [hlo.triangular_solve(a, b, ir.BoolAttr.get(left_side),
                                  ir.BoolAttr.get(lower),
                                  ir.BoolAttr.get(unit_diagonal),
+                                 # pyrefly: ignore[missing-attribute]
                                  hlo.TransposeAttr.get(transpose))]
 
 triangular_solve_p = linalg_primitive(
@@ -2562,6 +2581,7 @@ def _tridiagonal_solve_jvp_rule(primals, tangents):
   if all(type(p) is ad_util.Zero for p in diags_dot):
     rhs = b_dot
   else:
+    # pyrefly: ignore[bad-argument-count]  # pyrefly#2468
     matvec_dot = _tridiagonal_product(*map(ad.instantiate_zeros, diags_dot), ans)
     rhs = ad.add_tangents(b_dot, -matvec_dot)
   ans_dot = tridiagonal_solve_p.bind(*diags, rhs)
@@ -2575,9 +2595,9 @@ def _tridiagonal_solve_transpose_rule(cotangent, dl, d, du, b):
   if type(cotangent) is ad_util.Zero:
     cotangent_b = ad_util.Zero(b.aval)
   else:
-    dl_trans = lax.concatenate((lax.zeros_like_array(du[..., -1:]), du[..., :-1]),
+    dl_trans = lax.concatenate((lax.full_like(du[..., -1:], 0), du[..., :-1]),
                                du.ndim-1)
-    du_trans = lax.concatenate((dl[..., 1:], lax.zeros_like_array(dl[..., :1])),
+    du_trans = lax.concatenate((dl[..., 1:], lax.full_like(dl[..., :1], 0)),
                                dl.ndim-1)
     cotangent_b = tridiagonal_solve(dl_trans, d, du_trans, cotangent)
   return [None, None, None, cotangent_b]
@@ -2707,12 +2727,12 @@ def symmetrize(x: Array) -> Array: return (x + _H(x)) / 2
 def _tril(m: Array, k:int = 0) -> Array:
   *_, N, M = m.shape
   mask = lax._tri(bool, (N, M), k)
-  return lax.select(lax.broadcast(mask, m.shape[:-2]), m, lax.zeros_like_array(m))
+  return lax.select(lax.broadcast(mask, m.shape[:-2]), m, lax.full_like(m, 0))
 
 def _triu(m: Array, k:int = 0) -> Array:
   *_, N, M = m.shape
   mask = lax._tri(bool, (N, M), k - 1)
-  return lax.select(lax.broadcast(mask, m.shape[:-2]), lax.zeros_like_array(m), m)
+  return lax.select(lax.broadcast(mask, m.shape[:-2]), lax.full_like(m, 0), m)
 
 def _construct_diagonal(s: Array) -> Array:
   """Construct a (batched) diagonal matrix"""
diff --git a/jaxlib/gpu/solver.cc b/jaxlib/gpu/solver.cc
index 6eb76b570722..096fdbabc8aa 100644
--- a/jaxlib/gpu/solver.cc
+++ b/jaxlib/gpu/solver.cc
@@ -37,6 +37,10 @@ nb::dict Registrations() {
   dict[JAX_GPU_PREFIX "solver_gesvdj_ffi"] = EncapsulateFfiHandler(GesvdjFfi);
   dict[JAX_GPU_PREFIX "solver_sytrd_ffi"] = EncapsulateFfiHandler(SytrdFfi);
 
+#ifdef JAX_GPU_HIP
+  dict[JAX_GPU_PREFIX "solver_gesdd_ffi"] = EncapsulateFfiHandler(GesddFfi);
+#endif  // JAX_GPU_HIP
+
 #ifdef JAX_GPU_CUDA
   dict[JAX_GPU_PREFIX "solver_gesvdp_ffi"] = EncapsulateFfiHandler(GesvdpFfi);
   dict[JAX_GPU_PREFIX "solver_csrlsvqr_ffi"] =
diff --git a/jaxlib/gpu/solver_interface.cc b/jaxlib/gpu/solver_interface.cc
index 8866c7bea2fe..ee128fb5f836 100644
--- a/jaxlib/gpu/solver_interface.cc
+++ b/jaxlib/gpu/solver_interface.cc
@@ -15,8 +15,13 @@ limitations under the License.
 
 #include "jaxlib/gpu/solver_interface.h"
 
+#include <map>
+#include <tuple>
+
 #include "absl/status/status.h"
+#include "absl/synchronization/mutex.h"
 #include "absl/status/statusor.h"
+#include "absl/strings/str_format.h"
 #include "jaxlib/gpu/gpu_kernel_helpers.h"
 #include "jaxlib/gpu/vendor.h"
 
@@ -62,8 +67,8 @@ JAX_GPU_DEFINE_GETRF(gpuDoubleComplex, gpusolverDnZgetrf);
 
 JAX_GPU_DEFINE_GETRF_BATCHED(float, gpublasSgetrfBatched);
 JAX_GPU_DEFINE_GETRF_BATCHED(double, gpublasDgetrfBatched);
-JAX_GPU_DEFINE_GETRF_BATCHED(gpuComplex, gpublasCgetrfBatched);
-JAX_GPU_DEFINE_GETRF_BATCHED(gpuDoubleComplex, gpublasZgetrfBatched);
+JAX_GPU_DEFINE_GETRF_BATCHED(gpublasComplex, gpublasCgetrfBatched);
+JAX_GPU_DEFINE_GETRF_BATCHED(gpublasDoubleComplex, gpublasZgetrfBatched);
 #undef JAX_GPU_DEFINE_GETRF_BATCHED
 
 // QR decomposition: geqrf
@@ -101,8 +106,8 @@ JAX_GPU_DEFINE_GEQRF(gpuDoubleComplex, gpusolverDnZgeqrf);
 
 JAX_GPU_DEFINE_GEQRF_BATCHED(float, gpublasSgeqrfBatched);
 JAX_GPU_DEFINE_GEQRF_BATCHED(double, gpublasDgeqrfBatched);
-JAX_GPU_DEFINE_GEQRF_BATCHED(gpuComplex, gpublasCgeqrfBatched);
-JAX_GPU_DEFINE_GEQRF_BATCHED(gpuDoubleComplex, gpublasZgeqrfBatched);
+JAX_GPU_DEFINE_GEQRF_BATCHED(gpublasComplex, gpublasCgeqrfBatched);
+JAX_GPU_DEFINE_GEQRF_BATCHED(gpublasDoubleComplex, gpublasZgeqrfBatched);
 #undef JAX_GPU_DEFINE_GEQRF_BATCHED
 
 // Householder transformations: orgqr
@@ -272,8 +277,8 @@ JAX_GPU_DEFINE_SYEVD(gpuDoubleComplex, gpusolverDnZheevd);
 
 JAX_GPU_DEFINE_SYRK(float, gpublasSsyrk);
 JAX_GPU_DEFINE_SYRK(double, gpublasDsyrk);
-JAX_GPU_DEFINE_SYRK(gpuComplex, gpublasCsyrk);
-JAX_GPU_DEFINE_SYRK(gpuDoubleComplex, gpublasZsyrk);
+JAX_GPU_DEFINE_SYRK(gpublasComplex, gpublasCsyrk);
+JAX_GPU_DEFINE_SYRK(gpublasDoubleComplex, gpublasZsyrk);
 #undef JAX_GPU_DEFINE_SYRK
 
 // Singular Value Decomposition: gesvd
@@ -357,6 +362,238 @@ JAX_GPU_DEFINE_GESVDJ_BATCHED(gpuComplex, gpusolverDnCgesvdjBatched);
 JAX_GPU_DEFINE_GESVDJ_BATCHED(gpuDoubleComplex, gpusolverDnZgesvdjBatched);
 #undef JAX_GPU_DEFINE_GESVDJ_BATCHED
 
+#ifdef JAX_GPU_HIP
+// GESDD (divide-and-conquer SVD) is provided by rocsolver; hipSOLVER does not
+// expose it. rocsolver uses rocblas_handle; on ROCm the solver handle is
+// compatible with rocblas_handle.
+#include "rocm/include/rocsolver/rocsolver.h"
+
+namespace {
+rocblas_svect JobToRocblasSvect(signed char job) {
+  switch (job) {
+    case 'A':
+      return rocblas_svect_all;
+    case 'S':
+      return rocblas_svect_singular;
+    case 'N':
+    default:
+      return rocblas_svect_none;
+  }
+}
+
+absl::Status RocblasStatusToStatus(rocblas_status status, const char* file,
+                                  int line, const char* expr) {
+  if (ABSL_PREDICT_FALSE(status != rocblas_status_success)) {
+    return absl::InternalError(
+        absl::StrFormat("%s:%d: %s failed: rocblas_status %d", file, line, expr,
+                        static_cast<int>(status)));
+  }
+  return absl::OkStatus();
+}
+}  // namespace
+
+#define JAX_GPU_DEFINE_GESDD_REAL(Type, Name)                                  \
+  template <>                                                                  \
+  absl::Status Gesdd<Type>(                                                    \
+      gpusolverDnHandle_t handle, signed char jobu, signed char jobvt,        \
+      int m, int n, Type *a, int lda, RealType<Type>::value *s, Type *u,      \
+      int ldu, Type *v, int ldv, int *info) {                                  \
+    auto h = reinterpret_cast<rocblas_handle>(handle);                        \
+    rocblas_status st = Name(h, JobToRocblasSvect(jobu),                       \
+                             JobToRocblasSvect(jobvt), m, n, a, lda, s, u,    \
+                             ldu, v, ldv, info);                               \
+    return RocblasStatusToStatus(st, __FILE__, __LINE__, #Name);               \
+  }
+
+JAX_GPU_DEFINE_GESDD_REAL(float, rocsolver_sgesdd);
+JAX_GPU_DEFINE_GESDD_REAL(double, rocsolver_dgesdd);
+#undef JAX_GPU_DEFINE_GESDD_REAL
+
+template <>
+absl::Status Gesdd<gpuComplex>(
+    gpusolverDnHandle_t handle, signed char jobu, signed char jobvt, int m,
+    int n, gpuComplex *a, int lda, float *s, gpuComplex *u, int ldu,
+    gpuComplex *v, int ldv, int *info) {
+  auto h = reinterpret_cast<rocblas_handle>(handle);
+  rocblas_status st = rocsolver_cgesdd(
+      h, JobToRocblasSvect(jobu), JobToRocblasSvect(jobvt), m, n,
+      reinterpret_cast<rocblas_float_complex*>(a), lda, s,
+      reinterpret_cast<rocblas_float_complex*>(u), ldu,
+      reinterpret_cast<rocblas_float_complex*>(v), ldv, info);
+  return RocblasStatusToStatus(st, __FILE__, __LINE__, "rocsolver_cgesdd");
+}
+
+template <>
+absl::Status Gesdd<gpuDoubleComplex>(
+    gpusolverDnHandle_t handle, signed char jobu, signed char jobvt, int m,
+    int n, gpuDoubleComplex *a, int lda, double *s, gpuDoubleComplex *u,
+    int ldu, gpuDoubleComplex *v, int ldv, int *info) {
+  auto h = reinterpret_cast<rocblas_handle>(handle);
+  rocblas_status st = rocsolver_zgesdd(
+      h, JobToRocblasSvect(jobu), JobToRocblasSvect(jobvt), m, n,
+      reinterpret_cast<rocblas_double_complex*>(a), lda, s,
+      reinterpret_cast<rocblas_double_complex*>(u), ldu,
+      reinterpret_cast<rocblas_double_complex*>(v), ldv, info);
+  return RocblasStatusToStatus(st, __FILE__, __LINE__, "rocsolver_zgesdd");
+}
+
+// Workspace size query and set for rocsolver (two-phase memory model).
+absl::Status SetWorkspace(gpusolverDnHandle_t handle, void* ptr, size_t size) {
+  auto h = reinterpret_cast<rocblas_handle>(handle);
+  rocblas_status st = rocblas_set_workspace(h, ptr, size);
+  return RocblasStatusToStatus(st, __FILE__, __LINE__, "rocblas_set_workspace");
+}
+
+namespace {
+template <typename T>
+rocblas_status GesddQueryImpl(gpusolverDnHandle_t handle, signed char jobu,
+                              signed char jobvt, int m, int n);
+template <>
+rocblas_status GesddQueryImpl<float>(gpusolverDnHandle_t handle, signed char jobu,
+                                     signed char jobvt, int m, int n) {
+  auto h = reinterpret_cast<rocblas_handle>(handle);
+  return rocsolver_sgesdd(h, JobToRocblasSvect(jobu), JobToRocblasSvect(jobvt),
+                          m, n, nullptr, m, nullptr, nullptr, m, nullptr, n,
+                          nullptr);
+}
+template <>
+rocblas_status GesddQueryImpl<double>(gpusolverDnHandle_t handle, signed char jobu,
+                                      signed char jobvt, int m, int n) {
+  auto h = reinterpret_cast<rocblas_handle>(handle);
+  return rocsolver_dgesdd(h, JobToRocblasSvect(jobu), JobToRocblasSvect(jobvt),
+                          m, n, nullptr, m, nullptr, nullptr, m, nullptr, n,
+                          nullptr);
+}
+template <>
+rocblas_status GesddQueryImpl<gpuComplex>(gpusolverDnHandle_t handle,
+                                          signed char jobu, signed char jobvt,
+                                          int m, int n) {
+  auto h = reinterpret_cast<rocblas_handle>(handle);
+  return rocsolver_cgesdd(h, JobToRocblasSvect(jobu), JobToRocblasSvect(jobvt),
+                          m, n, nullptr, m, nullptr, nullptr, m, nullptr, n,
+                          nullptr);
+}
+template <>
+rocblas_status GesddQueryImpl<gpuDoubleComplex>(gpusolverDnHandle_t handle,
+                                                 signed char jobu,
+                                                 signed char jobvt, int m,
+                                                 int n) {
+  auto h = reinterpret_cast<rocblas_handle>(handle);
+  return rocsolver_zgesdd(h, JobToRocblasSvect(jobu), JobToRocblasSvect(jobvt),
+                          m, n, nullptr, m, nullptr, nullptr, m, nullptr, n,
+                          nullptr);
+}
+}  // namespace
+
+// Cache workspace size per (m, n, job) to avoid the expensive query (which
+// runs the full rocsolver path with nullptr) on every call. Same shape =>
+// same size; query once per (m, n, job) and dtype.
+namespace {
+absl::Mutex& GesddWorkspaceCacheMutex() {
+  static absl::Mutex mu;
+  return mu;
+}
+
+// Dedicated handle for workspace size queries (no stream set → default stream).
+gpusolverDnHandle_t GetGesddQueryHandleImpl() {
+  thread_local gpusolverDnHandle_t h = nullptr;
+  if (h == nullptr) {
+    if (gpusolverDnCreate(&h) != GPUSOLVER_STATUS_SUCCESS) return nullptr;
+  }
+  return h;
+}
+}  // namespace
+
+gpusolverDnHandle_t GetGesddQueryHandle() {
+  return GetGesddQueryHandleImpl();
+}
+
+// Query only (no cache). Kernel uses this with GetGesddQueryHandle so the
+// cache lives in the kernel .cc and is shared across all invocations.
+template <typename T>
+absl::StatusOr<size_t> GesddWorkspaceSizeQuery(gpusolverDnHandle_t handle,
+                                               signed char jobu,
+                                               signed char jobvt, int m,
+                                               int n) {
+  auto h = reinterpret_cast<rocblas_handle>(handle);
+  rocblas_status st = rocblas_start_device_memory_size_query(h);
+  JAX_RETURN_IF_ERROR(RocblasStatusToStatus(st, __FILE__, __LINE__,
+                                            "rocblas_start_device_memory_size_query"));
+  st = GesddQueryImpl<T>(handle, jobu, jobvt, m, n);
+  if (st != rocblas_status_success) {
+    (void)rocblas_stop_device_memory_size_query(h, nullptr);
+    return RocblasStatusToStatus(st, __FILE__, __LINE__, "rocsolver_*gesdd (query)");
+  }
+  size_t size = 0;
+  st = rocblas_stop_device_memory_size_query(h, &size);
+  JAX_RETURN_IF_ERROR(RocblasStatusToStatus(st, __FILE__, __LINE__,
+                                            "rocblas_stop_device_memory_size_query"));
+  return size;
+}
+
+template <typename T>
+absl::StatusOr<size_t> GesddWorkspaceSize(gpusolverDnHandle_t handle,
+                                         signed char jobu, signed char jobvt,
+                                         int m, int n) {
+  using Key = std::tuple<int, int, signed char>;
+  static std::map<Key, size_t> cache;
+
+  Key key(m, n, jobu);
+  {
+    absl::MutexLock lock(&GesddWorkspaceCacheMutex());
+    auto it = cache.find(key);
+    if (it != cache.end()) return it->second;
+  }
+
+  gpusolverDnHandle_t query_handle = GetGesddQueryHandleImpl();
+  if (query_handle == nullptr) {
+    return absl::InternalError("Failed to create gesdd query handle");
+  }
+  auto h = reinterpret_cast<rocblas_handle>(query_handle);
+  rocblas_status st = rocblas_start_device_memory_size_query(h);
+  JAX_RETURN_IF_ERROR(RocblasStatusToStatus(st, __FILE__, __LINE__,
+                                            "rocblas_start_device_memory_size_query"));
+  st = GesddQueryImpl<T>(query_handle, jobu, jobvt, m, n);
+  if (st != rocblas_status_success) {
+    (void)rocblas_stop_device_memory_size_query(h, nullptr);
+    return RocblasStatusToStatus(st, __FILE__, __LINE__, "rocsolver_*gesdd (query)");
+  }
+  size_t size = 0;
+  st = rocblas_stop_device_memory_size_query(h, &size);
+  JAX_RETURN_IF_ERROR(RocblasStatusToStatus(st, __FILE__, __LINE__,
+                                            "rocblas_stop_device_memory_size_query"));
+  {
+    absl::MutexLock lock(&GesddWorkspaceCacheMutex());
+    cache[key] = size;
+  }
+  return size;
+}
+
+template absl::StatusOr<size_t> GesddWorkspaceSize<float>(gpusolverDnHandle_t,
+                                                          signed char, signed char,
+                                                          int, int);
+template absl::StatusOr<size_t> GesddWorkspaceSize<double>(gpusolverDnHandle_t,
+                                                           signed char, signed char,
+                                                           int, int);
+template absl::StatusOr<size_t> GesddWorkspaceSize<gpuComplex>(gpusolverDnHandle_t,
+                                                               signed char, signed char,
+                                                               int, int);
+template absl::StatusOr<size_t> GesddWorkspaceSize<gpuDoubleComplex>(
+    gpusolverDnHandle_t, signed char, signed char, int, int);
+
+template absl::StatusOr<size_t> GesddWorkspaceSizeQuery<float>(gpusolverDnHandle_t,
+                                                                signed char, signed char,
+                                                                int, int);
+template absl::StatusOr<size_t> GesddWorkspaceSizeQuery<double>(gpusolverDnHandle_t,
+                                                                 signed char, signed char,
+                                                                 int, int);
+template absl::StatusOr<size_t> GesddWorkspaceSizeQuery<gpuComplex>(gpusolverDnHandle_t,
+                                                                    signed char, signed char,
+                                                                    int, int);
+template absl::StatusOr<size_t> GesddWorkspaceSizeQuery<gpuDoubleComplex>(
+    gpusolverDnHandle_t, signed char, signed char, int, int);
+#endif  // JAX_GPU_HIP
+
 #ifdef JAX_GPU_CUDA
 
 #define JAX_GPU_DEFINE_CSRLSVQR(Type, Scalar, Name)                          \
diff --git a/jaxlib/gpu/solver_interface.h b/jaxlib/gpu/solver_interface.h
index fb284ec984dd..67bbb6ec831d 100644
--- a/jaxlib/gpu/solver_interface.h
+++ b/jaxlib/gpu/solver_interface.h
@@ -227,6 +227,37 @@ JAX_GPU_SOLVER_EXPAND_DEFINITION(absl::StatusOr<int>, GesvdjBatchedBufferSize);
 JAX_GPU_SOLVER_EXPAND_DEFINITION(absl::Status, GesvdjBatched);
 #undef JAX_GPU_SOLVER_GesvdjBatched_ARGS
 
+// Singular Value Decomposition (divide-and-conquer): gesdd (ROCm only, via
+// rocsolver; CUDA cusolver does not expose gesdd).
+#define JAX_GPU_SOLVER_Gesdd_ARGS(Type, Real)                                  \
+  gpusolverDnHandle_t handle, signed char jobu, signed char jobvt, int m,      \
+      int n, Type *a, int lda, Real *s, Type *u, int ldu, Type *v, int ldv,   \
+      int *info
+JAX_GPU_SOLVER_EXPAND_DEFINITION(absl::Status, Gesdd);
+#undef JAX_GPU_SOLVER_Gesdd_ARGS
+
+#ifdef JAX_GPU_HIP
+// Query workspace size required by rocsolver gesdd (two-phase memory model).
+// Returns the size in bytes to pass to SetWorkspace before calling Gesdd.
+template <typename T>
+absl::StatusOr<size_t> GesddWorkspaceSize(gpusolverDnHandle_t handle,
+                                         signed char jobu, signed char jobvt,
+                                         int m, int n);
+// Run workspace size query on the given handle (no cache). Used by the kernel
+// with a dedicated query handle so the cache lives in the kernel translation
+// unit and is shared across warmup and timed runs.
+template <typename T>
+absl::StatusOr<size_t> GesddWorkspaceSizeQuery(gpusolverDnHandle_t handle,
+                                              signed char jobu, signed char jobvt,
+                                              int m, int n);
+// Handle used only for workspace size queries (no stream set). Kernel uses
+// this so query work is not on the execution stream.
+gpusolverDnHandle_t GetGesddQueryHandle();
+// Set user-owned workspace for rocsolver/rocblas (HIP only). Call with
+// (handle, ptr, size) before Gesdd; call with (handle, nullptr, 0) to clear.
+absl::Status SetWorkspace(gpusolverDnHandle_t handle, void* ptr, size_t size);
+#endif  // JAX_GPU_HIP
+
 #ifdef JAX_GPU_CUDA
 
 #define JAX_GPU_SOLVER_Csrlsvqr_ARGS(Type, ...)                          \
diff --git a/jaxlib/gpu/solver_kernels_ffi.cc b/jaxlib/gpu/solver_kernels_ffi.cc
index e568a49d58f0..35502b23046a 100644
--- a/jaxlib/gpu/solver_kernels_ffi.cc
+++ b/jaxlib/gpu/solver_kernels_ffi.cc
@@ -17,8 +17,13 @@ limitations under the License.
 
 #include <algorithm>
 #include <cstdint>
+#include <cstring>
+#include <cstdio>
+#include <cstdlib>
+#include <map>
 #include <memory>
 #include <string_view>
+#include <tuple>
 
 #if JAX_GPU_HAVE_64_BIT
 #include <cstddef>
@@ -1146,6 +1151,169 @@ XLA_FFI_DEFINE_HANDLER_SYMBOL(GesvdjFfi, GesvdjDispatch,
                                   .Ret<ffi::Buffer<ffi::S32>>()  // info
 );
 
+#ifdef JAX_GPU_HIP
+// Workspace size from LAPACK formula instead of querying rocsolver. rocsolver
+// does support a workspace query via rocblas_start_device_memory_size_query +
+// a dummy rocsolver_*gesdd call (see GesddWorkspaceSize in solver_interface.cc),
+// but that two-phase query can fail with rocblas_status 8/9 in some
+// environments; the formula avoids that and never blocks. rocsolver gesdd
+// needs more than LAPACK minimum (syevd+geqrf+orgqr buffers). Use 8x: 2x was
+// too small (slow path for 1536/2048); 16x caused ~1GB for N=2048 and
+// allocation cost. 8x gives ~512MB for 2048. LAPACK for JOBZ='S':
+// 4*mn^2+7*mn elements.
+namespace {
+template <typename T>
+size_t GesddWorkspaceSizeFromFormula(signed char job, int m, int n) {
+  int mn = std::min(m, n);
+  int mx = std::max(m, n);
+  int64_t min_elements;
+  switch (job) {
+    case 'N':
+      min_elements = 3 * mn + std::max(mx, 7 * mn);
+      break;
+    case 'O':
+      min_elements = 3 * mn + std::max(mx, 5 * mn * mn + 4 * mn);
+      break;
+    case 'S':
+      min_elements = 4 * static_cast<int64_t>(mn) * mn + 7 * mn;
+      break;
+    case 'A':
+      min_elements = 4 * static_cast<int64_t>(mn) * mn + 6 * mn + mx;
+      break;
+    default:
+      min_elements = 4 * static_cast<int64_t>(mn) * mn + 7 * mn;
+  }
+  min_elements = std::max(int64_t(1), min_elements);
+  int64_t elements = min_elements * 8;
+  elements += 4096;
+  return static_cast<size_t>(elements) * sizeof(T);
+}
+}  // namespace
+
+// Singular Value Decomposition (divide-and-conquer): gesdd (ROCm rocsolver).
+template <typename T>
+ffi::Error GesddImpl(int64_t batch, int64_t rows, int64_t cols,
+                     gpuStream_t stream, ffi::ScratchAllocator& scratch,
+                     bool full_matrices, bool compute_uv, ffi::AnyBuffer a,
+                     ffi::Result<ffi::AnyBuffer> out,
+                     ffi::Result<ffi::AnyBuffer> s,
+                     ffi::Result<ffi::AnyBuffer> u,
+                     ffi::Result<ffi::AnyBuffer> vt,
+                     ffi::Result<ffi::Buffer<ffi::S32>> info) {
+  FFI_ASSIGN_OR_RETURN(auto m, MaybeCastNoOverflow<int>(rows));
+  FFI_ASSIGN_OR_RETURN(auto n, MaybeCastNoOverflow<int>(cols));
+  FFI_ASSIGN_OR_RETURN(auto handle, SolverHandlePool::Borrow(stream));
+  // For square matrices, 'A' and 'S' produce the same output shapes.
+  // Prefer 'S' to avoid slower rocsolver code paths observed for some sizes
+  // (notably n=1536) with job='A'.
+  signed char job =
+      compute_uv ? ((full_matrices && m != n) ? 'A' : 'S') : 'N';
+
+  // Formula-based workspace (no query) to avoid rocblas_status 8/9 in some envs.
+  size_t workspace_size = GesddWorkspaceSizeFromFormula<T>(job, m, n);
+  auto maybe_workspace = scratch.Allocate(workspace_size);
+  if (!maybe_workspace.has_value()) {
+    return ffi::Error(ffi::ErrorCode::kResourceExhausted,
+                      "Unable to allocate device workspace for gesdd");
+  }
+  void* workspace_ptr = maybe_workspace.value();
+  FFI_RETURN_IF_ERROR_STATUS(
+      solver::SetWorkspace(handle.get(), workspace_ptr, workspace_size));
+
+  auto a_data = static_cast<T*>(a.untyped_data());
+  auto out_data = static_cast<T*>(out->untyped_data());
+  auto s_data =
+      static_cast<typename solver::RealType<T>::value*>(s->untyped_data());
+  auto u_data = compute_uv ? static_cast<T*>(u->untyped_data()) : nullptr;
+  auto vt_data = compute_uv ? static_cast<T*>(vt->untyped_data()) : nullptr;
+  auto info_data = info->typed_data();
+
+  if (a_data != out_data) {
+    JAX_FFI_RETURN_IF_GPU_ERROR(gpuMemcpyAsync(
+        out_data, a_data, a.size_bytes(), gpuMemcpyDeviceToDevice, stream));
+  }
+
+  int out_step = m * n;
+  int k = std::min(m, n);
+  int ldu = m;
+  int ldv = full_matrices ? n : k;
+  int u_step = compute_uv ? m * (full_matrices ? m : k) : 0;
+  int vt_step = compute_uv ? ldv * n : 0;
+  int s_step = k;
+
+  for (auto i = 0; i < batch; ++i) {
+    FFI_RETURN_IF_ERROR_STATUS(solver::Gesdd<T>(
+        handle.get(), job, job, m, n, out_data, m, s_data, u_data, ldu,
+        vt_data, ldv, info_data));
+    out_data += out_step;
+    s_data += s_step;
+    if (u_data) u_data += u_step;
+    if (vt_data) vt_data += vt_step;
+    ++info_data;
+  }
+
+  return ffi::Error::Success();
+}
+
+ffi::Error GesddDispatch(gpuStream_t stream, ffi::ScratchAllocator scratch,
+                         bool full_matrices, bool compute_uv, bool transposed,
+                         ffi::AnyBuffer a, ffi::Result<ffi::AnyBuffer> out,
+                         ffi::Result<ffi::AnyBuffer> s,
+                         ffi::Result<ffi::AnyBuffer> u,
+                         ffi::Result<ffi::AnyBuffer> vt,
+                         ffi::Result<ffi::Buffer<ffi::S32>> info) {
+  auto dataType = a.element_type();
+  if (out->element_type() != dataType ||
+      s->element_type() != ffi::ToReal(dataType) ||
+      u->element_type() != dataType || vt->element_type() != dataType) {
+    return ffi::Error::InvalidArgument(
+        "The inputs and outputs to gesdd must have the same element type");
+  }
+  FFI_ASSIGN_OR_RETURN((auto [batch, rows, cols]),
+                       SplitBatch2D(a.dimensions()));
+  int64_t m = transposed ? cols : rows;
+  int64_t n = transposed ? rows : cols;
+  int64_t k = std::min(m, n);
+  FFI_RETURN_IF_ERROR(
+      CheckShape(out->dimensions(), {batch, rows, cols}, "out", "gesdd"));
+  FFI_RETURN_IF_ERROR(CheckShape(s->dimensions(), {batch, k}, "s", "gesdd"));
+  if (compute_uv) {
+    if (full_matrices) {
+      FFI_RETURN_IF_ERROR(
+          CheckShape(u->dimensions(), {batch, m, m}, "u", "gesdd"));
+      FFI_RETURN_IF_ERROR(
+          CheckShape(vt->dimensions(), {batch, n, n}, "vt", "gesdd"));
+    } else {
+      FFI_RETURN_IF_ERROR(
+          CheckShape(u->dimensions(), {batch, m, k}, "u", "gesdd"));
+      FFI_RETURN_IF_ERROR(
+          CheckShape(vt->dimensions(), {batch, k, n}, "vt", "gesdd"));
+    }
+  }
+  FFI_RETURN_IF_ERROR(CheckShape(info->dimensions(), batch, "info", "gesdd"));
+
+  SOLVER_DISPATCH_IMPL(GesddImpl, batch, m, n, stream, scratch, full_matrices,
+                       compute_uv, a, out, s, u, vt, info);
+  return ffi::Error::InvalidArgument(absl::StrFormat(
+      "Unsupported dtype %s in gesdd", absl::FormatStreamed(dataType)));
+}
+
+XLA_FFI_DEFINE_HANDLER_SYMBOL(GesddFfi, GesddDispatch,
+                              ffi::Ffi::Bind()
+                                  .Ctx<ffi::PlatformStream<gpuStream_t>>()
+                                  .Ctx<ffi::ScratchAllocator>()
+                                  .Attr<bool>("full_matrices")
+                                  .Attr<bool>("compute_uv")
+                                  .Attr<bool>("transposed")
+                                  .Arg<ffi::AnyBuffer>()         // a
+                                  .Ret<ffi::AnyBuffer>()         // out
+                                  .Ret<ffi::AnyBuffer>()         // s
+                                  .Ret<ffi::AnyBuffer>()         // u
+                                  .Ret<ffi::AnyBuffer>()         // vt
+                                  .Ret<ffi::Buffer<ffi::S32>>()  // info
+);
+#endif  // JAX_GPU_HIP
+
 // Singular Value Decomposition: gesvdp (Polar decomposition)
 
 #ifdef JAX_GPU_CUDA
@@ -1277,10 +1445,6 @@ XLA_FFI_DEFINE_HANDLER_SYMBOL(GesvdpFfi, GesvdpDispatch,
                                   .Ret<ffi::Buffer<ffi::S32>>()  // info
 );
 
-#endif  // JAX_GPU_CUDA
-
-#ifdef JAX_GPU_CUDA
-
 // csrlsvqr: Linear system solve via Sparse QR
 
 template <typename T>
diff --git a/jaxlib/gpu/solver_kernels_ffi.h b/jaxlib/gpu/solver_kernels_ffi.h
index 176ab9932886..628db058ca2a 100644
--- a/jaxlib/gpu/solver_kernels_ffi.h
+++ b/jaxlib/gpu/solver_kernels_ffi.h
@@ -40,6 +40,10 @@ XLA_FFI_DECLARE_HANDLER_SYMBOL(GesvdFfi);
 XLA_FFI_DECLARE_HANDLER_SYMBOL(GesvdjFfi);
 XLA_FFI_DECLARE_HANDLER_SYMBOL(SytrdFfi);
 
+#ifdef JAX_GPU_HIP
+XLA_FFI_DECLARE_HANDLER_SYMBOL(GesddFfi);
+#endif  // JAX_GPU_HIP
+
 #ifdef JAX_GPU_CUDA
 XLA_FFI_DECLARE_HANDLER_SYMBOL(GesvdpFfi);
 XLA_FFI_DECLARE_HANDLER_SYMBOL(CsrlsvqrFfi);
diff --git a/jaxlib/rocm/BUILD b/jaxlib/rocm/BUILD
index 1b8e8dd1e64b..fc2424e45857 100644
--- a/jaxlib/rocm/BUILD
+++ b/jaxlib/rocm/BUILD
@@ -155,6 +155,7 @@ cc_library(
         "@com_google_absl//absl/strings:str_format",
         "@local_config_rocm//rocm:hipblas",
         "@local_config_rocm//rocm:hipsolver",
+        "@local_config_rocm//rocm:rocsolver",
     ],
 )
 
diff --git a/tests/export_back_compat_test.py b/tests/export_back_compat_test.py
index 41a4b99ed944..4688747f7bcc 100644
--- a/tests/export_back_compat_test.py
+++ b/tests/export_back_compat_test.py
@@ -34,12 +34,14 @@
 from jax._src.internal_test_util.export_back_compat_test_data import annotate_data_placement
 from jax._src.internal_test_util.export_back_compat_test_data import cpu_cholesky_lapack_potrf
 from jax._src.internal_test_util.export_back_compat_test_data import cuda_cholesky_solver_potrf
+from jax._src.internal_test_util.export_back_compat_test_data import rocm_cholesky_solver_potrf
 from jax._src.internal_test_util.export_back_compat_test_data import cpu_eig_lapack_geev
 from jax._src.internal_test_util.export_back_compat_test_data import cuda_eigh_cusolver_syev
 from jax._src.internal_test_util.export_back_compat_test_data import rocm_eigh_hipsolver_syev
 from jax._src.internal_test_util.export_back_compat_test_data import cpu_eigh_lapack_syev
 from jax._src.internal_test_util.export_back_compat_test_data import cpu_lu_lapack_getrf
 from jax._src.internal_test_util.export_back_compat_test_data import cuda_qr_cusolver_geqrf
+from jax._src.internal_test_util.export_back_compat_test_data import rocm_qr_hipsolver_geqrf
 from jax._src.internal_test_util.export_back_compat_test_data import cpu_qr_lapack_geqrf
 from jax._src.internal_test_util.export_back_compat_test_data import cpu_schur_lapack_gees
 from jax._src.internal_test_util.export_back_compat_test_data import cpu_svd_lapack_gesdd
@@ -48,10 +50,15 @@
 from jax._src.internal_test_util.export_back_compat_test_data import cpu_tridiagonal_lapack_sytrd_hetrd
 from jax._src.internal_test_util.export_back_compat_test_data import cpu_tridiagonal_solve_lapack_gtsv
 from jax._src.internal_test_util.export_back_compat_test_data import cuda_threefry2x32
+from jax._src.internal_test_util.export_back_compat_test_data import rocm_threefry2x32
 from jax._src.internal_test_util.export_back_compat_test_data import cuda_lu_pivots_to_permutation
+from jax._src.internal_test_util.export_back_compat_test_data import rocm_lu_pivots_to_permutation
 from jax._src.internal_test_util.export_back_compat_test_data import cuda_lu_cusolver_getrf
+from jax._src.internal_test_util.export_back_compat_test_data import rocm_lu_rocsolver_getrf
 from jax._src.internal_test_util.export_back_compat_test_data import cuda_svd_cusolver_gesvd
+from jax._src.internal_test_util.export_back_compat_test_data import rocm_svd_hipsolver_gesvd
 from jax._src.internal_test_util.export_back_compat_test_data import cuda_tridiagonal_cusolver_sytrd
+from jax._src.internal_test_util.export_back_compat_test_data import rocm_tridiagonal_hipsolver_sytrd
 from jax._src.internal_test_util.export_back_compat_test_data import cuda_tridiagonal_solve
 from jax._src.internal_test_util.export_back_compat_test_data import tpu_Eigh
 from jax._src.internal_test_util.export_back_compat_test_data import tpu_Lu
@@ -129,18 +136,25 @@ def test_custom_call_coverage(self):
     covering_testdatas = [
         *cpu_ffi_testdatas,
         cuda_cholesky_solver_potrf.data_2025_10_15,
+        rocm_cholesky_solver_potrf.data_2026_02_05,
         cuda_threefry2x32.data_2024_07_30,
+        rocm_threefry2x32.data_2026_02_05,
         cuda_lu_pivots_to_permutation.data_2025_04_01,
+        rocm_lu_pivots_to_permutation.data_2026_02_04,
         cuda_lu_cusolver_getrf.data_2024_08_19,
+        rocm_lu_rocsolver_getrf.data_2026_02_04,
         cuda_qr_cusolver_geqrf.data_2024_09_26,
+        rocm_qr_hipsolver_geqrf.data_2026_02_04,
         cuda_eigh_cusolver_syev.data_2024_09_30,
         cuda_svd_cusolver_gesvd.data_2024_10_08,
+        rocm_svd_hipsolver_gesvd.data_2026_02_04,
         cpu_tridiagonal_solve_lapack_gtsv.data_2025_01_09,
         cuda_tridiagonal_cusolver_sytrd.data_2025_01_09,
+        rocm_tridiagonal_hipsolver_sytrd.data_2026_02_04,
         cuda_tridiagonal_solve.data_2025_06_16,
         rocm_eigh_hipsolver_syev.data_2024_08_05,
         tpu_Eigh.data, tpu_Lu.data_2023_03_21, tpu_Qr.data_2023_03_17,
-        tpu_Sharding.data_2023_03_16, tpu_ApproxTopK.data_2023_04_17,
+        tpu_Sharding.data_2025_06_30, tpu_ApproxTopK.data_2023_04_17,
         tpu_ApproxTopK.data_2023_05_16,
         tpu_stablehlo_dynamic_reduce_window.data_unary_2023_06_17,
         tpu_stablehlo_dynamic_reduce_window.data_variadic_2023_06_17,
@@ -150,6 +164,7 @@ def test_custom_call_coverage(self):
         stablehlo_dynamic_approx_top_k.data_2024_05_30,
         annotate_data_placement.data_2025_04_07_tpu,
         annotate_data_placement.data_2025_04_07_cuda,
+        annotate_data_placement.data_2026_02_04_rocm,
     ]
     # Some of the above are nested structures.
     covering_testdatas = itertools.chain(
@@ -169,10 +184,9 @@ def test_custom_call_coverage(self):
       "AllocateBuffer",  # tested in pallas/export_back_compat_pallas_test.py
       "__gpu$xla.gpu.triton",  # tested in pallas/export_back_compat_pallas_test.py
       # The following require ROCm to test
-      "hip_lu_pivots_to_permutation", "hipsolver_getrf_ffi",
       "hipsolver_geqrf_ffi", "hipsolver_orgqr_ffi", "hipsolver_syevd_ffi",
       "hipsolver_gesvd_ffi", "hipsolver_gesvdj_ffi",
-      "hipsolver_potrf_ffi",
+      # hipsolver_gesdd_ffi is covered by rocm_svd_hipsolver_gesvd (gesdd f32).
     })
     not_covered = targets_to_cover.difference(covered_targets)
     self.assertEmpty(not_covered,
@@ -222,7 +236,14 @@ def test_gpu_cholesky_solver_potrf(self, dtype_name="f32"):
     rtol = dict(f32=1e-3, f64=1e-5, c64=1e-3, c128=1e-5)[dtype_name]
     atol = dict(f32=1e-4, f64=1e-12, c64=1e-4, c128=1e-12)[dtype_name]
 
-    info = cuda_cholesky_solver_potrf.data_2025_10_15[dtype_name]
+    # Select test data based on platform
+    if jtu.test_device_matches(["rocm"]):
+      info = rocm_cholesky_solver_potrf.data_2026_02_05[dtype_name]
+    elif jtu.test_device_matches(["cuda"]):
+      info = cuda_cholesky_solver_potrf.data_2025_10_15[dtype_name]
+    else:
+      self.skipTest("Unsupported platform")
+
     data = self.load_testdata(info)
     self.run_one_test(func, data, rtol=rtol, atol=atol)
 
@@ -334,7 +355,6 @@ def test_cpu_eigh_lapack_syevd(self, dtype_name="f32"):
     rtol = dict(f32=1e-3, f64=1e-5, c64=1e-3, c128=1e-5)[dtype_name]
     atol = dict(f32=1e-4, f64=1e-12, c64=1e-4, c128=1e-12)[dtype_name]
 
-    info = cpu_eigh_lapack_syev.data_2024_08_19[dtype_name]
     data = self.load_testdata(cpu_eigh_lapack_syev.data_2024_08_19[dtype_name])
     self.run_one_test(func, data, rtol=rtol, atol=atol,
                       check_results=partial(self.check_eigh_results, operand))
@@ -382,6 +402,12 @@ def test_cuda_lu_pivots_to_permutation(self):
     data = self.load_testdata(cuda_lu_pivots_to_permutation.data_2025_04_01)
     self.run_one_test(func, data)
 
+  def test_rocm_lu_pivots_to_permutation(self):
+    shape = (2, 3, 4)
+    func = lambda: CompatTest.lu_pivots_to_permutation_harness(shape)
+    data = self.load_testdata(rocm_lu_pivots_to_permutation.data_2026_02_04)
+    self.run_one_test(func, data)
+
   @parameterized.named_parameters(
       dict(testcase_name=f"_dtype={dtype_name}",
            dtype_name=dtype_name)
@@ -396,6 +422,23 @@ def test_cuda_lu_cusolver_getrf(self, dtype_name:str):
     data = self.load_testdata(cuda_lu_cusolver_getrf.data_2024_08_19[dtype_name])
     self.run_one_test(func, data)
 
+  @parameterized.named_parameters(
+      dict(testcase_name=f"_dtype={dtype_name}",
+           dtype_name=dtype_name)
+      for dtype_name in ("f32", "f64", "c64", "c128"))
+  def test_rocm_lu_rocsolver_getrf(self, dtype_name:str):
+    if not jtu.test_device_matches(["rocm"]):
+      self.skipTest("ROCm only test")
+    if not config.enable_x64.value and dtype_name in ["f64", "c128"]:
+      self.skipTest("Test disabled for x32 mode")
+    dtype = dict(f32=np.float32, f64=np.float64,
+                 c64=np.complex64, c128=np.complex128)[dtype_name]
+    shape = (3, 4)
+    func = lambda: CompatTest.lu_harness(shape, dtype)
+    data = self.load_testdata(rocm_lu_rocsolver_getrf.data_2026_02_04[dtype_name])
+    self.run_one_test(func, data)
+
+
   @staticmethod
   def qr_harness(shape, dtype):
     # In order to keep inputs small, we construct the input programmatically
@@ -421,8 +464,6 @@ def test_cpu_qr_lapack_geqrf(self, dtype_name="f32"):
       dict(testcase_name=f"_dtype={dtype_name}", dtype_name=dtype_name)
       for dtype_name in ("f32", "f64", "c64", "c128"))
   def test_gpu_qr_solver_geqrf(self, dtype_name="f32"):
-    if not jtu.test_device_matches(["cuda"]):
-      self.skipTest("Unsupported platform")
     if not config.enable_x64.value and dtype_name in ["f64", "c128"]:
       self.skipTest("Test disabled for x32 mode")
     dtype = dict(f32=np.float32, f64=np.float64,
@@ -430,7 +471,18 @@ def test_gpu_qr_solver_geqrf(self, dtype_name="f32"):
     rtol = dict(f32=1e-3, f64=1e-5, c64=1e-3, c128=1e-5)[dtype_name]
     shape = (2, 3, 3)
     func = lambda: CompatTest.qr_harness(shape, dtype)
-    data = self.load_testdata(cuda_qr_cusolver_geqrf.data_2024_09_26[dtype_name])
+
+    platform_data = None
+    if jtu.test_device_matches(["cuda"]):
+      platform_data = \
+          cuda_qr_cusolver_geqrf.data_2024_09_26[dtype_name]
+    elif jtu.test_device_matches(["rocm"]):
+      platform_data = \
+          rocm_qr_hipsolver_geqrf.data_2026_02_04[dtype_name]
+    else:
+      self.skipTest("Unsupported platform")
+
+    data = self.load_testdata(platform_data)
     self.run_one_test(func, data, rtol=rtol)
 
   def test_tpu_Qr(self):
@@ -606,26 +658,59 @@ def func(operand):
                                             *data.inputs))
 
   @parameterized.named_parameters(
-      dict(testcase_name=f"_dtype={dtype_name}_algorithm={algorithm_name}",
-           dtype_name=dtype_name, algorithm_name=algorithm_name)
-      for dtype_name in ("f32", "f64", "c64", "c128")
-      for algorithm_name in ("qr", "jacobi"))
+      [
+          dict(testcase_name=f"_dtype={dtype_name}_algorithm={algorithm_name}",
+               dtype_name=dtype_name, algorithm_name=algorithm_name)
+          for dtype_name in ("f32", "f64", "c64", "c128")
+          for algorithm_name in ("qr", "jacobi")
+      ] + [
+          dict(testcase_name=f"_dtype={dtype_name}_algorithm=gesdd",
+               dtype_name=dtype_name, algorithm_name="gesdd")
+          for dtype_name in ("f32", "f64", "c64", "c128")
+      ])
   @jax.default_matmul_precision("float32")
   def test_gpu_svd_solver_gesvd(self, dtype_name, algorithm_name):
     if not config.enable_x64.value and dtype_name in ["f64", "c128"]:
       self.skipTest("Test disabled for x32 mode")
 
+    algorithm = dict(
+        qr=lax.linalg.SvdAlgorithm.QR,
+        jacobi=lax.linalg.SvdAlgorithm.JACOBI,
+        gesdd=lax.linalg.SvdAlgorithm.DEFAULT,  # ROCm uses gesdd by default
+    )[algorithm_name]
+
     def func(operand):
       return lax.linalg.svd(operand, full_matrices=True, compute_uv=True,
                             algorithm=algorithm)
 
     rtol = dict(f32=1e-3, f64=1e-5, c64=1e-3, c128=1e-5)[dtype_name]
     atol = dict(f32=1e-4, f64=1e-12, c64=1e-4, c128=1e-12)[dtype_name]
-    algorithm = dict(qr=lax.linalg.SvdAlgorithm.QR,
-                     jacobi=lax.linalg.SvdAlgorithm.JACOBI)[algorithm_name]
 
-    info = cuda_svd_cusolver_gesvd.data_2024_10_08[algorithm_name][dtype_name]
-    data = self.load_testdata(info)
+    # The `platform_data_map` dictionary allows additional testdata modules
+    # to be easily added to the unit test. If no acceptable testdata is found
+    # for the current platform, the test will be skipped. "gesdd" exists only
+    # for ROCm (CUDA uses gesvd/gesvdj).
+    platform_data = None
+    platform_data_map = {
+        "cuda": cuda_svd_cusolver_gesvd.data_2024_10_08,
+        "rocm": rocm_svd_hipsolver_gesvd.data_2026_02_04,
+    }
+
+    for platform, data_module in platform_data_map.items():
+      if jtu.test_device_matches([platform]):
+        if algorithm_name not in data_module:
+          continue  # e.g. CUDA has no "gesdd" data
+        if dtype_name not in data_module[algorithm_name]:
+          self.skipTest(
+              f"Test data for {algorithm_name} {dtype_name} not yet generated "
+              "(run on ROCm and paste into rocm_svd_hipsolver_gesvd.py)")
+        platform_data = data_module[algorithm_name][dtype_name]
+        break
+
+    if platform_data is None:
+      self.skipTest("Unsupported platform: " + jtu.device_under_test())
+
+    data = self.load_testdata(platform_data)
     self.run_one_test(func, data, rtol=rtol, atol=atol,
                       check_results=partial(self.check_svd_results,
                                             *data.inputs))
@@ -742,9 +827,17 @@ def func(x):
     rtol = dict(f32=1e-3, f64=1e-5, c64=1e-3, c128=1e-5)[dtype_name]
     atol = dict(f32=1e-4, f64=1e-12, c64=1e-4, c128=1e-12)[dtype_name]
 
-    data = self.load_testdata(
-        cuda_tridiagonal_cusolver_sytrd.data_2025_01_09[dtype_name]
-    )
+    platform_data = None
+    if jtu.test_device_matches(["cuda"]):
+      platform_data = \
+          cuda_tridiagonal_cusolver_sytrd.data_2025_01_09[dtype_name]
+    elif jtu.test_device_matches(["rocm"]):
+      platform_data = \
+          rocm_tridiagonal_hipsolver_sytrd.data_2026_02_04[dtype_name]
+    else:
+      self.skipTest("Unsupported platform")
+
+    data = self.load_testdata(platform_data)
     self.run_one_test(func, data, rtol=rtol, atol=atol)
 
   @parameterized.named_parameters(
@@ -755,7 +848,6 @@ def test_gpu_tridiagonal_solve(self, dtype_name):
     if not config.enable_x64.value and dtype_name == "f64":
       self.skipTest("Test disabled for x32 mode")
 
-    dtype = dict(f32=np.float32, f64=np.float64)[dtype_name]
     def func(dl, d, du, b):
       return lax.linalg.tridiagonal_solve(dl, d, du, b)
 
@@ -784,6 +876,13 @@ def func(x):
       data = self.load_testdata(cuda_threefry2x32.data_2024_07_30)
       self.run_one_test(func, data)
 
+  def test_rocm_threefry2x32(self):
+    with config.threefry_partitionable(False):
+      def func(x):
+        return jax.random.uniform(x, (2, 4), dtype=np.float32)
+      data = self.load_testdata(rocm_threefry2x32.data_2026_02_05)
+      self.run_one_test(func, data)
+
   def test_tpu_sharding(self):
     # Tests "Sharding", "SPMDShardToFullShape", "SPMDFullToShardShape" on TPU
     if not jtu.test_device_matches(["tpu"]) or len(jax.devices()) < 2:
@@ -805,7 +904,6 @@ def func(x):  # b: f32[2, 4]
       return lax.ppermute(x, "a", perm=perm)
 
     data = [
-        (tpu_Sharding.data_2023_03_16, []),
         (tpu_Sharding.data_2025_06_30, None),
     ]
     # Due to changes in how Shardy is serialized, from using custom calls to
@@ -840,11 +938,16 @@ def test_annotate_device_placement(self, platform):
     def func(x, y):
       return x + y
 
+    # Check the actual GPU backend type to load appropriate test data
     if platform == "tpu":
       data = [(annotate_data_placement.data_2025_04_07_tpu,
                ["annotate_device_placement"]),
               (annotate_data_placement.data_2025_06_30_tpu, None)]
-    else:
+    elif jtu.test_device_matches(["rocm"]):
+      # ROCm test data - currently only have one version (Feb 2026)
+      data = [(annotate_data_placement.data_2026_02_04_rocm,
+               ["annotate_device_placement"])]
+    else:  # cuda
       data = [(annotate_data_placement.data_2025_04_07_cuda,
                ["annotate_device_placement"]),
               (annotate_data_placement.data_2025_06_30_cuda, None)]
@@ -1031,7 +1134,6 @@ def shard_map_func(x):  # b: f32[2, 4]
       return shard_map_func(x)
 
     data = [
-        (shardy_sharding_ops_with_different_meshes.data_2025_04_14, []),
         (shardy_sharding_ops_with_different_meshes.data_2025_06_30, None),
     ]
 
diff --git a/tests/lax_scipy_test.py b/tests/lax_scipy_test.py
index fbc74cc6d072..7ca2bc4a66b1 100644
--- a/tests/lax_scipy_test.py
+++ b/tests/lax_scipy_test.py
@@ -616,8 +616,11 @@ def testPolar(
     elif side == "left":
       recon = jnp.matmul(posdef, unitary, precision=lax.Precision.HIGHEST)
     with self.subTest('Test reconstruction.'):
-      self.assertAllClose(
-        matrix, recon, atol=tol * jnp.linalg.norm(matrix))
+      recon_atol = tol * jnp.linalg.norm(matrix)
+      if method == "svd" and not jtu.test_device_matches(["cpu"]):
+        # SVD-backed polar reconstruction can accumulate error on GPU (e.g. ROCm).
+        recon_atol = max(recon_atol, 6e-5)
+      self.assertAllClose(matrix, recon, atol=recon_atol)
 
   @jtu.sample_product(
     n_obs=[1, 3, 5],
diff --git a/tests/svd_test.py b/tests/svd_test.py
index a04b25046370..b97a40dbcaf6 100644
--- a/tests/svd_test.py
+++ b/tests/svd_test.py
@@ -309,6 +309,55 @@ def testSvdSubsetByIndex(self, start, end):
     s_slice = full_s[start:end]
     self.assertAllClose(s_slice, s, atol=tol, rtol=tol)
 
+  @jtu.sample_product(
+      shape=[(8, 8), (16, 12), (32, 32), (64, 48)],
+      full_matrices=[True, False],
+  )
+  @jtu.run_on_devices('rocm')
+  def testGesddRocm(self, shape, full_matrices):
+    """Unit test for ROCm gesdd (divide-and-conquer SVD) backend."""
+    m, n = shape
+    dtype = np.float32
+    rng = jtu.rand_default(self.rng())
+    tol = 50 * np.finfo(dtype).eps
+    # Reconstruction and orthogonality can accumulate error in float32 on GPU.
+    # ROCm gesdd numerics can vary across drivers/hardware (CI vs local).
+    recon_tol = max(tol, 2e-2)
+    recon_rtol = max(tol, 1e-2)
+    # Orthogonality (u.T@u, vt@vt.T): relaxed for ROCm float32 (~2.5e-3).
+    _orth = 2.5e-3
+
+    def args_maker():
+      return [rng((m, n), dtype)]
+
+    a, = args_maker()
+    u, s, vt = jnp.linalg.svd(a, full_matrices=full_matrices)
+    k = min(m, n)
+    self.assertEqual(u.shape, (m, m if full_matrices else k))
+    self.assertEqual(s.shape, (k,))
+    self.assertEqual(vt.shape, (n if full_matrices else k, n))
+
+    # Reconstruct using first k components (u[:, :k], s, vt[:k, :]) so shapes
+    # broadcast correctly for both full_matrices=True and False.
+    a_recon = (u[:, :k] * s) @ vt[:k, :]
+    self.assertAllClose(a, a_recon, atol=recon_tol, rtol=recon_rtol)
+
+    # Compare singular values to NumPy
+    expected_s = np.linalg.svd(np.asarray(a), compute_uv=False)
+    self.assertAllClose(s, expected_s, atol=tol, rtol=tol)
+
+    # U and Vt are orthogonal (up to tolerance). Use _orth for ROCm float32.
+    with jax.numpy_rank_promotion('allow'):
+      self.assertAllClose(
+          u.T @ u, np.eye(u.shape[1], dtype=dtype), atol=_orth, rtol=_orth)
+      self.assertAllClose(
+          vt @ vt.T, np.eye(vt.shape[0], dtype=dtype), atol=_orth, rtol=_orth)
+
+    # JIT compatibility
+    def svd_fn(x):
+      return jnp.linalg.svd(x, full_matrices=full_matrices)
+    self._CompileAndCheck(svd_fn, args_maker, rtol=_SVD_RTOL, atol=1e-5)
+
 
 if __name__ == '__main__':
   absltest.main(testLoader=jtu.JaxTestLoader())