[XLA:GPU] NFC: Avoid redundant BitcastMap.

There is no need to first bitcast to the hero shape and then to the root shape. We can directly bitcast to the root shape. PiperOrigin-RevId: 664678219
Intel-tensorflow · Aug 19, 2024 · a6b5bdb · a6b5bdb
1 parent 1fd3fa4
commit a6b5bdb
Showing 1 changed file with 2 additions and 6 deletions.
diff --git a/third_party/xla/xla/service/gpu/fusions/transpose_mlir.cc b/third_party/xla/xla/service/gpu/fusions/transpose_mlir.cc
@@ -167,12 +167,8 @@ std::optional<IndexingMap> MlirTransposeFusion::ComputeThreadIdToOutputIndexing(
           analysis_.fusion_root(root_index).instruction(), hero)) {
     // The shape of non-transpose roots are bitcast compatible with the input
     // shape of transpose heroes.
-    auto map = ComposeIndexingMaps(
-        GetIndexing(/*input=*/true, hero.shape(), mlir_context),
-        GetBitcastMap(hero.shape(), analysis_.fusion_root(root_index).shape(),
-                      mlir_context));
-    map.Simplify();
-    return map;
+    return GetIndexing(/*input=*/true,
+                       analysis_.fusion_root(root_index).shape(), mlir_context);
   }
   return GetIndexing(/*input=*/false, hero.shape(), mlir_context);
 }