alibaba · eedalong · Feb 26, 2024 · Jan 22, 2024 · Jan 22, 2024 · Feb 22, 2024
diff --git a/tao_compiler/mlir/disc/transforms/disc_lower_to_library_call.cc b/tao_compiler/mlir/disc/transforms/disc_lower_to_library_call.cc
@@ -494,7 +494,7 @@ struct TransposeConverter : public OpRewritePattern<lmhlo::TransposeOp> {
     if (rank != 2 && rank != 3) return failure();
     // only rewriter custom library when switch 1 and 2 dimensions of
     // a 3d tensor, that means permute = [0, 2, 1]
-    if (rank == 3 && permutation[1] != 2 && permutation[2] != 1)
+    if (rank == 3 && (permutation[1] != 2 || permutation[2] != 1))
       return failure();
     bool on_gpu = placement_utils::isGpuMemRef(op->getOperand(0));
     // TODO: support other device
@@ -914,8 +914,7 @@ struct DiscLowerToLibraryCallPass
       SendOutputOpConvertor
     >(context);
     // clang-format on
-    if (enableTransposeLibraryCall())
-      patterns.insert<TransposeConverter>(context);
+    patterns.insert<TransposeConverter>(context);
 
     // GPU copy related ops
     patterns.insert<GpuCopyOpConvertor<H2DOp>>(context, "h2d");