Add simple heuristic to decide if TensorReshape should be folded during fusion (#5797) This solves a performance regression on MobileBert.

commit: 59c709831d0ce86373a78df3ccaa36335f112e1b [log] [tgz]
author: Thomas <thomasraoux@google.com> Fri May 07 14:18:47 2021 -0700
committer: GitHub <noreply@github.com> Fri May 07 14:18:47 2021 -0700
tree: 7b2ffe569c4773522b85cd95bdc3e9fb867fe177
parent: dcc38a9eb96e93d397376d255689bc6a4a1ed13e [diff]
diff --git a/iree/compiler/Conversion/HLOToLinalg/FusionOfTensorOps.cpp b/iree/compiler/Conversion/HLOToLinalg/FusionOfTensorOps.cpp
index f6e3b9e..3034e91 100644
--- a/iree/compiler/Conversion/HLOToLinalg/FusionOfTensorOps.cpp
+++ b/iree/compiler/Conversion/HLOToLinalg/FusionOfTensorOps.cpp

@@ -108,14 +108,20 @@
           }
           return numUsers.empty();
         };
-    linalg::ControlElementwiseOpsFusionFn foldAllFn =
+    // Simple heuristic to decide if reshaope should be folded in the linalg.
+    // If the source of the reshape is a linalg op fold to potentially allow the
+    // two linalg ops to be fused. Otherwise leave it to avoid adding dimensions
+    // to the consumer linalg op.
+    linalg::ControlElementwiseOpsFusionFn foldReshapeBetweenLinalgFn =
         [](const OpResult &producer, const OpOperand &consumer) {
-          return true;
+          auto reshapeOp = producer.getDefiningOp<linalg::TensorReshapeOp>();
+          return reshapeOp.src().getDefiningOp<linalg::LinalgOp>() != nullptr;
         };
     linalg::populateElementwiseOpsFusionPatterns(
-        fusionPatterns, linalg::LinalgElementwiseFusionOptions()
-                            .setControlFoldingReshapes(foldAllFn)
-                            .setControlElementwiseOpsFusionFn(controlFn));
+        fusionPatterns,
+        linalg::LinalgElementwiseFusionOptions()
+            .setControlFoldingReshapes(foldReshapeBetweenLinalgFn)
+            .setControlElementwiseOpsFusionFn(controlFn));
 
     (void)applyPatternsAndFoldGreedily(op->getRegions(),
                                        std::move(fusionPatterns));
commit	59c709831d0ce86373a78df3ccaa36335f112e1b	[log] [tgz]
author	Thomas <thomasraoux@google.com>	Fri May 07 14:18:47 2021 -0700
committer	GitHub <noreply@github.com>	Fri May 07 14:18:47 2021 -0700
tree	7b2ffe569c4773522b85cd95bdc3e9fb867fe177
parent	dcc38a9eb96e93d397376d255689bc6a4a1ed13e [diff]