IntelPython
diff --git a/‎mlir-compiler/mlir-compiler/src/pipelines/plier_to_linalg.cpp‎
Lines changed: 149 additions & 42 deletions b/‎mlir-compiler/mlir-compiler/src/pipelines/plier_to_linalg.cpp‎
Lines changed: 149 additions & 42 deletions
diff --git a/‎mlir-compiler/mlir-compiler/src/py_linalg_resolver.cpp‎
Lines changed: 4 additions & 2 deletions b/‎mlir-compiler/mlir-compiler/src/py_linalg_resolver.cpp‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎mlir-compiler/plier/CMakeLists.txt‎
Lines changed: 4 additions & 0 deletions b/‎mlir-compiler/plier/CMakeLists.txt‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎mlir-compiler/plier/include/plier/PlierOps.td‎
Lines changed: 14 additions & 0 deletions b/‎mlir-compiler/plier/include/plier/PlierOps.td‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎mlir-compiler/plier/include/plier/rewrites/common_opts.hpp‎
Lines changed: 12 additions & 0 deletions b/‎mlir-compiler/plier/include/plier/rewrites/common_opts.hpp‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎mlir-compiler/plier/include/plier/rewrites/cse.hpp‎
Lines changed: 3 additions & 3 deletions b/‎mlir-compiler/plier/include/plier/rewrites/cse.hpp‎
Lines changed: 3 additions & 3 deletions
@@ -27,6 +27,7 @@
 #include "plier/rewrites/call_lowering.hpp"
 #include "plier/rewrites/canonicalize_reductions.hpp"
 #include "plier/rewrites/cast_lowering.hpp"
+#include "plier/rewrites/common_opts.hpp"
 #include "plier/rewrites/cse.hpp"
 #include "plier/rewrites/promote_to_parallel.hpp"
 #include "plier/rewrites/type_conversion.hpp"
@@ -722,6 +723,103 @@ struct BinopRewriter : public mlir::OpRewritePattern<plier::BinOp>
     resolver_t resolver;
 };
 
+struct SimplifyExpandDims : public mlir::OpRewritePattern<mlir::linalg::GenericOp>
+{
+    using mlir::OpRewritePattern<mlir::linalg::GenericOp>::OpRewritePattern;
+
+    mlir::LogicalResult matchAndRewrite(
+        mlir::linalg::GenericOp op, mlir::PatternRewriter &rewriter) const override
+    {
+        if (!op.hasTensorSemantics())
+        {
+            return mlir::failure();
+        }
+        if (op.getNumInputs() != 1 || op.getNumOutputs() != 1)
+        {
+            return mlir::failure();
+        }
+
+        auto context = op.getContext();
+        auto parallel_attr = mlir::StringAttr::get(context, "parallel");
+        if (llvm::any_of(op.iterator_types(), [&](auto attr) { return  attr != parallel_attr; }))
+        {
+            return mlir::failure();
+        }
+
+        auto maps = op.indexing_maps();
+        assert(maps.size() == 2);
+        auto out_map = maps[1].cast<mlir::AffineMapAttr>().getValue();
+        if (!out_map.isIdentity())
+        {
+            return mlir::failure();
+        }
+        auto in_map = maps[0].cast<mlir::AffineMapAttr>().getValue();
+        auto num_dims = op.getNumLoops();
+        if (in_map.getNumResults() != num_dims)
+        {
+            return mlir::failure();
+        }
+
+        bool changed = false;
+        auto out_shape = op.getOutput(0).getType().cast<mlir::RankedTensorType>().getShape();
+        llvm::SmallVector<mlir::AffineExpr> exprs(num_dims);
+        for (unsigned i = 0; i < num_dims; ++i)
+        {
+            auto prev_expr = in_map.getResult(i);
+            bool can_convert = [&]()
+            {
+                if (out_shape[i] == 1)
+                {
+                    auto const_expr = prev_expr.dyn_cast<mlir::AffineConstantExpr>();
+                    if (const_expr && const_expr.getValue() == 0)
+                    {
+                        return true;
+                    }
+                }
+                return false;
+            }();
+            if (can_convert)
+            {
+                changed = true;
+                exprs[i] = mlir::getAffineDimExpr(i, context);
+            }
+            else
+            {
+                exprs[i] = prev_expr;
+            }
+        }
+
+        if (changed)
+        {
+            const mlir::Attribute new_maps[] = {
+                mlir::AffineMapAttr::get(mlir::AffineMap::get(num_dims, 0, exprs, context)),
+                maps[1]
+            };
+            auto new_maps_attr = mlir::ArrayAttr::get(context, new_maps);
+            rewriter.updateRootInPlace(op, [&]()
+            {
+                op.indexing_mapsAttr(new_maps_attr);
+            });
+        }
+
+        return mlir::success(changed);
+    }
+};
+
+struct LowerEnforceShape : public mlir::OpRewritePattern<plier::EnforceShapeOp>
+{
+    using mlir::OpRewritePattern<plier::EnforceShapeOp>::OpRewritePattern;
+
+    mlir::LogicalResult matchAndRewrite(
+        plier::EnforceShapeOp op, mlir::PatternRewriter &rewriter) const override
+    {
+        auto type = op.getType();
+        auto src = op.value();
+        rewriter.replaceOpWithNewOp<mlir::tensor::CastOp>(op, type, src);
+        return mlir::success();
+    }
+};
+
 void PlierToLinalgPass::runOnOperation()
 {
     auto context = &getContext();
@@ -801,38 +899,61 @@ void LowerLinalgPass::runOnOperation()
     (void)mlir::applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
 }
 
-struct CommonOptPass :
-    public mlir::PassWrapper<CommonOptPass, mlir::OperationPass<mlir::ModuleOp>>
+struct PostPlierToLinalgPass :
+    public mlir::PassWrapper<PostPlierToLinalgPass, mlir::OperationPass<mlir::ModuleOp>>
 {
-    virtual void getDependentDialects(
-        mlir::DialectRegistry &registry) const override
-    {
-        registry.insert<mlir::StandardOpsDialect>();
-        registry.insert<mlir::linalg::LinalgDialect>();
-        registry.insert<mlir::scf::SCFDialect>();
-        registry.insert<mlir::AffineDialect>();
-    }
+    void runOnOperation() override;
+};
+
+void PostPlierToLinalgPass::runOnOperation()
+{
+    mlir::OwningRewritePatternList patterns;
+
+    auto& context = getContext();
+    plier::populate_common_opts_patterns(context, patterns);
 
+    patterns.insert<
+        SimplifyExpandDims
+        >(&getContext());
+
+    (void)mlir::applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
+}
+
+struct TensorFusionPass :
+    public mlir::PassWrapper<TensorFusionPass, mlir::OperationPass<mlir::ModuleOp>>
+{
     void runOnOperation() override;
 };
 
-void CommonOptPass::runOnOperation()
+void TensorFusionPass::runOnOperation()
 {
     mlir::OwningRewritePatternList patterns;
 
     auto& context = getContext();
-    for (auto *op : context.getRegisteredOperations())
-    {
-        op->getCanonicalizationPatterns(patterns, &context);
-    }
+    plier::populate_common_opts_patterns(context, patterns);
 
     patterns.insert<
-        //        LoopInvariantCodeMotion, TODO
-        plier::ForceInline,
-        plier::CSERewrite<mlir::FuncOp>
-        >(&context);
+        SimplifyExpandDims,
+        LowerEnforceShape
+        >(&getContext());
+
+    mlir::populateLinalgTensorOpsFusionPatterns(&context, patterns);
 
-    plier::populate_index_propagate_patterns(context, patterns);
+    (void)mlir::applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
+}
+
+struct CommonOptPass :
+    public mlir::PassWrapper<CommonOptPass, mlir::OperationPass<mlir::ModuleOp>>
+{
+    void runOnOperation() override;
+};
+
+void CommonOptPass::runOnOperation()
+{
+    mlir::OwningRewritePatternList patterns;
+
+    auto& context = getContext();
+    plier::populate_common_opts_patterns(context, patterns);
 
     (void)mlir::applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
 }
@@ -897,15 +1018,6 @@ void RetainArgsPass::runOnFunction()
 struct PostLinalgOptPass :
     public mlir::PassWrapper<PostLinalgOptPass, mlir::OperationPass<mlir::ModuleOp>>
 {
-    virtual void getDependentDialects(
-        mlir::DialectRegistry &registry) const override
-    {
-        registry.insert<mlir::StandardOpsDialect>();
-        registry.insert<mlir::linalg::LinalgDialect>();
-        registry.insert<mlir::scf::SCFDialect>();
-        registry.insert<mlir::AffineDialect>();
-    }
-
     void runOnOperation() override;
 };
 
@@ -914,35 +1026,26 @@ void PostLinalgOptPass::runOnOperation()
     mlir::OwningRewritePatternList patterns;
 
     auto& context = getContext();
-    for (auto *op : context.getRegisteredOperations())
-    {
-        op->getCanonicalizationPatterns(patterns, &context);
-    }
+    plier::populate_common_opts_patterns(context, patterns);
 
     patterns.insert<
         plier::CanonicalizeReduction,
-//        LoopInvariantCodeMotion, TODO
-        plier::PromoteToParallel,
-        plier::CmpLoopBoundsSimplify,
-        plier::CSERewrite<mlir::FuncOp>
+        plier::PromoteToParallel
         >(&context);
 
-    plier::populate_index_propagate_patterns(context, patterns);
-
     (void)mlir::applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
 }
 
 void populate_plier_to_linalg_gen_pipeline(mlir::OpPassManager& pm)
 {
     pm.addPass(std::make_unique<PlierToLinalgPass>());
-    pm.addPass(std::make_unique<CommonOptPass>());
+    pm.addPass(std::make_unique<PostPlierToLinalgPass>());
     pm.addPass(mlir::createSymbolDCEPass());
 }
 
 void populate_plier_to_linalg_opt_pipeline(mlir::OpPassManager& pm)
 {
-    pm.addPass(mlir::createLinalgFusionOfTensorOpsPass());
-    pm.addPass(std::make_unique<CommonOptPass>());
+    pm.addPass(std::make_unique<TensorFusionPass>());
 
     pm.addPass(mlir::createTensorConstantBufferizePass());
     pm.addNestedPass<mlir::FuncOp>(mlir::createSCFBufferizePass());
@@ -958,10 +1061,14 @@ void populate_plier_to_linalg_opt_pipeline(mlir::OpPassManager& pm)
 
     pm.addNestedPass<mlir::FuncOp>(std::make_unique<RetainArgsPass>());
     pm.addNestedPass<mlir::FuncOp>(mlir::createBufferDeallocationPass());
+    pm.addPass(mlir::createCopyRemovalPass());
 
     pm.addPass(std::make_unique<LowerLinalgPass>());
+    pm.addPass(mlir::createParallelLoopFusionPass());
     pm.addPass(std::make_unique<PostLinalgOptPass>());
     pm.addPass(mlir::createSymbolDCEPass());
+    pm.addPass(mlir::createParallelLoopFusionPass()); // TODO: make this rewrite and add to PostLinalgOptPass
+    pm.addPass(std::make_unique<PostLinalgOptPass>());
 }
 }
 
 
@@ -452,8 +452,9 @@ mlir::Value expand_dim(mlir::OpBuilder& builder, mlir::Location loc, mlir::Value
     {
         assert(dim < shape.size());
         shape[dim] = 1;
-        mlir::Type casted_type = mlir::RankedTensorType::get(shape, src_type.getElementType());
-        auto casted = builder.create<mlir::tensor::CastOp>(loc, casted_type, src).getResult();
+//        mlir::Type casted_type = mlir::RankedTensorType::get(shape, src_type.getElementType());
+//        auto casted = builder.create<mlir::tensor::CastOp>(loc, casted_type, src).getResult();
+        auto casted = src; // TODO
         auto init = builder.create<mlir::linalg::InitTensorOp>(loc, new_shape, src_type.getElementType()).getResult();
         llvm::SmallVector<mlir::AffineExpr> exprs(num_dims);
         for (unsigned i = 0; i < num_dims; ++i)
@@ -503,6 +504,7 @@ mlir::Value expand_dims(mlir::OpBuilder& builder, mlir::Location loc, mlir::Valu
     {
         current = expand_dim(builder, loc, val, current, i, target_shape);
     }
+    current = builder.create<plier::EnforceShapeOp>(loc, current, target_shape);
     return current;
 }
 
 
@@ -18,9 +18,11 @@ set(SOURCES_LIST
     src/rewrites/call_lowering.cpp
     src/rewrites/canonicalize_reductions.cpp
     src/rewrites/cast_lowering.cpp
+    src/rewrites/common_opts.cpp
     src/rewrites/cse.cpp
     src/rewrites/force_inline.cpp
     src/rewrites/index_type_propagation.cpp
+    include/plier/rewrites/if_rewrites.cpp
     src/rewrites/loop_rewrites.cpp
     src/rewrites/promote_to_parallel.cpp
     src/rewrites/type_conversion.cpp
@@ -39,9 +41,11 @@ set(HEADERS_LIST
     include/plier/rewrites/call_lowering.hpp
     include/plier/rewrites/canonicalize_reductions.hpp
     include/plier/rewrites/cast_lowering.hpp
+    include/plier/rewrites/common_opts.hpp
     include/plier/rewrites/cse.hpp
     include/plier/rewrites/force_inline.hpp
     include/plier/rewrites/index_type_propagation.hpp
+    include/plier/rewrites/if_rewrites.hpp
     include/plier/rewrites/loop_rewrites.hpp
     include/plier/rewrites/promote_to_parallel.hpp
     include/plier/rewrites/type_conversion.hpp
 
@@ -214,6 +214,20 @@ def GetattrOp : Plier_Op<"getattr", [NoSideEffect]> {
     ];
 }
 
+def EnforceShapeOp : Plier_Op<"enforce_shape"> {
+    let arguments = (ins AnyRankedTensor:$value,
+                         Variadic<Index>:$sizes);
+
+    let results = (outs AnyRankedTensor:$result);
+
+    let builders = [
+        OpBuilderDAG<(ins "::mlir::Value":$value, "::mlir::ValueRange":$shape)>
+    ];
+
+    let hasFolder = 1;
+    let hasCanonicalizer = 1;
+}
+
 def RetainOp : Plier_Op<"retain"> {
     let arguments = (ins AnyMemRef:$value);
 
 
@@ -0,0 +1,12 @@
+#pragma once
+
+namespace mlir
+{
+class OwningRewritePatternList;
+class MLIRContext;
+}
+
+namespace plier
+{
+void populate_common_opts_patterns(mlir::MLIRContext& context, mlir::OwningRewritePatternList& patterns);
+}
@@ -7,10 +7,10 @@ namespace plier
 {
 namespace detail
 {
-mlir::LogicalResult applyCSE(mlir::Region& region, mlir::PatternRewriter& rewriter);
+mlir::LogicalResult applyCSE(mlir::Region& region, mlir::PatternRewriter& rewriter, bool recusive);
 }
 
-template<typename Op>
+template<typename Op, bool Recursive>
 struct CSERewrite : public mlir::OpRewritePattern<Op>
 {
     CSERewrite(mlir::MLIRContext *context):
@@ -19,7 +19,7 @@ struct CSERewrite : public mlir::OpRewritePattern<Op>
     mlir::LogicalResult matchAndRewrite(
         Op op, mlir::PatternRewriter &rewriter) const override
     {
-        return ::plier::detail::applyCSE(op.getRegion(), rewriter);
+        return ::plier::detail::applyCSE(op.getRegion(), rewriter, Recursive);
     }
 };
 }
Original file line number	Diff line number	Diff line change
`@@ -452,8 +452,9 @@ mlir::Value expand_dim(mlir::OpBuilder& builder, mlir::Location loc, mlir::Value`
`452`	`452`	`{`
`453`	`453`	`assert(dim < shape.size());`
`454`	`454`	`shape[dim] = 1;`
`455`		`- mlir::Type casted_type = mlir::RankedTensorType::get(shape, src_type.getElementType());`
`456`		`- auto casted = builder.create<mlir::tensor::CastOp>(loc, casted_type, src).getResult();`
	`455`	`+// mlir::Type casted_type = mlir::RankedTensorType::get(shape, src_type.getElementType());`
	`456`	`+// auto casted = builder.create<mlir::tensor::CastOp>(loc, casted_type, src).getResult();`
	`457`	`+ auto casted = src; // TODO`
`457`	`458`	`auto init = builder.create<mlir::linalg::InitTensorOp>(loc, new_shape, src_type.getElementType()).getResult();`
`458`	`459`	`llvm::SmallVector<mlir::AffineExpr> exprs(num_dims);`
`459`	`460`	`for (unsigned i = 0; i < num_dims; ++i)`
`@@ -503,6 +504,7 @@ mlir::Value expand_dims(mlir::OpBuilder& builder, mlir::Location loc, mlir::Valu`
`503`	`504`	`{`
`504`	`505`	`current = expand_dim(builder, loc, val, current, i, target_shape);`
`505`	`506`	`}`
	`507`	`+ current = builder.create<plier::EnforceShapeOp>(loc, current, target_shape);`
`506`	`508`	`return current;`
`507`	`509`	`}`
`508`	`510`
Original file line number	Diff line number	Diff line change
`@@ -7,10 +7,10 @@ namespace plier`
`7`	`7`	`{`
`8`	`8`	`namespace detail`
`9`	`9`	`{`
`10`		`-mlir::LogicalResult applyCSE(mlir::Region& region, mlir::PatternRewriter& rewriter);`
	`10`	`+mlir::LogicalResult applyCSE(mlir::Region& region, mlir::PatternRewriter& rewriter, bool recusive);`
`11`	`11`	`}`
`12`	`12`
`13`		`-template<typename Op>`
	`13`	`+template<typename Op, bool Recursive>`
`14`	`14`	`struct CSERewrite : public mlir::OpRewritePattern<Op>`
`15`	`15`	`{`
`16`	`16`	`CSERewrite(mlir::MLIRContext *context):`
`@@ -19,7 +19,7 @@ struct CSERewrite : public mlir::OpRewritePattern<Op>`
`19`	`19`	`mlir::LogicalResult matchAndRewrite(`
`20`	`20`	`Op op, mlir::PatternRewriter &rewriter) const override`
`21`	`21`	`{`
`22`		`- return ::plier::detail::applyCSE(op.getRegion(), rewriter);`
	`22`	`+ return ::plier::detail::applyCSE(op.getRegion(), rewriter, Recursive);`
`23`	`23`	`}`
`24`	`24`	`};`
`25`	`25`	`}`