blob: 4bfa83d3b87f71424e2c8df636b730b404ce4376 [file] [log] [blame]
// RUN: iree-dialects-opt %s --transform-dialect-interpreter --split-input-file | FileCheck %s
// CHECK-LABEL: func.func @matmul_tensors_1(
func.func @matmul_tensors_1(
%arg0: tensor<128x128xf32>, %arg1: tensor<128x128xf32>,
%arg2: tensor<128x128xf32> {linalg.inplaceable = true})
-> tensor<128x128xf32> {
// This operation is marked for tiling only.
// CHECK-COUNT-3: scf.for
// CHECK-COUNT-2: tensor.extract_slice
// CHECK: linalg.matmul
// CHECK-SAME: -> tensor<4x4xf32>
%0 = linalg.matmul { test.attrA }
ins(%arg0, %arg1: tensor<128x128xf32>, tensor<128x128xf32>)
outs(%arg2: tensor<128x128xf32>)
-> tensor<128x128xf32>
func.return %0 : tensor<128x128xf32>
}
func.func @matmul_tensors_2(
%arg0: tensor<128x128xf32>, %arg1: tensor<128x128xf32>,
%arg2: tensor<128x128xf32> {linalg.inplaceable = true})
-> tensor<128x128xf32> {
// This operation is marked f
// This operation is marked for tiling and vectorization.
// Note that the loop-invariant read is hoisted out of the innermost loop.
// CHECK: scf.for
// CHECK: scf.for
// CHECK: vector.transfer_read
// CHECK: scf.for
// CHECK: vector.transfer_read
// CHECK: vector.transfer_read
// CHECK: vector.contract
// CHECK-NOT: linalg.matmul
// CHECK: vector.transfer_write
%0 = linalg.matmul { test.attrA, test.attrC }
ins(%arg0, %arg1: tensor<128x128xf32>, tensor<128x128xf32>)
outs(%arg2: tensor<128x128xf32>)
-> tensor<128x128xf32>
func.return %0 : tensor<128x128xf32>
}
func.func @matmul_tensors_3(
%arg0: tensor<128x128xf32>, %arg1: tensor<128x128xf32>,
%arg2: tensor<128x128xf32> {linalg.inplaceable = true})
-> tensor<128x128xf32> {
// This operation is marked for vectorization only.
// CHECK-NOT: scf.for
// CHECK-COUNT-3: vector.transfer_read
// CHECK: vector.contract
// CHECK-SAME: into vector<128x128xf32>
// CHECK: vector.transfer_write
%0 = linalg.matmul { test.attrC }
ins(%arg0, %arg1: tensor<128x128xf32>, tensor<128x128xf32>)
outs(%arg2: tensor<128x128xf32>)
-> tensor<128x128xf32>
func.return %0 : tensor<128x128xf32>
}
transform.with_pdl_patterns {
^bb0(%arg0: !pdl.operation):
// Match matmul operations inside @matmul_tensors with test.attrA set.
pdl.pattern @pdl_target_attrA : benefit(1) {
%args = operands
%results = types
%attr = attribute
%0 = operation "linalg.matmul"(%args : !pdl.range<value>) {"test.attrA" = %attr}-> (%results : !pdl.range<type>)
// TODO: we don't want this, but it is the required terminator for pdl.pattern
rewrite %0 with "transform.dialect"
}
// Match matmul operations inside @matmul_tensors with test.attrC set.
pdl.pattern @pdl_target_attrC : benefit(1) {
%args = operands
%results = types
%attr = attribute
%0 = operation "linalg.matmul"(%args : !pdl.range<value>) {"test.attrC" = %attr}-> (%results : !pdl.range<type>)
// TODO: we don't want this, but it is the required terminator for pdl.pattern
rewrite %0 with "transform.dialect"
}
transform.structured.canonicalized_sequence %arg0 failures(propagate) {
^bb1(%arg1: !pdl.operation):
%0 = pdl_match @pdl_target_attrA in %arg1 : (!pdl.operation) -> !pdl.operation
transform.structured.tile %0 [4, 4, 4]
: (!pdl.operation) -> (!pdl.operation, !pdl.operation, !pdl.operation, !pdl.operation)
%1 = pdl_match @pdl_target_attrC in %arg1 : (!pdl.operation) -> !pdl.operation
%2 = transform.get_closest_isolated_parent %1 : (!pdl.operation) -> !pdl.operation
transform.structured.vectorize %2
}
}
// -----
// CHECK-LABEL: @vectorize_one
func.func @vectorize_one(
%arg0: tensor<128x128xf32>, %arg1: tensor<128x128xf32>,
%arg2: tensor<128x128xf32> {linalg.inplaceable = true})
-> tensor<128x128xf32> {
// CHECK: vector.contract
%0 = linalg.matmul {test.attrA}
ins(%arg0, %arg1: tensor<128x128xf32>, tensor<128x128xf32>)
outs(%arg2: tensor<128x128xf32>)
-> tensor<128x128xf32>
func.return %0 : tensor<128x128xf32>
}
func.func @vectorize_none(
%arg0: tensor<128x128xf32>, %arg1: tensor<128x128xf32>,
%arg2: tensor<128x128xf32> {linalg.inplaceable = true})
-> tensor<128x128xf32> {
// CHECK: linalg.matmul
%0 = linalg.matmul ins(%arg0, %arg1: tensor<128x128xf32>, tensor<128x128xf32>)
outs(%arg2: tensor<128x128xf32>)
-> tensor<128x128xf32>
func.return %0 : tensor<128x128xf32>
}
transform.with_pdl_patterns {
^bb0(%arg0: !pdl.operation):
pdl.pattern @pdl_target : benefit(1) {
%args = operands
%results = types
%attr = attribute
%0 = operation "linalg.matmul"(%args : !pdl.range<value>) {"test.attrA" = %attr}-> (%results : !pdl.range<type>)
// TODO: we don't want this, but it is the required terminator for pdl.pattern
rewrite %0 with "transform.dialect"
}
transform.structured.canonicalized_sequence %arg0 failures(propagate) {
^bb1(%arg1: !pdl.operation):
%0 = pdl_match @pdl_target in %arg1 : (!pdl.operation) -> !pdl.operation
%1 = get_closest_isolated_parent %0 : (!pdl.operation) -> !pdl.operation
transform.structured.vectorize %1
}
}
// -----
// CHECK-LABEL: @vectorize_all
func.func @vectorize_all(
%arg0: tensor<128x128xf32>, %arg1: tensor<128x128xf32>, %arg2: tensor<128x128xf32>,
%arg3: tensor<128x128xf32> {linalg.inplaceable = true})
-> tensor<128x128xf32> {
// CHECK: vector.contract
%0 = linalg.matmul {test.attrA}
ins(%arg0, %arg1: tensor<128x128xf32>, tensor<128x128xf32>)
outs(%arg2: tensor<128x128xf32>)
-> tensor<128x128xf32>
// CHECK: vector.contract
%1 = linalg.matmul ins(%arg0, %0: tensor<128x128xf32>, tensor<128x128xf32>)
outs(%arg3: tensor<128x128xf32>)
-> tensor<128x128xf32>
return %1 : tensor<128x128xf32>
}
transform.structured.canonicalized_sequence failures(propagate) {
^bb0(%arg0: !pdl.operation):
transform.structured.vectorize %arg0
}