// RUN: mlir-opt %s -test-vector-scan-lowering -convert-vector-to-scf -convert-scf-to-cf -convert-vector-to-llvm -convert-func-to-llvm -reconcile-unrealized-casts | \
// RUN: mlir-cpu-runner -e entry -entry-point-result=void \
// RUN: -shared-libs=%mlir_c_runner_utils | \
// RUN: FileCheck %s
func.func @entry() {
%f1 = arith.constant 1.0: f32
%f2 = arith.constant 2.0: f32
%f3 = arith.constant 3.0: f32
%f4 = arith.constant 4.0: f32
%f5 = arith.constant 5.0: f32
%f6 = arith.constant 6.0: f32
// Construct test vector.
%0 = vector.broadcast %f1 : f32 to vector<3x2xf32>
%1 = vector.insert %f2, %0[0, 1] : f32 into vector<3x2xf32>
%2 = vector.insert %f3, %1[1, 0] : f32 into vector<3x2xf32>
%3 = vector.insert %f4, %2[1, 1] : f32 into vector<3x2xf32>
%4 = vector.insert %f5, %3[2, 0] : f32 into vector<3x2xf32>
%x = vector.insert %f6, %4[2, 1] : f32 into vector<3x2xf32>
vector.print %x : vector<3x2xf32>
// CHECK: ( ( 1, 2 ), ( 3, 4 ), ( 5, 6 ) )
%y = vector.broadcast %f6 : f32 to vector<2xf32>
%z = vector.broadcast %f6 : f32 to vector<3xf32>
// Scan
%a:2 = vector.scan <add>, %x, %y {inclusive = true, reduction_dim = 0} :
vector<3x2xf32>, vector<2xf32>
%b:2 = vector.scan <add>, %x, %z {inclusive = true, reduction_dim = 1} :
vector<3x2xf32>, vector<3xf32>
%c:2 = vector.scan <add>, %x, %y {inclusive = false, reduction_dim = 0} :
vector<3x2xf32>, vector<2xf32>
%d:2 = vector.scan <add>, %x, %z {inclusive = false, reduction_dim = 1} :
vector<3x2xf32>, vector<3xf32>
// CHECK: ( ( 1, 2 ), ( 4, 6 ), ( 9, 12 ) )
// CHECK: ( 9, 12 )
// CHECK: ( ( 1, 3 ), ( 3, 7 ), ( 5, 11 ) )
// CHECK: ( 3, 7, 11 )
// CHECK: ( ( 6, 6 ), ( 7, 8 ), ( 10, 12 ) )
// CHECK: ( 10, 12 )
// CHECK: ( ( 6, 7 ), ( 6, 9 ), ( 6, 11 ) )
// CHECK: ( 7, 9, 11 )
vector.print %a#0 : vector<3x2xf32>
vector.print %a#1 : vector<2xf32>
vector.print %b#0 : vector<3x2xf32>
vector.print %b#1 : vector<3xf32>
vector.print %c#0 : vector<3x2xf32>
vector.print %c#1 : vector<2xf32>
vector.print %d#0 : vector<3x2xf32>
vector.print %d#1 : vector<3xf32>
return
}