// RUN: mlir-opt -convert-to-spirv="run-signature-conversion=false run-vector-unrolling=false" -split-input-file %s | FileCheck %s
// CHECK-LABEL: @combined
// CHECK: %[[C0_F32:.*]] = spirv.Constant 0.000000e+00 : f32
// CHECK: %[[C1_F32:.*]] = spirv.Constant 1.000000e+00 : f32
// CHECK: %[[C0_I32:.*]] = spirv.Constant 0 : i32
// CHECK: %[[C4_I32:.*]] = spirv.Constant 4 : i32
// CHECK: %[[C0_I32_0:.*]] = spirv.Constant 0 : i32
// CHECK: %[[C4_I32_0:.*]] = spirv.Constant 4 : i32
// CHECK: %[[C1_I32:.*]] = spirv.Constant 1 : i32
// CHECK: %[[VEC:.*]] = spirv.Constant dense<1.000000e+00> : vector<4xf32>
// CHECK: %[[VARIABLE:.*]] = spirv.Variable : !spirv.ptr<f32, Function>
// CHECK: spirv.mlir.loop {
// CHECK: spirv.Branch ^[[HEADER:.*]](%[[C0_I32_0]], %[[C0_F32]] : i32, f32)
// CHECK: ^[[HEADER]](%[[INDVAR_0:.*]]: i32, %[[INDVAR_1:.*]]: f32):
// CHECK: %[[SLESSTHAN:.*]] = spirv.SLessThan %[[INDVAR_0]], %[[C4_I32_0]] : i32
// CHECK: spirv.BranchConditional %[[SLESSTHAN]], ^[[BODY:.*]], ^[[MERGE:.*]]
// CHECK: ^[[BODY]]:
// CHECK: %[[FADD:.*]] = spirv.FAdd %[[INDVAR_1]], %[[C1_F32]] : f32
// CHECK: %[[INSERT:.*]] = spirv.CompositeInsert %[[FADD]], %[[VEC]][0 : i32] : f32 into vector<4xf32>
// CHECK: spirv.Store "Function" %[[VARIABLE]], %[[FADD]] : f32
// CHECK: %[[IADD:.*]] = spirv.IAdd %[[INDVAR_0]], %[[C1_I32]] : i32
// CHECK: spirv.Branch ^[[HEADER]](%[[IADD]], %[[FADD]] : i32, f32)
// CHECK: ^[[MERGE]]:
// CHECK: spirv.mlir.merge
// CHECK: }
// CHECK: %[[LOAD:.*]] = spirv.Load "Function" %[[VARIABLE]] : f32
// CHECK: %[[UNDEF:.*]] = spirv.Undef : f32
// CHECK: spirv.ReturnValue %[[UNDEF]] : f32
func.func @combined() -> f32 {
%c0_f32 = arith.constant 0.0 : f32
%c1_f32 = arith.constant 1.0 : f32
%c0_i32 = arith.constant 0 : i32
%c4_i32 = arith.constant 4 : i32
%lb = index.casts %c0_i32 : i32 to index
%ub = index.casts %c4_i32 : i32 to index
%step = arith.constant 1 : index
%buf = vector.broadcast %c1_f32 : f32 to vector<4xf32>
scf.for %iv = %lb to %ub step %step iter_args(%sum_iter = %c0_f32) -> f32 {
%t = vector.extract %buf[0] : f32 from vector<4xf32>
%sum_next = arith.addf %sum_iter, %t : f32
vector.insert %sum_next, %buf[0] : f32 into vector<4xf32>
scf.yield %sum_next : f32
}
%ret = ub.poison : f32
return %ret : f32
}