; RUN: llc < %s -march=nvptx64 -mcpu=sm_53 -mattr=+ptx42 | FileCheck %s
; RUN: %if ptxas %{ llc < %s -march=nvptx64 -mcpu=sm_53 -mattr=+ptx42 | %ptxas-verify -arch=sm_53 %}
declare half @llvm.nvvm.fma.rn.f16(half, half, half)
declare half @llvm.nvvm.fma.rn.ftz.f16(half, half, half)
declare half @llvm.nvvm.fma.rn.sat.f16(half, half, half)
declare half @llvm.nvvm.fma.rn.ftz.sat.f16(half, half, half)
declare <2 x half> @llvm.nvvm.fma.rn.f16x2(<2 x half>, <2 x half>, <2 x half>)
declare <2 x half> @llvm.nvvm.fma.rn.ftz.f16x2(<2 x half>, <2 x half>, <2 x half>)
declare <2 x half> @llvm.nvvm.fma.rn.sat.f16x2(<2 x half>, <2 x half>, <2 x half>)
declare <2 x half> @llvm.nvvm.fma.rn.ftz.sat.f16x2(<2 x half>, <2 x half>, <2 x half>)
; CHECK-LABEL: fma_rn_f16
define half @fma_rn_f16(half %0, half %1, half %2) {
; CHECK-NOT: call
; CHECK: fma.rn.f16
%res = call half @llvm.nvvm.fma.rn.f16(half %0, half %1, half %2)
ret half %res
}
; CHECK-LABEL: fma_rn_ftz_f16
define half @fma_rn_ftz_f16(half %0, half %1, half %2) {
; CHECK-NOT: call
; CHECK: fma.rn.ftz.f16
%res = call half @llvm.nvvm.fma.rn.ftz.f16(half %0, half %1, half %2)
ret half %res
}
; CHECK-LABEL: fma_rn_sat_f16
define half @fma_rn_sat_f16(half %0, half %1, half %2) {
; CHECK-NOT: call
; CHECK: fma.rn.sat.f16
%res = call half @llvm.nvvm.fma.rn.sat.f16(half %0, half %1, half %2)
ret half %res
}
; CHECK-LABEL: fma_rn_ftz_sat_f16
define half @fma_rn_ftz_sat_f16(half %0, half %1, half %2) {
; CHECK-NOT: call
; CHECK: fma.rn.ftz.sat.f16
%res = call half @llvm.nvvm.fma.rn.ftz.sat.f16(half %0, half %1, half %2)
ret half %res
}
; CHECK-LABEL: fma_rn_f16x2
define <2 x half> @fma_rn_f16x2(<2 x half> %0, <2 x half> %1, <2 x half> %2) {
; CHECK-NOT: call
; CHECK: fma.rn.f16x2
%res = call <2 x half> @llvm.nvvm.fma.rn.f16x2(<2 x half> %0, <2 x half> %1, <2 x half> %2)
ret <2 x half> %res
}
; CHECK-LABEL: fma_rn_ftz_f16x2
define <2 x half> @fma_rn_ftz_f16x2(<2 x half> %0, <2 x half> %1, <2 x half> %2) {
; CHECK-NOT: call
; CHECK: fma.rn.ftz.f16x2
%res = call <2 x half> @llvm.nvvm.fma.rn.ftz.f16x2(<2 x half> %0, <2 x half> %1, <2 x half> %2)
ret <2 x half> %res
}
; CHECK-LABEL: fma_rn_sat_f16x2
define <2 x half> @fma_rn_sat_f16x2(<2 x half> %0, <2 x half> %1, <2 x half> %2) {
; CHECK-NOT: call
; CHECK: fma.rn.sat.f16x2
%res = call <2 x half> @llvm.nvvm.fma.rn.sat.f16x2(<2 x half> %0, <2 x half> %1, <2 x half> %2)
ret <2 x half> %res
}
; CHECK-LABEL: fma_rn_ftz_sat_f16x2
define <2 x half> @fma_rn_ftz_sat_f16x2(<2 x half> %0, <2 x half> %1, <2 x half> %2) {
; CHECK-NOT: call
; CHECK: fma.rn.ftz.sat.f16x2
%res = call <2 x half> @llvm.nvvm.fma.rn.ftz.sat.f16x2(<2 x half> %0, <2 x half> %1, <2 x half> %2)
ret <2 x half> %res
}