fpmath.cl | Explore in Territory

// RUN: %clang_cc1 %s -emit-llvm -o - -triple spir-unknown-unknown | FileCheck --check-prefix=CHECK --check-prefix=NODIVOPT %s
// RUN: %clang_cc1 %s -emit-llvm -o - -triple spir-unknown-unknown -cl-fp32-correctly-rounded-divide-sqrt | FileCheck --check-prefix=CHECK --check-prefix=DIVOPT %s
// RUN: %clang_cc1 %s -emit-llvm -o - -DNOFP64 -cl-std=CL1.2 -triple r600-unknown-unknown -target-cpu r600 -pedantic | FileCheck --check-prefix=CHECK-FLT %s
// RUN: %clang_cc1 %s -emit-llvm -o - -DFP64 -cl-std=CL1.2 -triple spir-unknown-unknown -pedantic | FileCheck --check-prefix=CHECK-DBL %s

typedef __attribute__(( ext_vector_type(4) )) float float4;

float spscalardiv(float a, float b) {
  // CHECK: @spscalardiv
  // CHECK: fdiv{{.*}},
  // NODIVOPT: !fpmath ![[MD_FDIV:[0-9]+]]
  // DIVOPT-NOT: !fpmath !{{[0-9]+}}
  return a / b;
}

float4 spvectordiv(float4 a, float4 b) {
  // CHECK: @spvectordiv
  // CHECK: fdiv{{.*}},
  // NODIVOPT: !fpmath ![[MD_FDIV]]
  // DIVOPT-NOT: !fpmath !{{[0-9]+}}
  return a / b;
}

float spscalarsqrt(float a) {
  // CHECK-LABEL: @spscalarsqrt
  // NODIVOPT: call float @llvm.sqrt.f32(float %{{.+}}), !fpmath ![[MD_SQRT:[0-9]+]]
  // DIVOPT: call float @llvm.sqrt.f32(float %{{.+}}){{$}}
  return __builtin_sqrtf(a);
}

float elementwise_sqrt_f32(float a) {
  // CHECK-LABEL: @elementwise_sqrt_f32
  // NODIVOPT: call float @llvm.sqrt.f32(float %{{.+}}), !fpmath ![[MD_SQRT:[0-9]+]]
  // DIVOPT: call float @llvm.sqrt.f32(float %{{.+}}){{$}}
  return __builtin_elementwise_sqrt(a);
}

float4 elementwise_sqrt_v4f32(float4 a) {
  // CHECK-LABEL: @elementwise_sqrt_v4f32
  // NODIVOPT: call <4 x float> @llvm.sqrt.v4f32(<4 x float> %{{.+}}), !fpmath ![[MD_SQRT:[0-9]+]]
  // DIVOPT: call <4 x float> @llvm.sqrt.v4f32(<4 x float> %{{.+}}){{$}}
  return __builtin_elementwise_sqrt(a);
}


#if __OPENCL_C_VERSION__ >=120
void printf(constant char* fmt, ...);

void testdbllit(long *val) {
  // CHECK-FLT: float noundef 2.000000e+01
  // CHECK-DBL: double noundef 2.000000e+01
  printf("%f", 20.0);
}

#endif

#ifndef NOFP64
#pragma OPENCL EXTENSION cl_khr_fp64 : enable
typedef __attribute__(( ext_vector_type(4) )) double double4;

double dpscalardiv(double a, double b) {
  // CHECK: @dpscalardiv
  // CHECK-NOT: !fpmath
  return a / b;
}

double4 dpvectordiv(double4 a, double4 b) {
  // CHECK: @dpvectordiv
  // CHECK-NOT: !fpmath
  return a / b;
}

double dpscalarsqrt(double a) {
  // CHECK-LABEL: @dpscalarsqrt
  // CHECK: call double @llvm.sqrt.f64(double %{{.+}}){{$}}
  return __builtin_sqrt(a);
}

double elementwise_sqrt_f64(double a) {
  // CHECK-LABEL: @elementwise_sqrt_f64
  // CHECK: call double @llvm.sqrt.f64(double %{{.+}}){{$}}
  return __builtin_elementwise_sqrt(a);
}

double4 elementwise_sqrt_v4f64(double4 a) {
  // CHECK-LABEL: @elementwise_sqrt_v4f64
  // CHECK: call <4 x double> @llvm.sqrt.v4f64(<4 x double> %{{.+}}){{$}}
  return __builtin_elementwise_sqrt(a);
}

#endif

// NODIVOPT: ![[MD_FDIV]] = !{float 2.500000e+00}
// NODIVOPT: ![[MD_SQRT]] = !{float 3.000000e+00}
llvm/clang/test/CodeGenOpenCL/fpmath.cl