// RUN: %clangxx_nsan -O0 -mllvm -nsan-shadow-type-mapping=dqq -g -DSUM=NaiveSum -DFLT=float %s -o %t
// RUN: env NSAN_OPTIONS=halt_on_error=1,log2_max_relative_error=19 not %run %t 2>&1 | FileCheck %s
// RUN: %clangxx_nsan -O3 -mllvm -nsan-shadow-type-mapping=dqq -g -DSUM=NaiveSum -DFLT=float %s -o %t
// RUN: env NSAN_OPTIONS=halt_on_error=1,log2_max_relative_error=19 not %run %t 2>&1 | FileCheck %s
// RUN: %clangxx_nsan -O0 -mllvm -nsan-shadow-type-mapping=dqq -g -DSUM=KahanSum -DFLT=float %s -o %t
// RUN: env NSAN_OPTIONS=halt_on_error=1,log2_max_relative_error=19 %run %t
// RUN: %clangxx_nsan -O3 -mllvm -nsan-shadow-type-mapping=dqq -g -DSUM=KahanSum -DFLT=float %s -o %t
// RUN: env NSAN_OPTIONS=halt_on_error=1,log2_max_relative_error=19 %run %t
#include <chrono>
#include <iostream>
#include <random>
#include <vector>
// A naive, unstable summation.
template <typename T>
__attribute__((noinline)) // To check call stack reporting.
T NaiveSum(const std::vector<T>& values) {
T sum = 0;
for (T v : values) {
sum += v;
}
return sum;
// CHECK: WARNING: NumericalStabilitySanitizer: inconsistent shadow results while checking return
// CHECK: float{{ *}}precision (native):
// CHECK: double{{ *}}precision (shadow):
// CHECK: {{#0 .*in .* NaiveSum}}
}
// Kahan's summation is a numerically stable sum.
// https://en.wikipedia.org/wiki/Kahan_summation_algorithm
template <typename T>
__attribute__((noinline)) T KahanSum(const std::vector<T> &values) {
T sum = 0;
T c = 0;
for (T v : values) {
T y = v - c;
T t = sum + y;
c = (t - sum) - y;
sum = t;
}
return sum;
}
int main() {
std::vector<FLT> values;
constexpr int kNumValues = 1000000;
values.reserve(kNumValues);
// Using a seed to avoid flakiness.
constexpr uint32_t kSeed = 0x123456;
std::mt19937 gen(kSeed);
std::uniform_real_distribution<FLT> dis(0.0f, 1000.0f);
for (int i = 0; i < kNumValues; ++i) {
values.push_back(dis(gen));
}
const auto t1 = std::chrono::high_resolution_clock::now();
const auto sum = SUM(values);
const auto t2 = std::chrono::high_resolution_clock::now();
printf("sum: %.8f\n", sum);
std::cout << "runtime: "
<< std::chrono::duration_cast<std::chrono::microseconds>(t2 - t1)
.count() /
1000.0
<< "ms\n";
return 0;
}