| // RUN: %clangxx_nsan -O0 -g -mavx %s -o %t |
| // RUN: env NSAN_OPTIONS=check_nan=true,halt_on_error=0 %run %t 2>&1 | FileCheck %s |
| // RUN: %clangxx_nsan -O3 -g -mavx %s -o %t |
| // RUN: env NSAN_OPTIONS=check_nan=true,halt_on_error=0 %run %t 2>&1 | FileCheck %s |
| |
| #include <cmath> |
| #include <immintrin.h> |
| #include <iostream> |
| |
| void simd_sqrt(const float *input, float *output, size_t size) { |
| size_t i = 0; |
| for (; i + 7 < size; i += 8) { |
| __m256 vec = _mm256_loadu_ps(&input[i]); |
| __m256 result = _mm256_sqrt_ps(vec); |
| _mm256_storeu_ps(&output[i], result); |
| } |
| for (; i < size; ++i) { |
| output[i] = std::sqrt(input[i]); |
| // CHECK: WARNING: NumericalStabilitySanitizer: NaN detected |
| } |
| } |
| |
| int main() { |
| float input[] = {1.0, 2.0, -3.0, 4.0, 5.0, 6.0, 7.0, |
| 8.0, 9.0, -10.0, 11.0, 12.0, 13.0, 14.0, |
| 15.0, -16.0, 17.0, -18.0, -19.0, -20.0}; |
| float output[20]; |
| simd_sqrt(input, output, 20); |
| for (int i = 0; i < 20; ++i) { |
| std::cout << output[i] << std::endl; |
| // CHECK: WARNING: NumericalStabilitySanitizer: NaN detected |
| } |
| return 0; |
| } |