static void fma4_test (void) { int i; init_nmaccps (); for (i = 0; i < NUM; i++) dst.x[i] = _mm256_nmacc_ps (src1.x[i], src2.x[i], src3.x[i]); if (check_nmaccps ()) abort (); init_nmaccpd (); for (i = 0; i < NUM; i++) dst.y[i] = _mm256_nmacc_pd (src1.y[i], src2.y[i], src3.y[i]); if (check_nmaccpd ()) abort (); }
__m256d test_mm256_nmacc_pd(__m256d a, __m256d b, __m256d c) { // CHECK: @llvm.x86.fma.vfnmadd.pd.256 // CHECK-ASM: vfnmaddpd %ymm{{.*}}, %ymm{{.*}}, %ymm{{.*}}, %ymm{{.*}} return _mm256_nmacc_pd(a, b, c); }
__m256d test_mm256_nmacc_pd(__m256d a, __m256d b, __m256d c) { // CHECK-LABEL: test_mm256_nmacc_pd // CHECK: [[NEG:%.+]] = fsub <4 x double> <double -0.000000e+00, double -0.000000e+00, double -0.000000e+00, double -0.000000e+00>, %{{.+}} // CHECK: @llvm.x86.fma.vfmadd.pd.256(<4 x double> [[NEG]], <4 x double> %{{.+}}, <4 x double> %{{.+}}) return _mm256_nmacc_pd(a, b, c); }