Commit 7d4d6829 authored by Andreas Marek's avatar Andreas Marek

Wrong preprocessor ifdef in complex block2 kernel

parent 150880a4
......@@ -443,7 +443,7 @@ static __forceinline void hh_trafo_complex_kernel_8_AVX_2hv(double complex* q, d
q1 = _mm256_add_pd(q1, _mm256_addsub_pd( _mm256_mul_pd(h2_real, y1), _mm256_shuffle_pd(tmp1, tmp1, 0x5)));
#endif
tmp2 = _mm256_mul_pd(h2_imag, y2);
#ifdef __FMA4_
#ifdef __ELPA_USE_FMA_
q2 = _mm256_add_pd(q2, _mm256_FMADDSUB_pd(h2_real, y2, _mm256_shuffle_pd(tmp2, tmp2, 0x5)));
#else
q2 = _mm256_add_pd(q2, _mm256_addsub_pd( _mm256_mul_pd(h2_real, y2), _mm256_shuffle_pd(tmp2, tmp2, 0x5)));
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment