Skip to content
GitLab
Menu
Projects
Groups
Snippets
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
elpa
elpa
Commits
554d2785
Commit
554d2785
authored
Aug 18, 2016
by
Andreas Marek
Browse files
Remove SSE references from AVX kernels
parent
1e1812bc
Changes
2
Pipelines
1
Hide whitespace changes
Inline
Side-by-side
src/elpa2_kernels/elpa2_kernels_real_avx-avx2_2hv_single_precision.c
View file @
554d2785
...
...
@@ -860,6 +860,8 @@ void double_hh_trafo_real_avx_avx2_2hv_single(float* q, float* hh, int* pnb, int
#endif
}
#if 0
/**
* Unrolled kernel that computes
* 4 rows of Q simultaneously, a
...
...
@@ -958,6 +960,7 @@ __forceinline void hh_trafo_kernel_4_sse_instead_of_avx_2hv_single(float* q, flo
q1 = _mm_add_ps(q1, _mm_mul_ps(x1, h1));
_mm_store_ps(&q[nb*ldq],q1);
}
#endif
/**
* Unrolled kernel that computes
...
...
src/elpa2_kernels/elpa2_kernels_real_avx-avx2_6hv_single_precision.c
View file @
554d2785
...
...
@@ -196,7 +196,7 @@ void hexa_hh_trafo_real_avx_avx2_6hv_single(float* q, float* hh, int* pnb, int*
}
// Production level kernel calls with padding
#ifdef __AVX__
//
#ifdef __AVX__
for
(
i
=
0
;
i
<
nq
-
4
;
i
+=
8
)
{
hh_trafo_kernel_8_AVX_6hv_single
(
&
q
[
i
],
hh
,
nb
,
ldq
,
ldh
,
scalarprods
);
...
...
@@ -209,20 +209,20 @@ void hexa_hh_trafo_real_avx_avx2_6hv_single(float* q, float* hh, int* pnb, int*
{
hh_trafo_kernel_4_AVX_6hv_single
(
&
q
[
i
],
hh
,
nb
,
ldq
,
ldh
,
scalarprods
);
}
#else
for
(
i
=
0
;
i
<
nq
-
2
;
i
+=
4
)
{
hh_trafo_kernel_4_SSE_6hv_single
(
&
q
[
i
],
hh
,
nb
,
ldq
,
ldh
,
scalarprods
);
}
if
(
nq
==
i
)
{
return
;
}
else
{
hh_trafo_kernel_2_SSE_6hv_single
(
&
q
[
i
],
hh
,
nb
,
ldq
,
ldh
,
scalarprods
);
}
#endif
//
#else
//
for (i = 0; i < nq-2; i+=4)
//
{
//
hh_trafo_kernel_4_SSE_6hv_single(&q[i], hh, nb, ldq, ldh, scalarprods);
//
}
//
if (nq == i)
//
{
//
return;
//
}
//
else
//
{
//
hh_trafo_kernel_2_SSE_6hv_single(&q[i], hh, nb, ldq, ldh, scalarprods);
//
}
//
#endif
}
...
...
Write
Preview
Supports
Markdown
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment