Skip to content
GitLab
Menu
Projects
Groups
Snippets
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
elpa
elpa
Commits
a5a5ef89
Commit
a5a5ef89
authored
Jun 18, 2019
by
Andreas Marek
Browse files
Test new kernel
parent
41896071
Changes
1
Pipelines
1
Hide whitespace changes
Inline
Side-by-side
src/elpa2/kernels/complex_128bit_256bit_512bit_BLOCK_template.c
View file @
a5a5ef89
...
...
@@ -5703,7 +5703,7 @@ static __forceinline void CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIM
#endif
/* VEC_SET == AVX_512 */
#if (VEC_SET == AVX_512 && BLOCK == 1) || VEC_SET != AVX_512
//
#if (VEC_SET == AVX_512 && BLOCK == 1) || VEC_SET != AVX_512
static
__forceinline
void
CONCAT_8ARGS
(
hh_trafo_complex_kernel_
,
ROW_LENGTH
,
_
,
SIMD_SET
,
_
,
BLOCK
,
hv_
,
WORD_LENGTH
)
(
DATA_TYPE_PTR
q
,
DATA_TYPE_PTR
hh
,
int
nb
,
int
ldq
#ifdef BLOCK1
...
...
@@ -6263,7 +6263,7 @@ static __forceinline void CONCAT_8ARGS(hh_trafo_complex_kernel_,ROW_LENGTH,_,SIM
#endif
/* BLOCK2 */
}
#endif
//
#endif
#if 0
...
...
@@ -6354,8 +6354,7 @@ static __forceinline void hh_trafo_complex_kernel_8_AVX512_1hv_single(float comp
}
#endif
#if VEC_SET == AVX_512 && BLOCK == 2
#if 0
#ifdef DOUBLE_PRECISION_COMPLEX
static __forceinline void hh_trafo_complex_kernel_4_AVX512_2hv_double(double complex* q, double complex* hh, int nb, int ldq, int ldh, double complex s)
#endif
...
...
@@ -6564,5 +6563,5 @@ static __forceinline void hh_trafo_complex_kernel_8_AVX512_2hv_single(float comp
_SIMD_STORE(&q_dbl[(2*nb*ldq)+0], q1);
}
#endif
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment