Skip to content
GitLab
Menu
Projects
Groups
Snippets
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
elpa
elpa
Commits
b6369e22
Commit
b6369e22
authored
May 02, 2019
by
Andreas Marek
Browse files
Unify 128bit kernels real block2 and block4
parent
9233720a
Changes
13
Pipelines
1
Expand all
Hide whitespace changes
Inline
Side-by-side
Doxyfile.in
View file @
b6369e22
...
...
@@ -905,7 +905,6 @@ EXCLUDE = @top_srcdir@/src/GPU/check_for_gpu.F90 \
@top_srcdir@/src/elpa2/kernels/complex_avx-avx2_2hv_double_precision.c \
@top_srcdir@/src/elpa2/kernels/real_avx512_2hv_double_precision.c \
@top_srcdir@/src/elpa2/kernels/real_avx512_2hv_single_precision.c \
@top_srcdir@/src/elpa2/kernels/real_sse_4hv_template.c \
@top_srcdir@/src/elpa2/kernels/complex_avx-avx2_2hv_single_precision.c \
@top_srcdir@/src/elpa2/kernels/complex_avx512_1hv_double_precision.c \
@top_srcdir@/src/elpa2/kernels/real_sse_6hv_single_precision.c \
...
...
@@ -913,7 +912,6 @@ EXCLUDE = @top_srcdir@/src/GPU/check_for_gpu.F90 \
@top_srcdir@/src/elpa2/kernels/asm_x86_64_double_precision.s \
@top_srcdir@/src/elpa2/kernels/real_avx512_4hv_double_precision.c \
@top_srcdir@/src/elpa2/kernels/real_sse_6hv_double_precision.c \
@top_srcdir@/src/elpa2/kernels/real_sse_2hv_template.c \
@top_srcdir@/src/elpa2/kernels/complex_avx512_1hv_single_precision.c \
@top_srcdir@/src/elpa2/kernels/asm_x86_64_single_precision.s \
@top_srcdir@/src/elpa2/kernels/real_avx512_6hv_template.c \
...
...
Makefile.am
View file @
b6369e22
...
...
@@ -784,8 +784,7 @@ EXTRA_DIST = \
src/elpa2/kernels/real_vsx_2hv_template.c
\
src/elpa2/kernels/real_vsx_4hv_template.c
\
src/elpa2/kernels/real_vsx_6hv_template.c
\
src/elpa2/kernels/real_sse_2hv_template.c
\
src/elpa2/kernels/real_sse_4hv_template.c
\
src/elpa2/kernels/real_128bit_BLOCK_template.c
\
src/elpa2/kernels/real_sse_6hv_template.c
\
src/elpa2/kernels/real_template.F90
\
src/elpa2/kernels/simple_template.F90
\
...
...
src/elpa2/kernels/real_128bit_BLOCK_template.c
0 → 100644
View file @
b6369e22
This diff is collapsed.
Click to expand it.
src/elpa2/kernels/real_sparc64_2hv_double_precision.c
View file @
b6369e22
...
...
@@ -48,8 +48,10 @@
#define REALCASE 1
#define DOUBLE_PRECISION 1
#define BLOCK2
#include "../../general/precision_macros.h"
#include "real_
sse_2hv
_template.c"
#include "real_
128bit_BLOCK
_template.c"
#undef REALCASE
#undef BLOCK2
#undef DOUBLE_PRECISION
src/elpa2/kernels/real_sparc64_2hv_single_precision.c
View file @
b6369e22
...
...
@@ -48,8 +48,10 @@
#define REALCASE 1
#define SINGLE_PRECISION 1
#define BLOCK2
#include "../../general/precision_macros.h"
#include "real_sse_2hv_template.c"
#include "real_128bit_BLOCK_template.c"
#undef BLOCK2
#undef REALCASE
#undef SINGLE_PRECISION
src/elpa2/kernels/real_sparc64_4hv_double_precision.c
View file @
b6369e22
...
...
@@ -48,8 +48,10 @@
#define REALCASE 1
#define DOUBLE_PRECISION 1
#define BLOCK4 1
#include "../../general/precision_macros.h"
#include "real_sse_4hv_template.c"
#include "real_128bit_BLOCK_template.c"
#undef BLOCK4
#undef REALCASE
#undef DOUBLE_PRECISION
src/elpa2/kernels/real_sparc64_4hv_single_precision.c
View file @
b6369e22
...
...
@@ -48,8 +48,10 @@
#define REALCASE 1
#define SINGLE_PRECISION 1
#define BLOCK4
#include "../../general/precision_macros.h"
#include "real_sse_4hv_template.c"
#include "real_128bit_BLOCK_template.c"
#undef BLOCK4
#undef REALCASE
#undef SINGLE_PRECISION
src/elpa2/kernels/real_sse_2hv_double_precision.c
View file @
b6369e22
...
...
@@ -48,8 +48,10 @@
#define REALCASE 1
#define DOUBLE_PRECISION 1
#define BLOCK2 1
#include "../../general/precision_macros.h"
#include "real_sse_2hv_template.c"
#include "real_128bit_BLOCK_template.c"
#undef BLOCK2
#undef REALCASE
#undef DOUBLE_PRECISION
src/elpa2/kernels/real_sse_2hv_single_precision.c
View file @
b6369e22
...
...
@@ -48,8 +48,10 @@
#define REALCASE 1
#define SINGLE_PRECISION 1
#define BLOCK2 1
#include "../../general/precision_macros.h"
#include "real_sse_2hv_template.c"
#include "real_128bit_BLOCK_template.c"
#undef BLOCK2
#undef REALCASE
#undef SINGLE_PRECISION
src/elpa2/kernels/real_sse_2hv_template.c
deleted
100644 → 0
View file @
9233720a
This diff is collapsed.
Click to expand it.
src/elpa2/kernels/real_sse_4hv_double_precision.c
View file @
b6369e22
...
...
@@ -48,8 +48,10 @@
#define REALCASE 1
#define DOUBLE_PRECISION 1
#define BLOCK4 1
#include "../../general/precision_macros.h"
#include "real_sse_4hv_template.c"
#include "real_128bit_BLOCK_template.c"
#undef BLOCK4
#undef REALCASE
#undef DOUBLE_PRECISION
src/elpa2/kernels/real_sse_4hv_single_precision.c
View file @
b6369e22
...
...
@@ -48,8 +48,10 @@
#define REALCASE 1
#define SINGLE_PRECISION 1
#define BLOCK4 1
#include "../../general/precision_macros.h"
#include "real_sse_4hv_template.c"
#include "real_128bit_BLOCK_template.c"
#undef BLOCK4
#undef REALCASE
#undef SINGLE_PRECISION
src/elpa2/kernels/real_sse_4hv_template.c
deleted
100644 → 0
View file @
9233720a
This diff is collapsed.
Click to expand it.
Write
Preview
Supports
Markdown
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment