test_skewsymmetric.F90 11.6 KB
Newer Older
Andreas Marek's avatar
Andreas Marek committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
!    This file is part of ELPA.
!
!    The ELPA library was originally created by the ELPA consortium,
!    consisting of the following organizations:
!
!    - Max Planck Computing and Data Facility (MPCDF), formerly known as
!      Rechenzentrum Garching der Max-Planck-Gesellschaft (RZG),
!    - Bergische Universität Wuppertal, Lehrstuhl für angewandte
!      Informatik,
!    - Technische Universität München, Lehrstuhl für Informatik mit
!      Schwerpunkt Wissenschaftliches Rechnen ,
!    - Fritz-Haber-Institut, Berlin, Abt. Theorie,
!    - Max-Plack-Institut für Mathematik in den Naturwissenschaften,
!      Leipzig, Abt. Komplexe Strukutren in Biologie und Kognition,
!      and
!    - IBM Deutschland GmbH
!
!
!    More information can be found here:
!    http://elpa.mpcdf.mpg.de/
!
!    ELPA is free software: you can redistribute it and/or modify
!    it under the terms of the version 3 of the license of the
!    GNU Lesser General Public License as published by the Free
!    Software Foundation.
!
!    ELPA is distributed in the hope that it will be useful,
!    but WITHOUT ANY WARRANTY; without even the implied warranty of
!    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
!    GNU Lesser General Public License for more details.
!
!    You should have received a copy of the GNU Lesser General Public License
!    along with ELPA.  If not, see <http://www.gnu.org/licenses/>
!
!    ELPA reflects a substantial effort on the part of the original
!    ELPA consortium, and we ask you to respect the spirit of the
!    license that we chose: i.e., please contribute any changes you
!    may have back to the original ELPA library distribution, and keep
!    any derivatives of ELPA under the same license that we chose for
!    the original distribution, the GNU Lesser General Public License.
!
!
#include "config-f90.h"

! Define one of TEST_REAL or TEST_COMPLEX
! Define one of TEST_SINGLE or TEST_DOUBLE
! Define one of TEST_SOLVER_1STAGE or TEST_SOLVER_2STAGE
! Define TEST_GPU \in [0, 1]
! Define either TEST_ALL_KERNELS or a TEST_KERNEL \in [any valid kernel]

#if !(defined(TEST_REAL) ^ defined(TEST_COMPLEX))
error: define exactly one of TEST_REAL or TEST_COMPLEX
#endif

#if !(defined(TEST_SINGLE) ^ defined(TEST_DOUBLE))
error: define exactly one of TEST_SINGLE or TEST_DOUBLE
#endif

#ifdef TEST_SINGLE
#  define EV_TYPE real(kind=C_FLOAT)
#  ifdef TEST_REAL
#    define MATRIX_TYPE real(kind=C_FLOAT)
#  else
#    define MATRIX_TYPE complex(kind=C_FLOAT_COMPLEX)
#  endif
#else
#  define EV_TYPE real(kind=C_DOUBLE)
#  ifdef TEST_REAL
#    define MATRIX_TYPE real(kind=C_DOUBLE)
#  else
#    define MATRIX_TYPE complex(kind=C_DOUBLE_COMPLEX)
#  endif
#endif

75
76
77
78
79
80
81
#ifdef TEST_SINGLE
#define MATRIX_TYPE_COMPLEX complex(kind=C_FLOAT_COMPLEX)
#define EV_TYPE_COMPLEX complex(kind=C_FLOAT_COMPLEX)
#else
#define MATRIX_TYPE_COMPLEX complex(kind=C_DOUBLE_COMPLEX)
#define EV_TYPE_COMPLEX complex(kind=C_DOUBLE_COMPLEX)
#endif
Andreas Marek's avatar
Andreas Marek committed
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121

#ifdef TEST_REAL
#  define AUTOTUNE_DOMAIN ELPA_AUTOTUNE_DOMAIN_REAL
#else
#  define AUTOTUNE_DOMAIN ELPA_AUTOTUNE_DOMAIN_COMPLEX
#endif

#include "assert.h"

program test
   use elpa

   use test_util
   use test_setup_mpi
   use test_prepare_matrix
   use test_read_input_parameters
   use test_blacs_infrastructure
   use test_check_correctness
   use iso_fortran_env

#ifdef HAVE_REDIRECT
   use test_redirect
#endif
   implicit none

   ! matrix dimensions
   integer                     :: na, nev, nblk

   ! mpi
   integer                     :: myid, nprocs
   integer                     :: na_cols, na_rows  ! local matrix size
   integer                     :: np_cols, np_rows  ! number of MPI processes per column/row
   integer                     :: my_prow, my_pcol  ! local MPI task position (my_prow, my_pcol) in the grid (0..np_cols -1, 0..np_rows -1)
   integer                     :: mpierr, ierr

   ! blacs
   character(len=1)            :: layout
   integer                     :: my_blacs_ctxt, sc_desc(9), info, nprow, npcol

   ! The Matrix
122
123
   MATRIX_TYPE, allocatable    :: a_skewsymmetric(:,:), as_skewsymmetric(:,:)
   MATRIX_TYPE_COMPLEX, allocatable    :: a_complex(:,:), as_complex(:,:)
Andreas Marek's avatar
Andreas Marek committed
124
   ! eigenvectors
125
126
   MATRIX_TYPE, allocatable    :: z_skewsymmetric(:,:)
   MATRIX_TYPE_COMPLEX, allocatable    :: z_complex(:,:)
Andreas Marek's avatar
Andreas Marek committed
127
   ! eigenvalues
128
   EV_TYPE, allocatable:: ev_skewsymmetric(:), ev_complex(:)
Andreas Marek's avatar
Andreas Marek committed
129

130
   integer                     :: error, status, i, j
Andreas Marek's avatar
Andreas Marek committed
131
132

   type(output_t)              :: write_to_file
133
134
   class(elpa_t), pointer      :: e_complex, e_skewsymmetric
           
Andreas Marek's avatar
Andreas Marek committed
135
136
137
138
139
140
141
142
143
144
145
146
147
   call read_input_parameters(na, nev, nblk, write_to_file)
   call setup_mpi(myid, nprocs)
#ifdef HAVE_REDIRECT
#ifdef WITH_MPI
   call MPI_BARRIER(MPI_COMM_WORLD, mpierr)
   call redirect_stdout(myid)
#endif
#endif

   if (elpa_init(CURRENT_API_VERSION) /= ELPA_OK) then
     print *, "ELPA API version not supported"
     stop 1
   endif
Carolin Penke's avatar
Carolin Penke committed
148
! 
Andreas Marek's avatar
Andreas Marek committed
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
   layout = 'C'
   do np_cols = NINT(SQRT(REAL(nprocs))),2,-1
      if(mod(nprocs,np_cols) == 0 ) exit
   enddo
   np_rows = nprocs/np_cols
   assert(nprocs == np_rows * np_cols)

   if (myid == 0) then
     print '((a,i0))', 'Matrix size: ', na
     print '((a,i0))', 'Num eigenvectors: ', nev
     print '((a,i0))', 'Blocksize: ', nblk
#ifdef WITH_MPI
     print '((a,i0))', 'Num MPI proc: ', nprocs
     print '(3(a,i0))','Number of processor rows=',np_rows,', cols=',np_cols,', total=',nprocs
     print '(a)',      'Process layout: ' // layout
#endif
     print *,''
   endif

   call set_up_blacsgrid(mpi_comm_world, np_rows, np_cols, layout, &
                         my_blacs_ctxt, my_prow, my_pcol)

   call set_up_blacs_descriptor(na, nblk, my_prow, my_pcol, np_rows, np_cols, &
                                na_rows, na_cols, sc_desc, my_blacs_ctxt, info)

174
175
   allocate(a_skewsymmetric (na_rows,na_cols))
   allocate(as_skewsymmetric(na_rows,na_cols))
Carolin Penke's avatar
Carolin Penke committed
176
   allocate(z_skewsymmetric (na_rows,2*na_cols))
177
   allocate(ev_skewsymmetric(na))
Andreas Marek's avatar
Andreas Marek committed
178

179
180
181
   a_skewsymmetric(:,:) = 0.0
   z_skewsymmetric(:,:) = 0.0
   ev_skewsymmetric(:) = 0.0
Andreas Marek's avatar
Andreas Marek committed
182

Carolin Penke's avatar
Carolin Penke committed
183
184
   call prepare_matrix_random(na, myid, sc_desc, a_skewsymmetric, &
   z_skewsymmetric(:,1:na_cols), as_skewsymmetric, is_skewsymmetric=1)
Carolin Penke's avatar
Carolin Penke committed
185
186
   
   call MPI_BARRIER(MPI_COMM_WORLD, ierr)  
187
   as_skewsymmetric(:,:) = a_skewsymmetric(:,:)
Carolin Penke's avatar
Carolin Penke committed
188
   
Andreas Marek's avatar
Andreas Marek committed
189

190
191
192
193
194
   ! prepare the complex matrix for the "brute force" case
   allocate(a_complex (na_rows,na_cols))
   allocate(as_complex(na_rows,na_cols))
   allocate(z_complex (na_rows,na_cols))
   allocate(ev_complex(na))
Andreas Marek's avatar
Andreas Marek committed
195

Carolin Penke's avatar
Carolin Penke committed
196
197
198
   a_complex(1:na_rows,1:na_cols) = 0.0
   z_complex(1:na_rows,1:na_cols) = 0.0
   as_complex(1:na_rows,1:na_cols) = 0.0
Carolin Penke's avatar
Carolin Penke committed
199
   
Andreas Marek's avatar
Andreas Marek committed
200

Carolin Penke's avatar
Carolin Penke committed
201
202
      do j=1, na_cols
         do i=1,na_rows
203
               a_complex(i,j) = dcmplx(0.0, a_skewsymmetric(i,j))
Carolin Penke's avatar
Carolin Penke committed
204
205
206
         enddo
      enddo
   
Carolin Penke's avatar
Carolin Penke committed
207
208
   z_complex(1:na_rows,1:na_cols)  = a_complex(1:na_rows,1:na_cols)
   as_complex(1:na_rows,1:na_cols) = a_complex(1:na_rows,1:na_cols)
Andreas Marek's avatar
Andreas Marek committed
209

210
211
212
   ! first set up and solve the brute force problem
   e_complex => elpa_allocate()
   call set_basic_params(e_complex, na, nev, na_rows, na_cols, my_prow, my_pcol)
Andreas Marek's avatar
Andreas Marek committed
213

214
   call e_complex%set("timings",1, error)
Andreas Marek's avatar
Andreas Marek committed
215

216
   call e_complex%set("debug",1)
Carolin Penke's avatar
Carolin Penke committed
217
218
   call e_complex%set("gpu", 0)
   call e_complex%set("omp_threads", 8, error)
Andreas Marek's avatar
Andreas Marek committed
219

220
   assert_elpa_ok(e_complex%setup())
221
   call e_complex%set("solver", elpa_solver_2stage, error)
Andreas Marek's avatar
Andreas Marek committed
222

223
224
225
   call e_complex%timer_start("eigenvectors: brute force ")
   call e_complex%eigenvectors(a_complex, ev_complex, z_complex, error)
   call e_complex%timer_stop("eigenvectors: brute force ")
Andreas Marek's avatar
Andreas Marek committed
226

227
228
   if (myid .eq. 0) then
     print *, ""
Carolin Penke's avatar
Carolin Penke committed
229
     call e_complex%print_times("eigenvectors: brute force")
230
   endif 
Carolin Penke's avatar
Carolin Penke committed
231
232
233
234
#ifdef WITH_MPI
     call MPI_BARRIER(MPI_COMM_WORLD, ierr)
#endif     
!      as_complex(:,:) = z_complex(:,:)
235
236
237
238
239
#ifdef TEST_SINGLE
     status = check_correctness_evp_numeric_residuals_complex_single(na, nev, as_complex, z_complex, ev_complex, sc_desc, &
                                                    nblk, myid, np_rows,np_cols, my_prow, my_pcol)
#else
     status = check_correctness_evp_numeric_residuals_complex_double(na, nev, as_complex, z_complex, ev_complex, sc_desc, &
240
                                                    nblk, myid, np_rows,np_cols, my_prow, my_pcol)
241
#endif
Carolin Penke's avatar
Carolin Penke committed
242
243
!    status = 0
!    call check_status(status, myid)
Andreas Marek's avatar
Andreas Marek committed
244
245
246
247

#ifdef WITH_MPI
     call MPI_BARRIER(MPI_COMM_WORLD, ierr)
#endif
248
249
250
   ! now run the skewsymmetric case
   e_skewsymmetric => elpa_allocate()
   call set_basic_params(e_skewsymmetric, na, nev, na_rows, na_cols, my_prow, my_pcol)
Andreas Marek's avatar
Andreas Marek committed
251

252
253
254
   call e_skewsymmetric%set("timings",1, error)

   call e_skewsymmetric%set("debug",1)
Carolin Penke's avatar
Carolin Penke committed
255
256
   call e_skewsymmetric%set("gpu", 0)
   call e_skewsymmetric%set("omp_threads",8, error)
257
258
259

   call e_skewsymmetric%set("is_skewsymmetric",1)
   assert_elpa_ok(e_skewsymmetric%setup())
Carolin Penke's avatar
Carolin Penke committed
260
261
   
   call e_skewsymmetric%set("solver", elpa_solver_2stage, error)
262

Carolin Penke's avatar
Carolin Penke committed
263
264
   call e_skewsymmetric%get("is_skewsymmetric", i,error)
   
265
266
267
   call e_skewsymmetric%timer_start("eigenvectors: skewsymmetric ")
   call e_skewsymmetric%eigenvectors(a_skewsymmetric, ev_skewsymmetric, z_skewsymmetric, error)
   call e_skewsymmetric%timer_stop("eigenvectors: skewsymmetric ")
Andreas Marek's avatar
Andreas Marek committed
268
269
270

   if (myid .eq. 0) then
     print *, ""
Carolin Penke's avatar
Carolin Penke committed
271
     call e_skewsymmetric%print_times("eigenvectors: skewsymmetric")
Carolin Penke's avatar
Carolin Penke committed
272
   endif
Carolin Penke's avatar
Carolin Penke committed
273
274
   
   
Carolin Penke's avatar
Carolin Penke committed
275
276
   ! check eigenvalues
   do i=1, na
Carolin Penke's avatar
Carolin Penke committed
277
     if (myid == 0) then
Carolin Penke's avatar
Carolin Penke committed
278
!          print *,"ev(", i,")=",ev_skewsymmetric(i)
279
       if (abs(ev_complex(i)-ev_skewsymmetric(i))/abs(ev_complex(i)) .gt. 1e-10) then
Carolin Penke's avatar
Carolin Penke committed
280
         print *,"ev: i=",i,ev_complex(i),ev_skewsymmetric(i)
Carolin Penke's avatar
Carolin Penke committed
281
282
         status = 1
     endif
Carolin Penke's avatar
Carolin Penke committed
283
284
     endif
   enddo
285
!    call check_status(status, myid)
Carolin Penke's avatar
Carolin Penke committed
286
   
Carolin Penke's avatar
Carolin Penke committed
287
288
289
   z_complex(:,:) = 0
   do j=1, na_cols
     do i=1,na_rows
290
       z_complex(i,j) = dcmplx(z_skewsymmetric(i,j), z_skewsymmetric(i,na_cols+j))
Carolin Penke's avatar
Carolin Penke committed
291
292
293
294
295
296
297
     enddo
   enddo
   call MPI_BARRIER(MPI_COMM_WORLD, ierr)
   
   status = check_correctness_evp_numeric_residuals_ss(na, nev, as_skewsymmetric, z_complex, ev_skewsymmetric, &
                              sc_desc, nblk, myid, np_rows,np_cols, my_prow, my_pcol)

Carolin Penke's avatar
Carolin Penke committed
298
   
299
#ifdef WITH_MPI
Carolin Penke's avatar
Carolin Penke committed
300
!    call MPI_BARRIER(MPI_COMM_WORLD, ierr)
301
302
303
304
#endif
   call elpa_deallocate(e_complex)
   call elpa_deallocate(e_skewsymmetric)

Andreas Marek's avatar
Andreas Marek committed
305

306
307
308
   !to do 
   ! - check whether brute-force check_correctness_evp_numeric_residuals worsk (complex ev)
   ! - invent a test for skewsymmetric residuals
Andreas Marek's avatar
Andreas Marek committed
309

310
311
312
313
   deallocate(a_complex)
   deallocate(as_complex)
   deallocate(z_complex)
   deallocate(ev_complex)
Andreas Marek's avatar
Andreas Marek committed
314

315
316
317
318
   deallocate(a_skewsymmetric)
   deallocate(as_skewsymmetric)
   deallocate(z_skewsymmetric)
   deallocate(ev_skewsymmetric)
Andreas Marek's avatar
Andreas Marek committed
319
320
   call elpa_uninit()

321
322


Andreas Marek's avatar
Andreas Marek committed
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
#ifdef WITH_MPI
   call blacs_gridexit(my_blacs_ctxt)
   call mpi_finalize(mpierr)
#endif

   call exit(status)

contains
   subroutine set_basic_params(elpa, na, nev, na_rows, na_cols, my_prow, my_pcol)
     implicit none
     class(elpa_t), pointer      :: elpa
     integer, intent(in)         :: na, nev, na_rows, na_cols, my_prow, my_pcol

     call elpa%set("na", na, error)
     assert_elpa_ok(error)
     call elpa%set("nev", nev, error)
     assert_elpa_ok(error)
     call elpa%set("local_nrows", na_rows, error)
     assert_elpa_ok(error)
     call elpa%set("local_ncols", na_cols, error)
     assert_elpa_ok(error)
     call elpa%set("nblk", nblk, error)
     assert_elpa_ok(error)

#ifdef WITH_MPI
     call elpa%set("mpi_comm_parent", MPI_COMM_WORLD, error)
     assert_elpa_ok(error)
     call elpa%set("process_row", my_prow, error)
     assert_elpa_ok(error)
     call elpa%set("process_col", my_pcol, error)
     assert_elpa_ok(error)
#endif
   end subroutine
356
357
358
359
360
361
362
363
364
365
366
367
   subroutine check_status(status, myid)
     implicit none
     integer, intent(in) :: status, myid
     integer :: mpierr
     if (status /= 0) then
       if (myid == 0) print *, "Result incorrect!"
#ifdef WITH_MPI
       call mpi_finalize(mpierr)
#endif
       call exit(status)
     endif
   end subroutine
Andreas Marek's avatar
Andreas Marek committed
368
end program