test_skewsymmetric.F90 11.7 KB
Newer Older
Andreas Marek's avatar
Andreas Marek committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
!    This file is part of ELPA.
!
!    The ELPA library was originally created by the ELPA consortium,
!    consisting of the following organizations:
!
!    - Max Planck Computing and Data Facility (MPCDF), formerly known as
!      Rechenzentrum Garching der Max-Planck-Gesellschaft (RZG),
!    - Bergische Universität Wuppertal, Lehrstuhl für angewandte
!      Informatik,
!    - Technische Universität München, Lehrstuhl für Informatik mit
!      Schwerpunkt Wissenschaftliches Rechnen ,
!    - Fritz-Haber-Institut, Berlin, Abt. Theorie,
!    - Max-Plack-Institut für Mathematik in den Naturwissenschaften,
!      Leipzig, Abt. Komplexe Strukutren in Biologie und Kognition,
!      and
!    - IBM Deutschland GmbH
!
!
!    More information can be found here:
!    http://elpa.mpcdf.mpg.de/
!
!    ELPA is free software: you can redistribute it and/or modify
!    it under the terms of the version 3 of the license of the
!    GNU Lesser General Public License as published by the Free
!    Software Foundation.
!
!    ELPA is distributed in the hope that it will be useful,
!    but WITHOUT ANY WARRANTY; without even the implied warranty of
!    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
!    GNU Lesser General Public License for more details.
!
!    You should have received a copy of the GNU Lesser General Public License
!    along with ELPA.  If not, see <http://www.gnu.org/licenses/>
!
!    ELPA reflects a substantial effort on the part of the original
!    ELPA consortium, and we ask you to respect the spirit of the
!    license that we chose: i.e., please contribute any changes you
!    may have back to the original ELPA library distribution, and keep
!    any derivatives of ELPA under the same license that we chose for
!    the original distribution, the GNU Lesser General Public License.
!
!
#include "config-f90.h"

! Define one of TEST_REAL or TEST_COMPLEX
! Define one of TEST_SINGLE or TEST_DOUBLE
! Define one of TEST_SOLVER_1STAGE or TEST_SOLVER_2STAGE
! Define TEST_GPU \in [0, 1]
! Define either TEST_ALL_KERNELS or a TEST_KERNEL \in [any valid kernel]

#if !(defined(TEST_REAL) ^ defined(TEST_COMPLEX))
error: define exactly one of TEST_REAL or TEST_COMPLEX
#endif

#if !(defined(TEST_SINGLE) ^ defined(TEST_DOUBLE))
error: define exactly one of TEST_SINGLE or TEST_DOUBLE
#endif

#ifdef TEST_SINGLE
#  define EV_TYPE real(kind=C_FLOAT)
#  ifdef TEST_REAL
#    define MATRIX_TYPE real(kind=C_FLOAT)
#  else
#    define MATRIX_TYPE complex(kind=C_FLOAT_COMPLEX)
#  endif
#else
#  define EV_TYPE real(kind=C_DOUBLE)
#  ifdef TEST_REAL
#    define MATRIX_TYPE real(kind=C_DOUBLE)
#  else
#    define MATRIX_TYPE complex(kind=C_DOUBLE_COMPLEX)
#  endif
#endif

75
76
77
78
79
80
81
#ifdef TEST_SINGLE
#define MATRIX_TYPE_COMPLEX complex(kind=C_FLOAT_COMPLEX)
#define EV_TYPE_COMPLEX complex(kind=C_FLOAT_COMPLEX)
#else
#define MATRIX_TYPE_COMPLEX complex(kind=C_DOUBLE_COMPLEX)
#define EV_TYPE_COMPLEX complex(kind=C_DOUBLE_COMPLEX)
#endif
Andreas Marek's avatar
Andreas Marek committed
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121

#ifdef TEST_REAL
#  define AUTOTUNE_DOMAIN ELPA_AUTOTUNE_DOMAIN_REAL
#else
#  define AUTOTUNE_DOMAIN ELPA_AUTOTUNE_DOMAIN_COMPLEX
#endif

#include "assert.h"

program test
   use elpa

   use test_util
   use test_setup_mpi
   use test_prepare_matrix
   use test_read_input_parameters
   use test_blacs_infrastructure
   use test_check_correctness
   use iso_fortran_env

#ifdef HAVE_REDIRECT
   use test_redirect
#endif
   implicit none

   ! matrix dimensions
   integer                     :: na, nev, nblk

   ! mpi
   integer                     :: myid, nprocs
   integer                     :: na_cols, na_rows  ! local matrix size
   integer                     :: np_cols, np_rows  ! number of MPI processes per column/row
   integer                     :: my_prow, my_pcol  ! local MPI task position (my_prow, my_pcol) in the grid (0..np_cols -1, 0..np_rows -1)
   integer                     :: mpierr, ierr

   ! blacs
   character(len=1)            :: layout
   integer                     :: my_blacs_ctxt, sc_desc(9), info, nprow, npcol

   ! The Matrix
122
123
   MATRIX_TYPE, allocatable    :: a_skewsymmetric(:,:), as_skewsymmetric(:,:)
   MATRIX_TYPE_COMPLEX, allocatable    :: a_complex(:,:), as_complex(:,:)
Andreas Marek's avatar
Andreas Marek committed
124
   ! eigenvectors
125
126
   MATRIX_TYPE, allocatable    :: z_skewsymmetric(:,:)
   MATRIX_TYPE_COMPLEX, allocatable    :: z_complex(:,:)
Andreas Marek's avatar
Andreas Marek committed
127
   ! eigenvalues
128
   EV_TYPE, allocatable:: ev_skewsymmetric(:), ev_complex(:)
Andreas Marek's avatar
Andreas Marek committed
129

130
   integer                     :: error, status, i, j
Andreas Marek's avatar
Andreas Marek committed
131
132

   type(output_t)              :: write_to_file
133
134
   class(elpa_t), pointer      :: e_complex, e_skewsymmetric
           
Andreas Marek's avatar
Andreas Marek committed
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
   call read_input_parameters(na, nev, nblk, write_to_file)
   call setup_mpi(myid, nprocs)
#ifdef HAVE_REDIRECT
#ifdef WITH_MPI
   call MPI_BARRIER(MPI_COMM_WORLD, mpierr)
   call redirect_stdout(myid)
#endif
#endif

   if (elpa_init(CURRENT_API_VERSION) /= ELPA_OK) then
     print *, "ELPA API version not supported"
     stop 1
   endif

   layout = 'C'
   do np_cols = NINT(SQRT(REAL(nprocs))),2,-1
      if(mod(nprocs,np_cols) == 0 ) exit
   enddo
   np_rows = nprocs/np_cols
   assert(nprocs == np_rows * np_cols)

   if (myid == 0) then
     print '((a,i0))', 'Matrix size: ', na
     print '((a,i0))', 'Num eigenvectors: ', nev
     print '((a,i0))', 'Blocksize: ', nblk
#ifdef WITH_MPI
     print '((a,i0))', 'Num MPI proc: ', nprocs
     print '(3(a,i0))','Number of processor rows=',np_rows,', cols=',np_cols,', total=',nprocs
     print '(a)',      'Process layout: ' // layout
#endif
     print *,''
   endif

   call set_up_blacsgrid(mpi_comm_world, np_rows, np_cols, layout, &
                         my_blacs_ctxt, my_prow, my_pcol)

   call set_up_blacs_descriptor(na, nblk, my_prow, my_pcol, np_rows, np_cols, &
                                na_rows, na_cols, sc_desc, my_blacs_ctxt, info)

174
175
176
177
   allocate(a_skewsymmetric (na_rows,na_cols))
   allocate(as_skewsymmetric(na_rows,na_cols))
   allocate(z_skewsymmetric (na_rows,na_cols))
   allocate(ev_skewsymmetric(na))
Andreas Marek's avatar
Andreas Marek committed
178

179
180
181
   a_skewsymmetric(:,:) = 0.0
   z_skewsymmetric(:,:) = 0.0
   ev_skewsymmetric(:) = 0.0
Andreas Marek's avatar
Andreas Marek committed
182

183
184
   call prepare_matrix_random(na, myid, sc_desc, a_skewsymmetric, z_skewsymmetric, as_skewsymmetric, is_skewsymmetric=1)
   as_skewsymmetric(:,:) = a_skewsymmetric(:,:)
Andreas Marek's avatar
Andreas Marek committed
185

186
187
188
189
190
   ! prepare the complex matrix for the "brute force" case
   allocate(a_complex (na_rows,na_cols))
   allocate(as_complex(na_rows,na_cols))
   allocate(z_complex (na_rows,na_cols))
   allocate(ev_complex(na))
Andreas Marek's avatar
Andreas Marek committed
191

192
193
194
   a_complex(:,:) = 0.0
   z_complex(:,:) = 0.0
   as_complex(:,:) = 0.0
Andreas Marek's avatar
Andreas Marek committed
195

196
197
198
199
200
   do j=1, na_cols
     do i=1,na_rows
       a_complex(i,j) = cmplx(0.0, a_skewsymmetric(i,j))
     enddo
   enddo
Andreas Marek's avatar
Andreas Marek committed
201

202
203
   z_complex(:,:)  = a_complex(:,:)
   as_complex(:,:) = a_complex(:,:)
Andreas Marek's avatar
Andreas Marek committed
204

205
206
207
   ! first set up and solve the brute force problem
   e_complex => elpa_allocate()
   call set_basic_params(e_complex, na, nev, na_rows, na_cols, my_prow, my_pcol)
Andreas Marek's avatar
Andreas Marek committed
208

209
   call e_complex%set("timings",1, error)
Andreas Marek's avatar
Andreas Marek committed
210

211
212
   call e_complex%set("debug",1)
   call e_complex%set("gpu", 0)
Andreas Marek's avatar
Andreas Marek committed
213

214
   assert_elpa_ok(e_complex%setup())
Andreas Marek's avatar
Andreas Marek committed
215

216
217
218
   call e_complex%timer_start("eigenvectors: brute force ")
   call e_complex%eigenvectors(a_complex, ev_complex, z_complex, error)
   call e_complex%timer_stop("eigenvectors: brute force ")
Andreas Marek's avatar
Andreas Marek committed
219

220
221
222
223
   if (myid .eq. 0) then
     print *, ""
     call e_complex%print_times("eigenvectors: brute force")
   endif 
Andreas Marek's avatar
Andreas Marek committed
224

225
226
227
   status = check_correctness_evp_numeric_residuals(na, nev, as_complex, z_complex, ev_complex, sc_desc, &
                                                    nblk, myid, np_rows,np_cols, my_prow, my_pcol)
   call check_status(status, myid)
Andreas Marek's avatar
Andreas Marek committed
228
229
230
231

#ifdef WITH_MPI
     call MPI_BARRIER(MPI_COMM_WORLD, ierr)
#endif
232
233
234
   ! now run the skewsymmetric case
   e_skewsymmetric => elpa_allocate()
   call set_basic_params(e_skewsymmetric, na, nev, na_rows, na_cols, my_prow, my_pcol)
Andreas Marek's avatar
Andreas Marek committed
235

236
237
238
239
240
241
242
243
244
245
246
   call e_skewsymmetric%set("timings",1, error)

   call e_skewsymmetric%set("debug",1)
   call e_skewsymmetric%set("gpu", 0)

   call e_skewsymmetric%set("is_skewsymmetric",1)
   assert_elpa_ok(e_skewsymmetric%setup())

   call e_skewsymmetric%timer_start("eigenvectors: skewsymmetric ")
   call e_skewsymmetric%eigenvectors(a_skewsymmetric, ev_skewsymmetric, z_skewsymmetric, error)
   call e_skewsymmetric%timer_stop("eigenvectors: skewsymmetric ")
Andreas Marek's avatar
Andreas Marek committed
247
248
249

   if (myid .eq. 0) then
     print *, ""
250
251
252
253
254
255
256
257
     call e_skewsymmetric%print_times("eigenvectors: skewsymmetric")
   endif  
#ifdef WITH_MPI
   call MPI_BARRIER(MPI_COMM_WORLD, ierr)
#endif
   call elpa_deallocate(e_complex)
   call elpa_deallocate(e_skewsymmetric)

Andreas Marek's avatar
Andreas Marek committed
258

259
260
261
262
   !to do 
   ! - compare ev results from brute-force and skewsymmetric
   ! - check whether brute-force check_correctness_evp_numeric_residuals worsk (complex ev)
   ! - invent a test for skewsymmetric residuals
Andreas Marek's avatar
Andreas Marek committed
263

264
265
266
267
   deallocate(a_complex)
   deallocate(as_complex)
   deallocate(z_complex)
   deallocate(ev_complex)
Andreas Marek's avatar
Andreas Marek committed
268

269
270
271
272
   deallocate(a_skewsymmetric)
   deallocate(as_skewsymmetric)
   deallocate(z_skewsymmetric)
   deallocate(ev_skewsymmetric)
Andreas Marek's avatar
Andreas Marek committed
273
274
   call elpa_uninit()

275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325



   !  if (myid .eq. 0) then
   !    print *, ""
   !    call e_ptr%print_times("eigenvectors: iteration "//trim(iter_string))
   !  endif
   !  status = check_correctness_analytic(na, nev, ev, z, nblk, myid, np_rows, np_cols, my_prow, my_pcol, &
   !                                      .true., .true., print_times=.false.)
   !  a(:,:) = as(:,:)
   !  call e_ptr%autotune_print_state(tune_state)
   !  call e_ptr%autotune_save_state(tune_state, "saved_state_"//trim(iter_string)//".txt")
#ifdef WITH_MPI
   !  call MPI_BARRIER(MPI_COMM_WORLD, ierr)
#endif
   !  call e_ptr%autotune_load_state(tune_state, "saved_state_"//trim(iter_string)//".txt")
   !end do

   !! set and print the autotuned-settings
   !call e_ptr%autotune_set_best(tune_state)
   !if (myid .eq. 0) then
   !  print *, "The best combination found by the autotuning:"
   !  flush(output_unit)
   !  call e_ptr%autotune_print_best(tune_state)
   !endif
   !! de-allocate autotune object
   !call elpa_autotune_deallocate(tune_state)

   !if (myid .eq. 0) then
   !  print *, "Running once more time with the best found setting..."
   !endif
   !call e_ptr%timer_start("eigenvectors: best setting")
   !call e_ptr%eigenvectors(a, ev, z, error)
   !call e_ptr%timer_stop("eigenvectors: best setting")
   !assert_elpa_ok(error)
   !if (myid .eq. 0) then
   !  print *, ""
   !  call e_ptr%print_times("eigenvectors: best setting")
   !endif
   !status = check_correctness_analytic(na, nev, ev, z, nblk, myid, np_rows, np_cols, my_prow, my_pcol, &
   !                                    .true., .true., print_times=.false.)

   !call elpa_deallocate(e_ptr)

   !deallocate(a)
   !deallocate(as)
   !deallocate(z)
   !deallocate(ev)

   !call elpa_uninit()

Andreas Marek's avatar
Andreas Marek committed
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
#ifdef WITH_MPI
   call blacs_gridexit(my_blacs_ctxt)
   call mpi_finalize(mpierr)
#endif

   call exit(status)

contains
   subroutine set_basic_params(elpa, na, nev, na_rows, na_cols, my_prow, my_pcol)
     implicit none
     class(elpa_t), pointer      :: elpa
     integer, intent(in)         :: na, nev, na_rows, na_cols, my_prow, my_pcol

     call elpa%set("na", na, error)
     assert_elpa_ok(error)
     call elpa%set("nev", nev, error)
     assert_elpa_ok(error)
     call elpa%set("local_nrows", na_rows, error)
     assert_elpa_ok(error)
     call elpa%set("local_ncols", na_cols, error)
     assert_elpa_ok(error)
     call elpa%set("nblk", nblk, error)
     assert_elpa_ok(error)

#ifdef WITH_MPI
     call elpa%set("mpi_comm_parent", MPI_COMM_WORLD, error)
     assert_elpa_ok(error)
     call elpa%set("process_row", my_prow, error)
     assert_elpa_ok(error)
     call elpa%set("process_col", my_pcol, error)
     assert_elpa_ok(error)
#endif
   end subroutine
359
360
361
362
363
364
365
366
367
368
369
370
   subroutine check_status(status, myid)
     implicit none
     integer, intent(in) :: status, myid
     integer :: mpierr
     if (status /= 0) then
       if (myid == 0) print *, "Result incorrect!"
#ifdef WITH_MPI
       call mpi_finalize(mpierr)
#endif
       call exit(status)
     endif
   end subroutine
Andreas Marek's avatar
Andreas Marek committed
371
end program