bioem.cpp 27.7 KB
Newer Older
Pilar Cossio's avatar
License    
Pilar Cossio committed
1
2
3
4
/* ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
        < BioEM software for Bayesian inference of Electron Microscopy images>
            Copyright (C) 2014 Pilar Cossio, David Rohr and Gerhard Hummer.
            Max Planck Institute of Biophysics, Frankfurt, Germany.
5

Pilar Cossio's avatar
License    
Pilar Cossio committed
6
7
8
9
                See license statement for terms of distribution.

   ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++*/

10
11
12
13
14
15
16
17
#include <mpi.h>

#define MPI_CHK(expr) \
	if (expr != MPI_SUCCESS) \
	{ \
		fprintf(stderr, "Error in MPI function %s: %d\n", __FILE__, __LINE__); \
	}

18
19
20
21
22
23
24
25
26
#include <fstream>
#include <boost/program_options.hpp>
#include <iostream>
#include <algorithm>
#include <iterator>
#include <stdio.h>
#include <stdlib.h>
#include <string>
#include <cmath>
27

28
#ifdef WITH_OPENMP
29
#include <omp.h>
30
#endif
31
32
33
34
35
36
37
38
39
40

#include <fftw3.h>
#include <math.h>
#include "cmodules/timer.h"

#include "param.h"
#include "bioem.h"
#include "model.h"
#include "map.h"

41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
#ifdef BIOEM_USE_NVTX
#include "nvToolsExt.h"

const uint32_t colors[] = { 0x0000ff00, 0x000000ff, 0x00ffff00, 0x00ff00ff, 0x0000ffff, 0x00ff0000, 0x00ffffff };
const int num_colors = sizeof(colors)/sizeof(colors[0]);

#define cuda_custom_timeslot(name,cid) { \
	int color_id = cid; \
	color_id = color_id%num_colors;\
	nvtxEventAttributes_t eventAttrib = {0}; \
	eventAttrib.version = NVTX_VERSION; \
	eventAttrib.size = NVTX_EVENT_ATTRIB_STRUCT_SIZE; \
	eventAttrib.colorType = NVTX_COLOR_ARGB; \
	eventAttrib.color = colors[color_id]; \
	eventAttrib.messageType = NVTX_MESSAGE_TYPE_ASCII; \
	eventAttrib.message.ascii = name; \
	nvtxRangePushEx(&eventAttrib); \
}
#define cuda_custom_timeslot_end nvtxRangePop();
#else
#define cuda_custom_timeslot(name,cid)
#define cuda_custom_timeslot_end
#endif
64

65
66
67
68
69
70
71
72
73
74
75
#include "bioem_algorithm.h"

using namespace boost;
namespace po = boost::program_options;

using namespace std;

// A helper function of Boost
template<class T>
ostream& operator<<(ostream& os, const vector<T>& v)
{
76
77
	copy(v.begin(), v.end(), ostream_iterator<T>(os, " "));
	return os;
78
79
80
81
}

bioem::bioem()
{
82
	FFTAlgo = getenv("FFTALGO") == NULL ? 1 : atoi(getenv("FFTALGO"));
83
	DebugOutput = getenv("BIOEM_DEBUG_OUTPUT") == NULL ? 2 : atoi(getenv("BIOEM_DEBUG_OUTPUT"));
84
85
86
87
88
89
90
91
}

bioem::~bioem()
{
}

int bioem::configure(int ac, char* av[])
{
David Rohr's avatar
David Rohr committed
92
93
94
95
96
	// **************************************************************************************
	// **** Configuration Routine using boost for extracting parameters, models and maps ****
	// **************************************************************************************
	// ****** And Precalculating necessary grids, map crosscorrelations and kernels  ********
	// *************************************************************************************
97

David Rohr's avatar
David Rohr committed
98
99
100
101
102
	if (mpi_rank == 0)
	{
		// *** Inizialzing default variables ***
		std::string infile, modelfile, mapfile;
		Model.readPDB = false;
103
		param.param_device.writeAngles = false;
David Rohr's avatar
David Rohr committed
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
		param.dumpMap = false;
		param.loadMap = false;
		RefMap.readMRC = false;
		RefMap.readMultMRC = false;

		// *************************************************************************************
		cout << " ++++++++++++ FROM COMMAND LINE +++++++++++\n\n";
		// *************************************************************************************

		// ********************* Command line reading input with BOOST ************************

		try {
			po::options_description desc("Command line inputs");
			desc.add_options()
			("Inputfile", po::value<std::string>(), "(Mandatory) Name of input parameter file")
			("Modelfile", po::value< std::string>() , "(Mandatory) Name of model file")
			("Particlesfile", po::value< std::string>(), "(Mandatory) Name of paricles file")
			("ReadPDB", "(Optional) If reading model file in PDB format")
			("ReadMRC", "(Optional) If reading particle file in MRC format")
			("ReadMultipleMRC", "(Optional) If reading Multiple MRCs")
			("DumpMaps", "(Optional) Dump maps after they were red from maps file")
			("LoadMapDump", "(Optional) Read Maps from dump instead of maps file")
			("help", "(Optional) Produce help message")
			;


			po::positional_options_description p;
			p.add("Inputfile", -1);
			p.add("Modelfile", -1);
			p.add("Particlesfile", -1);
			p.add("ReadPDB", -1);
			p.add("ReadMRC", -1);
			p.add("ReadMultipleMRC", -1);
			p.add("DumpMaps", -1);
			p.add("LoadMapDump", -1);

			po::variables_map vm;
			po::store(po::command_line_parser(ac, av).
					  options(desc).positional(p).run(), vm);
			po::notify(vm);

			if((ac < 6)) {
				std::cout << desc << std::endl;
				return 1;
			}
			if (vm.count("help")) {
				cout << "Usage: options_description [options]\n";
				cout << desc;
				return 1;
			}

			if (vm.count("Inputfile"))
			{
				cout << "Input file is: ";
				cout << vm["Inputfile"].as< std::string >() << "\n";
				infile = vm["Inputfile"].as< std::string >();
			}
			if (vm.count("Modelfile"))
			{
				cout << "Model file is: "
					 << vm["Modelfile"].as<  std::string  >() << "\n";
				modelfile = vm["Modelfile"].as<  std::string  >();
			}

			if (vm.count("ReadPDB"))
			{
				cout << "Reading model file in PDB format.\n";
				Model.readPDB = true;
			}

			if (vm.count("ReadMRC"))
			{
				cout << "Reading particle file in MRC format.\n";
				RefMap.readMRC=true;
			}

			if (vm.count("ReadMultipleMRC"))
			{
				cout << "Reading Multiple MRCs.\n";
				RefMap.readMultMRC=true;
			}

			if (vm.count("DumpMaps"))
			{
				cout << "Dumping Maps after reading from file.\n";
				param.dumpMap = true;
			}

			if (vm.count("LoadMapDump"))
			{
				cout << "Loading Map dump.\n";
				param.loadMap = true;
			}

			if (vm.count("Particlesfile"))
			{
				cout << "Paricle file is: "
					 << vm["Particlesfile"].as< std::string >() << "\n";
				mapfile = vm["Particlesfile"].as< std::string >();
			}
David Rohr's avatar
David Rohr committed
204
		}
David Rohr's avatar
David Rohr committed
205
		catch(std::exception& e)
206
		{
David Rohr's avatar
David Rohr committed
207
208
			cout << e.what() << "\n";
			return 1;
209
		}
David Rohr's avatar
David Rohr committed
210
211
212
213
214
215
			//check for consitency in multiple MRCs
			if(  RefMap.readMultMRC && not(RefMap.readMRC) ){
			 cout << "For Multiple MRCs command --ReadMRC is necesary too";
			 exit(1);
			}
		// ********************* Reading Parameter Input ***************************
216
		param.readParameters(infile.c_str());
David Rohr's avatar
David Rohr committed
217
218

		// ********************* Reading Model Input ******************************
219
		Model.readModel(modelfile.c_str());
David Rohr's avatar
David Rohr committed
220
221

		// ********************* Reading Particle Maps Input **********************
222
		RefMap.readRefMaps(param, mapfile.c_str());
David Rohr's avatar
David Rohr committed
223
	}
224

David Rohr's avatar
David Rohr committed
225
#ifdef WITH_MPI
226
227
228
229
	MPI_Bcast(&param, sizeof(param), MPI_BYTE, 0, MPI_COMM_WORLD);
	//refCtf, CtfParam, angles automatically filled by precalculare function below
	
	MPI_Bcast(&Model, sizeof(Model), MPI_BYTE, 0, MPI_COMM_WORLD);
David Rohr's avatar
David Rohr committed
230
	if (mpi_rank != 0) Model.points = (bioem_model::bioem_model_point*) mallocchk(sizeof(bioem_model::bioem_model_point) * Model.nPointsModel);
231
232
	MPI_Bcast(Model.points, sizeof(bioem_model::bioem_model_point) * Model.nPointsModel, MPI_BYTE, 0, MPI_COMM_WORLD);
	
David Rohr's avatar
David Rohr committed
233
234
235
	MPI_Bcast(&RefMap, sizeof(RefMap), MPI_BYTE, 0, MPI_COMM_WORLD);
	if (mpi_rank != 0) RefMap.maps = (myfloat_t*) mallocchk(RefMap.refMapSize * sizeof(myfloat_t) * RefMap.ntotRefMap);
	MPI_Bcast(RefMap.maps, RefMap.refMapSize * sizeof(myfloat_t) * RefMap.ntotRefMap, MPI_BYTE, 0, MPI_COMM_WORLD);
David Rohr's avatar
David Rohr committed
236
#endif
237

David Rohr's avatar
David Rohr committed
238
	// ****************** Precalculating Necessary Stuff *********************
239
	param.PrepareFFTs();
240
	precalculate();
David Rohr's avatar
David Rohr committed
241

242
243
	if (getenv("BIOEM_DEBUG_BREAK"))
	{
244
245
246
		const int cut = atoi(getenv("BIOEM_DEBUG_BREAK"));
		if (param.nTotGridAngles > cut) param.nTotGridAngles = cut;
		if (param.nTotCTFs > cut) param.nTotCTFs = cut;
247
	}
David Rohr's avatar
David Rohr committed
248

249
	pProb.init(RefMap.ntotRefMap, param.nTotGridAngles, *this);
250

251
252
	deviceInit();

253
	return(0);
254
255
}

256
257
258
void bioem::cleanup()
{
	//Deleting allocated pointers
259
	free_device_host(pProb.ptr);
260
261
262
	RefMap.freePointers();
}

263
264
int bioem::precalculate()
{
David Rohr's avatar
David Rohr committed
265
	// **************************************************************************************
David Rohr's avatar
David Rohr committed
266
	// **Precalculating Routine of Orientation grids, Map crosscorrelations and CTF Kernels**
David Rohr's avatar
David Rohr committed
267
	// **************************************************************************************
268

269
270
	// Generating Grids of orientations
	param.CalculateGridsParam();
271

272
273
	// Precalculating CTF Kernels stored in class Param
	param.CalculateRefCTF();
274

275
276
	//Precalculate Maps
	RefMap.precalculate(param, *this);
277

278
	return(0);
279
280
281
282
}

int bioem::run()
{
David Rohr's avatar
David Rohr committed
283
284
285
	// **************************************************************************************
	// **** Main BioEM routine, projects, convolutes and compares with Map using OpenMP ****
	// **************************************************************************************
286

David Rohr's avatar
David Rohr committed
287
288
	// **** If we want to control the number of threads -> omp_set_num_threads(XX); ******
	// ****************** Declarying class of Probability Pointer  *************************
289

David Rohr's avatar
David Rohr committed
290
	if (mpi_rank == 0) printf("\tInitializing Probabilities\n");
291
292
293
	// Inizialzing Probabilites to zero and constant to -Infinity
	for (int iRefMap = 0; iRefMap < RefMap.ntotRefMap; iRefMap ++)
	{
294
295
296
297
		bioem_Probability_map& pProbMap = pProb.getProbMap(iRefMap);

		pProbMap.Total = 0.0;
		pProbMap.Constoadd = -9999999;
298
		if (param.param_device.writeAngles)
299
		{
300
301
302
			for (int iOrient = 0; iOrient < param.nTotGridAngles; iOrient ++)
			{
				bioem_Probability_angle& pProbAngle = pProb.getProbAngle(iRefMap, iOrient);
303

304
305
306
				pProbAngle.forAngles = 0.0;
				pProbAngle.ConstAngle = -99999999;
			}
307
308
		}
	}
David Rohr's avatar
David Rohr committed
309
	// **************************************************************************************
310
	deviceStartRun();
311
312
313
314
315
316
317
318
319
320
	{
		const int count = omp_get_max_threads();
		localCCT = new mycomplex_t*[count];
		lCC = new myfloat_t*[count];
		for (int i = 0;i < count;i++)
		{
			localCCT[i] = (mycomplex_t *) myfftw_malloc(sizeof(mycomplex_t) * param.param_device.NumberPixels * param.param_device.NumberFFTPixels1D);
			lCC[i] = (myfloat_t *) myfftw_malloc(sizeof(myfloat_t) * param.param_device.NumberPixels * param.param_device.NumberPixels);
		}
	}
321

David Rohr's avatar
David Rohr committed
322
	// ******************************** MAIN CYCLE ******************************************
David Rohr's avatar
David Rohr committed
323

David Rohr's avatar
David Rohr committed
324
	// *** Declaring Private variables for each thread *****
325
	mycomplex_t* proj_mapFFT;
326
	myfloat_t* conv_map = new myfloat_t[param.param_device.NumberPixels * param.param_device.NumberPixels];
327
	mycomplex_t* conv_mapFFT;
328
	myfloat_t sumCONV, sumsquareCONV;
329
330

	//allocating fftw_complex vector
331
332
	proj_mapFFT = (mycomplex_t *) myfftw_malloc(sizeof(mycomplex_t) * param.param_device.NumberPixels * param.param_device.NumberFFTPixels1D);
	conv_mapFFT = (mycomplex_t *) myfftw_malloc(sizeof(mycomplex_t) * param.param_device.NumberPixels * param.param_device.NumberFFTPixels1D);
333
334
335

	HighResTimer timer;

David Rohr's avatar
David Rohr committed
336
337
338
339
340
341
342
	if (DebugOutput >= 1 && mpi_rank == 0) printf("\tMain Loop (GridAngles %d, CTFs %d, RefMaps %d, Shifts (%d/%d)²), Pixels %d²\n", param.nTotGridAngles, param.nTotCTFs, RefMap.ntotRefMap, 2 * param.param_device.maxDisplaceCenter + param.param_device.GridSpaceCenter, param.param_device.GridSpaceCenter, param.param_device.NumberPixels);

	const int iOrientStart = (int) ((long long int) mpi_rank * param.nTotGridAngles / mpi_size);
	int iOrientEnd = (int) ((long long int) (mpi_rank + 1) * param.nTotGridAngles / mpi_size);
	if (iOrientEnd > param.nTotGridAngles) iOrientEnd = param.nTotGridAngles;
	
	for (int iOrient = iOrientStart; iOrient < iOrientEnd; iOrient++)
343
	{
David Rohr's avatar
David Rohr committed
344
345
		// ***************************************************************************************
		// ***** Creating Projection for given orientation and transforming to Fourier space *****
346
		if (DebugOutput >= 1) timer.ResetStart();
347
		createProjection(iOrient, proj_mapFFT);
348
		if (DebugOutput >= 1) printf("Time Projection %d: %f\n", iOrient, timer.GetCurrentElapsedTime());
349

David Rohr's avatar
David Rohr committed
350
351
		// ***************************************************************************************
		// ***** **** Internal Loop over convolutions **** *****
352
353
		for (int iConv = 0; iConv < param.nTotCTFs; iConv++)
		{
David Rohr's avatar
David Rohr committed
354
			// *** Calculating convolutions of projection map and crosscorrelations ***
355

356
			if (DebugOutput >= 2) timer.ResetStart();
357
			createConvolutedProjectionMap(iOrient, iConv, proj_mapFFT, conv_map, conv_mapFFT, sumCONV, sumsquareCONV);
358
			if (DebugOutput >= 2) printf("Time Convolution %d %d: %f\n", iOrient, iConv, timer.GetCurrentElapsedTime());
359

David Rohr's avatar
David Rohr committed
360
361
			// ***************************************************************************************
			// *** Comparing each calculated convoluted map with all experimental maps ***
362
			if (DebugOutput >= 2) timer.ResetStart();
363
			compareRefMaps(iOrient, iConv, conv_map, conv_mapFFT, sumCONV, sumsquareCONV);
364

365
366
367
368
369
370
371
372
373
374
375
376
			if (DebugOutput >= 2)
			{
				const double compTime = timer.GetCurrentElapsedTime();
				const int nShifts = 2 * param.param_device.maxDisplaceCenter / param.param_device.GridSpaceCenter + 1;
				const double nFlops = (double) RefMap.ntotRefMap * (double) nShifts * (double) nShifts *
									  (((double) param.param_device.NumberPixels - (double) param.param_device.maxDisplaceCenter / 2.) * ((double) param.param_device.NumberPixels - (double) param.param_device.maxDisplaceCenter / 2.) * 5. + 25.) / compTime;
				const double nGBs = (double) RefMap.ntotRefMap * (double) nShifts * (double) nShifts *
									(((double) param.param_device.NumberPixels - (double) param.param_device.maxDisplaceCenter / 2.) * ((double) param.param_device.NumberPixels - (double) param.param_device.maxDisplaceCenter / 2.) * 2. + 8.) * (double) sizeof(myfloat_t) / compTime;
				const double nGBs2 = (double) RefMap.ntotRefMap * ((double) param.param_device.NumberPixels * (double) param.param_device.NumberPixels + 8.) * (double) sizeof(myfloat_t) / compTime;

				printf("Time Comparison %d %d: %f sec (%f GFlops, %f GB/s (cached), %f GB/s)\n", iOrient, iConv, compTime, nFlops / 1000000000., nGBs / 1000000000., nGBs2 / 1000000000.);
			}
377
378
379
380
381
		}
	}
	//deallocating fftw_complex vector
	myfftw_free(proj_mapFFT);
	myfftw_free(conv_mapFFT);
382
	delete[] conv_map;
David Rohr's avatar
David Rohr committed
383

384
	deviceFinishRun();
385
386
387
388
389
390
391
392
393
394
	{
		const int count = omp_get_max_threads();
		for (int i = 0;i < count;i++)
		{
			myfftw_free(localCCT[i]);
			myfftw_free(lCC[i]);
		}
		delete[] localCCT;
		delete[] lCC;
	}
395

David Rohr's avatar
David Rohr committed
396
	// ************* Writing Out Probabilities ***************
397

David Rohr's avatar
David Rohr committed
398
	// *** Angular Probability ***
David Rohr's avatar
David Rohr committed
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
	
#ifdef WITH_MPI
	if (DebugOutput >= 2 && mpi_rank == 0) timer.ResetStart();
	//Reduce Constant and summarize probabilities
	{
		myfloat_t* tmp1 = new myfloat_t[RefMap.ntotRefMap];
		myfloat_t* tmp2 = new myfloat_t[RefMap.ntotRefMap];
		myfloat_t* tmp3 = new myfloat_t[RefMap.ntotRefMap];
		for (int i = 0;i < RefMap.ntotRefMap;i++)
		{
				tmp1[i] = pProb.getProbMap(i).Constoadd;
		}
		MPI_Allreduce(tmp1, tmp2, RefMap.ntotRefMap, MY_MPI_FLOAT, MPI_MAX, MPI_COMM_WORLD);
		for (int i = 0;i < RefMap.ntotRefMap;i++)
		{
			bioem_Probability_map& pProbMap = pProb.getProbMap(i);
			tmp1[i] = pProbMap.Total * exp(pProbMap.Constoadd - tmp2[i]);
		}
		MPI_Reduce(tmp1, tmp3, RefMap.ntotRefMap, MY_MPI_FLOAT, MPI_SUM, 0, MPI_COMM_WORLD);
418

David Rohr's avatar
David Rohr committed
419
		//Find MaxProb
420
		MPI_Status mpistatus;
David Rohr's avatar
David Rohr committed
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
		{	
			int* tmpi1 = new int[RefMap.ntotRefMap];
			int* tmpi2 = new int[RefMap.ntotRefMap];
			for (int i = 0;i < RefMap.ntotRefMap;i++)
			{
				bioem_Probability_map& pProbMap = pProb.getProbMap(i);
				tmpi1[i] = tmp2[i] <= pProbMap.Constoadd ? mpi_rank : -1;
			}
			MPI_Allreduce(tmpi1, tmpi2, RefMap.ntotRefMap, MPI_INT, MPI_MAX, MPI_COMM_WORLD);
			for (int i = 0;i < RefMap.ntotRefMap;i++)
			{
				if (tmpi2[i] == -1)
				{
					if (mpi_rank == 0) printf("Error: Could not find highest probability\n");
				}
				else if (tmpi2[i] != 0) //Skip if rank 0 already has highest probability
				{
					if (mpi_rank == 0)
					{
440
						MPI_Recv(&pProb.getProbMap(i).max, sizeof(pProb.getProbMap(i).max), MPI_BYTE, tmpi2[i], i, MPI_COMM_WORLD, &mpistatus);
David Rohr's avatar
David Rohr committed
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
					}
					else if (mpi_rank == tmpi2[i])
					{
						MPI_Send(&pProb.getProbMap(i).max, sizeof(pProb.getProbMap(i).max), MPI_BYTE, 0, i, MPI_COMM_WORLD);
					}
				}
			}
			delete[] tmpi1;
			delete[] tmpi2;
		}
		
		if (mpi_rank == 0)
		{
			for (int i = 0;i < RefMap.ntotRefMap;i++)
			{
					bioem_Probability_map& pProbMap = pProb.getProbMap(i);
					pProbMap.Total = tmp3[i];
					pProbMap.Constoadd = tmp2[i];
			}
		}
		
		delete[] tmp1;
		delete[] tmp2;
		delete[] tmp3;
		if (DebugOutput >= 2 && mpi_rank == 0) printf("Time MPI Reduction: %f\n", timer.GetCurrentElapsedTime());
	}
	
	//Angle Reduction and Probability summation for individual angles
	if (param.param_device.writeAngles)
470
	{
David Rohr's avatar
David Rohr committed
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
		const int count = RefMap.ntotRefMap * param.nTotGridAngles;
		myfloat_t* tmp1 = new myfloat_t[count];
		myfloat_t* tmp2 = new myfloat_t[count];
		myfloat_t* tmp3 = new myfloat_t[count];
		for (int i = 0;i < RefMap.ntotRefMap;i++)
		{
				tmp1[i] = pProb.getProbMap(i).Constoadd;
		}
		MPI_Allreduce(tmp1, tmp2, count, MY_MPI_FLOAT, MPI_MAX, MPI_COMM_WORLD);
		for (int i = 0;i < RefMap.ntotRefMap;i++)
		{
			for (int j = 0;j < param.nTotGridAngles;j++)
			{
				bioem_Probability_angle& pProbAngle = pProb.getProbAngle(i, j);
				tmp1[i * param.nTotGridAngles + j] = pProbAngle.forAngles * exp(pProbAngle.ConstAngle - tmp2[i * param.nTotGridAngles + j]);
			}
		}
		MPI_Reduce(tmp1, tmp3, count, MY_MPI_FLOAT, MPI_SUM, 0, MPI_COMM_WORLD);
		if (mpi_rank == 0)
		{
			for (int i = 0;i < RefMap.ntotRefMap;i++)
			{
				for (int j = 0;j < param.nTotGridAngles;j++)
				{
					bioem_Probability_angle& pProbAngle = pProb.getProbAngle(i, j);
					pProbAngle.forAngles = tmp3[i * param.nTotGridAngles + j];
					pProbAngle.ConstAngle = tmp2[i * param.nTotGridAngles + j];
				}
			}
		}
		delete[] tmp1;
		delete[] tmp2;
		delete[] tmp3;	
504
	}
David Rohr's avatar
David Rohr committed
505
#endif
506

David Rohr's avatar
David Rohr committed
507
	if (mpi_rank == 0)
508
	{
David Rohr's avatar
David Rohr committed
509
510
511
512
513
514
515
516
517
518
519
520
		ofstream angProbfile;
		if(param.param_device.writeAngles)
		{
			angProbfile.open ("ANG_PROB");
		}

		ofstream outputProbFile;
		outputProbFile.open ("Output_Probabilities");
		for (int iRefMap = 0; iRefMap < RefMap.ntotRefMap; iRefMap ++)
		{
			// **** Total Probability ***
			bioem_Probability_map& pProbMap = pProb.getProbMap(iRefMap);
521

David Rohr's avatar
David Rohr committed
522
			outputProbFile << "RefMap " << iRefMap << " Probability  "  << log(pProbMap.Total) + pProbMap.Constoadd + 0.5 * log(M_PI) + (1 - param.param_device.Ntotpi * 0.5)*(log(2 * M_PI) + 1) + log(param.param_device.volu) << " Constant " << pProbMap.Constoadd  << "\n";
523

David Rohr's avatar
David Rohr committed
524
			outputProbFile << "RefMap " << iRefMap << " Maximizing Param: ";
525

David Rohr's avatar
David Rohr committed
526
527
528
529
530
531
532
533
534
535
536
			// *** Param that maximize probability****
			outputProbFile << (pProbMap.Constoadd + 0.5 * log(M_PI) + (1 - param.param_device.Ntotpi * 0.5) * (log(2 * M_PI) + 1) + log(param.param_device.volu)) << " ";
			outputProbFile << param.angles[pProbMap.max.max_prob_orient].pos[0] << " ";
			outputProbFile << param.angles[pProbMap.max.max_prob_orient].pos[1] << " ";
			outputProbFile << param.angles[pProbMap.max.max_prob_orient].pos[2] << " ";
			outputProbFile << param.CtfParam[pProbMap.max.max_prob_conv].pos[0] << " ";
			outputProbFile << param.CtfParam[pProbMap.max.max_prob_conv].pos[1] << " ";
			outputProbFile << param.CtfParam[pProbMap.max.max_prob_conv].pos[2] << " ";
			outputProbFile << pProbMap.max.max_prob_cent_x << " ";
			outputProbFile << pProbMap.max.max_prob_cent_y;
			outputProbFile << "\n";
537

David Rohr's avatar
David Rohr committed
538
			// *** For individual files*** //angProbfile.open ("ANG_PROB_"iRefMap);
539

David Rohr's avatar
David Rohr committed
540
			if(param.param_device.writeAngles)
541
			{
David Rohr's avatar
David Rohr committed
542
543
544
				for (int iOrient = 0; iOrient < param.nTotGridAngles; iOrient++)
				{
					bioem_Probability_angle& pProbAngle = pProb.getProbAngle(iRefMap, iOrient);
545

David Rohr's avatar
David Rohr committed
546
547
					angProbfile << " " << iRefMap << " " << param.angles[iOrient].pos[0] << " " << param.angles[iOrient].pos[1] << " " << param.angles[iOrient].pos[2] << " " << log(pProbAngle.forAngles) + pProbAngle.ConstAngle + 0.5 * log(M_PI) + (1 - param.param_device.Ntotpi * 0.5)*(log(2 * M_PI) + 1) + log(param.param_device.volu) << " " << log(param.param_device.volu) << "\n";
				}
548
549
			}
		}
550

David Rohr's avatar
David Rohr committed
551
552
553
554
555
		if(param.param_device.writeAngles)
		{
			angProbfile.close();
		}
		outputProbFile.close();
556
	}
557

558
	return(0);
559
560
}

561
int bioem::compareRefMaps(int iOrient, int iConv, const myfloat_t* conv_map, mycomplex_t* localmultFFT, myfloat_t sumC, myfloat_t sumsquareC, const int startMap)
562
{
David Rohr's avatar
David Rohr committed
563
564
	//***************************************************************************************
	//***** BioEM routine for comparing reference maps to convoluted maps *****
565
	if (FFTAlgo)
566
	{
David Rohr's avatar
David Rohr committed
567
		//With FFT Algorithm
568
569
		#pragma omp parallel for
		for (int iRefMap = startMap; iRefMap < RefMap.ntotRefMap; iRefMap ++)
570
		{
571
			const int num = omp_get_thread_num();
572
			calculateCCFFT(iRefMap, iOrient, iConv, sumC, sumsquareC, localmultFFT, localCCT[num], lCC[num]);
573
574
575
		}
	}
	else
576
	{
David Rohr's avatar
David Rohr committed
577
		//Without FFT Algorithm
578
		#pragma omp parallel for
579
		for (int iRefMap = startMap; iRefMap < RefMap.ntotRefMap; iRefMap ++)
580
		{
581
			compareRefMapShifted < -1 > (iRefMap, iOrient, iConv, conv_map, pProb, param.param_device, RefMap);
582
583
584
585
586
		}
	}
	return(0);
}

587
inline void bioem::calculateCCFFT(int iRefMap, int iOrient, int iConv, myfloat_t sumC, myfloat_t sumsquareC, mycomplex_t* localConvFFT, mycomplex_t* localCCT, myfloat_t* lCC)
588
{
David Rohr's avatar
David Rohr committed
589
590
	//***************************************************************************************
	//***** Calculating cross correlation in FFTALGOrithm *****
Pilar Cossio's avatar
Pilar Cossio committed
591

592
	const mycomplex_t* RefMapFFT = &RefMap.RefMapsFFT[iRefMap * param.FFTMapSize];
593
	for(int i = 0; i < param.param_device.NumberPixels * param.param_device.NumberFFTPixels1D; i++)
594
	{
595
596
		localCCT[i][0] = localConvFFT[i][0] * RefMapFFT[i][0] + localConvFFT[i][1] * RefMapFFT[i][1];
		localCCT[i][1] = localConvFFT[i][1] * RefMapFFT[i][0] - localConvFFT[i][0] * RefMapFFT[i][1];
597
598
	}

599
	myfftw_execute_dft_c2r(param.fft_plan_c2r_backward, localCCT, lCC);
600

601
	doRefMapFFT(iRefMap, iOrient, iConv, lCC, sumC, sumsquareC, pProb, param.param_device, RefMap);
602
}
603

604
int bioem::createProjection(int iMap, mycomplex_t* mapFFT)
605
{
David Rohr's avatar
David Rohr committed
606
	// **************************************************************************************
David Rohr's avatar
David Rohr committed
607
608
	// ****  BioEM Create Projection routine in Euler angle predefined grid******************
	// ********************* and turns projection into Fourier space ************************
David Rohr's avatar
David Rohr committed
609
	// **************************************************************************************
610

611
612
	cuda_custom_timeslot("Projection", 0);

613
614
	myfloat3_t RotatedPointsModel[Model.nPointsModel];
	myfloat_t rotmat[3][3];
615
	myfloat_t alpha, gam, beta;
616
	myfloat_t* localproj;
617

618
	localproj = lCC[omp_get_thread_num()];
619
	memset(localproj, 0, param.param_device.NumberPixels * param.param_device.NumberPixels * sizeof(*localproj));
620

621
622
623
	alpha = param.angles[iMap].pos[0];
	beta = param.angles[iMap].pos[1];
	gam = param.angles[iMap].pos[2];
624

David Rohr's avatar
David Rohr committed
625
	// **** To see how things are going: cout << "Id " << omp_get_thread_num() <<  " Angs: " << alpha << " " << beta << " " << gam << "\n"; ***
626

David Rohr's avatar
David Rohr committed
627
	// ********** Creat Rotation with pre-defiend grid of orientations**********
628
629
630
631
632
633
634
635
636
637
638
	rotmat[0][0] = cos(gam) * cos(alpha) - cos(beta) * sin(alpha) * sin(gam);
	rotmat[0][1] = cos(gam) * sin(alpha) + cos(beta) * cos(alpha) * sin(gam);
	rotmat[0][2] = sin(gam) * sin(beta);
	rotmat[1][0] = -sin(gam) * cos(alpha) - cos(beta) * sin(alpha) * cos(gam);
	rotmat[1][1] = -sin(gam) * sin(alpha) + cos(beta) * cos(alpha) * cos(gam);
	rotmat[1][2] = cos(gam) * sin(beta);
	rotmat[2][0] = sin(beta) * sin(alpha);
	rotmat[2][1] = -sin(beta) * cos(alpha);
	rotmat[2][2] = cos(beta);

	for(int n = 0; n < Model.nPointsModel; n++)
639
	{
640
641
642
		RotatedPointsModel[n].pos[0] = 0.0;
		RotatedPointsModel[n].pos[1] = 0.0;
		RotatedPointsModel[n].pos[2] = 0.0;
643
	}
644
	for(int n = 0; n < Model.nPointsModel; n++)
645
	{
646
		for(int k = 0; k < 3; k++)
647
		{
648
			for(int j = 0; j < 3; j++)
649
			{
650
				RotatedPointsModel[n].pos[k] += rotmat[k][j] * Model.points[n].point.pos[j];
651
652
653
654
655
656
			}
		}
	}

	int i, j;

David Rohr's avatar
David Rohr committed
657
	// ************ Projection over the Z axis********************
658
	for(int n = 0; n < Model.nPointsModel; n++)
659
660
	{
		//Getting pixel that represents coordinates & shifting the start at to Numpix/2,Numpix/2 )
661
662
		i = floor(RotatedPointsModel[n].pos[0] / param.pixelSize + (myfloat_t) param.param_device.NumberPixels / 2.0f + 0.5f);
		j = floor(RotatedPointsModel[n].pos[1] / param.pixelSize + (myfloat_t) param.param_device.NumberPixels / 2.0f + 0.5f);
663

664
665
666
667
668
669
		if (i < 0 || j < 0 || i >= param.param_device.NumberPixels || j >= param.param_device.NumberPixels)
		{
			if (DebugOutput >= 3) cout << "Model Point out of map: " << i << ", " << j << "\n";
			continue;
		}

670
		localproj[i * param.param_device.NumberPixels + j] += Model.points[n].density / Model.NormDen;
671
672
	}

David Rohr's avatar
David Rohr committed
673
	// **** Output Just to check****
674
#ifdef PILAR_DEBUG
675
	if(iMap == 10)
676
677
678
679
680
681
	{
		ofstream myexamplemap;
		ofstream myexampleRot;
		myexamplemap.open ("MAP_i10");
		myexampleRot.open ("Rot_i10");
		myexamplemap << "ANGLES " << alpha << " " << beta << " " << gam << "\n";
682
		for(int k = 0; k < param.param_device.NumberPixels; k++)
683
		{
684
			for(int j = 0; j < param.param_device.NumberPixels; j++) myexamplemap << "\nMAP " << k << " " << j << " " << localproj[k * param.param_device.NumberPixels + j];
685
686
		}
		myexamplemap << " \n";
687
		for(int n = 0; n < Model.nPointsModel; n++)myexampleRot << "\nCOOR " << RotatedPointsModel[n].pos[0] << " " << RotatedPointsModel[n].pos[1] << " " << RotatedPointsModel[n].pos[2];
688
689
690
		myexamplemap.close();
		myexampleRot.close();
	}
691
#endif
692

David Rohr's avatar
David Rohr committed
693
694
	// ***** Converting projection to Fourier Space for Convolution later with kernel****
	// ********** Omp Critical is necessary with FFTW*******
695
	myfftw_execute_dft_r2c(param.fft_plan_r2c_forward, localproj, mapFFT);
696

697
698
	cuda_custom_timeslot_end;

699
700
701
	return(0);
}

702
int bioem::createConvolutedProjectionMap(int iMap, int iConv, mycomplex_t* lproj, myfloat_t* Mapconv, mycomplex_t* localmultFFT, myfloat_t& sumC, myfloat_t& sumsquareC)
703
{
David Rohr's avatar
David Rohr committed
704
705
	// **************************************************************************************
	// ****  BioEM Create Convoluted Projection Map routine, multiplies in Fourier **********
David Rohr's avatar
David Rohr committed
706
707
	// **************** calculated Projection with convoluted precalculated Kernel***********
	// *************** and Backtransforming it to real Space ********************************
David Rohr's avatar
David Rohr committed
708
	// **************************************************************************************
709

710
711
	cuda_custom_timeslot("Convolution", 1);

712
	mycomplex_t* tmp = localCCT[omp_get_thread_num()];
713

David Rohr's avatar
David Rohr committed
714
	// **** Multiplying FFTmap with corresponding kernel ****
715
	const mycomplex_t* refCTF = &param.refCTF[iConv * param.FFTMapSize];
716
	for(int i = 0; i < param.param_device.NumberPixels * param.param_device.NumberFFTPixels1D; i++)
717
	{
718
719
720
		localmultFFT[i][0] = lproj[i][0] * refCTF[i][0] + lproj[i][1] * refCTF[i][1];
		localmultFFT[i][1] = lproj[i][1] * refCTF[i][0] - lproj[i][0] * refCTF[i][1];
		// cout << "GG " << i << " " << j << " " << refCTF[i][0] << " " << refCTF[i][1] <<" " <<lproj[i][0] <<" " <<lproj[i][1] << "\n";
721
722
	}

723
724
725
	//FFTW_C2R will destroy the input array, so we have to work on a copy here
	memcpy(tmp, localmultFFT, sizeof(mycomplex_t) * param.param_device.NumberPixels * param.param_device.NumberFFTPixels1D);

David Rohr's avatar
David Rohr committed
726
	// **** Bringing convoluted Map to real Space ****
David Rohr's avatar
David Rohr committed
727
	myfftw_execute_dft_c2r(param.fft_plan_c2r_backward, tmp, Mapconv);
728

David Rohr's avatar
David Rohr committed
729
	// *** Calculating Cross-correlations of cal-convoluted map with its self *****
730
731
	sumC = 0;
	sumsquareC = 0;
732
	for(int i = 0; i < param.param_device.NumberPixels * param.param_device.NumberPixels; i++)
733
	{
David Rohr's avatar
David Rohr committed
734
735
		sumC += Mapconv[i];
		sumsquareC += Mapconv[i] * Mapconv[i];
736
	}
David Rohr's avatar
David Rohr committed
737
	// *** The DTF gives an unnormalized value so have to divded by the total number of pixels in Fourier ***
738
	// Normalizing
739
740
741
742
	myfloat_t norm2 = (myfloat_t) (param.param_device.NumberPixels * param.param_device.NumberPixels);
	myfloat_t norm4 = norm2 * norm2;
	sumC = sumC / norm2;
	sumsquareC = sumsquareC / norm4;
743

744
745
	cuda_custom_timeslot_end;

746
	return(0);
747
748
}

749
int bioem::calcross_cor(myfloat_t* localmap, myfloat_t& sum, myfloat_t& sumsquare)
750
{
David Rohr's avatar
David Rohr committed
751
	// *********************** Routine to calculate Cross correlations***********************
752

753
754
	sum = 0.0;
	sumsquare = 0.0;
755
756
757
758
759
	for (int i = 0; i < param.param_device.NumberPixels; i++)
	{
		for (int j = 0; j < param.param_device.NumberPixels; j++)
		{
			// Calculate Sum of pixels
760
			sum += localmap[i * param.param_device.NumberPixels + j];
761
			// Calculate Sum of pixels squared
762
			sumsquare += localmap[i * param.param_device.NumberPixels + j] * localmap[i * param.param_device.NumberPixels + j];
763
764
765
		}
	}
	return(0);
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
}

int bioem::deviceInit()
{
	return(0);
}

int bioem::deviceStartRun()
{
	return(0);
}

int bioem::deviceFinishRun()
{
	return(0);
}
782
783
784
785
786
787
788
789
790
791

void* bioem::malloc_device_host(size_t size)
{
	return(mallocchk(size));
}

void bioem::free_device_host(void* ptr)
{
	free(ptr);
}