Commit d8564df0 authored by Luka Stanisic's avatar Luka Stanisic

nicer output of the execution (adding GPU workload values)

parent e4af4bce
...@@ -615,7 +615,7 @@ int bioem::run() ...@@ -615,7 +615,7 @@ int bioem::run()
(((double) param.param_device.NumberPixels - (double) param.param_device.maxDisplaceCenter / 2.) * ((double) param.param_device.NumberPixels - (double) param.param_device.maxDisplaceCenter / 2.) * 2. + 8.) * (double) sizeof(myfloat_t) / compTime; (((double) param.param_device.NumberPixels - (double) param.param_device.maxDisplaceCenter / 2.) * ((double) param.param_device.NumberPixels - (double) param.param_device.maxDisplaceCenter / 2.) * 2. + 8.) * (double) sizeof(myfloat_t) / compTime;
const double nGBs2 = (double) RefMap.ntotRefMap * ((double) param.param_device.NumberPixels * (double) param.param_device.NumberPixels + 8.) * (double) sizeof(myfloat_t) / compTime; const double nGBs2 = (double) RefMap.ntotRefMap * ((double) param.param_device.NumberPixels * (double) param.param_device.NumberPixels + 8.) * (double) sizeof(myfloat_t) / compTime;
printf("\t\tTime Comparison %d %d: %f sec (%f GFlops, %f GB/s (cached), %f GB/s) (rank %d)\n", iOrient, iConv, compTime, nFlops / 1000000000., nGBs / 1000000000., nGBs2 / 1000000000., mpi_rank); printf("\t\tTime Comparison %d %d: %f sec (%f GFlops, %f GB/s (cached), %f GB/s, with GPU workload %d%%) (rank %d)\n", iOrient, iConv, compTime, nFlops / 1000000000., nGBs / 1000000000., nGBs2 / 1000000000., workload, mpi_rank);
} }
if (Autotuning == 1 && !stopTuning && STABLE_ITERATION(iConv)) if (Autotuning == 1 && !stopTuning && STABLE_ITERATION(iConv))
{ {
...@@ -688,7 +688,14 @@ int bioem::run() ...@@ -688,7 +688,14 @@ int bioem::run()
x = (c-b > b-a) ? (int)(b+(c-b)/2) : (int)(a+(b-a+1)/2); x = (c-b > b-a) ? (int)(b+(c-b)/2) : (int)(a+(b-a+1)/2);
} }
if ( (c-b == limit) && ( b-a == limit) ) stopTuning=true; if ((c - b == limit) && (b - a == limit))
{
stopTuning=true;
if (DebugOutput >= 2)
{
printf("\t\tOptimal GPU workload %d%% (rank %d)\n", workload, mpi_rank);
}
}
workload=x; workload=x;
rebalance(x); rebalance(x);
......
...@@ -684,7 +684,7 @@ void bioem_cuda::rebalance(int workload) ...@@ -684,7 +684,7 @@ void bioem_cuda::rebalance(int workload)
if (DebugOutput >= 2) if (DebugOutput >= 2)
{ {
printf("\t\tSetting GPU workload to %d%%\n", workload); printf("\t\tSetting GPU workload to %d%% (rank %d)\n", workload, mpi_rank);
} }
GPUWorkload = workload; GPUWorkload = workload;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment