diff --git a/benchmarks/Benchmark_su3.cc b/benchmarks/Benchmark_su3.cc index c7ac5d3..18aa1e3 100644 --- a/benchmarks/Benchmark_su3.cc +++ b/benchmarks/Benchmark_su3.cc @@ -26,6 +26,9 @@ Author: Peter Boyle See the full license in the file "LICENSE" in the top level distribution directory *************************************************************************************/ /* END LEGAL */ + + *************************************************************************************/ + /* END LEGAL */ #include #include using namespace std; @@ -33,16 +36,21 @@ using namespace Grid; #ifdef OMPTARGET_UVM #pragma omp requires unified_shared_memory #endif + +//#define TILE_UNROLL +#define UNROLL_TILE +#define TILE_SIZE 64 +#define UNROLL_FACTOR 16 int main (int argc, char ** argv) { Grid_init(&argc,&argv); #define LMAX (48) -#define LMIN (8) -#define LADD (8) +#define LMIN (4) +#define LADD (4) int64_t Nwarm=50; int64_t Nloop=1000; - + Coordinate simd_layout = GridDefaultSimd(Nd,vComplex::Nsimd()); std::cout<= vol) { - std::cout<<"Spot check failed; index out of bound"< latt_size ({lat*mpi_layout[0],lat*mpi_layout[1],lat*mpi_layout[2],lat*mpi_layout[3]}); @@ -280,17 +328,16 @@ int64_t Nloop=1000; LatticeColourMatrix y(&Grid); random(pRNG,y); for(int mu=0;mu<4;mu++){ - double start=usecond(); - for(int64_t i=0;i