Loading Makefile +5 −5 Original line number Diff line number Diff line Loading @@ -63,11 +63,11 @@ OPT += -DPHASE_ON # SELECT THE GRIDDING KERNEL: GAUSS, GAUSS_HI_PRECISION, KAISERBESSEL OPT += -DGAUSS_HI_PRECISION #OPT += -DGAUSS_HI_PRECISION #OPT += -DGAUSS #OPT += -DKAISERBESSEL OPT += -DKAISERBESSEL # ======================================================== Loading @@ -77,16 +77,16 @@ OPT += -DGAUSS_HI_PRECISION #OPT += -DNVIDIA # use CUDA for GPUs OPT += -DCUDACC #OPT += -DCUDACC # use GPU acceleration via OMP #OPT += -DACCOMP # perform stacking on GPUs OPT += -DGPU_STACKING #OPT += -DGPU_STACKING # use NVIDIA GPU to perform the reduce OPT += -DNCCL_REDUCE #OPT += -DNCCL_REDUCE # use GPU to perform FFT #OPT += -DCUFFTMP Loading allvars.c +5 −9 Original line number Diff line number Diff line Loading @@ -18,12 +18,12 @@ char datapath[LONGNAME_LEN]; int xaxis, yaxis; int rank; int size; uint nsectors; uint startrow; myuint nsectors; myuint startrow; double resolution, dx, dw, w_supporth; uint **sectorarray = NULL; uint *histo_send = NULL; myuint **sectorarray = NULL; myuint *histo_send = NULL; int verbose_level = 0; timing_t timing_wt; Loading @@ -31,12 +31,8 @@ double reduce_mpi_time; double reduce_shmem_time; uint size_of_grid; myuint size_of_grid; double *grid_pointers = NULL, *grid, *gridss, *gridss_real, *gridss_img, *gridss_w, *grid_gpu, *gridss_gpu; MPI_Comm MYMPI_COMM_WORLD; MPI_Win slabwin; allvars.h +17 −15 Original line number Diff line number Diff line Loading @@ -73,8 +73,8 @@ typedef double float_t; typedef float float_t; #endif typedef unsigned int uint; typedef unsigned long long ull; typedef unsigned int myuint; typedef unsigned long long myull; extern struct io Loading Loading @@ -104,6 +104,8 @@ extern struct op char outfile2[NAME_LEN]; char outfile3[NAME_LEN]; char fftfile[NAME_LEN]; char gridded_writedata1[NAME_LEN]; char gridded_writedata2[NAME_LEN]; char fftfile_writedata1[NAME_LEN]; char fftfile_writedata2[NAME_LEN]; char fftfile2[NAME_LEN]; Loading @@ -117,15 +119,15 @@ extern struct op extern struct meta { unsigned long Nmeasures; unsigned long Nvis; uint Nweights; uint freq_per_chan; uint polarisations; uint Ntimes; myuint Nmeasures; myull Nvis; myuint Nweights; myuint freq_per_chan; myuint polarisations; myuint Ntimes; double dt; double thours; uint baselines; myuint baselines; double uvmin; double uvmax; double wmin; Loading Loading @@ -161,16 +163,16 @@ extern char datapath[LONGNAME_LEN]; extern int xaxis, yaxis; extern int rank; extern int size; extern uint nsectors; extern uint startrow; extern myuint nsectors; extern myuint startrow; extern double_t resolution, dx, dw, w_supporth; extern uint **sectorarray; extern uint *histo_send; extern myuint **sectorarray; extern myuint *histo_send; extern int verbose_level; extern uint size_of_grid; extern myuint size_of_grid; extern double_t *grid_pointers, *grid, *gridss, *gridss_real, *gridss_img, *gridss_w, *grid_gpu, *gridss_gpu; extern MPI_Comm MYMPI_COMM_WORLD; Loading allvars_nccl.h +17 −15 Original line number Diff line number Diff line Loading @@ -71,8 +71,8 @@ typedef double float_t; typedef float float_t; #endif typedef unsigned int uint; typedef unsigned long long ull; typedef unsigned int myuint; typedef unsigned long long myull; extern struct io Loading Loading @@ -102,6 +102,8 @@ extern struct op char outfile2[NAME_LEN]; char outfile3[NAME_LEN]; char fftfile[NAME_LEN]; char gridded_writedata1[NAME_LEN]; char gridded_writedata2[NAME_LEN]; char fftfile_writedata1[NAME_LEN]; char fftfile_writedata2[NAME_LEN]; char fftfile2[NAME_LEN]; Loading @@ -115,15 +117,15 @@ extern struct op extern struct meta { unsigned long Nmeasures; unsigned long Nvis; uint Nweights; uint freq_per_chan; uint polarisations; uint Ntimes; myuint Nmeasures; myull Nvis; myuint Nweights; myuint freq_per_chan; myuint polarisations; myuint Ntimes; double dt; double thours; uint baselines; myuint baselines; double uvmin; double uvmax; double wmin; Loading Loading @@ -159,16 +161,16 @@ extern char datapath[LONGNAME_LEN]; extern int xaxis, yaxis; extern int rank; extern int size; extern uint nsectors; extern uint startrow; extern myuint nsectors; extern myuint startrow; extern double_t resolution, dx, dw, w_supporth; extern uint **sectorarray; extern uint *histo_send; extern myuint **sectorarray; extern myuint *histo_send; extern int verbose_level; extern uint size_of_grid; extern myuint size_of_grid; extern double_t *grid_pointers, *grid, *gridss, *gridss_real, *gridss_img, *gridss_w, *grid_gpu, *gridss_gpu; extern MPI_Comm MYMPI_COMM_WORLD; Loading allvars_rccl.h +16 −14 Original line number Diff line number Diff line Loading @@ -74,7 +74,7 @@ typedef double float_ty; typedef float float_ty; #endif typedef unsigned int uint; typedef unsigned int myuint; typedef unsigned long long ull; Loading Loading @@ -105,6 +105,8 @@ extern struct op char outfile2[NAME_LEN]; char outfile3[NAME_LEN]; char fftfile[NAME_LEN]; char gridded_writedata1[NAME_LEN]; char gridded_writedata2[NAME_LEN]; char fftfile_writedata1[NAME_LEN]; char fftfile_writedata2[NAME_LEN]; char fftfile2[NAME_LEN]; Loading @@ -118,15 +120,15 @@ extern struct op extern struct meta { uint Nmeasures; uint Nvis; uint Nweights; uint freq_per_chan; uint polarisations; uint Ntimes; myuint Nmeasures; myuint Nvis; myuint Nweights; myuint freq_per_chan; myuint polarisations; myuint Ntimes; double dt; double thours; uint baselines; myuint baselines; double uvmin; double uvmax; double wmin; Loading Loading @@ -162,16 +164,16 @@ extern char datapath[LONGNAME_LEN]; extern int xaxis, yaxis; extern int rank; extern int size; extern uint nsectors; extern uint startrow; extern myuint nsectors; extern myuint startrow; extern double_ty resolution, dx, dw, w_supporth; extern uint **sectorarray; extern uint *histo_send; extern myuint **sectorarray; extern myuint *histo_send; extern int verbose_level; extern uint size_of_grid; extern myuint size_of_grid; extern double_ty *grid_pointers, *grid, *gridss, *gridss_real, *gridss_img, *gridss_w; extern MPI_Comm MYMPI_COMM_WORLD; Loading Loading
Makefile +5 −5 Original line number Diff line number Diff line Loading @@ -63,11 +63,11 @@ OPT += -DPHASE_ON # SELECT THE GRIDDING KERNEL: GAUSS, GAUSS_HI_PRECISION, KAISERBESSEL OPT += -DGAUSS_HI_PRECISION #OPT += -DGAUSS_HI_PRECISION #OPT += -DGAUSS #OPT += -DKAISERBESSEL OPT += -DKAISERBESSEL # ======================================================== Loading @@ -77,16 +77,16 @@ OPT += -DGAUSS_HI_PRECISION #OPT += -DNVIDIA # use CUDA for GPUs OPT += -DCUDACC #OPT += -DCUDACC # use GPU acceleration via OMP #OPT += -DACCOMP # perform stacking on GPUs OPT += -DGPU_STACKING #OPT += -DGPU_STACKING # use NVIDIA GPU to perform the reduce OPT += -DNCCL_REDUCE #OPT += -DNCCL_REDUCE # use GPU to perform FFT #OPT += -DCUFFTMP Loading
allvars.c +5 −9 Original line number Diff line number Diff line Loading @@ -18,12 +18,12 @@ char datapath[LONGNAME_LEN]; int xaxis, yaxis; int rank; int size; uint nsectors; uint startrow; myuint nsectors; myuint startrow; double resolution, dx, dw, w_supporth; uint **sectorarray = NULL; uint *histo_send = NULL; myuint **sectorarray = NULL; myuint *histo_send = NULL; int verbose_level = 0; timing_t timing_wt; Loading @@ -31,12 +31,8 @@ double reduce_mpi_time; double reduce_shmem_time; uint size_of_grid; myuint size_of_grid; double *grid_pointers = NULL, *grid, *gridss, *gridss_real, *gridss_img, *gridss_w, *grid_gpu, *gridss_gpu; MPI_Comm MYMPI_COMM_WORLD; MPI_Win slabwin;
allvars.h +17 −15 Original line number Diff line number Diff line Loading @@ -73,8 +73,8 @@ typedef double float_t; typedef float float_t; #endif typedef unsigned int uint; typedef unsigned long long ull; typedef unsigned int myuint; typedef unsigned long long myull; extern struct io Loading Loading @@ -104,6 +104,8 @@ extern struct op char outfile2[NAME_LEN]; char outfile3[NAME_LEN]; char fftfile[NAME_LEN]; char gridded_writedata1[NAME_LEN]; char gridded_writedata2[NAME_LEN]; char fftfile_writedata1[NAME_LEN]; char fftfile_writedata2[NAME_LEN]; char fftfile2[NAME_LEN]; Loading @@ -117,15 +119,15 @@ extern struct op extern struct meta { unsigned long Nmeasures; unsigned long Nvis; uint Nweights; uint freq_per_chan; uint polarisations; uint Ntimes; myuint Nmeasures; myull Nvis; myuint Nweights; myuint freq_per_chan; myuint polarisations; myuint Ntimes; double dt; double thours; uint baselines; myuint baselines; double uvmin; double uvmax; double wmin; Loading Loading @@ -161,16 +163,16 @@ extern char datapath[LONGNAME_LEN]; extern int xaxis, yaxis; extern int rank; extern int size; extern uint nsectors; extern uint startrow; extern myuint nsectors; extern myuint startrow; extern double_t resolution, dx, dw, w_supporth; extern uint **sectorarray; extern uint *histo_send; extern myuint **sectorarray; extern myuint *histo_send; extern int verbose_level; extern uint size_of_grid; extern myuint size_of_grid; extern double_t *grid_pointers, *grid, *gridss, *gridss_real, *gridss_img, *gridss_w, *grid_gpu, *gridss_gpu; extern MPI_Comm MYMPI_COMM_WORLD; Loading
allvars_nccl.h +17 −15 Original line number Diff line number Diff line Loading @@ -71,8 +71,8 @@ typedef double float_t; typedef float float_t; #endif typedef unsigned int uint; typedef unsigned long long ull; typedef unsigned int myuint; typedef unsigned long long myull; extern struct io Loading Loading @@ -102,6 +102,8 @@ extern struct op char outfile2[NAME_LEN]; char outfile3[NAME_LEN]; char fftfile[NAME_LEN]; char gridded_writedata1[NAME_LEN]; char gridded_writedata2[NAME_LEN]; char fftfile_writedata1[NAME_LEN]; char fftfile_writedata2[NAME_LEN]; char fftfile2[NAME_LEN]; Loading @@ -115,15 +117,15 @@ extern struct op extern struct meta { unsigned long Nmeasures; unsigned long Nvis; uint Nweights; uint freq_per_chan; uint polarisations; uint Ntimes; myuint Nmeasures; myull Nvis; myuint Nweights; myuint freq_per_chan; myuint polarisations; myuint Ntimes; double dt; double thours; uint baselines; myuint baselines; double uvmin; double uvmax; double wmin; Loading Loading @@ -159,16 +161,16 @@ extern char datapath[LONGNAME_LEN]; extern int xaxis, yaxis; extern int rank; extern int size; extern uint nsectors; extern uint startrow; extern myuint nsectors; extern myuint startrow; extern double_t resolution, dx, dw, w_supporth; extern uint **sectorarray; extern uint *histo_send; extern myuint **sectorarray; extern myuint *histo_send; extern int verbose_level; extern uint size_of_grid; extern myuint size_of_grid; extern double_t *grid_pointers, *grid, *gridss, *gridss_real, *gridss_img, *gridss_w, *grid_gpu, *gridss_gpu; extern MPI_Comm MYMPI_COMM_WORLD; Loading
allvars_rccl.h +16 −14 Original line number Diff line number Diff line Loading @@ -74,7 +74,7 @@ typedef double float_ty; typedef float float_ty; #endif typedef unsigned int uint; typedef unsigned int myuint; typedef unsigned long long ull; Loading Loading @@ -105,6 +105,8 @@ extern struct op char outfile2[NAME_LEN]; char outfile3[NAME_LEN]; char fftfile[NAME_LEN]; char gridded_writedata1[NAME_LEN]; char gridded_writedata2[NAME_LEN]; char fftfile_writedata1[NAME_LEN]; char fftfile_writedata2[NAME_LEN]; char fftfile2[NAME_LEN]; Loading @@ -118,15 +120,15 @@ extern struct op extern struct meta { uint Nmeasures; uint Nvis; uint Nweights; uint freq_per_chan; uint polarisations; uint Ntimes; myuint Nmeasures; myuint Nvis; myuint Nweights; myuint freq_per_chan; myuint polarisations; myuint Ntimes; double dt; double thours; uint baselines; myuint baselines; double uvmin; double uvmax; double wmin; Loading Loading @@ -162,16 +164,16 @@ extern char datapath[LONGNAME_LEN]; extern int xaxis, yaxis; extern int rank; extern int size; extern uint nsectors; extern uint startrow; extern myuint nsectors; extern myuint startrow; extern double_ty resolution, dx, dw, w_supporth; extern uint **sectorarray; extern uint *histo_send; extern myuint **sectorarray; extern myuint *histo_send; extern int verbose_level; extern uint size_of_grid; extern myuint size_of_grid; extern double_ty *grid_pointers, *grid, *gridss, *gridss_real, *gridss_img, *gridss_w; extern MPI_Comm MYMPI_COMM_WORLD; Loading