Commit 8bc86876 authored by Giovanni La Mura's avatar Giovanni La Mura
Browse files

Rebase loval prepare_magma on remote branch

parents ea91f54f d4c1387f
Loading
Loading
Loading
Loading
+18 −10
Original line number Diff line number Diff line
@@ -95,24 +95,28 @@ void cluster(const string& config_file, const string& data_file, const string& o
  cudaGetDeviceCount(&device_count);
  logger->log("DEBUG: Proc-" + to_string(mpidata->rank) + " found " + to_string(device_count) + " CUDA devices.\n", LOG_DEBG);
  logger->log("INFO: Process " + to_string(mpidata->rank) + " initializes MAGMA.\n");
  magma_device_t *devices = new magma_device_t[device_count];
  cudaSetValidDevices(devices, device_count);
  magma_device_t *magmadevices = new magma_device_t[device_count];
  int *cudadevices = new int[device_count];
  cudaSetValidDevices(cudadevices, device_count);
  for (int ci=0; ci<device_count; ci++) magmadevices[ci] = (magma_device_t) cudadevices[ci];
  magma_int_t num_devices;
  magma_getdevices(devices, device_count, &num_devices);
  magma_getdevices(magmadevices, device_count, &num_devices);
  logger->log("DEBUG: Proc-" + to_string(mpidata->rank) + " found " + to_string(num_devices) + " MAGMA devices.\n", LOG_DEBG);
  magma_int_t magma_result = magma_init();
  if (magma_result != MAGMA_SUCCESS) {
    logger->err("ERROR: Process " + to_string(mpidata->rank) + " failed to initilize MAGMA.\n");
    logger->err("PROC-" + to_string(mpidata->rank) + ": MAGMA error code " + to_string(magma_result) + "\n");
    fclose(timing_file);
    delete[] devices;
    delete[] magmadevices;
    delete[] cudadevices;
    delete time_logger;
    delete logger;
    return;
  }
#else
  int *devices = new int[1];
  devices[0] = -1;
  int *cudadevices = new int[1];
  int *magmadevices = new int[1];
  cudadevices[0] = magmadevices[0] = -1;
#endif
  // the following only happens on MPI process 0
  if (mpidata->rank == 0) {
@@ -125,7 +129,8 @@ void cluster(const string& config_file, const string& data_file, const string& o
      string message = "FILE: " + string(ex.what()) + "\n";
      logger->err(message);
      fclose(timing_file);
      delete[] devices;
      delete[] cudadevices;
      delete[] magmadevices;
      delete time_logger;
      delete logger;
      return;
@@ -142,7 +147,8 @@ void cluster(const string& config_file, const string& data_file, const string& o
      logger->err(message);
      if (sconf) delete sconf;
      fclose(timing_file);
      delete[] devices;
      delete[] cudadevices;
      delete[] magmadevices;
      delete time_logger;
      delete logger;
      return;
@@ -248,7 +254,8 @@ void cluster(const string& config_file, const string& data_file, const string& o
	  tppoan.close();
	  fclose(timing_file);
	  fclose(output);
	  delete[] devices;
	  delete[] magmadevices;
	  delete[] cudadevices;
	  delete p_scattering_angles;
	  delete cid;
	  delete logger;
@@ -558,7 +565,8 @@ void cluster(const string& config_file, const string& data_file, const string& o
      }
    }
    // Clean memory
    delete[] devices;
    delete[] magmadevices;
    delete[] cudadevices;
    delete cid;
    delete p_scattering_angles;
    delete sconf;
+10 −0
Original line number Diff line number Diff line
@@ -27,9 +27,15 @@ typedef __complex__ double dcomplex;

#ifdef USE_LAPACK
#ifdef USE_MKL
#ifdef USE_ILP64
#ifndef MKL_INT 
#define MKL_INT int64_t
#endif // MKL_INT
#else
#ifndef MKL_INT 
#define MKL_INT int32_t
#endif // MKL_INT
#endif
#include <mkl_lapacke.h>
#else
#include <lapacke.h>
@@ -44,7 +50,11 @@ typedef __complex__ double dcomplex;
#ifdef lapack_int
#define np_int lapack_int
#else
#ifdef USE_ILP64
#define np_int int64_t
#else
#define np_int int32_t
#endif // USE_ILP64
#endif // lapack_int
#endif // np_int

+54 −8
Original line number Diff line number Diff line
@@ -48,32 +48,47 @@ endif

# define (outside) USE_LAPACK for lapacke support, LAPACK_ILP64 for ilp64 interface, MKL_ILP64 the same if using MKL implementation
ifdef USE_LAPACK
# define (outside) USE_ILP64 for long long int support in lapack/mkl/magma interfaces
ifdef USE_ILP64
ifndef LAPACK_ILP64
override LAPACK_ILP64=1
endif #LAPACK_ILP64
endif
# define (outside) USE_MKL to use the MKL implementation of lapacke
ifdef USE_MKL
# define (outside) USE_ILP64 for long long int support in lapack/mkl/magma interfaces
ifdef USE_ILP64
ifndef MKL_ILP64
override MKL_ILP64=1
endif #MKL_ILP64
endif
ifndef LAPACK_INCLUDE
# this is for the MKL implementation
override LAPACK_INCLUDE=$(MKLROOT)/include
endif
endif #LAPACK_INCLUDE
ifndef LAPACK_LDFLAGS
# this is for the MKL implementation
# define (outside) USE_ILP64 for long long int support in lapack/mkl/magma interfaces
ifdef USE_ILP64
override LAPACK_LDFLAGS=-L$(MKLROOT)/lib -Wl,--no-as-needed -lmkl_intel_ilp64 -lmkl_gnu_thread -lmkl_core -lgomp -lpthread -lm -ldl
else
override LAPACK_LDFLAGS=-L$(MKLROOT)/lib -Wl,--no-as-needed -lmkl_intel_lp64 -lmkl_gnu_thread -lmkl_core -lgomp -lpthread -lm -ldl
endif
endif #LAPACK_LDFLAGS
# the next else refers to USE_MKL
else
else #this is for when USE_MKL is _not_ defined
ifndef LAPACK_INCLUDE
# this is for standard "vanilla" lapacke64
override LAPACK_INCLUDE=/usr/include
endif
endif # LAPACK_INCLUDE
ifndef LAPACK_LDFLAGS
ifdef USE_ILP64
# this is for standard "vanilla" lapacke64
override LAPACK_LDFLAGS=-llapacke64
else
override LAPACK_LDFLAGS=-llapacke
endif
endif #LAPACK_LDFLAGS
# the next endif is for USE_MKL
endif
#the next endif is for USE_LAPACK
@@ -81,7 +96,13 @@ endif

# define (outside) USE_MAGMA for magma support
ifdef USE_MAGMA
MAGMA_LDFLAGS= -lmagma -lcudart
ifdef MAGMA_LIB
override MAGMA_LDFLAGS= -L$(MAGMA_LIB)
endif
ifdef CUDA_HOME
override MAGMA_LDFLAGS+= -L$(CUDA_HOME)/lib64
endif
override MAGMA_LDFLAGS+= -lmagma -lcudart
#the next endif is for USE_MAGMA
endif

@@ -92,25 +113,50 @@ ifdef USE_OPENMP
override CXXFLAGS+= -fopenmp
# closes USE_OPENMP
endif

ifdef USE_ILP64
override CXXFLAGS+= -DUSE_ILP64
endif

ifdef USE_LAPACK
override CXXFLAGS+= -DUSE_LAPACK -DLAPACK_ILP64 
override CXXFLAGS+= -DUSE_LAPACK
ifdef USE_ILP64
override CXXFLAGS+= -DLAPACK_ILP64
endif
# closes USE_LAPACK
endif

ifdef USE_MKL
override CXXFLAGS+= -DMKL_ILP64 -DUSE_MKL -I$(MKLROOT)/include
override CXXFLAGS+= -DUSE_MKL -I$(MKLROOT)/include
ifdef USE_ILP64
override CXXFLAGS+= -DMKL_ILP64
endif
# closes USE_MKL
endif

ifdef USE_OPENMP
override CXXFLAGS+= -fopenmp
# closes USE_OPENMP
endif
# closes USE_LAPACK
endif

ifdef USE_MAGMA
override CXXFLAGS+= -DUSE_MAGMA
ifdef CUDA_HOME
override CXXFLAGS+= -I$(CUDA_HOME)/include
endif
ifdef MAGMA_INCLUDE
override CXXFLAGS+= -I$(MAGMA_INCLUDE)
endif
ifdef USE_ILP64
override CXXFLAGS+= -DMAGMA_ILP64
endif
# closes USE_MAGMA
endif

# closes CXXFLAGS
endif


# HDF5_LIB defines the default path to the HDF5 libraries to use
# CXXLDFLAGS defines the default linker flags to use for C++ codes
ifndef CXXLDFLAGS