2014-03-17 10:14:46 -04:00
|
|
|
// Basic cuda functions callable from C/C++ code
|
|
|
|
|
#include <cuda.h>
|
2015-06-25 17:46:13 -04:00
|
|
|
#include <stdio.h>
|
2014-03-17 10:14:46 -04:00
|
|
|
|
2018-04-14 21:01:16 -04:00
|
|
|
extern "C" int ScaLBL_SetDevice(int rank){
|
2018-04-14 20:33:45 -04:00
|
|
|
int n_devices;
|
2018-04-14 21:01:16 -04:00
|
|
|
//int local_rank = atoi(getenv("MV2_COMM_WORLD_LOCAL_RANK"));
|
2018-04-14 20:33:45 -04:00
|
|
|
cudaGetDeviceCount(&n_devices);
|
2018-04-14 21:01:16 -04:00
|
|
|
//int device = local_rank % n_devices;
|
|
|
|
|
int device = rank % n_devices;
|
2018-04-14 20:33:45 -04:00
|
|
|
cudaSetDevice(device);
|
|
|
|
|
return device;
|
|
|
|
|
}
|
|
|
|
|
|
2016-11-24 11:26:51 -05:00
|
|
|
extern "C" void ScaLBL_AllocateDeviceMemory(void** address, size_t size){
|
2018-04-30 10:29:56 -04:00
|
|
|
cudaMalloc(address,size);
|
2015-06-25 16:18:45 -04:00
|
|
|
cudaError_t err = cudaGetLastError();
|
|
|
|
|
if (cudaSuccess != err){
|
2018-04-30 10:29:56 -04:00
|
|
|
printf("Error in cudaMalloc: %s \n",cudaGetErrorString(err));
|
2015-06-25 16:18:45 -04:00
|
|
|
}
|
2014-03-17 10:14:46 -04:00
|
|
|
}
|
|
|
|
|
|
2018-01-24 10:08:43 -05:00
|
|
|
extern "C" void ScaLBL_FreeDeviceMemory(void* pointer){
|
|
|
|
|
cudaFree(pointer);
|
2017-10-02 10:07:06 -04:00
|
|
|
}
|
|
|
|
|
|
2016-11-24 11:26:51 -05:00
|
|
|
extern "C" void ScaLBL_CopyToDevice(void* dest, const void* source, size_t size){
|
2014-03-17 10:14:46 -04:00
|
|
|
cudaMemcpy(dest,source,size,cudaMemcpyHostToDevice);
|
2015-06-25 16:18:45 -04:00
|
|
|
cudaError_t err = cudaGetLastError();
|
|
|
|
|
if (cudaSuccess != err){
|
2015-06-25 17:44:13 -04:00
|
|
|
printf("Error in cudaMemcpy (host->device): %s \n",cudaGetErrorString(err));
|
2015-06-25 16:18:45 -04:00
|
|
|
}
|
2014-03-17 10:14:46 -04:00
|
|
|
}
|
|
|
|
|
|
2018-04-03 20:13:35 -04:00
|
|
|
extern "C" void ScaLBL_AllocateZeroCopy(void** address, size_t size){
|
2018-09-22 23:46:38 -04:00
|
|
|
//cudaMallocHost(address,size);
|
|
|
|
|
cudaMalloc(address,size);
|
2018-04-30 10:29:56 -04:00
|
|
|
cudaError_t err = cudaGetLastError();
|
|
|
|
|
if (cudaSuccess != err){
|
|
|
|
|
printf("Error in cudaMallocHost: %s \n",cudaGetErrorString(err));
|
|
|
|
|
}
|
2018-04-03 20:13:35 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
extern "C" void ScaLBL_CopyToZeroCopy(void* dest, const void* source, size_t size){
|
2018-09-22 23:46:38 -04:00
|
|
|
cudaMemcpy(dest,source,size,cudaMemcpyHostToDevice);
|
|
|
|
|
cudaError_t err = cudaGetLastError();
|
|
|
|
|
//memcpy(dest, source, size);
|
2018-04-03 20:13:35 -04:00
|
|
|
|
|
|
|
|
}
|
2014-03-17 10:14:46 -04:00
|
|
|
|
2016-11-23 17:03:12 -05:00
|
|
|
extern "C" void ScaLBL_CopyToHost(void* dest, const void* source, size_t size){
|
2014-03-17 10:14:46 -04:00
|
|
|
cudaMemcpy(dest,source,size,cudaMemcpyDeviceToHost);
|
2015-06-25 16:18:45 -04:00
|
|
|
cudaError_t err = cudaGetLastError();
|
|
|
|
|
if (cudaSuccess != err){
|
2015-06-25 17:44:13 -04:00
|
|
|
printf("Error in cudaMemcpy (device->host): %s \n",cudaGetErrorString(err));
|
2015-06-25 16:18:45 -04:00
|
|
|
}
|
2014-03-17 10:14:46 -04:00
|
|
|
}
|
|
|
|
|
|
2016-11-23 17:03:12 -05:00
|
|
|
extern "C" void ScaLBL_DeviceBarrier(){
|
2014-03-17 10:14:46 -04:00
|
|
|
cudaDeviceSynchronize();
|
|
|
|
|
}
|