devices.h
833 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
#ifndef RTS_CUDA_DEVICES
#define RTS_CUDA_DEVICES
#include <cuda.h>
namespace stim{
extern "C"
int maxThreadsPerBlock()
{
int device;
cudaGetDevice(&device); //get the id of the current device
cudaDeviceProp props; //device property structure
cudaGetDeviceProperties(&props, device);
return props.maxThreadsPerBlock;
}
extern "C"
size_t sharedMemPerBlock()
{
int device;
cudaGetDevice(&device); //get the id of the current device
cudaDeviceProp props; //device property structure
cudaGetDeviceProperties(&props, device);
return props.sharedMemPerBlock;
}
extern "C"
size_t constMem()
{
int device;
cudaGetDevice(&device); //get the id of the current device
cudaDeviceProp props; //device property structure
cudaGetDeviceProperties(&props, device);
return props.totalConstMem;
}
} //end namespace rts
#endif