proper declaration of tb_sum with HIP_DYNAMIC_SHARED macro
This commit is contained in:
parent
350a151c3b
commit
ceada6922f
@ -188,9 +188,9 @@ template <class T>
|
|||||||
__global__ void dot_kernel(hipLaunchParm lp, const T * a, const T * b, T * sum, unsigned int array_size)
|
__global__ void dot_kernel(hipLaunchParm lp, const T * a, const T * b, T * sum, unsigned int array_size)
|
||||||
{
|
{
|
||||||
|
|
||||||
//extern __shared__ __align__(sizeof(T)) unsigned char smem[];
|
HIP_DYNAMIC_SHARED(T,tb_sum);
|
||||||
HIP_DYNAMIC_SHARED(unsigned char,smem);
|
// HIP_DYNAMIC_SHARED(unsigned char,smem);
|
||||||
T *tb_sum = reinterpret_cast<T*>(smem);
|
// T *tb_sum = reinterpret_cast<T*>(smem);
|
||||||
|
|
||||||
int i = hipBlockDim_x * hipBlockIdx_x + hipThreadIdx_x;
|
int i = hipBlockDim_x * hipBlockIdx_x + hipThreadIdx_x;
|
||||||
const size_t local_i = hipThreadIdx_x;
|
const size_t local_i = hipThreadIdx_x;
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user