[Bugfix][Kernel] Promote another index to int64_t (#6838)

This commit is contained in:
Tyler Michael Smith
2024-07-26 14:41:04 -04:00
committed by GitHub
parent 07278c37dd
commit 50704f52c4

View File

@ -48,7 +48,7 @@ __global__ void segmented_max_reduction(float* __restrict__ scale,
const scalar_t* __restrict__ input,
int64_t num_elems) {
__shared__ float cache[1024];
int i = blockDim.x * blockIdx.x + threadIdx.x;
int64_t i = blockDim.x * blockIdx.x + threadIdx.x;
// First store maximum for all values processes by
// the current thread in cache[threadIdx.x]