diff --git a/src/libtorchaudio/forced_align/gpu/compute.cu b/src/libtorchaudio/forced_align/gpu/compute.cu index ef7d9acaae..c7800d39e9 100644 --- a/src/libtorchaudio/forced_align/gpu/compute.cu +++ b/src/libtorchaudio/forced_align/gpu/compute.cu @@ -1,3 +1,4 @@ +#include #include #include #include @@ -94,7 +95,7 @@ __global__ void falign_cuda_step_kernel( alphas_a[curIdxOffset][i] = result + logProbs_a[batchIndex][t][labelIdx]; threadMax = max(threadMax, alphas_a[curIdxOffset][i]); } - scalar_t maxResult = BlockReduce(tempStorage).Reduce(threadMax, cub::Max()); + scalar_t maxResult = BlockReduce(tempStorage).Reduce(threadMax, cuda::maximum{}); if (threadIdx.x == 0) { maxValue = maxResult; }