Skip to content

Commit

Permalink
delete pragma unroll
Browse files Browse the repository at this point in the history
  • Loading branch information
EsdeathYZH committed Jun 17, 2022
1 parent e46ef54 commit 938cde3
Showing 1 changed file with 0 additions and 3 deletions.
3 changes: 0 additions & 3 deletions paddle/phi/kernels/gpu/batch_norm_kernel.cu
Original file line number Diff line number Diff line change
Expand Up @@ -229,7 +229,6 @@ static __global__ void BNForwardTraining2DChannelLastCompStat(

// vertical block sum
int tid = threadIdx.x + threadIdx.y * blockDim.x;
#pragma unroll
for (int offset = blockDim.y / 2; offset > 0; offset >>= 1) {
if (threadIdx.y < offset * 2) {
smem_sum[tid] = x_sum;
Expand Down Expand Up @@ -365,7 +364,6 @@ static __global__ void BNForwardTraining2DCompStat(

// horizonal block sum
int tid = threadIdx.x + threadIdx.y * blockDim.x;
#pragma unroll
for (int offset = blockDim.x / 2; offset > 0; offset >>= 1) {
if (threadIdx.x < offset * 2) {
smem_sum[tid] = x_sum;
Expand Down Expand Up @@ -413,7 +411,6 @@ static __global__ void BNForwardTraining2DCompStat(

// vertical block sum
int tid = threadIdx.x + threadIdx.y * blockDim.x;
#pragma unroll
for (int offset = blockDim.x / 2; offset > 0; offset >>= 1) {
if (threadIdx.x < offset * 2) {
smem_sum[tid] = x_sum;
Expand Down

0 comments on commit 938cde3

Please sign in to comment.