PaddlePaddle
diff --git a/‎paddle/phi/kernels/cpu/affine_channel_grad_kernel.cc‎
Lines changed: 2 additions & 2 deletions b/‎paddle/phi/kernels/cpu/affine_channel_grad_kernel.cc‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎paddle/phi/kernels/cpu/affine_channel_kernel.cc‎
Lines changed: 2 additions & 2 deletions b/‎paddle/phi/kernels/cpu/affine_channel_kernel.cc‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎paddle/phi/kernels/cpu/batch_norm_grad_kernel.cc‎
Lines changed: 9 additions & 9 deletions b/‎paddle/phi/kernels/cpu/batch_norm_grad_kernel.cc‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎paddle/phi/kernels/cpu/batch_norm_kernel.cc‎
Lines changed: 7 additions & 7 deletions b/‎paddle/phi/kernels/cpu/batch_norm_kernel.cc‎
Lines changed: 7 additions & 7 deletions
diff --git a/‎paddle/phi/kernels/cpu/group_norm_grad_kernel.cc‎
Lines changed: 4 additions & 4 deletions b/‎paddle/phi/kernels/cpu/group_norm_grad_kernel.cc‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎paddle/phi/kernels/cpu/group_norm_kernel.cc‎
Lines changed: 5 additions & 5 deletions b/‎paddle/phi/kernels/cpu/group_norm_kernel.cc‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎paddle/phi/kernels/cpu/interpolate_grad_kernel.cc‎
Lines changed: 9 additions & 9 deletions b/‎paddle/phi/kernels/cpu/interpolate_grad_kernel.cc‎
Lines changed: 9 additions & 9 deletions
@@ -55,7 +55,7 @@ void AffineChannelGradKernel(const Context& dev_ctx,
   auto dims = x->dims();
   int N = static_cast<int>(dims[0]);
   int C = static_cast<int>(
-      layout == phi::DataLayout::kNCHW ? dims[1] : dims[dims.size() - 1]);
+      layout == phi::DataLayout::NCHW ? dims[1] : dims[dims.size() - 1]);
   int HxW = static_cast<int>(x->numel() / N / C);
 
   auto* dy_d = dy->data<T>();
@@ -68,7 +68,7 @@ void AffineChannelGradKernel(const Context& dev_ctx,
   EigenVectorArrayMap<T> dscale_e(dscale_d, C);
   EigenVectorArrayMap<T> dbias_e(dbias_d, C);
 
-  if (layout == phi::DataLayout::kNCHW) {
+  if (layout == phi::DataLayout::NCHW) {
     // compute dscale and dbias
     int stride = C * HxW;
     auto* original_dy_d = dy_d;
 
@@ -51,7 +51,7 @@ void AffineChannelKernel(const Context& dev_ctx,
   auto dims = x->dims();
   int N = static_cast<int>(dims[0]);
   int C = static_cast<int>(
-      layout == phi::DataLayout::kNCHW ? dims[1] : dims[dims.size() - 1]);
+      layout == phi::DataLayout::NCHW ? dims[1] : dims[dims.size() - 1]);
   int HxW = static_cast<int>(x->numel() / N / C);
 
   auto* scale_d = scale->data<T>();
@@ -61,7 +61,7 @@ void AffineChannelKernel(const Context& dev_ctx,
 
   auto* x_d = x->data<T>();
   auto* y_d = y->data<T>();
-  if (layout == phi::DataLayout::kNCHW) {
+  if (layout == phi::DataLayout::NCHW) {
     int stride = C * HxW;
     for (int i = 0; i < N; i++) {
       ConstEigenArrayMap<T> x_e(x_d, HxW, C);
 
@@ -107,13 +107,13 @@ void BatchNormGradFunctor(const Context& dev_ctx,
           x_dims.size()));
   const int N = static_cast<int>(x_dims[0]);
   const int C = static_cast<int>(
-      data_layout == DataLayout::kNCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
+      data_layout == DataLayout::NCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
   const int sample_size = static_cast<int>(x.numel() / N / C);
 
   // input dimension is 2 and the format is NCHW. The input can be regarded as
   // NHWC format
-  if (x_dims.size() == 2 && data_layout == DataLayout::kNCHW) {
-    data_layout = DataLayout::kNHWC;
+  if (x_dims.size() == 2 && data_layout == DataLayout::NCHW) {
+    data_layout = DataLayout::NHWC;
   }
 
   // init output
@@ -207,7 +207,7 @@ void BatchNormGradFunctor(const Context& dev_ctx,
   //   formula transform ====>
   //    (y - bias) / (scale * inv_var) + est_mean
   switch (data_layout) {
-    case DataLayout::kNCHW: {
+    case DataLayout::NCHW: {
       if (is_inplace) {
         auto px = x;
         EigenArrayMap<T> x_data(
@@ -256,7 +256,7 @@ void BatchNormGradFunctor(const Context& dev_ctx,
       }
       break;
     }
-    case DataLayout::kNHWC: {
+    case DataLayout::NHWC: {
       if (is_inplace) {
         auto px = x;
         EigenArrayMap<T> x_data(
@@ -413,7 +413,7 @@ void BatchNormDoubleGradKernel(
 
   const auto& x_dims = X->dims();
   const int C = static_cast<int>(
-      data_layout == DataLayout::kNCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
+      data_layout == DataLayout::NCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
   const int sample_size = static_cast<int>(X->numel() / C);
   phi::funcs::SetConstant<Context, T> set_constant;
 
@@ -442,7 +442,7 @@ void BatchNormDoubleGradKernel(
 
   DenseTensor transformed_dx(dX->type());
   DenseTensor transformed_ddy(ddY->type());
-  if (data_layout == DataLayout::kNCHW && x_dims.size() > 2) {
+  if (data_layout == DataLayout::NCHW && x_dims.size() > 2) {
     VLOG(3) << "Transform batchnorm output from NCHW to NHWC";
     // Input Tensor
     ResizeToChannelLast<Context, T>(dev_ctx, X, &transformed_x);
@@ -585,7 +585,7 @@ void BatchNormDoubleGradKernel(
             ddscale_tile_data;
       }
     }
-    if (data_layout == DataLayout::kNCHW) {
+    if (data_layout == DataLayout::NCHW) {
       VLOG(3) << "Transform batchnorm output from NHWC to NCHW";
       TransToChannelFirst<Context, T>(dev_ctx, &transformed_dx, dX);
     }
@@ -674,7 +674,7 @@ void BatchNormDoubleGradKernel(
       ddy_arr += ddbias_tile_data;
     }
 
-    if (data_layout == DataLayout::kNCHW) {
+    if (data_layout == DataLayout::NCHW) {
       VLOG(3) << "Transform batchnorm output from NHWC to NCHW";
       TransToChannelFirst<Context, T>(dev_ctx, &transformed_ddy, ddY);
     }
 
@@ -87,7 +87,7 @@ void BatchNormKernel(const Context& dev_ctx,
           x_dims.size()));
   const int N = static_cast<int>(x_dims[0]);
   const int C = static_cast<int>(
-      data_layout == DataLayout::kNCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
+      data_layout == DataLayout::NCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
   const int sample_size = static_cast<int>(x.numel() / N / C);
 
   // alloc memory
@@ -103,8 +103,8 @@ void BatchNormKernel(const Context& dev_ctx,
 
   // input dimension is 2 and the format is NCHW. The input can be regarded
   // as NHWC format
-  if (x_dims.size() == 2 && data_layout == DataLayout::kNCHW) {
-    data_layout = DataLayout::kNHWC;
+  if (x_dims.size() == 2 && data_layout == DataLayout::NCHW) {
+    data_layout = DataLayout::NHWC;
   }
 
   if (!global_stats) {
@@ -132,7 +132,7 @@ void BatchNormKernel(const Context& dev_ctx,
     }
 
     switch (data_layout) {
-      case DataLayout::kNCHW: {
+      case DataLayout::NCHW: {
         ConstEigenArrayMap<T> x_arr(x.data<T>(), sample_size, N * C);
         for (int nc = 0; nc < N * C; ++nc) {
           saved_mean_e(nc % C) += x_arr.col(nc).sum();
@@ -145,7 +145,7 @@ void BatchNormKernel(const Context& dev_ctx,
         saved_variance_e /= N * sample_size;
         break;
       }
-      case DataLayout::kNHWC: {
+      case DataLayout::NHWC: {
         ConstEigenArrayMap<T> x_arr(x.data<T>(), C, N * sample_size);
         for (int i = 0; i < N * sample_size; ++i) {
           saved_mean_e += x_arr.col(i);
@@ -253,15 +253,15 @@ void BatchNormKernel(const Context& dev_ctx,
   }
 
   switch (data_layout) {
-    case DataLayout::kNCHW: {
+    case DataLayout::NCHW: {
       EigenArrayMap<T> y_arr(dev_ctx.template Alloc<T>(y), sample_size, N * C);
       ConstEigenArrayMap<T> x_arr(x.data<T>(), sample_size, N * C);
       for (int nc = 0; nc < N * C; ++nc) {
         y_arr.col(nc) = x_arr.col(nc) * new_scale(nc % C) + new_bias(nc % C);
       }
       break;
     }
-    case DataLayout::kNHWC: {
+    case DataLayout::NHWC: {
       EigenArrayMap<T>(dev_ctx.template Alloc<T>(y), C, N * sample_size) =
           (ConstEigenArrayMap<T>(x.data<T>(), C, N * sample_size).colwise() *
            new_scale)
 
@@ -72,7 +72,7 @@ void GroupNormGradKernel(const Context& dev_ctx,
   const auto bias_ptr = bias.get_ptr();
   const auto& x_dims = y.dims();
   const int C = static_cast<int>(
-      data_layout == DataLayout::kNCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
+      data_layout == DataLayout::NCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
   const int group_size = C / groups;
 
   phi::funcs::SetConstant<CPUContext, T> set_zero;
@@ -107,7 +107,7 @@ void GroupNormGradKernel(const Context& dev_ctx,
   if (bias_ptr) bias_data = bias_ptr->data<T>();
 
   int imsize = 1;
-  if (data_layout == DataLayout::kNCHW) {
+  if (data_layout == DataLayout::NCHW) {
     for (int i = 2; i < x_dims.size(); ++i) {
       imsize *= static_cast<int>(x_dims[i]);
     }
@@ -135,7 +135,7 @@ void GroupNormGradKernel(const Context& dev_ctx,
       auto* iter_d_x_data_backup = iter_d_x_data;
       T dp_scale = 0, dp_bias = 0;
 
-      if (data_layout == DataLayout::kNCHW) {
+      if (data_layout == DataLayout::NCHW) {
         for (int cid = 0; cid < number; cid++) {
           for (int imid = 0; imid < imsize;
                imid++, iter_x_data++, iter_y_data++) {
@@ -221,7 +221,7 @@ void GroupNormGradKernel(const Context& dev_ctx,
         }
       }
     }
-    if (data_layout == DataLayout::kNHWC) {
+    if (data_layout == DataLayout::NHWC) {
       iter_x_data = x_data + (bid + 1) * C * imsize;
       if (d_x_data) {
         iter_d_x_data = d_x_data + (bid + 1) * C * imsize;
 
@@ -60,7 +60,7 @@ void GroupNormKernel(const Context& dev_ctx,
 
   const auto x_dims = x.dims();
   const int C = static_cast<int>(
-      data_layout == DataLayout::kNCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
+      data_layout == DataLayout::NCHW ? x_dims[1] : x_dims[x_dims.size() - 1]);
   const int group_size = C / groups;
 
   dev_ctx.template Alloc<T>(y);
@@ -78,7 +78,7 @@ void GroupNormKernel(const Context& dev_ctx,
   if (bias_ptr) bias_data = bias_ptr->data<T>();
 
   int imsize = 1;
-  if (data_layout == DataLayout::kNCHW) {
+  if (data_layout == DataLayout::NCHW) {
     for (int i = 2; i < x_dims.size(); ++i) {
       imsize *= static_cast<int>(x_dims[i]);
     }
@@ -103,7 +103,7 @@ void GroupNormKernel(const Context& dev_ctx,
       auto* tmp_y = iter_y_data;
       auto* y_src_data = iter_y_data;
 
-      if (data_layout == DataLayout::kNCHW) {
+      if (data_layout == DataLayout::NCHW) {
         for (int cid = 0; cid < number; cid++) {
           int imid = 0;
           for (imid = 0; imid < imsize - (imsize % M);
@@ -186,7 +186,7 @@ void GroupNormKernel(const Context& dev_ctx,
       mean_data[bid * groups + gid] = x_mean;
       var_data[bid * groups + gid] = x_var;
 
-      if (data_layout == DataLayout::kNCHW) {
+      if (data_layout == DataLayout::NCHW) {
         for (int cid = 0; cid < number; cid++) {
           for (int imid = 0; imid < imsize; imid++, tmp_x++, iter_y_data++) {
             T val = (tmp_x[0] - x_mean) * var_inv;
@@ -210,7 +210,7 @@ void GroupNormKernel(const Context& dev_ctx,
         iter_y_data = tmp_y + group_size;
       }
     }
-    if (data_layout == DataLayout::kNHWC) {
+    if (data_layout == DataLayout::NHWC) {
       iter_x_data = x_data + (bid + 1) * C * imsize;
       iter_y_data = y_data + (bid + 1) * C * imsize;
     }
 
@@ -56,7 +56,7 @@ static void LinearInterpolationGrad(const DenseTensor& output_grad,
     for (int i = 0; i < n; i++) {    // loop for batches
       for (int j = 0; j < c; j++) {  // loop for channels
         // linear interpolation grad
-        if (data_layout == DataLayout::kNCHW) {
+        if (data_layout == DataLayout::NCHW) {
           const MT grad = static_cast<MT>(output_grad_t(i, j, l));
           input_grad_t(i, j, x_w) += static_cast<T>(grad * d_e);
           input_grad_t(i, j, x_e) += static_cast<T>(grad * d_w);
@@ -118,7 +118,7 @@ static void BilinearInterpolationGrad(const DenseTensor& output_grad,
       for (int i = 0; i < n; i++) {    // loop for batches
         for (int j = 0; j < c; j++) {  // loop for channels
           // bilinear interpolation grad
-          if (data_layout == DataLayout::kNCHW) {
+          if (data_layout == DataLayout::NCHW) {
             const MT grad = static_cast<MT>(output_grad_t(i, j, k, l));
             input_grad_t(i, j, y_n, x_w) += static_cast<T>(grad * d_s * d_e);
             input_grad_t(i, j, y_s, x_w) += static_cast<T>(grad * d_n * d_e);
@@ -163,7 +163,7 @@ static void NearestNeighborInterpolateGrad(const DenseTensor& output_grad,
 
       for (int i = 0; i < n; i++) {    // loop for batches
         for (int j = 0; j < c; j++) {  // loop for channels
-          if (data_layout == DataLayout::kNCHW) {
+          if (data_layout == DataLayout::NCHW) {
             input_grad_t(i, j, in_k, in_l) += output_grad_t(i, j, k, l);
           } else {
             input_grad_t(i, in_k, in_l, j) += output_grad_t(i, k, l, j);
@@ -218,7 +218,7 @@ static void BicubicInterpolationGrad(const DenseTensor& output_grad,
                                       static_cast<int64_t>(0));
               int access_y = std::max(std::min(input_y - 1 + jj, in_h - 1),
                                       static_cast<int64_t>(0));
-              if (data_layout == DataLayout::kNCHW) {
+              if (data_layout == DataLayout::NCHW) {
                 MT grad = static_cast<MT>(output_grad_t(i, j, k, l));
                 input_grad_t(i, j, access_y, access_x) +=
                     static_cast<T>(grad * y_coeffs[jj] * x_coeffs[ii]);
@@ -298,7 +298,7 @@ static void TrilinearInterpolationGrad(const DenseTensor& output_grad,
         for (int b = 0; b < n; b++) {    // loop for batches
           for (int i = 0; i < c; i++) {  // loop for channels
             // trilinear interpolation grad
-            if (data_layout == DataLayout::kNCHW) {
+            if (data_layout == DataLayout::NCHW) {
               const MT grad = static_cast<MT>(output_grad_t(b, i, j, k, l));
               input_grad_t(b, i, t_f, y_n, x_w) +=
                   static_cast<T>(grad * d_b * d_s * d_e);
@@ -377,7 +377,7 @@ static void NearestNeighbor3DInterpolateGrad(const DenseTensor& output_grad,
 
         for (int i = 0; i < n; i++) {    // loop for batches
           for (int j = 0; j < c; j++) {  // loop for channels
-            if (data_layout == DataLayout::kNCHW) {
+            if (data_layout == DataLayout::NCHW) {
               input_grad_t(i, j, in_d, in_k, in_l) +=
                   output_grad_t(i, j, d, k, l);
             } else {
@@ -449,7 +449,7 @@ static void Interpolate1DCPUBwd(
   }
 
   phi::DDim dim_grad;
-  if (data_layout == DataLayout::kNCHW) {
+  if (data_layout == DataLayout::NCHW) {
     dim_grad = {n, c, in_w};
   } else {
     dim_grad = {n, in_w, c};
@@ -575,7 +575,7 @@ static void Interpolate2DCPUBwd(
   }
 
   phi::DDim dim_grad;
-  if (data_layout == DataLayout::kNCHW) {
+  if (data_layout == DataLayout::NCHW) {
     dim_grad = {n, c, in_h, in_w};
   } else {
     dim_grad = {n, in_h, in_w, c};
@@ -753,7 +753,7 @@ static void Interpolate3DCPUBwd(
   }
 
   phi::DDim dim_grad;
-  if (data_layout == DataLayout::kNCHW) {
+  if (data_layout == DataLayout::NCHW) {
     dim_grad = {n, c, in_d, in_h, in_w};
   } else {
     dim_grad = {n, in_d, in_h, in_w, c};