PaddlePaddle
diff --git a/‎paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/multiary_infer_sym.cc‎
Lines changed: 6 additions & 0 deletions b/‎paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/multiary_infer_sym.cc‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/multiary_infer_sym.h‎
Lines changed: 1 addition & 0 deletions b/‎paddle/fluid/pir/dialect/operator/interface/infer_symbolic_shape/multiary_infer_sym.h‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎paddle/phi/kernels/cpu/interpolate_grad_kernel.cc‎
Lines changed: 20 additions & 54 deletions b/‎paddle/phi/kernels/cpu/interpolate_grad_kernel.cc‎
Lines changed: 20 additions & 54 deletions
diff --git a/‎paddle/phi/kernels/cpu/interpolate_kernel.cc‎
Lines changed: 17 additions & 49 deletions b/‎paddle/phi/kernels/cpu/interpolate_kernel.cc‎
Lines changed: 17 additions & 49 deletions
diff --git a/‎paddle/phi/kernels/funcs/interpolate_function.h‎
Lines changed: 79 additions & 8 deletions b/‎paddle/phi/kernels/funcs/interpolate_function.h‎
Lines changed: 79 additions & 8 deletions
@@ -772,6 +772,12 @@ bool BilinearInterpOpInferSymbolicShape(
   return BicubicInterpOpInferSymbolicShape(op, infer_context);
 }
 
+// TODO(zrr1999): add test
+// bool InterpAntialiasOpInferSymbolicShape(
+//     pir::Operation *op, pir::InferSymbolicShapeContext *infer_context) {
+//   return BicubicInterpOpInferSymbolicShape(op, infer_context);
+// }
+
 bool BoxCoderOpInferSymbolicShape(
     pir::Operation *op, pir::InferSymbolicShapeContext *infer_context) {
   const symbol::ShapeOrDataDimExprs &prior_box_shape_or_data =
 
@@ -33,6 +33,7 @@ OP_DECLARE_INFER_SYMBOLIC_SHAPE(BatchNorm_)
 OP_DECLARE_INFER_SYMBOLIC_SHAPE(BicubicInterp)
 OP_DECLARE_INFER_SYMBOLIC_SHAPE(Bilinear)
 OP_DECLARE_INFER_SYMBOLIC_SHAPE(BilinearInterp)
+OP_DECLARE_INFER_SYMBOLIC_SHAPE(InterpAntialias)
 OP_DECLARE_INFER_SYMBOLIC_SHAPE(BoxCoder)
 OP_DECLARE_INFER_SYMBOLIC_SHAPE(CheckFiniteAndUnscale)
 OP_DECLARE_INFER_SYMBOLIC_SHAPE(CheckFiniteAndUnscale_)
 
@@ -206,8 +206,8 @@ static void BicubicInterpolationGrad(const DenseTensor& output_grad,
       std::array<MT, 4> x_coeffs;
       std::array<MT, 4> y_coeffs;
 
-      funcs::get_cubic_upsample_coefficients<MT>(x_coeffs.data(), x_t);
-      funcs::get_cubic_upsample_coefficients<MT>(y_coeffs.data(), y_t);
+      funcs::GetCubicUpsampleCoefficients<MT>(x_coeffs.data(), x_t);
+      funcs::GetCubicUpsampleCoefficients<MT>(y_coeffs.data(), y_t);
 
       for (int i = 0; i < n; i++) {    // loop for batches
         for (int j = 0; j < c; j++) {  // loop for channels
@@ -592,27 +592,18 @@ static void Interpolate2DCPUBwd(
     return;
   }
 
-  float ratio_h = 0.f;
-  float ratio_w = 0.f;
-  if (out_h > 1) {
-    float new_scale_h = 0.f;
-    new_scale_h = static_cast<float>(
-        (scale_h > 0) ? (1.f / scale_h)
-                      : static_cast<float>(in_h) / static_cast<float>(out_h));
-    ratio_h =
-        static_cast<float>(align_corners ? (static_cast<float>(in_h) - 1.f) /
-                                               (static_cast<float>(out_h) - 1.f)
-                                         : new_scale_h);
+  using MT = typename phi::dtype::MPTypeTrait<T>::Type;
+  double ratio_h =
+      funcs::AreaPixelComputeScale<float>(in_h, out_h, align_corners, scale_h);
+  double ratio_w =
+      funcs::AreaPixelComputeScale<float>(in_w, out_w, align_corners, scale_w);
+
+  // TODO(zrr1999): to align xpu
+  if (out_h <= 1) {
+    ratio_h = 0;
   }
-  if (out_w > 1) {
-    float new_scale_w = 0.f;
-    new_scale_w = static_cast<float>(
-        (scale_w > 0) ? (1.f / scale_w)
-                      : static_cast<float>(in_w) / static_cast<float>(out_w));
-    ratio_w =
-        static_cast<float>(align_corners ? (static_cast<float>(in_w) - 1.f) /
-                                               (static_cast<float>(out_w) - 1.f)
-                                         : new_scale_w);
+  if (out_w <= 1) {
+    ratio_w = 0;
   }
 
   if ("bilinear" == interp_method) {
@@ -778,38 +769,13 @@ static void Interpolate3DCPUBwd(
     return;
   }
 
-  float ratio_d = 0.f;
-  float ratio_h = 0.f;
-  float ratio_w = 0.f;
-  if (out_d > 1) {
-    float new_scale_d = 0.f;
-    new_scale_d = static_cast<float>(
-        (scale_d > 0) ? (1.f / scale_d)
-                      : static_cast<float>(in_d) / static_cast<float>(out_d));
-    ratio_d =
-        static_cast<float>(align_corners ? (static_cast<float>(in_d) - 1.f) /
-                                               (static_cast<float>(out_d) - 1.f)
-                                         : new_scale_d);
-  }
-  if (out_h > 1) {
-    float new_scale_h = 0.f;
-    new_scale_h = static_cast<float>(
-        (scale_h > 0) ? (1.f / scale_h)
-                      : static_cast<float>(in_h) / static_cast<float>(out_h));
-    ratio_h = (align_corners) ? static_cast<float>(in_h - 1) /
-                                    (static_cast<float>(out_h) - 1)
-                              : static_cast<float>(new_scale_h);
-  }
-  if (out_w > 1) {
-    float new_scale_w = 0.f;
-    new_scale_w = static_cast<float>(
-        (scale_w > 0) ? (1.f / scale_w)
-                      : static_cast<float>(in_w) / static_cast<float>(out_w));
-    ratio_w =
-        static_cast<float>(align_corners ? (static_cast<float>(in_w) - 1.f) /
-                                               (static_cast<float>(out_w) - 1.f)
-                                         : new_scale_w);
-  }
+  using MT = typename phi::dtype::MPTypeTrait<T>::Type;
+  double ratio_d =
+      funcs::AreaPixelComputeScale<float>(in_d, out_d, align_corners, scale_d);
+  double ratio_h =
+      funcs::AreaPixelComputeScale<float>(in_h, out_h, align_corners, scale_h);
+  double ratio_w =
+      funcs::AreaPixelComputeScale<float>(in_w, out_w, align_corners, scale_w);
 
   if ("trilinear" == interp_method) {
     TrilinearInterpolationGrad<T>(output_grad,
 
@@ -26,7 +26,7 @@ namespace phi {
 template <typename T>
 static inline T cubic_interp(T x0, T x1, T x2, T x3, T t) {
   std::array<T, 4> coeffs;
-  funcs::get_cubic_upsample_coefficients<T>(coeffs.data(), t);
+  funcs::GetCubicUpsampleCoefficients<T>(coeffs.data(), t);
 
   return x0 * coeffs[0] + x1 * coeffs[1] + x2 * coeffs[2] + x3 * coeffs[3];
 }
@@ -754,25 +754,17 @@ static void Interpolate2DCPUFwd(
     return;
   }
 
-  float ratio_h = 0.f;
-  float ratio_w = 0.f;
-  if (out_h > 1) {
-    float new_scale_h = 0.f;
-    new_scale_h = (scale_h > 0)
-                      ? static_cast<float>(1. / scale_h)
-                      : static_cast<float>(in_h) / static_cast<float>(out_h);
-    ratio_h = (align_corners)
-                  ? static_cast<float>(in_h - 1) / static_cast<float>(out_h - 1)
-                  : static_cast<float>(new_scale_h);
+  float ratio_h =
+      funcs::AreaPixelComputeScale<float>(in_h, out_h, align_corners, scale_h);
+  float ratio_w =
+      funcs::AreaPixelComputeScale<float>(in_w, out_w, align_corners, scale_w);
+
+  // TODO(zrr1999): to align xpu
+  if (out_h <= 1) {
+    ratio_h = 0;
   }
-  if (out_w > 1) {
-    float new_scale_w = 0.f;
-    new_scale_w = (scale_w > 0)
-                      ? static_cast<float>(1. / scale_w)
-                      : static_cast<float>(in_w) / static_cast<float>(out_w);
-    ratio_w = (align_corners)
-                  ? static_cast<float>(in_w - 1) / static_cast<float>(out_w - 1)
-                  : static_cast<float>(new_scale_w);
+  if (out_w <= 1) {
+    ratio_w = 0;
   }
 
   if ("bilinear" == interp_method) {
@@ -953,36 +945,12 @@ static void Interpolate3DCPUFwd(
     return;
   }
 
-  float ratio_d = 0.f;
-  float ratio_h = 0.f;
-  float ratio_w = 0.f;
-  if (out_d > 1) {
-    float new_scale_d = 0.f;
-    new_scale_d = (scale_d > 0)
-                      ? static_cast<float>(1. / scale_d)
-                      : static_cast<float>(in_d) / static_cast<float>(out_d);
-    ratio_d = (align_corners)
-                  ? static_cast<float>(in_d - 1) / static_cast<float>(out_d - 1)
-                  : static_cast<float>(new_scale_d);
-  }
-  if (out_h > 1) {
-    float new_scale_h = 0.f;
-    new_scale_h = (scale_h > 0)
-                      ? static_cast<float>(1. / scale_h)
-                      : static_cast<float>(in_h) / static_cast<float>(out_h);
-    ratio_h = (align_corners)
-                  ? static_cast<float>(in_h - 1) / static_cast<float>(out_h - 1)
-                  : static_cast<float>(new_scale_h);
-  }
-  if (out_w > 1) {
-    float new_scale_w = 0.f;
-    new_scale_w = (scale_w > 0)
-                      ? static_cast<float>(1. / scale_w)
-                      : static_cast<float>(in_w) / static_cast<float>(out_w);
-    ratio_w = (align_corners)
-                  ? static_cast<float>(in_w - 1) / static_cast<float>(out_w - 1)
-                  : static_cast<float>(new_scale_w);
-  }
+  float ratio_d =
+      funcs::AreaPixelComputeScale<float>(in_d, out_d, align_corners, scale_d);
+  float ratio_h =
+      funcs::AreaPixelComputeScale<float>(in_h, out_h, align_corners, scale_h);
+  float ratio_w =
+      funcs::AreaPixelComputeScale<float>(in_w, out_w, align_corners, scale_w);
 
   if ("trilinear" == interp_method) {
     TrilinearInterpolation<T>(x,
 
@@ -26,30 +26,60 @@
 namespace phi {
 namespace funcs {
 
+template <typename T>
+inline T AreaPixelComputeScale(int64_t input_size,
+                               int64_t output_size,
+                               bool align_corners,
+                               const T scale) {
+  if (align_corners) {
+    if (output_size > 1) {
+      return static_cast<T>(input_size - 1) / (output_size - 1);
+    }
+  } else {
+    if (scale > 0.) {
+      return static_cast<T>(1.0) / scale;
+    }
+    if (output_size > 0) {
+      return static_cast<T>(input_size) / output_size;
+    }
+  }
+  return static_cast<T>(0);
+}
+
+template <typename T>
+HOSTDEVICE inline T AreaPixelComputeSourceIndex(T scale,
+                                                int64_t dst_index,
+                                                bool align_corners,
+                                                T align_type_value = 0.5) {
+  if (align_corners) {
+    return scale * dst_index;
+  } else {
+    return scale * (dst_index + align_type_value) - align_type_value;
+  }
+}
+
 template <typename T>
 HOSTDEVICE inline T CubicConvolution1(T x, T A) {
-  return ((A + static_cast<T>(2)) * x - (A + static_cast<T>(3))) * x * x +
-         static_cast<T>(1);
+  return ((A + 2) * x - (A + 3)) * x * x + 1;
 }
 
 template <typename T>
 HOSTDEVICE inline T CubicConvolution2(T x, T A) {
-  return ((A * x - static_cast<T>(5) * A) * x + static_cast<T>(8) * A) * x -
-         static_cast<T>(4) * A;
+  return ((A * x - 5 * A) * x + 8 * A) * x - 4 * A;
 }
 
 template <typename T>
-HOSTDEVICE inline void get_cubic_upsample_coefficients(T coeffs[4], T t) {
+HOSTDEVICE inline void GetCubicUpsampleCoefficients(T coeffs[4], T t) {
   T A = static_cast<T>(-0.75);
 
   T x1 = t;
-  coeffs[0] = CubicConvolution2<T>(x1 + static_cast<T>(1.0), A);
+  coeffs[0] = CubicConvolution2<T>(x1 + 1.0, A);
   coeffs[1] = CubicConvolution1<T>(x1, A);
 
   // opposite coefficients
-  T x2 = static_cast<T>(1.0) - t;
+  T x2 = 1.0 - t;
   coeffs[2] = CubicConvolution1<T>(x2, A);
-  coeffs[3] = CubicConvolution2<T>(x2 + static_cast<T>(1.0), A);
+  coeffs[3] = CubicConvolution2<T>(x2 + 1.0, A);
 }
 
 inline void ExtractNCDWH(const DDim& dims,
@@ -197,5 +227,46 @@ struct FastDivModForInterpolate {
 
 #endif
 
+namespace antialias {
+
+// taken from
+// https://github.com/pytorch/pytorch/blob/a527e816935957a164d74dd7c5069310b2857695/
+// aten/src/ATen/native/cuda/UpSample.cuh#L207-L305
+struct BilinearFilterFunctor {
+  template <typename T>
+  HOSTDEVICE T operator()(T x) const {
+    if (x < 0) {
+      x = -x;
+    }
+    if (x < 1) {
+      return 1 - x;
+    }
+    return 0;
+  }
+
+  static constexpr int size = 2;
+};
+struct BicubicFilterFunctor {
+  template <typename T>
+  HOSTDEVICE T operator()(T x) const {
+    // https://en.wikipedia.org/wiki/Bicubic_interpolation#Bicubic_convolution_algorithm
+    const T a = -0.5;
+    if (x < 0) {
+      x = -x;
+    }
+    if (x < 1) {
+      return ((a + 2) * x - (a + 3)) * x * x + 1;
+    }
+    if (x < 2) {
+      return (((x - 5) * x + 8) * x - 4) * a;
+    }
+    return 0;
+  }
+
+  static constexpr int size = 4;
+};
+
+}  // namespace antialias
+
 }  // namespace funcs
 }  // namespace phi