fix bug

a162837 · a162837 · commit cf17e35e0147 · 2025-01-01T16:15:38.000+08:00
diff --git a/paddle/phi/kernels/cpu/clip_tensor_grad_kernel.cc b/paddle/phi/kernels/cpu/clip_tensor_grad_kernel.cc
@@ -27,14 +27,8 @@ void ClipTensorGradKernel(const Context& dev_ctx,
                           const DenseTensor& max,
                           const DenseTensor& out_grad,
                           DenseTensor* x_grad) {
-  DenseTensor tem_min;
-  MetaTensor meta_tem_min(&tem_min);
-  CastInferMeta(min, x.dtype(), &meta_tem_min);
-  CastKernel<T, Context>(dev_ctx, min, x.dtype(), &tem_min);
-  DenseTensor tem_max;
-  MetaTensor meta_tem_max(&tem_max);
-  CastInferMeta(max, x.dtype(), &meta_tem_max);
-  CastKernel<T, Context>(dev_ctx, max, x.dtype(), &tem_max);
+  DenseTensor tem_min = phi::Cast<T, Context>(dev_ctx, min, x.dtype());
+  DenseTensor tem_max = phi::Cast<T, Context>(dev_ctx, max, x.dtype());
 
   const T* x_data = x.data<T>();
   const T* min_data = tem_min.data<T>();
diff --git a/paddle/phi/kernels/cpu/clip_tensor_kernel.cc b/paddle/phi/kernels/cpu/clip_tensor_kernel.cc
@@ -27,14 +27,8 @@ void ClipTensorKernel(const Context& dev_ctx,
                       const DenseTensor& min,
                       const DenseTensor& max,
                       DenseTensor* out) {
-  DenseTensor tem_min;
-  MetaTensor meta_tem_min(&tem_min);
-  CastInferMeta(min, x.dtype(), &meta_tem_min);
-  CastKernel<T, Context>(dev_ctx, min, x.dtype(), &tem_min);
-  DenseTensor tem_max;
-  MetaTensor meta_tem_max(&tem_max);
-  CastInferMeta(max, x.dtype(), &meta_tem_max);
-  CastKernel<T, Context>(dev_ctx, max, x.dtype(), &tem_max);
+  DenseTensor tem_min = phi::Cast<T, Context>(dev_ctx, min, x.dtype());
+  DenseTensor tem_max = phi::Cast<T, Context>(dev_ctx, max, x.dtype());
 
   const T* x_data = x.data<T>();
   const T* min_data = tem_min.data<T>();
diff --git a/paddle/phi/kernels/gpu/clip_tensor_grad_kernel.cu b/paddle/phi/kernels/gpu/clip_tensor_grad_kernel.cu
@@ -44,14 +44,8 @@ void ClipTensorGradKernel(const Context& dev_ctx,
                           const DenseTensor& max,
                           const DenseTensor& out_grad,
                           DenseTensor* x_grad) {
-  DenseTensor tem_min;
-  MetaTensor meta_tem_min(&tem_min);
-  CastInferMeta(min, x.dtype(), &meta_tem_min);
-  CastKernel<T, Context>(dev_ctx, min, x.dtype(), &tem_min);
-  DenseTensor tem_max;
-  MetaTensor meta_tem_max(&tem_max);
-  CastInferMeta(max, x.dtype(), &meta_tem_max);
-  CastKernel<T, Context>(dev_ctx, max, x.dtype(), &tem_max);
+  DenseTensor tem_min = phi::Cast<T, Context>(dev_ctx, min, x.dtype());
+  DenseTensor tem_max = phi::Cast<T, Context>(dev_ctx, max, x.dtype());
 
   const T* x_data = x.data<T>();
   auto numel = x.numel();
diff --git a/paddle/phi/kernels/gpu/clip_tensor_kernel.cu b/paddle/phi/kernels/gpu/clip_tensor_kernel.cu
@@ -12,7 +12,7 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
-#include "paddle/phi/kernels/clip_kernel.h"
+#include "paddle/phi/kernels/clip_tensor_kernel.h"
 
 #include "paddle/phi/backends/gpu/gpu_context.h"
 #include "paddle/phi/backends/gpu/gpu_launch_config.h"
@@ -39,14 +39,8 @@ void ClipTensorKernel(const Context& dev_ctx,
                       const DenseTensor& min,
                       const DenseTensor& max,
                       DenseTensor* out) {
-  DenseTensor tem_min;
-  MetaTensor meta_tem_min(&tem_min);
-  CastInferMeta(min, x.dtype(), &meta_tem_min);
-  CastKernel<T, Context>(dev_ctx, min, x.dtype(), &tem_min);
-  DenseTensor tem_max;
-  MetaTensor meta_tem_max(&tem_max);
-  CastInferMeta(max, x.dtype(), &meta_tem_max);
-  CastKernel<T, Context>(dev_ctx, max, x.dtype(), &tem_max);
+  DenseTensor tem_min = phi::Cast<T, Context>(dev_ctx, min, x.dtype());
+  DenseTensor tem_max = phi::Cast<T, Context>(dev_ctx, max, x.dtype());
 
   std::vector<const DenseTensor*> ins = {&x, &tem_min, &tem_max};
   std::vector<DenseTensor*> outs = {out};
diff --git a/paddle/phi/kernels/onednn/clip_tensor_grad_kernel.cc b/paddle/phi/kernels/onednn/clip_tensor_grad_kernel.cc
@@ -13,11 +13,12 @@
 // limitations under the License.
 
 #include "paddle/phi/kernels/clip_tensor_grad_kernel.h"
-#include "paddle/phi/kernels/cast_kernel.h"
-#include "paddle/phi/kernels/elementwise_kernel.h"
 
 #include "paddle/phi/backends/onednn/onednn_reuse.h"
 #include "paddle/phi/core/kernel_registry.h"
+#include "paddle/phi/infermeta/unary.h"
+#include "paddle/phi/kernels/cast_kernel.h"
+#include "paddle/phi/kernels/elementwise_kernel.h"
 
 namespace phi {
 template <typename T, typename Context>
@@ -27,14 +28,6 @@ void ClipTensorGradKernel(const Context& dev_ctx,
                           const DenseTensor& max,
                           const DenseTensor& out_grad,
                           DenseTensor* x_grad) {
-  DenseTensor ex_min;
-  MetaTensor meta_min(&ex_min);
-  CastInferMeta(min, x.dtype(), &meta_min);
-  DenseTensor ex_max;
-  MetaTensor meta_max(&ex_max);
-  CastInferMeta(max, x.dtype(), &meta_max);
-  phi::CastKernel<T, Context>(dev_ctx, min, x.dtype(), &ex_min);
-  phi::CastKernel<T, Context>(dev_ctx, max, x.dtype(), &ex_max);
 
   const auto& onednn_engine = dev_ctx.GetEngine();
   auto& astream = OneDNNContext::tls().get_stream();
@@ -53,8 +46,8 @@ void ClipTensorGradKernel(const Context& dev_ctx,
   auto* tem_max_mask = &t_max_mask;
   auto* tem_zero_mask = &t_zero_mask;
   auto* non_const_x = &x;
-  auto* non_const_min = &ex_min;
-  auto* non_const_max = &ex_max;
+  auto* non_const_min = &min;
+  auto* non_const_max = &max;
   auto* non_const_out_grad = &out_grad;
 
   funcs::BinaryOneDNNHandler<T> Lesshandler(dnnl::algorithm::binary_lt,
diff --git a/paddle/phi/kernels/onednn/clip_tensor_kernel.cc b/paddle/phi/kernels/onednn/clip_tensor_kernel.cc
@@ -13,11 +13,12 @@
 // limitations under the License.
 
 #include "paddle/phi/kernels/clip_tensor_kernel.h"
-#include "paddle/phi/kernels/cast_kernel.h"
-#include "paddle/phi/kernels/elementwise_kernel.h"
 
 #include "paddle/phi/backends/onednn/onednn_reuse.h"
 #include "paddle/phi/core/kernel_registry.h"
+#include "paddle/phi/infermeta/unary.h"
+#include "paddle/phi/kernels/cast_kernel.h"
+#include "paddle/phi/kernels/elementwise_kernel.h"
 
 namespace phi {
 template <typename T, typename Context>
@@ -26,14 +27,6 @@ void ClipTensorKernel(const Context& dev_ctx,
                       const DenseTensor& min,
                       const DenseTensor& max,
                       DenseTensor* out) {
-  DenseTensor ex_min;
-  MetaTensor meta_min(&ex_min);
-  CastInferMeta(min, x.dtype(), &meta_min);
-  DenseTensor ex_max;
-  MetaTensor meta_max(&ex_max);
-  CastInferMeta(max, x.dtype(), &meta_max);
-  phi::CastKernel<T, Context>(dev_ctx, min, x.dtype(), &ex_min);
-  phi::CastKernel<T, Context>(dev_ctx, max, x.dtype(), &ex_max);
 
   const auto& onednn_engine = dev_ctx.GetEngine();
   auto& astream = OneDNNContext::tls().get_stream();
@@ -43,8 +36,8 @@ void ClipTensorKernel(const Context& dev_ctx,
   UnchangedInferMeta(x, &meta_out);
   auto* tem_out = &t_out;
   auto* non_const_x = &x;
-  auto* non_const_min = &ex_min;
-  auto* non_const_max = &ex_max;
+  auto* non_const_min = &min;
+  auto* non_const_max = &max;
 
   funcs::BinaryOneDNNHandler<T> MAXhandler(dnnl::algorithm::binary_max,
                                            -1,
diff --git a/paddle/phi/kernels/xpu/clip_tensor_grad_kernel.cc b/paddle/phi/kernels/xpu/clip_tensor_grad_kernel.cc
@@ -16,6 +16,7 @@
 
 #include "paddle/phi/backends/xpu/enforce_xpu.h"
 #include "paddle/phi/core/kernel_registry.h"
+#include "paddle/phi/infermeta/unary.h"
 #include "paddle/phi/kernels/cast_kernel.h"
 #include "paddle/phi/kernels/compare_kernel.h"
 #include "paddle/phi/kernels/full_kernel.h"
@@ -31,14 +32,8 @@ void ClipTensorGradKernel(const Context& dev_ctx,
                           const DenseTensor& max,
                           const DenseTensor& out_grad,
                           DenseTensor* x_grad) {
-  DenseTensor ex_min;
-  MetaTensor meta_min(&ex_min);
-  CastInferMeta(min, x.dtype(), &meta_min);
-  DenseTensor ex_max;
-  MetaTensor meta_max(&ex_max);
-  CastInferMeta(max, x.dtype(), &meta_max);
-  phi::CastKernel<T, Context>(dev_ctx, min, x.dtype(), &ex_min);
-  phi::CastKernel<T, Context>(dev_ctx, max, x.dtype(), &ex_max);
+  DenseTensor ex_min = phi::Cast<T, Context>(dev_ctx, min, x.dtype());
+  DenseTensor ex_max = phi::Cast<T, Context>(dev_ctx, max, x.dtype());
 
   phi::DenseTensor x_ls_min;
   MetaTensor meta_x_ls_min(&x_ls_min);
@@ -56,12 +51,12 @@ void ClipTensorGradKernel(const Context& dev_ctx,
   MetaTensor meta_out(&out);
   UnchangedExceptDtypeInferMeta(x, &meta_out);
   meta_out.set_dtype(phi::DataType::BOOL);
-  LogicalAndKernel<bool, Context>(dev_ctx, x_ls_min, x_ls_max, &out);
+  phi::LogicalAndKernel<bool, Context>(dev_ctx, x_ls_min, x_ls_max, &out);
 
   phi::DenseTensor zero_tensor;
   MetaTensor meta_zero(&zero_tensor);
   UnchangedInferMeta(x_grad, &meta_zero);
-  FullKernel<T, Context>(dev_ctx,
+  phi::FullKernel<T, Context>(dev_ctx,
                          common::vectorize(x_grad->dims()),
                          0.0f,
                          zero_tensor.dtype(),
diff --git a/paddle/phi/kernels/xpu/clip_tensor_kernel.cc b/paddle/phi/kernels/xpu/clip_tensor_kernel.cc
@@ -29,19 +29,10 @@ void ClipTensorKernel(const Context& dev_ctx,
                       const DenseTensor& min,
                       const DenseTensor& max,
                       DenseTensor* out) {
-  DenseTensor tem_min;
-  MetaTensor meta_tem_min(&tem_min);
-  CastInferMeta(min, x.dtype(), &meta_tem_min);
-  CastKernel<T, Context>(dev_ctx, min, x.dtype(), &tem_min);
-  DenseTensor tem_max;
-  MetaTensor meta_tem_max(&tem_max);
-  CastInferMeta(max, x.dtype(), &meta_tem_max);
-  CastKernel<T, Context>(dev_ctx, max, x.dtype(), &tem_max);
+  DenseTensor tem_min = phi::Cast<T, Context>(dev_ctx, min, x.dtype());
+  DenseTensor tem_max = phi::Cast<T, Context>(dev_ctx, max, x.dtype());
 
-  DenseTensor tem_max_out;
-  MetaTensor meta_tem_max_out(&tem_max_out);
-  ElementwiseInferMeta(min, x, &meta_tem_max_out);
-  MaximumKernel<T, Context>(dev_ctx, min, x, &tem_max_out);
+  DenseTensor tem_max_out = phi::Maximum<T, Context>(dev_ctx, min, x);
   MinimumKernel<T, Context>(dev_ctx, tem_max_out, max, out);
 }
 
@@ -54,5 +45,5 @@ PD_REGISTER_KERNEL(clip_tensor,
                    float,
                    phi::dtype::float16,
                    phi::dtype::bfloat16,
-                   int64_t,
-                   int) {}
+                   int,
+                   int64_t) {}