PaddlePaddle · luotao1 · Nov 24, 2022 · Nov 19, 2022 · Nov 19, 2022 · Nov 19, 2022
diff --git a/paddle/fluid/distributed/ps/service/brpc_utils.cc b/paddle/fluid/distributed/ps/service/brpc_utils.cc
@@ -111,14 +111,13 @@ void SerializeLodTensor(framework::Variable* var,
   }
   // IO Buffer
   if (platform::is_cpu_place(tensor->place())) {
-    auto data_len = tensor->numel() * framework::DataTypeSize(tensor->dtype());
+    auto data_len = tensor->numel() * phi::SizeOf(tensor->dtype());
     iobuf->append(reinterpret_cast<const char*>(&data_len), 8);
     iobuf->append(reinterpret_cast<const char*>(tensor->data()), data_len);
   } else {
 #ifdef PADDLE_WITH_CUDA
     char* temp_ptr =
-        new char[tensor->numel() *
-                 framework::DataTypeSize(tensor->dtype())];  // NOLINT
+        new char[tensor->numel() * phi::SizeOf(tensor->dtype())];  // NOLINT
     auto stream = reinterpret_cast<const phi::GPUContext&>(ctx).stream();
     memory::Copy(
         platform::CPUPlace(),
@@ -128,7 +127,7 @@ void SerializeLodTensor(framework::Variable* var,
         tensor->numel() * framework::SizeOfType(
                               framework::TransToProtoVarType(tensor->dtype())),
         stream);
-    auto data_len = tensor->numel() * framework::DataTypeSize(tensor->dtype());
+    auto data_len = tensor->numel() * phi::SizeOf(tensor->dtype());
     iobuf->append(reinterpret_cast<const char*>(&data_len), 8);
     iobuf->append(reinterpret_cast<const char*>(temp_ptr), data_len);
     delete[] temp_ptr;
@@ -159,14 +158,13 @@ void SerializeSelectedRows(framework::Variable* var,
   }
   // IO Buffer
   if (platform::is_cpu_place(tensor->place())) {
-    auto data_len = tensor->numel() * framework::DataTypeSize(tensor->dtype());
+    auto data_len = tensor->numel() * phi::SizeOf(tensor->dtype());
     iobuf->append(reinterpret_cast<const char*>(&data_len), 8);
     iobuf->append(reinterpret_cast<const char*>(tensor->data()), data_len);
   } else {
 #ifdef PADDLE_WITH_CUDA
     char* temp_ptr =
-        new char[tensor->numel() *
-                 framework::DataTypeSize(tensor->dtype())];  // NOLINT
+        new char[tensor->numel() * phi::SizeOf(tensor->dtype())];  // NOLINT
     auto stream = reinterpret_cast<const phi::GPUContext&>(ctx).stream();
     memory::Copy(
         platform::CPUPlace(),
@@ -176,7 +174,7 @@ void SerializeSelectedRows(framework::Variable* var,
         tensor->numel() * framework::SizeOfType(
                               framework::TransToProtoVarType(tensor->dtype())),
         stream);
-    auto data_len = tensor->numel() * framework::DataTypeSize(tensor->dtype());
+    auto data_len = tensor->numel() * phi::SizeOf(tensor->dtype());
     iobuf->append(reinterpret_cast<const char*>(&data_len), 8);
     iobuf->append(reinterpret_cast<const char*>(temp_ptr), data_len);
     delete[] temp_ptr;
@@ -259,16 +257,15 @@ void DeserializeLodTensor(framework::Variable* var,
 #ifdef PADDLE_WITH_CUDA
     unsigned long data_len;  // NOLINT
     char* temp_ptr =
-        new char[tensor->numel() *
-                 framework::DataTypeSize(tensor->dtype())];     // NOLINT
-    io_buffer_itr.copy_and_forward((void*)(&data_len), 8);      // NOLINT
-    io_buffer_itr.copy_and_forward((void*)temp_ptr, data_len);  // NOLINT
+        new char[tensor->numel() * phi::SizeOf(tensor->dtype())];  // NOLINT
+    io_buffer_itr.copy_and_forward((void*)(&data_len), 8);         // NOLINT
+    io_buffer_itr.copy_and_forward((void*)temp_ptr, data_len);     // NOLINT
     auto stream = reinterpret_cast<const phi::GPUContext&>(ctx).stream();
     memory::Copy(place,
                  tensor_data,
                  platform::CPUPlace(),
                  (void*)temp_ptr,  // NOLINT
-                 tensor->numel() * framework::DataTypeSize(tensor->dtype()),
+                 tensor->numel() * phi::SizeOf(tensor->dtype()),
                  stream);
     delete[] temp_ptr;
 #endif
@@ -303,17 +300,16 @@ void DeserializeSelectedRows(
   } else if (platform::is_gpu_place(place)) {
 #ifdef PADDLE_WITH_CUDA
     char* temp_ptr =
-        new char[tensor->numel() *
-                 framework::DataTypeSize(tensor->dtype())];  // NOLINT
-    unsigned long data_len;                                  // NOLINT
-    io_buffer_itr.copy_and_forward((void*)(&data_len), 8);   // NOLINT
+        new char[tensor->numel() * phi::SizeOf(tensor->dtype())];  // NOLINT
+    unsigned long data_len;                                        // NOLINT
+    io_buffer_itr.copy_and_forward((void*)(&data_len), 8);         // NOLINT
     io_buffer_itr.copy_and_forward(temp_ptr, data_len);
     auto stream = reinterpret_cast<const phi::GPUContext&>(ctx).stream();
     memory::Copy(place,
                  tensor_data,
                  platform::CPUPlace(),
                  temp_ptr,
-                 tensor->numel() * framework::DataTypeSize(tensor->dtype()),
+                 tensor->numel() * phi::SizeOf(tensor->dtype()),
                  stream);
     delete[] temp_ptr;
 #endif

diff --git a/paddle/fluid/distributed/ps/service/heter_client.cc b/paddle/fluid/distributed/ps/service/heter_client.cc
@@ -41,14 +41,14 @@ int GetMicroId(const platform::DeviceContext& ctx,
   } else {
 #ifdef PADDLE_WITH_CUDA
     std::vector<char> temp;
-    temp.resize(tensor->numel() * framework::DataTypeSize(tensor->dtype()));
+    temp.resize(tensor->numel() * phi::SizeOf(tensor->dtype()));
     char* temp_ptr = temp.data();
     auto stream = reinterpret_cast<const phi::GPUContext&>(ctx).stream();
     memory::Copy(platform::CPUPlace(),
                  temp_ptr,
                  tensor->place(),
                  tensor->data(),
-                 tensor->numel() * framework::DataTypeSize(tensor->dtype()),
+                 tensor->numel() * phi::SizeOf(tensor->dtype()),
                  stream);
     float* temp_ptr_float = reinterpret_cast<float*>(temp_ptr);
     micro_id = static_cast<int>(temp_ptr_float[0]);

diff --git a/paddle/fluid/eager/amp_auto_cast.h b/paddle/fluid/eager/amp_auto_cast.h
@@ -48,7 +48,7 @@ inline std::vector<paddle::experimental::Tensor> AmpAutoCasts(
     std::string op_name) {
   VLOG(6) << "AMP AmpAutoCasts:"
           << " inputs(" << inputs_name << ") dst_dtype("
-          << paddle::framework::DataType2String(dst_dtype) << ").";
+          << phi::DataTypeToString(dst_dtype) << ").";
   std::vector<paddle::experimental::Tensor> inputs_casted;
   for (auto& input : inputs) {
     if (NeedCast(input, dst_dtype)) {
@@ -71,7 +71,7 @@ inline paddle::experimental::Tensor AmpAutoCast(
     std::string op_name) {
   VLOG(6) << "AMP AmpAutoCasts:"
           << " input(" << input_name << ") dst_dtype("
-          << paddle::framework::DataType2String(dst_dtype) << ").";
+          << phi::DataTypeToString(dst_dtype) << ").";
   if (dst_dtype == paddle::experimental::DataType::FLOAT16) {
     if (op_name == "run_program") {
       return input;

diff --git a/paddle/fluid/eager/eager_amp_auto_cast.h b/paddle/fluid/eager/eager_amp_auto_cast.h
@@ -68,7 +68,7 @@ inline std::vector<paddle::experimental::Tensor> EagerAmpAutoCasts(
     bool trace_backward = true) {
   VLOG(6) << "AMP AmpAutoCasts:"
           << " inputs(" << inputs_name << ") dst_dtype("
-          << paddle::framework::DataType2String(dst_dtype) << ").";
+          << phi::DataTypeToString(dst_dtype) << ").";
   std::vector<paddle::experimental::Tensor> inputs_casted;
   for (auto& input : inputs) {
     if (NeedCast(input, dst_dtype)) {
@@ -88,7 +88,7 @@ inline paddle::experimental::Tensor EagerAmpAutoCast(
     bool trace_backward = true) {
   VLOG(6) << "AMP AmpAutoCasts:"
           << " input(" << egr::EagerUtils::TensorStr(input) << " to dst_dtype("
-          << paddle::framework::DataType2String(dst_dtype) << ").";
+          << phi::DataTypeToString(dst_dtype) << ").";
   if (dst_dtype == paddle::experimental::DataType::FLOAT16) {
     if (op_name == "run_program") {
       return input;

@@ -41,16 +41,16 @@ static void CheckTensor(const paddle::experimental::Tensor& pre,
         "The tensor in before and after hook are not consistent"));
   }
   if (pre.initialized() && post.initialized()) {
-    VLOG(7) << paddle::framework::DataType2String(pre.dtype()) << " "
-            << paddle::framework::DataType2String(post.dtype());
+    VLOG(7) << phi::DataTypeToString(pre.dtype()) << " "
+            << phi::DataTypeToString(post.dtype());
     PADDLE_ENFORCE_EQ(
         pre.dtype(),
         post.dtype(),
         paddle::platform::errors::PermissionDenied(
             "The dtype of tensor before(%s) and after(%s) hook are not "
             "consistent",
-            paddle::framework::DataType2String(pre.dtype()),
-            paddle::framework::DataType2String(post.dtype())));
+            phi::DataTypeToString(pre.dtype()),
+            phi::DataTypeToString(post.dtype())));
     PADDLE_ENFORCE_EQ(pre.place(),
                       post.place(),
                       paddle::platform::errors::PermissionDenied(

diff --git a/paddle/fluid/framework/CMakeLists.txt b/paddle/fluid/framework/CMakeLists.txt
@@ -1246,23 +1246,7 @@ cc_test(
   SRCS phi_utils_test.cc
   DEPS phi_utils)
 
-if(WITH_GPU OR WITH_ROCM)
-  cc_library(
-    fluid_convert_utils
-    SRCS convert_utils.cc
-    DEPS data_type place gpu_info)
-else()
-  cc_library(
-    fluid_convert_utils
-    SRCS convert_utils.cc
-    DEPS data_type place)
-endif()
-
-# every source file that includes "dnnl.h" must depends on mkldnn
-# or, the first one should depends on mkldnn
-if(WITH_MKLDNN)
-  add_dependencies(fluid_convert_utils mkldnn)
-endif()
+cc_library(fluid_convert_utils DEPS data_type)
 
 cc_test(
   convert_utils_test

diff --git a/paddle/fluid/framework/convert_utils.cc b/paddle/fluid/framework/convert_utils.cc