diff --git a/paddle/pten/api/include/tensor.h b/paddle/pten/api/include/tensor.h index 476dddb4e2cbd00a1ae9cff50dc97816f45a4e6c..58a851ffb5c787f2397dbf9308439090b95f4a71 100644 --- a/paddle/pten/api/include/tensor.h +++ b/paddle/pten/api/include/tensor.h @@ -86,16 +86,13 @@ class AbstractAutogradMeta { class PD_DLL_DECL Tensor final { public: + /* Part 1: Construction and destruction methods */ + /** * @brief Construct a new Tensor object */ Tensor() = default; - /** - * @brief Construct a new Tensor object with name - * */ - explicit Tensor(const std::string& name) { name_ = name; } - /** * @brief Construct a new Tensor object by copy */ @@ -132,18 +129,14 @@ class PD_DLL_DECL Tensor final { Tensor(const PlaceType& place, const std::vector& shape); /** - * @brief Return the name of Tensor. + * @brief Construct a new Tensor object with name * - * @return const std::string& - */ - const std::string& name() const { return name_; } + * @note Used to adapt original execution mechanism and debug analysis + * in the development of new dygraph. It may be removed in the future. + * */ + explicit Tensor(const std::string& name) : name_(name) {} - /** - * @brief Set name of Tensor. - * - * @param const std::string& name - */ - void set_name(const std::string& name) { name_ = name; } + /* Part 2: Dimension, DataType and DataLayout methods */ /** * @brief Return the number of elements of Tensor. @@ -179,7 +172,7 @@ class PD_DLL_DECL Tensor final { /** * @brief Reset the shape of the tensor. - * Note: This method means Reset the shape of the tensor, + * @note: This method means Reset the shape of the tensor, * and must be called before calling mutable_data() or * copy_to(const PlaceType& place), this is not a standard definition of * reshape behavior, so we will deprecated this feature in the future. @@ -329,14 +322,33 @@ class PD_DLL_DECL Tensor final { gpuStream_t stream() const; #endif + /** + * @brief Return the name of Tensor. + * @note Used to adapt original execution mechanism and debug analysis + * in the development of new dygraph. It may be removed in the future. + * + * @return const std::string& + */ + const std::string& name() const { return name_; } + + /** + * @brief Set name of Tensor. + * @note Used to adapt original execution mechanism and debug analysis + * in the development of new dygraph. It may be removed in the future. + * + * @param const std::string& name + */ + void set_name(const std::string& name) { name_ = name; } + /* Part 5: Data Transform methods */ /** * @brief Copy the current Tensor data to the specified device * and return the new Tensor. It's usually used to set the input tensor data. - * Note: The Tensor's `copy_to` method is deprecated since version 2.3, and - * will be removed in version 2.4, please use `to` method instead. reason: - * copying a Tensor to another device does not need to specify the + * @note The Tensor's `copy_to` method is deprecated since version 2.3, and + * will be removed in version 2.4, please use `copy_to` method without + * template argument instead. + * reason: copying a Tensor to another device does not need to specify the * data type template argument * * @tparam T @@ -352,9 +364,8 @@ class PD_DLL_DECL Tensor final { * @param place, the target place of which the tensor will copy to. * @return Tensor */ - // TODO(chenweihang): replace Backend by new Place, may be append dtype and - // layout arguments in the future - Tensor to(Backend backend, bool blocking) const; + // TODO(chenweihang): replace Backend by new Place + Tensor copy_to(Backend backend, bool blocking) const; /** * @brief Cast datatype from one to another @@ -362,7 +373,7 @@ class PD_DLL_DECL Tensor final { * @param target_type * @return Tensor */ - Tensor cast(const DataType& target_type) const; + Tensor cast(DataType target_type) const; /* Part 6: Status utils methods */ @@ -470,7 +481,7 @@ class PD_DLL_DECL Tensor final { std::shared_ptr autograd_meta_{nullptr}; /** - * Tensor name: used for adapt original execution mechanism and debug analysis + * Tensor name: used to adapt original execution mechanism and debug analysis * in the development of new dygraph. It may be removed in the future. */ std::string name_; diff --git a/paddle/pten/api/include/utils.h b/paddle/pten/api/include/utils.h index 1a73e2ac96f72b5421c81fc4f9fe860cec004bcd..c038e503d47bb71295c13140949adc7100ae0adc 100644 --- a/paddle/pten/api/include/utils.h +++ b/paddle/pten/api/include/utils.h @@ -21,8 +21,7 @@ namespace paddle { namespace experimental { // TODO(chenweihang): Replace backend by place when place is ready -// TODO(chenweihang): Add layout and dtype argument if needed -PD_DLL_DECL Tensor to(const Tensor& x, Backend backend, bool blocking); +PD_DLL_DECL Tensor copy_to(const Tensor& x, Backend backend, bool blocking); } // namespace experimental } // namespace paddle diff --git a/paddle/pten/api/lib/tensor.cc b/paddle/pten/api/lib/tensor.cc index 6eae7dc370813052d75c50036e68ce52bdac3306..2ec66803d17625c58173a595689b46aceab893cb 100644 --- a/paddle/pten/api/lib/tensor.cc +++ b/paddle/pten/api/lib/tensor.cc @@ -19,6 +19,7 @@ limitations under the License. */ #include #include "glog/logging.h" +#include "paddle/pten/api/include/manipulation.h" #include "paddle/pten/api/include/utils.h" #include "paddle/pten/api/lib/ext_compat_utils.h" #include "paddle/pten/api/lib/utils/allocator.h" @@ -281,11 +282,11 @@ gpuStream_t Tensor::stream() const { template Tensor Tensor::copy_to(const PlaceType &target_place) const { LOG(WARNING) << "The Tensor's `copy_to` method is deprecated since version " - "2.3, and will be removed in version 2.4, please use `to` " - "method instead. " + "2.3, and will be removed in version 2.4, please use " + "`copy_to` method without template argumentinstead. " "reason: copying a Tensor to another device does not need " "to specify the data type template argument."; - return to(ConvertExtPlaceToBackend(target_place), /*blocking=*/false); + return copy_to(ConvertExtPlaceToBackend(target_place), /*blocking=*/false); } template PD_DLL_DECL Tensor @@ -311,15 +312,12 @@ template PD_DLL_DECL Tensor Tensor::copy_to>( template PD_DLL_DECL Tensor Tensor::copy_to(const PlaceType &target_place) const; -Tensor Tensor::to(Backend backend, bool blocking) const { - return experimental::to(*this, backend, blocking); +Tensor Tensor::copy_to(Backend backend, bool blocking) const { + return experimental::copy_to(*this, backend, blocking); } -Tensor Tensor::cast(const DataType &target_type) const { - PADDLE_THROW(platform::errors::Unimplemented( - "The cast operation is not supported now, " - "and it will be implemented by calling the cast kernel later.")); - return Tensor(); +Tensor Tensor::cast(DataType target_type) const { + return experimental::cast(*this, target_type); } /* Part 6: Status utils methods */ diff --git a/paddle/pten/api/lib/utils.cc b/paddle/pten/api/lib/utils.cc index 603699b26c15cff3ed19ed1a733dfa67c333602e..90ea1c357ffcdf8fc24c45f8a91c306b56809286 100644 --- a/paddle/pten/api/lib/utils.cc +++ b/paddle/pten/api/lib/utils.cc @@ -34,7 +34,7 @@ PT_DECLARE_MODULE(UtilsCUDA); namespace paddle { namespace experimental { -PD_DLL_DECL Tensor to(const Tensor& x, Backend backend, bool blocking) { +PD_DLL_DECL Tensor copy_to(const Tensor& x, Backend backend, bool blocking) { // 1. Get kernel signature and kernel auto kernel_key_set = ParseKernelKeyByInputArgs(x); kernel_key_set.backend_set = kernel_key_set.backend_set | BackendSet(backend); diff --git a/paddle/pten/tests/api/CMakeLists.txt b/paddle/pten/tests/api/CMakeLists.txt index a5f6aa73cade5a1972d5e253621aa55f6ea606d2..432532d433896f6e42e0e7f229a42ed4a50f26f1 100644 --- a/paddle/pten/tests/api/CMakeLists.txt +++ b/paddle/pten/tests/api/CMakeLists.txt @@ -1,7 +1,7 @@ if(WITH_ROCM) - hip_test(test_pten_tensor SRCS test_pten_tensor.cc DEPS pten_tensor utils_api glog) + hip_test(test_pten_tensor SRCS test_pten_tensor.cc DEPS pten_tensor utils_api manipulation_api glog) else() - cc_test(test_pten_tensor SRCS test_pten_tensor.cc DEPS pten_tensor utils_api glog) + cc_test(test_pten_tensor SRCS test_pten_tensor.cc DEPS pten_tensor utils_api manipulation_api glog) endif() cc_test(test_pten_exception SRCS test_pten_exception.cc DEPS gtest) diff --git a/paddle/pten/tests/api/test_cast_api.cc b/paddle/pten/tests/api/test_cast_api.cc index 46265d8568ceb15381a5272851143c6752a73608..1f7c238817e9894093071df827ac8899f786409c 100644 --- a/paddle/pten/tests/api/test_cast_api.cc +++ b/paddle/pten/tests/api/test_cast_api.cc @@ -15,17 +15,15 @@ limitations under the License. */ #include #include +#include "paddle/pten/api/include/creation.h" #include "paddle/pten/api/include/manipulation.h" #include "paddle/pten/api/lib/utils/allocator.h" #include "paddle/pten/core/dense_tensor.h" #include "paddle/pten/core/kernel_registry.h" -PT_DECLARE_MODULE(ManipulationCPU); - -#if defined(PADDLE_WITH_CUDA) || defined(PADDLE_WITH_HIP) -PT_DECLARE_MODULE(ManipulationCUDA); -#endif +namespace pten { +namespace tests { namespace framework = paddle::framework; using DDim = paddle::framework::DDim; @@ -67,3 +65,24 @@ TEST(API, cast) { ASSERT_NEAR(dense_out_data[i], static_cast(dense_x_data[i]), 1e-6f); } } + +TEST(Tensor, cast) { + auto x = paddle::experimental::full({3, 4}, 1.0, pten::DataType::FLOAT32); + auto y = x.cast(pten::DataType::INT32); + + // check slice result + ASSERT_EQ(y.dims().size(), 2); + ASSERT_EQ(y.dims()[0], 3); + ASSERT_EQ(y.dims()[1], 4); + ASSERT_EQ(y.numel(), 12); + ASSERT_EQ(y.is_cpu(), true); + ASSERT_EQ(y.type(), pten::DataType::INT32); + ASSERT_EQ(y.layout(), pten::DataLayout::NCHW); + ASSERT_EQ(y.initialized(), true); + for (int64_t i = 0; i < y.numel(); ++i) { + ASSERT_EQ(y.mutable_data()[i], 1); + } +} + +} // namespace tests +} // namespace pten diff --git a/paddle/pten/tests/api/test_to_api.cc b/paddle/pten/tests/api/test_to_api.cc index 5374903cbb7ff91eb8e4503babe64f7b575e2782..d08a78cf4cf823a1807c816dc928204ef5760bc8 100644 --- a/paddle/pten/tests/api/test_to_api.cc +++ b/paddle/pten/tests/api/test_to_api.cc @@ -58,39 +58,39 @@ void CheckOutputResult(const paddle::experimental::Tensor& out) { } } -TEST(API, to) { +TEST(API, copy_to) { // 1. create tensor auto x = CreateInputTensor(); // 2. test API #if defined(PADDLE_WITH_CUDA) || defined(PADDLE_WITH_HIP) - auto tmp = paddle::experimental::to(x, pten::Backend::CUDA, false); - auto out = paddle::experimental::to(tmp, pten::Backend::CPU, true); + auto tmp = paddle::experimental::copy_to(x, pten::Backend::CUDA, false); + auto out = paddle::experimental::copy_to(tmp, pten::Backend::CPU, true); #else - auto out = paddle::experimental::to(x, pten::Backend::CPU, false); + auto out = paddle::experimental::copy_to(x, pten::Backend::CPU, false); #endif // 3. check result CheckOutputResult(out); } -TEST(Tensor, to) { +TEST(Tensor, copy_to) { // 1. create tensor auto x = CreateInputTensor(); // 2. test API #if defined(PADDLE_WITH_CUDA) || defined(PADDLE_WITH_HIP) - auto tmp = x.to(pten::Backend::CUDA, false); - auto out = tmp.to(pten::Backend::CPU, true); + auto tmp = x.copy_to(pten::Backend::CUDA, false); + auto out = tmp.copy_to(pten::Backend::CPU, true); #else - auto out = x.to(pten::Backend::CPU, false); + auto out = x.copy_to(pten::Backend::CPU, false); #endif // 3. check result CheckOutputResult(out); } -TEST(Tensor, copy_to) { +TEST(Tensor, old_copy_to) { // 1. create tensor auto x = CreateInputTensor(); diff --git a/paddle/pten/tests/kernels/test_cast_dev_api.cc b/paddle/pten/tests/kernels/test_cast_dev_api.cc index 2471529ba9b506ef4eba763c73e8ad98ac49576d..64b60a540f7ebcdd1a311cdcaa4aa367186bed28 100644 --- a/paddle/pten/tests/kernels/test_cast_dev_api.cc +++ b/paddle/pten/tests/kernels/test_cast_dev_api.cc @@ -23,12 +23,6 @@ limitations under the License. */ #include "paddle/pten/core/dense_tensor.h" #include "paddle/pten/core/kernel_registry.h" -PT_DECLARE_MODULE(ManipulationCPU); - -#if defined(PADDLE_WITH_CUDA) || defined(PADDLE_WITH_HIP) -PT_DECLARE_MODULE(ManipulationCUDA); -#endif - namespace framework = paddle::framework; using DDim = paddle::framework::DDim;