// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "paddle/fluid/jit/layer.h" #include #include #include #include #include #include "gtest/gtest.h" #include "paddle/fluid/framework/op_registry.h" #include "paddle/fluid/framework/variable.h" #include "paddle/fluid/imperative/tracer.h" #include "paddle/fluid/jit/serializer.h" #include "paddle/fluid/memory/allocation/allocator_facade.h" #include "paddle/phi/api/include/tensor.h" #include "paddle/phi/core/dense_tensor.h" #include "paddle/phi/core/kernel_registry.h" #include "paddle/phi/kernels/copy_kernel.h" #include "paddle/phi/kernels/funcs/math_function.h" USE_OP_ITSELF(elementwise_add); USE_OP_ITSELF(matmul_v2); USE_OP_ITSELF(relu); USE_OP_ITSELF(reduce_mean); USE_OP_ITSELF(feed); USE_OP_ITSELF(fetch); USE_OP_ITSELF(scale); PD_DECLARE_KERNEL(add, CPU, ALL_LAYOUT); PD_DECLARE_KERNEL(matmul, CPU, ALL_LAYOUT); PD_DECLARE_KERNEL(relu, CPU, ALL_LAYOUT); PD_DECLARE_KERNEL(mean, CPU, ALL_LAYOUT); PD_DECLARE_KERNEL(scale, CPU, ALL_LAYOUT); #if defined(PADDLE_WITH_CUDA) PD_DECLARE_KERNEL(add, KPS, ALL_LAYOUT); PD_DECLARE_KERNEL(matmul, GPU, ALL_LAYOUT); PD_DECLARE_KERNEL(relu, GPU, ALL_LAYOUT); PD_DECLARE_KERNEL(mean, GPU, ALL_LAYOUT); PD_DECLARE_KERNEL(scale, GPU, ALL_LAYOUT); #endif namespace paddle { namespace jit { std::vector PrepareInputs() { auto default_place = imperative::GetCurrentTracer()->ExpectedPlace(); platform::DeviceContextPool& pool = platform::DeviceContextPool::Instance(); auto& dev_ctx = *pool.Get(default_place); Variable v; auto* dense_tensor = v.GetMutable(); dense_tensor->Resize(phi::make_ddim({2, 4})); dense_tensor->mutable_data(default_place); phi::funcs::set_constant(dev_ctx, dense_tensor, 2.); return {v}; } TEST(CpuLayerTest, Construct) { auto tracer = std::make_shared(); paddle::imperative::SetCurrentTracer(tracer); imperative::GetCurrentTracer()->SetExpectedPlace(phi::CPUPlace()); std::string path = "./"; auto layer = jit::Load(path); auto inputs = PrepareInputs(); auto outs = layer.forward(inputs); auto out_vars = outs[0]; auto out_dense_tensor = out_vars.Get(); auto out_data = out_dense_tensor.data(); EXPECT_NEAR(out_data[0], 0.02194316, 1e-6); auto func = layer.GetFunction("infer"); outs = (*func)(inputs); out_vars = outs[0]; out_dense_tensor = out_vars.Get(); out_data = out_dense_tensor.data(); EXPECT_NEAR(out_data[0], 1.41562390, 1e-6); } #if defined(PADDLE_WITH_CUDA) TEST(GpuLayerTest, Construct) { auto tracer = std::make_shared(); paddle::imperative::SetCurrentTracer(tracer); imperative::GetCurrentTracer()->SetExpectedPlace(phi::GPUPlace(0)); platform::DeviceContextPool& pool = platform::DeviceContextPool::Instance(); auto& dev_ctx = *pool.Get(imperative::GetCurrentTracer()->ExpectedPlace()); const auto* dev_ctx_gpu = static_cast(&dev_ctx); DenseTensor cpu_dense_tensor; std::string path = "./"; auto layer = jit::Load(path); auto inputs = PrepareInputs(); auto outs = layer.forward(inputs); auto out_vars = outs[0]; auto out_dense_tensor = out_vars.Get(); phi::Copy( *dev_ctx_gpu, out_dense_tensor, phi::CPUPlace(), true, &cpu_dense_tensor); auto out_data = cpu_dense_tensor.data(); EXPECT_NEAR(out_data[0], 0.02194316, 1e-6); auto func = layer.GetFunction("infer"); outs = (*func)(inputs); out_vars = outs[0]; out_dense_tensor = out_vars.Get(); phi::Copy( *dev_ctx_gpu, out_dense_tensor, phi::CPUPlace(), true, &cpu_dense_tensor); out_data = cpu_dense_tensor.data(); EXPECT_NEAR(out_data[0], 1.41562390, 1e-6); } #endif } // namespace jit } // namespace paddle