未验证 提交 5fe3d596 编写于 作者: L Leo Chen 提交者: GitHub

Fix pow, use fillD instead of broadcast (#31433)

上级 ecc6e213
...@@ -12,7 +12,6 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. ...@@ -12,7 +12,6 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and See the License for the specific language governing permissions and
limitations under the Licnse. */ limitations under the Licnse. */
#ifdef PADDLE_WITH_ASCEND_CL
#include <memory> #include <memory>
#include <string> #include <string>
...@@ -90,8 +89,8 @@ class PowGradNPUKernel : public framework::OpKernel<T> { ...@@ -90,8 +89,8 @@ class PowGradNPUKernel : public framework::OpKernel<T> {
// factor. // factor.
Tensor factor_bc_tensor(framework::proto::VarType::FP32); Tensor factor_bc_tensor(framework::proto::VarType::FP32);
factor_bc_tensor.mutable_data<float>(x_dims, place); factor_bc_tensor.mutable_data<float>(x_dims, place);
auto runner_bc = NpuOpRunner("BroadcastTo", {factor_tensor, x_shape}, auto runner_bc = NpuOpRunner("FillD", {factor_tensor}, {factor_bc_tensor},
{factor_bc_tensor}, {}); {{"dims", x_dims}});
runner_bc.Run(stream); runner_bc.Run(stream);
// Step 3: Compute x_power_mul_factor = factor * x.pow(factor-1) // Step 3: Compute x_power_mul_factor = factor * x.pow(factor-1)
...@@ -123,5 +122,3 @@ REGISTER_OP_NPU_KERNEL( ...@@ -123,5 +122,3 @@ REGISTER_OP_NPU_KERNEL(
pow_grad, ops::PowGradNPUKernel<paddle::platform::NPUDeviceContext, float>, pow_grad, ops::PowGradNPUKernel<paddle::platform::NPUDeviceContext, float>,
ops::PowGradNPUKernel<paddle::platform::NPUDeviceContext, ops::PowGradNPUKernel<paddle::platform::NPUDeviceContext,
paddle::platform::float16>); paddle::platform::float16>);
#endif
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册