未验证 提交 05c2b9ba 编写于 作者: zhouweiwei2014's avatar zhouweiwei2014 提交者: GitHub

[Zero-Dim] support input 0D Tensor for some unary api (#45992)

* [Zero-Dim] support input 0D Tensor for unary api

* fix CI
上级 95768115
...@@ -164,24 +164,32 @@ void FetchAsyncOpHandle::FetchMergedLodTensor( ...@@ -164,24 +164,32 @@ void FetchAsyncOpHandle::FetchMergedLodTensor(
} }
} }
bool find_first_dims = false;
for (auto *t : src_lodtensors) {
if (t->numel() && t->IsInitialized()) {
if (!find_first_dims) {
new_dim = t->dims();
find_first_dims = true;
} else {
new_dim[0] += t->dims()[0];
}
}
}
// check src type,layout,dim,lod consistence // check src type,layout,dim,lod consistence
for (size_t i = 1; i < src_lodtensors.size(); ++i) { for (size_t i = 1; i < src_lodtensors.size(); ++i) {
CheckTensorAttrs( CheckTensorAttrs(
src_lodtensors[i], new_type, new_layout, check_dim, new_lod, offset_); src_lodtensors[i], new_type, new_layout, check_dim, new_lod, offset_);
} }
auto rank = src_lodtensors[0]->dims().size();
// for 0D tensor, can't concat eath tensor. So stack 0D and concat 1+D tensor
if (rank == 0) {
int src_lodtensor_size = src_lodtensors.size();
new_dim = phi::make_ddim(std::vector<int>({src_lodtensor_size}));
} else {
bool find_first_dims = false;
for (auto *t : src_lodtensors) {
if (t->numel() && t->IsInitialized()) {
if (!find_first_dims) {
new_dim = t->dims();
find_first_dims = true;
} else {
new_dim[0] += t->dims()[0];
}
}
}
}
// set dst tensor // set dst tensor
dst_lodtensor->Resize(new_dim); dst_lodtensor->Resize(new_dim);
dst_lodtensor->set_layout(src_lodtensors[0]->layout()); dst_lodtensor->set_layout(src_lodtensors[0]->layout());
...@@ -195,9 +203,17 @@ void FetchAsyncOpHandle::FetchMergedLodTensor( ...@@ -195,9 +203,17 @@ void FetchAsyncOpHandle::FetchMergedLodTensor(
} }
// slice and memcpy // slice and memcpy
// for 0D tensor, can't concat eath tensor, stack them. for 1+D tensor, concat
// them
int begin = 0; int begin = 0;
int end = 0;
for (auto *src : src_lodtensors) { for (auto *src : src_lodtensors) {
int end = begin + src->dims()[0]; if (rank == 0) {
end = begin + 1;
} else {
end = begin + src->dims()[0];
}
if (end == begin) { if (end == begin) {
continue; continue;
} }
......
...@@ -16,6 +16,7 @@ ...@@ -16,6 +16,7 @@
#include <string> #include <string>
#include "paddle/fluid/framework/operator.h"
#include "paddle/fluid/platform/profiler/event_tracing.h" #include "paddle/fluid/platform/profiler/event_tracing.h"
namespace phi { namespace phi {
...@@ -101,6 +102,7 @@ std::string ScaleLossGradOpHandle::LossGradName() const { ...@@ -101,6 +102,7 @@ std::string ScaleLossGradOpHandle::LossGradName() const {
void ScaleLossGradOpHandle::RunImpl() { void ScaleLossGradOpHandle::RunImpl() {
platform::RecordEvent record_event( platform::RecordEvent record_event(
Name(), platform::TracerEventType::UserDefined, 2); Name(), platform::TracerEventType::UserDefined, 2);
RunOnVar(local_exec_scopes_[0]->FindVar(LossGradName()), true); RunOnVar(local_exec_scopes_[0]->FindVar(LossGradName()), true);
} }
......
...@@ -213,8 +213,9 @@ DDim CompatMetaTensor::dims() const { ...@@ -213,8 +213,9 @@ DDim CompatMetaTensor::dims() const {
} else { } else {
auto* var = PADDLE_GET_CONST(VarDesc*, var_); auto* var = PADDLE_GET_CONST(VarDesc*, var_);
return var->GetShape().empty() ? phi::make_ddim({0UL}) return phi::make_ddim(var->GetShape());
: phi::make_ddim(var->GetShape()); // return var->GetShape().empty() ? phi::make_ddim({0UL}) :
// phi::make_ddim(var->GetShape());
} }
} }
......
...@@ -262,6 +262,16 @@ std::vector<LoDTensor> SplitLoDTensor( ...@@ -262,6 +262,16 @@ std::vector<LoDTensor> SplitLoDTensor(
platform::errors::InvalidArgument( platform::errors::InvalidArgument(
"Place number cannot be empty when splitting.")); "Place number cannot be empty when splitting."));
src.check_memory_size(); src.check_memory_size();
auto rank = src.dims().size();
// if rank is 0, just return #places.size() copys of src
if (rank == 0) {
LoDTensor dst;
framework::TensorCopy(src, src.place(), &dst);
std::vector<LoDTensor> ret;
ret.emplace_back(std::move(dst));
return ret;
}
size_t batch_size = src.lod().empty() ? static_cast<size_t>(src.dims()[0]) size_t batch_size = src.lod().empty() ? static_cast<size_t>(src.dims()[0])
: src.lod()[0].size() - 1; : src.lod()[0].size() - 1;
...@@ -349,6 +359,7 @@ void MergeLoDTensor(LoDTensor *target, ...@@ -349,6 +359,7 @@ void MergeLoDTensor(LoDTensor *target,
} }
LoD new_lod = lod_tensors[0]->lod(); LoD new_lod = lod_tensors[0]->lod();
auto rank = lod_tensors[0]->dims().size();
for (size_t i = 1; i < lod_tensors.size(); ++i) { for (size_t i = 1; i < lod_tensors.size(); ++i) {
auto *t = lod_tensors[i]; auto *t = lod_tensors[i];
...@@ -369,16 +380,24 @@ void MergeLoDTensor(LoDTensor *target, ...@@ -369,16 +380,24 @@ void MergeLoDTensor(LoDTensor *target,
"actual layout is %s.", "actual layout is %s.",
DataLayoutToString(new_layout), DataLayoutToString(new_layout),
DataLayoutToString(t->layout()))); DataLayoutToString(t->layout())));
PADDLE_ENFORCE_EQ( auto tensor_dims = t->dims();
phi::product(new_dim) / new_dim[0], PADDLE_ENFORCE_EQ(tensor_dims.size(),
phi::product(t->dims()) / t->dims()[0], new_dim.size(),
platform::errors::InvalidArgument( platform::errors::InvalidArgument(
"LoDTensor dimension does not match, all dimensions except the " "dimensions of LoDTensor does not match"));
"first dimension need to be equal," for (int j = 1; j < t->dims().size(); j++) {
"but expected dimension is %s, actual dimension is %s.", PADDLE_ENFORCE_EQ(
new_dim, tensor_dims[j],
t->dims())); new_dim[j],
new_dim[0] += t->dims()[0]; platform::errors::InvalidArgument(
"LoDTensor.ddim[%d] should eaqual to %d, but is %d",
j,
new_dim[j],
tensor_dims[j]));
}
if (rank > 0) {
new_dim[0] += t->dims()[0];
}
} }
auto &lod = t->lod(); auto &lod = t->lod();
......
...@@ -362,7 +362,7 @@ class CompileTimeInferShapeContext : public InferShapeContext { ...@@ -362,7 +362,7 @@ class CompileTimeInferShapeContext : public InferShapeContext {
DDim res; DDim res;
try { try {
auto shape = var->GetShape(); auto shape = var->GetShape();
res = shape.empty() ? phi::make_ddim({0UL}) : phi::make_ddim(shape); res = phi::make_ddim(shape);
} catch (...) { } catch (...) {
VLOG(5) << "GetDim of variable " << name << " error"; VLOG(5) << "GetDim of variable " << name << " error";
std::rethrow_exception(std::current_exception()); std::rethrow_exception(std::current_exception());
...@@ -1258,7 +1258,7 @@ std::vector<DDim> CompileTimeInferShapeContext::GetRepeatedDims( ...@@ -1258,7 +1258,7 @@ std::vector<DDim> CompileTimeInferShapeContext::GetRepeatedDims(
try { try {
auto shapes = var->GetShapes(); auto shapes = var->GetShapes();
for (const auto &s : shapes) { for (const auto &s : shapes) {
res.push_back(s.empty() ? phi::make_ddim({0UL}) : phi::make_ddim(s)); res.push_back(phi::make_ddim(s));
} }
} catch (...) { } catch (...) {
VLOG(5) << "GetRepeatedDim of variable " << name << " error."; VLOG(5) << "GetRepeatedDim of variable " << name << " error.";
......
...@@ -72,10 +72,15 @@ HOSTDEVICE inline Dim<sizeof...(Args)> make_dim(Args... idxes) { ...@@ -72,10 +72,15 @@ HOSTDEVICE inline Dim<sizeof...(Args)> make_dim(Args... idxes) {
// Allows us to output a Dim // Allows us to output a Dim
template <int D> template <int D>
inline std::ostream& operator<<(std::ostream& os, const Dim<D>& d) { inline std::ostream& operator<<(std::ostream& os, const Dim<D>& d) {
os << d[0]; if (D > 0) {
for (int i = 1; i < D; ++i) { os << d[0];
os << ", " << d[i]; for (int i = 1; i < D; ++i) {
os << ", " << d[i];
}
} else {
os << "";
} }
return os; return os;
} }
......
...@@ -305,9 +305,14 @@ void AddNInferMeta(const std::vector<const MetaTensor*>& x, ...@@ -305,9 +305,14 @@ void AddNInferMeta(const std::vector<const MetaTensor*>& x,
if (x[i]->is_selected_rows() && x_dim.size() == 1) { if (x[i]->is_selected_rows() && x_dim.size() == 1) {
continue; continue;
} }
// for zero-sized tensor
if (phi::product(x_dim) == 0) { if (phi::product(x_dim) == 0) {
continue; continue;
} }
// for 0D tensor
if (x_dim.size() == 0) {
continue;
}
if (phi::product(in_dim) == 0) { if (phi::product(in_dim) == 0) {
in_dim = x_dim; in_dim = x_dim;
} else { } else {
...@@ -2547,8 +2552,8 @@ void WarpctcInferMeta(const MetaTensor& logits, ...@@ -2547,8 +2552,8 @@ void WarpctcInferMeta(const MetaTensor& logits,
const MetaTensor& labels_length, const MetaTensor& labels_length,
int blank, int blank,
bool norm_by_times, bool norm_by_times,
MetaTensor* warpctcgrad, MetaTensor* loss,
MetaTensor* loss) { MetaTensor* warpctcgrad) {
auto logits_dims = logits.dims(); auto logits_dims = logits.dims();
int sequence_width = 0; int sequence_width = 0;
......
...@@ -483,8 +483,8 @@ void WarpctcInferMeta(const MetaTensor& logits, ...@@ -483,8 +483,8 @@ void WarpctcInferMeta(const MetaTensor& logits,
const MetaTensor& labels_length, const MetaTensor& labels_length,
int blank, int blank,
bool norm_by_times, bool norm_by_times,
MetaTensor* warpctcgrad, MetaTensor* loss,
MetaTensor* loss); MetaTensor* warpctcgrad);
void WhereInferMeta(const MetaTensor& condition, void WhereInferMeta(const MetaTensor& condition,
const MetaTensor& x, const MetaTensor& x,
......
...@@ -2668,7 +2668,7 @@ DDim ReduceInferDim(const MetaTensor& x, ...@@ -2668,7 +2668,7 @@ DDim ReduceInferDim(const MetaTensor& x,
x_rank, x_rank,
errors::InvalidArgument( errors::InvalidArgument(
"The reduce dim index %d should be in the " "The reduce dim index %d should be in the "
"range [-dimension(X), dimension(X)] " "range [ -dimension(X), dimension(X) ) "
"which dimesion = %d. But received dim index = %d.", "which dimesion = %d. But received dim index = %d.",
i, i,
x_rank, x_rank,
...@@ -2677,7 +2677,7 @@ DDim ReduceInferDim(const MetaTensor& x, ...@@ -2677,7 +2677,7 @@ DDim ReduceInferDim(const MetaTensor& x,
-x_rank, -x_rank,
errors::InvalidArgument( errors::InvalidArgument(
"The reduce dim index %d should be in the " "The reduce dim index %d should be in the "
"range [-dimension(X), dimension(X)] " "range [ -dimension(X), dimension(X) ) "
"which dimesion = %d. But received dim index = %d.", "which dimesion = %d. But received dim index = %d.",
i, i,
x_rank, x_rank,
......
...@@ -36,6 +36,24 @@ inline DDim GetOutputSqueezeShape(const std::vector<int> squeeze_dims, ...@@ -36,6 +36,24 @@ inline DDim GetOutputSqueezeShape(const std::vector<int> squeeze_dims,
} }
} else { } else {
for (size_t i = 0; i < num_squeeze_dims; ++i) { for (size_t i = 0; i < num_squeeze_dims; ++i) {
if (in_dims.size() == 0) {
PADDLE_ENFORCE_GE(
squeeze_dims[i],
-1,
phi::errors::InvalidArgument(
"For 0D Tensor, Each axis in Attr(axes) should be in the range "
"of [-1, 0]"
"But current axis is:%d, input tensor's shape = [%s]."));
PADDLE_ENFORCE_LE(
squeeze_dims[i],
0,
phi::errors::InvalidArgument(
"For 0D Tensor, Each axis in Attr(axes) should be in the range "
"of [-1, 0]"
"But current axis is:%d, input tensor's shape = [%s]."));
continue;
}
int current = squeeze_dims[i] < 0 ? squeeze_dims[i] + in_dims.size() int current = squeeze_dims[i] < 0 ? squeeze_dims[i] + in_dims.size()
: squeeze_dims[i]; : squeeze_dims[i];
......
...@@ -25,8 +25,7 @@ inline std::vector<int64_t> CalculateReducedDims( ...@@ -25,8 +25,7 @@ inline std::vector<int64_t> CalculateReducedDims(
bool keep_dim) { bool keep_dim) {
if (keep_dim) return vectorize(output->dims()); if (keep_dim) return vectorize(output->dims());
if (reduce_all && reduce_dims.size() > 0) if (reduce_all) return std::vector<int64_t>(input->dims().size(), 1);
return std::vector<int64_t>(input->dims().size(), 1);
std::vector<int64_t> output_dims(vectorize(input->dims())); std::vector<int64_t> output_dims(vectorize(input->dims()));
for (size_t i = 0; i < reduce_dims.size(); ++i) { for (size_t i = 0; i < reduce_dims.size(); ++i) {
......
...@@ -21,18 +21,43 @@ namespace phi { ...@@ -21,18 +21,43 @@ namespace phi {
namespace tests { namespace tests {
TEST(DDim, Equality) { TEST(DDim, Equality) {
// default construct ddim
phi::DDim default_ddim;
EXPECT_EQ(arity(default_ddim), 1);
EXPECT_EQ(default_ddim[0], 0);
// construct a zero-DDim
phi::DDim zero_ddim = phi::make_ddim({});
EXPECT_EQ(arity(zero_ddim), 0);
EXPECT_EQ(zero_ddim.size(), 0);
EXPECT_EQ(phi::product(zero_ddim), 1);
std::vector<int64_t> zero_vec;
phi::DDim zero_ddim1 = phi::make_ddim(zero_vec);
EXPECT_EQ(arity(zero_ddim1), 0);
EXPECT_EQ(zero_ddim1.size(), 0);
EXPECT_EQ(phi::product(zero_ddim1), 1);
// zero-DDim to vector
std::vector<int64_t> zero_ddim_vec = phi::vectorize(zero_ddim);
EXPECT_EQ(zero_ddim_vec.size(), size_t(0));
// reshape zero-DDim
std::vector<int> reshape_vec = {1};
phi::DDim reshape_ddim = zero_ddim.reshape(reshape_vec);
EXPECT_EQ(arity(reshape_ddim), 1);
EXPECT_EQ(reshape_ddim.size(), 1);
EXPECT_EQ(phi::product(reshape_ddim), 1);
// construct a DDim from an initialization list // construct a DDim from an initialization list
phi::DDim ddim = phi::make_ddim({9, 1, 5}); phi::DDim ddim = phi::make_ddim({9, 1, 5});
EXPECT_EQ(ddim[0], 9); EXPECT_EQ(ddim[0], 9);
EXPECT_EQ(ddim[1], 1); EXPECT_EQ(ddim[1], 1);
EXPECT_EQ(ddim[2], 5); EXPECT_EQ(ddim[2], 5);
// construct a DDim from a vector // arity of a DDim
std::vector<int64_t> vec({9, 1, 5}); EXPECT_EQ(phi::arity(ddim), 3);
phi::DDim vddim = phi::make_ddim(vec); EXPECT_EQ(ddim.size(), 3);
EXPECT_EQ(ddim[0], 9);
EXPECT_EQ(ddim[1], 1);
EXPECT_EQ(ddim[2], 5);
// mutate a DDim // mutate a DDim
ddim[1] = 2; ddim[1] = 2;
...@@ -40,6 +65,13 @@ TEST(DDim, Equality) { ...@@ -40,6 +65,13 @@ TEST(DDim, Equality) {
ddim[0] = 6; ddim[0] = 6;
EXPECT_EQ(ddim[0], 6); EXPECT_EQ(ddim[0], 6);
// construct a DDim from a vector
std::vector<int64_t> vec({9, 1, 5});
phi::DDim vddim = phi::make_ddim(vec);
EXPECT_EQ(vddim[0], 9);
EXPECT_EQ(vddim[1], 1);
EXPECT_EQ(vddim[2], 5);
// vectorize a DDim // vectorize a DDim
std::vector<int64_t> res_vec = phi::vectorize(vddim); std::vector<int64_t> res_vec = phi::vectorize(vddim);
EXPECT_EQ(res_vec[0], 9); EXPECT_EQ(res_vec[0], 9);
...@@ -51,37 +83,45 @@ TEST(DDim, Equality) { ...@@ -51,37 +83,45 @@ TEST(DDim, Equality) {
EXPECT_EQ(res_vec[1], 2); EXPECT_EQ(res_vec[1], 2);
EXPECT_EQ(res_vec[2], 1); EXPECT_EQ(res_vec[2], 1);
// arity of a DDim
EXPECT_EQ(phi::arity(ddim), 3);
EXPECT_EQ(ddim.size(), 3);
// product of a DDim // product of a DDim
EXPECT_EQ(phi::product(vddim), 45); EXPECT_EQ(phi::product(vddim), 45);
EXPECT_EQ(phi::product(phi::make_ddim({3, 2, 5, 3})), 90); EXPECT_EQ(phi::product(phi::make_ddim({3, 2, 5, 3})), 90);
// slice a DDim // slice a DDim
phi::DDim ddim2 = phi::make_ddim({1, 2, 3, 4, 5, 6}); phi::DDim ddim2 = phi::make_ddim({1, 2, 3, 4, 5, 6});
phi::DDim ss = phi::slice_ddim(ddim2, 2, 5); phi::DDim slice_dim1 = phi::slice_ddim(ddim2, 2, 5);
EXPECT_EQ(arity(ss), 3); EXPECT_EQ(arity(slice_dim1), 3);
EXPECT_EQ(ss[0], 3); EXPECT_EQ(slice_dim1[0], 3);
EXPECT_EQ(ss[1], 4); EXPECT_EQ(slice_dim1[1], 4);
EXPECT_EQ(ss[2], 5); EXPECT_EQ(slice_dim1[2], 5);
phi::DDim ss2 = phi::slice_ddim(ddim2, 0, 6);
EXPECT_EQ(arity(ss2), 6); phi::DDim slice_dim2 = phi::slice_ddim(ddim2, 0, 6);
EXPECT_EQ(ss2[0], 1); EXPECT_EQ(arity(slice_dim2), 6);
EXPECT_EQ(ss2[1], 2); EXPECT_EQ(slice_dim2[0], 1);
EXPECT_EQ(ss2[2], 3); EXPECT_EQ(slice_dim2[1], 2);
EXPECT_EQ(ss2[3], 4); EXPECT_EQ(slice_dim2[2], 3);
EXPECT_EQ(ss2[4], 5); EXPECT_EQ(slice_dim2[3], 4);
EXPECT_EQ(ss2[5], 6); EXPECT_EQ(slice_dim2[4], 5);
EXPECT_EQ(slice_dim2[5], 6);
phi::DDim slice_dim3 = phi::slice_ddim(ddim2, 1, 1);
EXPECT_EQ(arity(slice_dim3), 0);
EXPECT_EQ(slice_dim3.size(), 0);
EXPECT_EQ(phi::product(slice_dim3), 1);
} }
TEST(DDim, Print) { TEST(DDim, Print) {
// print a DDim // print a DDim
std::stringstream ss; std::stringstream ss1;
phi::DDim ddim = phi::make_ddim({2, 3, 4}); phi::DDim ddim = phi::make_ddim({2, 3, 4});
ss << ddim; ss1 << ddim;
EXPECT_EQ("2, 3, 4", ss.str()); EXPECT_EQ("2, 3, 4", ss1.str());
// print a zero-DDim
std::stringstream ss2;
phi::DDim zero_ddim = phi::make_ddim({});
ss2 << zero_ddim;
EXPECT_EQ("", ss2.str());
} }
} // namespace tests } // namespace tests
......
...@@ -688,8 +688,10 @@ class HybridParallelInferenceHelper(object): ...@@ -688,8 +688,10 @@ class HybridParallelInferenceHelper(object):
}) })
else: else:
var_shape = list(var.shape) var_shape = list(var.shape)
var_shape[0] = self.micro_batch_size if var_shape[ print(var_name)
0] < 0 else var_shape[0] if len(var.shape) > 0:
var_shape[0] = self.micro_batch_size if var_shape[
0] < 0 else var_shape[0]
block._insert_op_without_sync( block._insert_op_without_sync(
index=index, index=index,
type='recv_v2', type='recv_v2',
......
...@@ -462,6 +462,7 @@ def convert_len(var): ...@@ -462,6 +462,7 @@ def convert_len(var):
`shape_op` in var.block. `shape_op` in var.block.
""" """
if isinstance(var, Variable): if isinstance(var, Variable):
assert var.ndim > 0, "len() of a 0D tensor is wrong"
if var.type in [ if var.type in [
core.VarDesc.VarType.LOD_TENSOR, core.VarDesc.VarType.LOD_TENSOR,
core.VarDesc.VarType.SELECTED_ROWS core.VarDesc.VarType.SELECTED_ROWS
......
...@@ -144,6 +144,7 @@ def monkey_patch_math_varbase(): ...@@ -144,6 +144,7 @@ def monkey_patch_math_varbase():
return int(var.numpy().flatten()[0]) return int(var.numpy().flatten()[0])
def _len_(var): def _len_(var):
assert var.ndim > 0, "len() of a 0D tensor is wrong"
if var.type == core.VarDesc.VarType.VOCAB: if var.type == core.VarDesc.VarType.VOCAB:
return len(var.value().get_map_tensor()) return len(var.value().get_map_tensor())
elif var.type == core.VarDesc.VarType.STRINGS: elif var.type == core.VarDesc.VarType.STRINGS:
......
...@@ -208,6 +208,30 @@ OP_NAMEMAPPING = { ...@@ -208,6 +208,30 @@ OP_NAMEMAPPING = {
} }
def _get_reduce_dim(dim, input):
"""
Internal function for reduce_sum, reduce_mean, reduce_max, reduce_min, reduce_prod.
It computes the attribute reduce_all value based on axis.
"""
if dim is not None and not isinstance(dim, list):
if isinstance(dim, (tuple, range)):
dim = list(dim)
elif isinstance(dim, int):
dim = [dim]
else:
raise TypeError(
"The type of dim must be int, list, tuple or range, but received {}"
.format(type(axis)))
if dim is None:
dim = []
if dim == [] or len(dim) == len(input.shape):
reduce_all = True
else:
reduce_all = False
return reduce_all, dim
@dygraph_only @dygraph_only
def _elementwise_op_in_dygraph(x, def _elementwise_op_in_dygraph(x,
y, y,
...@@ -4689,29 +4713,14 @@ def reduce_sum(input, dim=None, keep_dim=False, name=None): ...@@ -4689,29 +4713,14 @@ def reduce_sum(input, dim=None, keep_dim=False, name=None):
if dim is not None and not isinstance(dim, list): if dim is not None and not isinstance(dim, list):
dim = [dim] dim = [dim]
reduce_all, dim = _get_reduce_dim(dim, input)
if in_dygraph_mode(): if in_dygraph_mode():
reduce_all = True if dim == None or dim == [] or len(dim) == len( return _C_ops.sum(input, dim, None, keep_dim)
input.shape) else False
dim = dim if dim != None and dim != [] else [0]
if reduce_all:
return _C_ops.sum(input, [], None, keep_dim)
else:
return _C_ops.sum(input, dim, None, keep_dim)
elif _in_legacy_dygraph(): elif _in_legacy_dygraph():
reduce_all = True if dim == None or dim == [] or len(dim) == len(
input.shape) else False
dim = dim if dim != None and dim != [] else [0]
return _legacy_C_ops.reduce_sum(input, 'dim', dim, 'keep_dim', keep_dim, return _legacy_C_ops.reduce_sum(input, 'dim', dim, 'keep_dim', keep_dim,
'reduce_all', reduce_all) 'reduce_all', reduce_all)
attrs = { attrs = {'dim': dim, 'keep_dim': keep_dim, 'reduce_all': reduce_all}
'dim':
dim if dim != None and dim != [] else [0],
'keep_dim':
keep_dim,
'reduce_all':
True
if dim == None or dim == [] or len(dim) == len(input.shape) else False
}
check_variable_and_dtype( check_variable_and_dtype(
input, 'input', ['float16', 'float32', 'float64', 'int32', 'int64'], input, 'input', ['float16', 'float32', 'float64', 'int32', 'int64'],
'reduce_sum') 'reduce_sum')
......
...@@ -363,9 +363,6 @@ def get_shape_tensor_inputs(inputs, attrs, shape, op_type): ...@@ -363,9 +363,6 @@ def get_shape_tensor_inputs(inputs, attrs, shape, op_type):
shape = cast(shape, 'int32') shape = cast(shape, 'int32')
inputs["ShapeTensor"] = shape inputs["ShapeTensor"] = shape
elif isinstance(shape, (list, tuple)): elif isinstance(shape, (list, tuple)):
assert len(shape) > 0, ("The size of 'shape' in" + op_type +
" can't be zero, "
"but received %s." % len(shape))
attrs["shape"] = _get_attr_shape(shape) attrs["shape"] = _get_attr_shape(shape)
if _contain_var(shape): if _contain_var(shape):
inputs['ShapeTensorList'] = _get_shape_tensor(shape) inputs['ShapeTensorList'] = _get_shape_tensor(shape)
......
...@@ -82,6 +82,7 @@ class TestHybridParallelInferenceHelperClass(unittest.TestCase): ...@@ -82,6 +82,7 @@ class TestHybridParallelInferenceHelperClass(unittest.TestCase):
value=0, value=0,
force_cpu=False, force_cpu=False,
name="cond_int") name="cond_int")
print(cond_int.shape)
cond = layers.less_than(x=step_idx, y=max_len) cond = layers.less_than(x=step_idx, y=max_len)
while_op = layers.While(cond, is_test=True) while_op = layers.While(cond, is_test=True)
......
...@@ -82,6 +82,7 @@ def len_with_selected_rows(place): ...@@ -82,6 +82,7 @@ def len_with_selected_rows(place):
# create selected_rows variable # create selected_rows variable
var = block.create_var(name="X", var = block.create_var(name="X",
dtype="float32", dtype="float32",
shape=[-1],
persistable=True, persistable=True,
type=fluid.core.VarDesc.VarType.SELECTED_ROWS) type=fluid.core.VarDesc.VarType.SELECTED_ROWS)
# y is Variable(SelectedRows) # y is Variable(SelectedRows)
......
...@@ -505,6 +505,7 @@ class OpTest(unittest.TestCase): ...@@ -505,6 +505,7 @@ class OpTest(unittest.TestCase):
else: else:
tensor.set(self.inputs[var_name], place) tensor.set(self.inputs[var_name], place)
feed_map[var_name] = tensor feed_map[var_name] = tensor
return feed_map return feed_map
def _append_ops(self, block): def _append_ops(self, block):
...@@ -1136,6 +1137,7 @@ class OpTest(unittest.TestCase): ...@@ -1136,6 +1137,7 @@ class OpTest(unittest.TestCase):
continue continue
else: else:
grad_feed_map[arg] = fwd_outs[i]._copy(p) grad_feed_map[arg] = fwd_outs[i]._copy(p)
return grad_feed_map return grad_feed_map
def _get_need_run_ops(self, op_desc, fwd_op_desc=None): def _get_need_run_ops(self, op_desc, fwd_op_desc=None):
...@@ -1254,6 +1256,7 @@ class OpTest(unittest.TestCase): ...@@ -1254,6 +1256,7 @@ class OpTest(unittest.TestCase):
build_strategy=build_strategy, build_strategy=build_strategy,
places=place) places=place)
program = compiled_program program = compiled_program
outs = exe.run(program, outs = exe.run(program,
feed=grad_feed_map, feed=grad_feed_map,
fetch_list=grad_fetch_list, fetch_list=grad_fetch_list,
...@@ -1290,6 +1293,7 @@ class OpTest(unittest.TestCase): ...@@ -1290,6 +1293,7 @@ class OpTest(unittest.TestCase):
fwd_res, fwd_res,
grad_op_desc, grad_op_desc,
enable_inplace=True) enable_inplace=True)
self._compare_expect_and_actual_outputs(place, self._compare_expect_and_actual_outputs(place,
expect_res[1], expect_res[1],
expect_res[0], expect_res[0],
...@@ -1457,7 +1461,7 @@ class OpTest(unittest.TestCase): ...@@ -1457,7 +1461,7 @@ class OpTest(unittest.TestCase):
# NOTE(zhiqiu): np.allclose([], [1.]) returns True # NOTE(zhiqiu): np.allclose([], [1.]) returns True
# see details: https://stackoverflow.com/questions/38331703/why-does-numpys-broadcasting-sometimes-allow-comparing-arrays-of-different-leng # see details: https://stackoverflow.com/questions/38331703/why-does-numpys-broadcasting-sometimes-allow-comparing-arrays-of-different-leng
if expect_np.size == 0: if expect_np.size == 0:
self.op_test.assertTrue(actual_np.size == 0) # }}} self.op_test.assertTrue(actual_np.size == 0)
self._compare_numpy(name, actual_np, expect_np) self._compare_numpy(name, actual_np, expect_np)
if isinstance(expect, tuple): if isinstance(expect, tuple):
self._compare_list(name, actual, expect) self._compare_list(name, actual, expect)
...@@ -1663,7 +1667,6 @@ class OpTest(unittest.TestCase): ...@@ -1663,7 +1667,6 @@ class OpTest(unittest.TestCase):
if check_dygraph: if check_dygraph:
# always enable legacy dygraph # always enable legacy dygraph
g_enable_legacy_dygraph() g_enable_legacy_dygraph()
dygraph_checker = DygraphChecker(self, self.outputs) dygraph_checker = DygraphChecker(self, self.outputs)
dygraph_checker.check() dygraph_checker.check()
dygraph_outs = dygraph_checker.outputs dygraph_outs = dygraph_checker.outputs
...@@ -1830,15 +1833,29 @@ class OpTest(unittest.TestCase): ...@@ -1830,15 +1833,29 @@ class OpTest(unittest.TestCase):
# Therefore, it asserts np.abs(a - b) / (np.abs(a)*1e4) < max_relative_error, # Therefore, it asserts np.abs(a - b) / (np.abs(a)*1e4) < max_relative_error,
# which is the same as np.abs(a - b) / np.abs(a) < max_relative_error*1e4. # which is the same as np.abs(a - b) / np.abs(a) < max_relative_error*1e4.
abs_a = np.abs(a) abs_a = np.abs(a)
if self.dtype == np.float64 and \ if abs_a.ndim > 0:
self.op_type not in op_threshold_white_list.NEED_FIX_FP64_CHECK_GRAD_THRESHOLD_OP_LIST: if self.dtype == np.float64 and \
abs_a[abs_a < 1e-10] = 1e-3 self.op_type not in op_threshold_white_list.NEED_FIX_FP64_CHECK_GRAD_THRESHOLD_OP_LIST:
abs_a[np.logical_and(abs_a > 1e-10, abs_a <= 1e-8)] *= 1e4 abs_a[abs_a < 1e-10] = 1e-3
abs_a[np.logical_and(abs_a > 1e-8, abs_a <= 1e-6)] *= 1e2 abs_a[np.logical_and(abs_a > 1e-10, abs_a <= 1e-8)] *= 1e4
elif self.is_bfloat16_op(): abs_a[np.logical_and(abs_a > 1e-8, abs_a <= 1e-6)] *= 1e2
abs_a[abs_a < 1e-2] = 1 elif self.is_bfloat16_op():
else: abs_a[abs_a < 1e-2] = 1
abs_a[abs_a < 1e-3] = 1 else:
abs_a[abs_a < 1e-3] = 1
elif abs_a.ndim == 0:
if self.dtype == np.float64 and \
self.op_type not in op_threshold_white_list.NEED_FIX_FP64_CHECK_GRAD_THRESHOLD_OP_LIST:
if abs_a < 1e-10:
abs_a = 1e-3
elif abs_a > 1e-10 and abs_a <= 1e-8:
abs_a = abs_a * 1e4
elif abs_a > 1e-8 and abs_a <= 1e-6:
abs_a = abs_a * 1e2
elif self.is_bfloat16_op():
abs_a = 1 if abs_a < 1e-2 else abs_a
else:
abs_a = 1 if abs_a < 1e-3 else abs_a
diff_mat = np.abs(a - b) / abs_a diff_mat = np.abs(a - b) / abs_a
max_diff = np.max(diff_mat) max_diff = np.max(diff_mat)
...@@ -1958,7 +1975,9 @@ class OpTest(unittest.TestCase): ...@@ -1958,7 +1975,9 @@ class OpTest(unittest.TestCase):
tensor_to_check = self.scope.find_var(input_to_check).get_tensor() tensor_to_check = self.scope.find_var(input_to_check).get_tensor()
tensor_size = six.moves.reduce(lambda a, b: a * b, tensor_size = six.moves.reduce(lambda a, b: a * b,
tensor_to_check.shape(), 1) tensor_to_check.shape(), 1)
if tensor_size < 100: tensor_ndim = len(tensor_to_check.shape())
# for 0D Tensor, it's additional case for OP, so not raise error
if tensor_ndim > 0 and tensor_size < 100:
self.__class__.input_shape_is_large = False self.__class__.input_shape_is_large = False
if not type(output_names) is list: if not type(output_names) is list:
......
...@@ -437,12 +437,6 @@ class TestFillConstantOpError(unittest.TestCase): ...@@ -437,12 +437,6 @@ class TestFillConstantOpError(unittest.TestCase):
self.assertRaises(TypeError, test_shape_type) self.assertRaises(TypeError, test_shape_type)
# The argument shape's size of fill_constant_op must not be 0.
def test_shape_size():
fluid.layers.fill_constant(shape=[], dtype="float32", value=1)
self.assertRaises(AssertionError, test_shape_size)
# The shape dtype of fill_constant_op must be int32 or int64. # The shape dtype of fill_constant_op must be int32 or int64.
def test_shape_tensor_dtype(): def test_shape_tensor_dtype():
shape = fluid.data(name="shape_tensor", shape = fluid.data(name="shape_tensor",
......
...@@ -175,12 +175,6 @@ class TestFullOpError(unittest.TestCase): ...@@ -175,12 +175,6 @@ class TestFullOpError(unittest.TestCase):
self.assertRaises(TypeError, test_shape_type) self.assertRaises(TypeError, test_shape_type)
# The argument shape's size of full_op must not be 0.
def test_shape_size():
paddle.full(shape=[], dtype="float32", fill_value=1)
self.assertRaises(AssertionError, test_shape_size)
# The shape dtype of full op must be int32 or int64. # The shape dtype of full op must be int32 or int64.
def test_shape_tensor_dtype(): def test_shape_tensor_dtype():
shape = fluid.data(name="shape_tensor", shape = fluid.data(name="shape_tensor",
......
...@@ -30,8 +30,8 @@ class TestMseLoss(unittest.TestCase): ...@@ -30,8 +30,8 @@ class TestMseLoss(unittest.TestCase):
sub = input_val - label_val sub = input_val - label_val
np_result = np.mean(sub * sub) np_result = np.mean(sub * sub)
input_var = layers.create_tensor(dtype="float32", name="input") input_var = fluid.data(name="input", shape=[-1, 3], dtype="float32")
label_var = layers.create_tensor(dtype="float32", name="label") label_var = fluid.data(name="label", shape=[-1, 3], dtype="float32")
output = layers.mse_loss(input=input_var, label=label_var) output = layers.mse_loss(input=input_var, label=label_var)
for use_cuda in ([False, True] for use_cuda in ([False, True]
...@@ -54,7 +54,7 @@ class TestMseInvalidInput(unittest.TestCase): ...@@ -54,7 +54,7 @@ class TestMseInvalidInput(unittest.TestCase):
def test_invalid_input(): def test_invalid_input():
input = [256, 3] input = [256, 3]
label = fluid.data(name='label', shape=[None, 3], dtype='float32') label = fluid.data(name='label1', shape=[None, 3], dtype='float32')
loss = fluid.layers.mse_loss(input, label) loss = fluid.layers.mse_loss(input, label)
self.assertRaises(TypeError, test_invalid_input) self.assertRaises(TypeError, test_invalid_input)
......
...@@ -75,9 +75,6 @@ class TestRandnOpError(unittest.TestCase): ...@@ -75,9 +75,6 @@ class TestRandnOpError(unittest.TestCase):
def test_error(self): def test_error(self):
with program_guard(Program(), Program()): with program_guard(Program(), Program()):
# The argument shape's size of randn_op should not be 0.
self.assertRaises(AssertionError, paddle.randn, [])
# The argument shape's type of randn_op should be list or tuple. # The argument shape's type of randn_op should be list or tuple.
self.assertRaises(TypeError, paddle.randn, 1) self.assertRaises(TypeError, paddle.randn, 1)
......
...@@ -23,6 +23,8 @@ from paddle.fluid.executor import Executor ...@@ -23,6 +23,8 @@ from paddle.fluid.executor import Executor
from paddle.fluid.framework import Program, program_guard from paddle.fluid.framework import Program, program_guard
from paddle.fluid.layers.control_flow import select_input, select_output from paddle.fluid.layers.control_flow import select_input, select_output
paddle.enable_static()
class TestSplitMergeSelectedVarOps(unittest.TestCase): class TestSplitMergeSelectedVarOps(unittest.TestCase):
...@@ -37,7 +39,9 @@ class TestSplitMergeSelectedVarOps(unittest.TestCase): ...@@ -37,7 +39,9 @@ class TestSplitMergeSelectedVarOps(unittest.TestCase):
outputs = [] outputs = []
for i in range(branch_num): for i in range(branch_num):
out = program.current_block().create_var( out = program.current_block().create_var(
dtype='float32', type=core.VarDesc.VarType.LOD_TENSOR) dtype='float32',
shape=[2],
type=core.VarDesc.VarType.LOD_TENSOR)
outputs.append(out) outputs.append(out)
select_output(x, outputs, mask) select_output(x, outputs, mask)
......
...@@ -23,7 +23,6 @@ from paddle.fluid.layer_helper import LayerHelper ...@@ -23,7 +23,6 @@ from paddle.fluid.layer_helper import LayerHelper
from functools import reduce from functools import reduce
from paddle.fluid.framework import _test_eager_guard from paddle.fluid.framework import _test_eager_guard
class TestSetValueBase(unittest.TestCase): class TestSetValueBase(unittest.TestCase):
def setUp(self): def setUp(self):
...@@ -1442,7 +1441,6 @@ class TestGradientTruncated(unittest.TestCase): ...@@ -1442,7 +1441,6 @@ class TestGradientTruncated(unittest.TestCase):
# When `input.stop_gradient = True` and `value.stop_gradient = False`, # When `input.stop_gradient = True` and `value.stop_gradient = False`,
# set_value_grad_op will not be run during backward. # set_value_grad_op will not be run during backward.
y, value = op(x) y, value = op(x)
y2 = y + 1 y2 = y + 1
loss = paddle.fluid.layers.reduce_sum(y2) loss = paddle.fluid.layers.reduce_sum(y2)
sgd = paddle.optimizer.Adam() sgd = paddle.optimizer.Adam()
......
# Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import paddle
import paddle.fluid as fluid
import numpy as np
import unittest
unary_api_list = [
paddle.nn.functional.elu,
paddle.nn.functional.gelu,
paddle.nn.functional.hardsigmoid,
paddle.nn.functional.hardswish,
paddle.nn.functional.leaky_relu,
paddle.nn.functional.log_sigmoid,
paddle.nn.functional.relu,
paddle.nn.functional.relu6,
paddle.nn.functional.sigmoid,
paddle.nn.functional.softplus,
paddle.nn.functional.softshrink,
paddle.nn.functional.softsign,
paddle.nn.functional.swish,
paddle.nn.functional.tanhshrink,
paddle.nn.functional.thresholded_relu,
paddle.stanh,
paddle.nn.functional.celu,
paddle.nn.functional.mish,
paddle.nn.functional.silu,
paddle.nn.functional.tanh,
paddle.cosh,
paddle.sinh,
paddle.abs,
paddle.acos,
paddle.asin,
paddle.atan,
paddle.ceil,
paddle.cos,
paddle.exp,
paddle.floor,
paddle.log,
paddle.log1p,
paddle.reciprocal,
paddle.round,
paddle.sin,
paddle.sqrt,
paddle.square,
paddle.tanh,
paddle.acosh,
paddle.asinh,
paddle.atanh,
paddle.expm1,
paddle.log10,
paddle.log2,
paddle.tan,
]
# Use to test zero-dim in the whole API
class TestUnaryAPI(unittest.TestCase):
def test_dygraph_unary(self):
paddle.disable_static()
fluid.set_flags({"FLAGS_retain_grad_for_all_tensor": True})
for api in unary_api_list:
x = paddle.rand([])
x.stop_gradient = False
out = api(x)
out.backward()
self.assertEqual(x.shape, [])
self.assertEqual(out.shape, [])
self.assertEqual(x.grad.shape, [])
self.assertEqual(out.grad.shape, [])
paddle.enable_static()
def test_static_unary(self):
paddle.enable_static()
for api in unary_api_list:
main_prog = fluid.Program()
with fluid.program_guard(main_prog, fluid.Program()):
x = paddle.rand([])
x.stop_gradient = False
out = api(x)
fluid.backward.append_backward(out)
# ScaleLossGradOp / append_backward always set grad shape to [1]
prog = paddle.static.default_main_program()
block = prog.global_block()
x_grad = block.var(fluid.framework.grad_var_name(x.name))
out_grad = block.var(fluid.framework.grad_var_name(out.name))
# Test compile shape, grad is always [1]
self.assertEqual(x.shape, ())
self.assertEqual(out.shape, ())
exe = fluid.Executor()
result = exe.run(main_prog,
fetch_list=[x, out, x_grad, out_grad])
# Test runtime shape
self.assertEqual(result[0].shape, ())
self.assertEqual(result[1].shape, ())
self.assertEqual(result[3].shape, (1, ))
# 0D will be stacked when 1+ place, due to it cannot be concated
# for 1 place: [ x-place1 ]
# for 1+ place: [ paddle.stack([x-place1, x_place2...]) ]
if paddle.device.is_compiled_with_cuda():
places = [paddle.CUDAPlace(0)]
device_num = 1
expect_shape = ()
else:
places = [paddle.CPUPlace()] * 4
device_num = 4
expect_shape = (device_num, )
compiled_program = fluid.CompiledProgram(
main_prog).with_data_parallel(out.name, places=places)
result = exe.run(compiled_program,
fetch_list=[x, out, x_grad, out_grad],
return_merged=True)
# Test runtime parallel shape
self.assertEqual(result[0].shape, expect_shape)
self.assertEqual(result[1].shape, expect_shape)
self.assertEqual(result[3].shape, (device_num, ))
compiled_program = fluid.CompiledProgram(
main_prog).with_data_parallel(out.name, places=places)
result = exe.run(compiled_program,
fetch_list=[x, out, x_grad, out_grad],
return_merged=False)
# [[x-place1, x-place2, ...], [], [], ...]
self.assertEqual(np.array(result[0]).shape, (device_num, ))
self.assertEqual(np.array(result[1]).shape, (device_num, ))
self.assertEqual(np.array(result[3]).shape, (device_num, 1))
paddle.disable_static()
if __name__ == "__main__":
unittest.main()
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册