提交 259858b4 编写于 作者: C chengduoZH

modify doc

上级 578d60bf
...@@ -49,6 +49,7 @@ class MatMulFunctor { ...@@ -49,6 +49,7 @@ class MatMulFunctor {
"The dimensions of X and Y must be the same, and both of " "The dimensions of X and Y must be the same, and both of "
"them should be %d-dimensional.", "them should be %d-dimensional.",
dim_b.size()); dim_b.size());
// The previous Rank-2 dimensions are accumulated on the batch_count.
for (int j = 0; j < dim_a.size() - 2; ++j) { for (int j = 0; j < dim_a.size() - 2; ++j) {
PADDLE_ENFORCE(dim_b[j] == dim_a[j], PADDLE_ENFORCE(dim_b[j] == dim_a[j],
"The dimensions of X[%d] and Y[%d] must be the same.", j, "The dimensions of X[%d] and Y[%d] must be the same.", j,
......
...@@ -49,6 +49,8 @@ class MatMulOp : public framework::OperatorWithKernel { ...@@ -49,6 +49,8 @@ class MatMulOp : public framework::OperatorWithKernel {
"The dimensions of X and Y must be the same, and both of " "The dimensions of X and Y must be the same, and both of "
"them should be %d-dimensional.", "them should be %d-dimensional.",
dim_x.size()); dim_x.size());
// The previous Rank-2 dimensions are accumulated on the batch_count.
for (int j = 0; j < dim_x.size() - 2; ++j) { for (int j = 0; j < dim_x.size() - 2; ++j) {
PADDLE_ENFORCE(dim_y[j] == dim_x[j], PADDLE_ENFORCE(dim_y[j] == dim_x[j],
"The dimensions of X[%d] and Y[%d] must be the same.", j, "The dimensions of X[%d] and Y[%d] must be the same.", j,
...@@ -185,10 +187,14 @@ Examples without transpose: ...@@ -185,10 +187,14 @@ Examples without transpose:
- X: [B, M, K], Y: [K] => Out: [B, M] - X: [B, M, K], Y: [K] => Out: [B, M]
- X: [M, K], Y: [B, K, N] => Out: [B, M, N] - X: [M, K], Y: [B, K, N] => Out: [B, M, N]
- X: [B, M, K], Y: [B, K, N] => Out: [B, M, N] - X: [B, M, K], Y: [B, K, N] => Out: [B, M, N]
- X: [B, ..., M, K], Y: [B, ..., K, N] => Out: [B, ..., M, N]
The behavior is designed to be similar to the `numpy.matmul` function. The behavior is designed to be similar to the `numpy.matmul` function.
The differences are: The differences are:
- Currently only rank 1 to rank 3 input tensors are supported. - When the rank of the input is greater than 3, the rank of X and
Y must be equal, and the former rank-2 dimensions are equal.
- When the rank of the input data is less than or equal to 3, it
is similar to the `numpy.matmul` function.
- We add `transpose_X` and `transpose_Y` flags. - We add `transpose_X` and `transpose_Y` flags.
Both the input `X` and `Y` can carry the LoD (Level of Details) information, Both the input `X` and `Y` can carry the LoD (Level of Details) information,
......
...@@ -138,7 +138,7 @@ class MatMulGradKernel : public framework::OpKernel<T> { ...@@ -138,7 +138,7 @@ class MatMulGradKernel : public framework::OpKernel<T> {
} }
int batch_count = 0; int batch_count = 0;
// // The previous Rank-2 dimensions are accumulated on the batch_count.
if (x_dims.size() > 3) { if (x_dims.size() > 3) {
batch_count = accumulate(x_dims.begin(), x_dims.end() - 2, 1, batch_count = accumulate(x_dims.begin(), x_dims.end() - 2, 1,
std::multiplies<int>()); std::multiplies<int>());
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册