未验证 提交 700bc8cd 编写于 作者: 小飞猪 提交者: GitHub

[xdoctest][task 144-149] reformat example code with google style in `text/datasets/*` (#56579)

* [Doctest]fix No.144-149, test=docs_preview

* fix timeout
上级 e43f93d0
...@@ -67,28 +67,39 @@ class Conll05st(Dataset): ...@@ -67,28 +67,39 @@ class Conll05st(Dataset):
.. code-block:: python .. code-block:: python
import paddle >>> import paddle
from paddle.text.datasets import Conll05st >>> from paddle.text.datasets import Conll05st
class SimpleNet(paddle.nn.Layer): >>> class SimpleNet(paddle.nn.Layer):
def __init__(self): ... def __init__(self):
super().__init__() ... super().__init__()
...
def forward(self, pred_idx, mark, label): ... def forward(self, pred_idx, mark, label):
return paddle.sum(pred_idx), paddle.sum(mark), paddle.sum(label) ... return paddle.sum(pred_idx), paddle.sum(mark), paddle.sum(label)
conll05st = Conll05st() >>> conll05st = Conll05st()
for i in range(10): >>> for i in range(10):
pred_idx, mark, label= conll05st[i][-3:] ... pred_idx, mark, label= conll05st[i][-3:]
pred_idx = paddle.to_tensor(pred_idx) ... pred_idx = paddle.to_tensor(pred_idx)
mark = paddle.to_tensor(mark) ... mark = paddle.to_tensor(mark)
label = paddle.to_tensor(label) ... label = paddle.to_tensor(label)
...
model = SimpleNet() ... model = SimpleNet()
pred_idx, mark, label= model(pred_idx, mark, label) ... pred_idx, mark, label= model(pred_idx, mark, label)
print(pred_idx, mark, label) ... print(pred_idx.item(), mark.item(), label.item())
>>> # doctest: +SKIP('label will change')
65840 5 1991
92560 5 3686
99120 5 457
121960 5 3945
4774 5 2378
14973 5 1938
36921 5 1090
26908 5 2329
62965 5 2968
97755 5 2674
""" """
...@@ -334,10 +345,11 @@ class Conll05st(Dataset): ...@@ -334,10 +345,11 @@ class Conll05st(Dataset):
.. code-block:: python .. code-block:: python
from paddle.text.datasets import Conll05st >>> from paddle.text.datasets import Conll05st
>>> conll05st = Conll05st()
>>> word_dict, predicate_dict, label_dict = conll05st.get_dict()
conll05st = Conll05st()
word_dict, predicate_dict, label_dict = conll05st.get_dict()
""" """
return self.word_dict, self.predicate_dict, self.label_dict return self.word_dict, self.predicate_dict, self.label_dict
...@@ -349,9 +361,10 @@ class Conll05st(Dataset): ...@@ -349,9 +361,10 @@ class Conll05st(Dataset):
.. code-block:: python .. code-block:: python
from paddle.text.datasets import Conll05st >>> from paddle.text.datasets import Conll05st
>>> conll05st = Conll05st()
>>> emb_file = conll05st.get_embedding()
conll05st = Conll05st()
emb_file = conll05st.get_embedding()
""" """
return self.emb_file return self.emb_file
...@@ -47,27 +47,38 @@ class Imdb(Dataset): ...@@ -47,27 +47,38 @@ class Imdb(Dataset):
.. code-block:: python .. code-block:: python
import paddle >>> # doctest: +TIMEOUT(75)
from paddle.text.datasets import Imdb >>> import paddle
>>> from paddle.text.datasets import Imdb
class SimpleNet(paddle.nn.Layer):
def __init__(self): >>> class SimpleNet(paddle.nn.Layer):
super().__init__() ... def __init__(self):
... super().__init__()
def forward(self, doc, label): ...
return paddle.sum(doc), label ... def forward(self, doc, label):
... return paddle.sum(doc), label
imdb = Imdb(mode='train')
>>> imdb = Imdb(mode='train')
for i in range(10):
doc, label = imdb[i] >>> for i in range(10):
doc = paddle.to_tensor(doc) ... doc, label = imdb[i]
label = paddle.to_tensor(label) ... doc = paddle.to_tensor(doc)
... label = paddle.to_tensor(label)
model = SimpleNet() ...
image, label = model(doc, label) ... model = SimpleNet()
print(doc.shape, label.shape) ... image, label = model(doc, label)
... print(doc.shape, label.shape)
[121] [1]
[115] [1]
[386] [1]
[471] [1]
[585] [1]
[206] [1]
[221] [1]
[324] [1]
[166] [1]
[598] [1]
""" """
......
...@@ -47,27 +47,37 @@ class Imikolov(Dataset): ...@@ -47,27 +47,37 @@ class Imikolov(Dataset):
.. code-block:: python .. code-block:: python
import paddle >>> import paddle
from paddle.text.datasets import Imikolov >>> from paddle.text.datasets import Imikolov
class SimpleNet(paddle.nn.Layer): >>> class SimpleNet(paddle.nn.Layer):
def __init__(self): ... def __init__(self):
super().__init__() ... super().__init__()
...
def forward(self, src, trg): ... def forward(self, src, trg):
return paddle.sum(src), paddle.sum(trg) ... return paddle.sum(src), paddle.sum(trg)
imikolov = Imikolov(mode='train', data_type='SEQ', window_size=2) >>> imikolov = Imikolov(mode='train', data_type='SEQ', window_size=2)
for i in range(10): >>> for i in range(10):
src, trg = imikolov[i] ... src, trg = imikolov[i]
src = paddle.to_tensor(src) ... src = paddle.to_tensor(src)
trg = paddle.to_tensor(trg) ... trg = paddle.to_tensor(trg)
...
model = SimpleNet() ... model = SimpleNet()
src, trg = model(src, trg) ... src, trg = model(src, trg)
print(src.shape, trg.shape) ... print(src.item(), trg.item())
2076 2075
2076 2075
675 674
4 3
464 463
2076 2075
865 864
2076 2075
2076 2075
1793 1792
""" """
......
...@@ -113,28 +113,39 @@ class Movielens(Dataset): ...@@ -113,28 +113,39 @@ class Movielens(Dataset):
.. code-block:: python .. code-block:: python
import paddle >>> # doctest: +TIMEOUT(75)
from paddle.text.datasets import Movielens >>> import paddle
>>> from paddle.text.datasets import Movielens
class SimpleNet(paddle.nn.Layer):
def __init__(self): >>> class SimpleNet(paddle.nn.Layer):
super().__init__() ... def __init__(self):
... super().__init__()
def forward(self, category, title, rating): ...
return paddle.sum(category), paddle.sum(title), paddle.sum(rating) ... def forward(self, category, title, rating):
... return paddle.sum(category), paddle.sum(title), paddle.sum(rating)
movielens = Movielens(mode='train')
>>> movielens = Movielens(mode='train')
for i in range(10):
category, title, rating = movielens[i][-3:] >>> for i in range(10):
category = paddle.to_tensor(category) ... category, title, rating = movielens[i][-3:]
title = paddle.to_tensor(title) ... category = paddle.to_tensor(category)
rating = paddle.to_tensor(rating) ... title = paddle.to_tensor(title)
... rating = paddle.to_tensor(rating)
model = SimpleNet() ...
category, title, rating = model(category, title, rating) ... model = SimpleNet()
print(category.shape, title.shape, rating.shape) ... category, title, rating = model(category, title, rating)
... print(category.shape, title.shape, rating.shape)
[] [] []
[] [] []
[] [] []
[] [] []
[] [] []
[] [] []
[] [] []
[] [] []
[] [] []
[] [] []
""" """
......
...@@ -58,28 +58,38 @@ class UCIHousing(Dataset): ...@@ -58,28 +58,38 @@ class UCIHousing(Dataset):
.. code-block:: python .. code-block:: python
import paddle >>> import paddle
from paddle.text.datasets import UCIHousing >>> from paddle.text.datasets import UCIHousing
class SimpleNet(paddle.nn.Layer): >>> class SimpleNet(paddle.nn.Layer):
def __init__(self): ... def __init__(self):
super().__init__() ... super().__init__()
...
def forward(self, feature, target): ... def forward(self, feature, target):
return paddle.sum(feature), target ... return paddle.sum(feature), target
paddle.disable_static() >>> paddle.disable_static()
uci_housing = UCIHousing(mode='train') >>> uci_housing = UCIHousing(mode='train')
for i in range(10): >>> for i in range(10):
feature, target = uci_housing[i] ... feature, target = uci_housing[i]
feature = paddle.to_tensor(feature) ... feature = paddle.to_tensor(feature)
target = paddle.to_tensor(target) ... target = paddle.to_tensor(target)
...
model = SimpleNet() ... model = SimpleNet()
feature, target = model(feature, target) ... feature, target = model(feature, target)
print(feature.numpy().shape, target.numpy()) ... print(feature.shape, target.numpy())
[] [24.]
[] [21.6]
[] [34.7]
[] [33.4]
[] [36.2]
[] [28.7]
[] [22.9]
[] [27.1]
[] [16.5]
[] [18.9]
""" """
......
...@@ -61,27 +61,37 @@ class WMT14(Dataset): ...@@ -61,27 +61,37 @@ class WMT14(Dataset):
.. code-block:: python .. code-block:: python
import paddle >>> import paddle
from paddle.text.datasets import WMT14 >>> from paddle.text.datasets import WMT14
class SimpleNet(paddle.nn.Layer): >>> class SimpleNet(paddle.nn.Layer):
def __init__(self): ... def __init__(self):
super().__init__() ... super().__init__()
...
def forward(self, src_ids, trg_ids, trg_ids_next): ... def forward(self, src_ids, trg_ids, trg_ids_next):
return paddle.sum(src_ids), paddle.sum(trg_ids), paddle.sum(trg_ids_next) ... return paddle.sum(src_ids), paddle.sum(trg_ids), paddle.sum(trg_ids_next)
wmt14 = WMT14(mode='train', dict_size=50) >>> wmt14 = WMT14(mode='train', dict_size=50)
for i in range(10): >>> for i in range(10):
src_ids, trg_ids, trg_ids_next = wmt14[i] ... src_ids, trg_ids, trg_ids_next = wmt14[i]
src_ids = paddle.to_tensor(src_ids) ... src_ids = paddle.to_tensor(src_ids)
trg_ids = paddle.to_tensor(trg_ids) ... trg_ids = paddle.to_tensor(trg_ids)
trg_ids_next = paddle.to_tensor(trg_ids_next) ... trg_ids_next = paddle.to_tensor(trg_ids_next)
...
model = SimpleNet() ... model = SimpleNet()
src_ids, trg_ids, trg_ids_next = model(src_ids, trg_ids, trg_ids_next) ... src_ids, trg_ids, trg_ids_next = model(src_ids, trg_ids, trg_ids_next)
print(src_ids.numpy(), trg_ids.numpy(), trg_ids_next.numpy()) ... print(src_ids.item(), trg_ids.item(), trg_ids_next.item())
91 38 39
123 81 82
556 229 230
182 26 27
447 242 243
116 110 111
403 288 289
258 221 222
136 34 35
281 136 137
""" """
...@@ -196,9 +206,10 @@ class WMT14(Dataset): ...@@ -196,9 +206,10 @@ class WMT14(Dataset):
.. code-block:: python .. code-block:: python
from paddle.text.datasets import WMT14 >>> from paddle.text.datasets import WMT14
wmt14 = WMT14(mode='train', dict_size=50) >>> wmt14 = WMT14(mode='train', dict_size=50)
src_dict, trg_dict = wmt14.get_dict() >>> src_dict, trg_dict = wmt14.get_dict()
""" """
src_dict, trg_dict = self.src_dict, self.trg_dict src_dict, trg_dict = self.src_dict, self.trg_dict
if reverse: if reverse:
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册