From 6a68dc07dce365abba2d1e43912119016be964eb Mon Sep 17 00:00:00 2001
From: liaogang <liaogang@baidu.com>
Date: Mon, 17 Apr 2017 14:47:48 +0800
Subject: [PATCH] add infer and save models

---
 02.recognize_digits/README.en.md      |  33 ++++++++++++++++++++++++-
 02.recognize_digits/README.md         |  34 +++++++++++++++++++++++++-
 02.recognize_digits/image/infer_3.png | Bin 0 -> 7346 bytes
 02.recognize_digits/index.en.html     |  33 ++++++++++++++++++++++++-
 02.recognize_digits/index.html        |  34 +++++++++++++++++++++++++-
 02.recognize_digits/train.py          |  26 +++++++++++++++++++-
 6 files changed, 155 insertions(+), 5 deletions(-)
 create mode 100644 02.recognize_digits/image/infer_3.png

diff --git a/02.recognize_digits/README.en.md b/02.recognize_digits/README.en.md
index 0dc9354..b01790a 100644
--- a/02.recognize_digits/README.en.md
+++ b/02.recognize_digits/README.en.md
@@ -131,6 +131,7 @@ PaddlePaddle provides a Python module, `paddle.dataset.mnist`, which downloads a
 A PaddlePaddle program starts from importing the API package:
 
 ```python
+import gzip
 import paddle.v2 as paddle
 ```
 
@@ -249,6 +250,10 @@ def event_handler_plot(event):
             cost_ploter.plot()
         step += 1
     if isinstance(event, paddle.event.EndPass):
+        # save parameters
+        with gzip.open('params_pass_%d.tar.gz' % event.pass_id, 'w') as f:
+            parameters.to_tar(f)
+
         result = trainer.test(reader=paddle.batch(
             paddle.dataset.mnist.test(), batch_size=128))
         cost_ploter.append(test_title, step, result.cost)
@@ -265,6 +270,10 @@ def event_handler(event):
             print "Pass %d, Batch %d, Cost %f, %s" % (
                 event.pass_id, event.batch_id, event.cost, event.metrics)
     if isinstance(event, paddle.event.EndPass):
+        # save parameters
+        with gzip.open('params_pass_%d.tar.gz' % event.pass_id, 'w') as f:
+            parameters.to_tar(f)
+
         result = trainer.test(reader=paddle.batch(
             paddle.dataset.mnist.test(), batch_size=128))
         print "Test with Pass %d, Cost %f, %s\n" % (
@@ -280,7 +289,7 @@ trainer.train(
             paddle.dataset.mnist.train(), buf_size=8192),
         batch_size=128),
     event_handler=event_handler_plot,
-    num_passes=100)
+    num_passes=5)
 ```
 
 During training, `trainer.train` invokes `event_handler` for certain events. This gives us a chance to print the training progress.
@@ -305,8 +314,30 @@ print 'The classification accuracy is %.2f%%' % (100 - float(best[2]) * 100)
 
 Usually, with MNIST data, the softmax regression model can get accuracy around 92.34%, MLP can get about 97.66%, and convolution network can get up to around 99.20%.  Convolution layers have been widely considered a great invention for image processsing.
 
+## Application
+
+After training is done, user can use the trained model to classify images. The following code shows how to inference MNIST images through `paddle.infer` interface.
+
+```python
+from PIL import Image
+import numpy as np
+def load_image(file):
+    im = Image.open(file).convert('L')
+    im = im.resize((28, 28), Image.ANTIALIAS)
+    im = np.array(im).astype(np.float32).flatten()
+    im = im / 255.0
+    return im
+test_data = []
+test_data.append((load_image('image/infer_3.png'),))
+
+probs = paddle.infer(
+    output_layer=predict, parameters=parameters, input=test_data)
+lab = np.argsort(-probs) # probs and lab are the results of one batch data
+print "Label of image/infer_3.png is: %d" % lab[0][0]
+```
 
 ## Conclusion
+
 This tutorial describes a few basic Deep Learning models viz. Softmax regression, Multilayer Perceptron Network and Convolutional Neural Network. The subsequent tutorials will derive more sophisticated models from these. So it is crucial to understand these models for future learning. When our model evolved from a simple softmax regression to slightly complex Convolutional Neural Network, the recognition accuracy on the MNIST data set achieved large improvement in accuracy. This is due to the Convolutional layers' local connections and parameter sharing. While learning new models in the future, we encourage the readers to understand the key ideas that lead a new model to improve results of an old one. Moreover, this tutorial introduced the basic flow of PaddlePaddle model design, starting with a dataprovider, model layer construction, to final training and prediction. Readers can leverage the flow used in this MNIST handwritten digit classification example and experiment with different data and network architectures to train models for classification tasks of their choice.
 
 ## References
diff --git a/02.recognize_digits/README.md b/02.recognize_digits/README.md
index b9cac63..dada65b 100644
--- a/02.recognize_digits/README.md
+++ b/02.recognize_digits/README.md
@@ -132,6 +132,7 @@ PaddlePaddle在API中提供了自动加载[MNIST](http://yann.lecun.com/exdb/mni
 首先，加载PaddlePaddle的V2 api包。
 
 ```python
+import gzip
 import paddle.v2 as paddle
 ```
 其次，定义三个不同的分类器：
@@ -254,6 +255,10 @@ def event_handler_plot(event):
             cost_ploter.plot()
         step += 1
     if isinstance(event, paddle.event.EndPass):
+        # save parameters
+        with gzip.open('params_pass_%d.tar.gz' % event.pass_id, 'w') as f:
+            parameters.to_tar(f)
+
         result = trainer.test(reader=paddle.batch(
             paddle.dataset.mnist.test(), batch_size=128))
         cost_ploter.append(test_title, step, result.cost)
@@ -269,6 +274,10 @@ def event_handler(event):
             print "Pass %d, Batch %d, Cost %f, %s" % (
                 event.pass_id, event.batch_id, event.cost, event.metrics)
     if isinstance(event, paddle.event.EndPass):
+        # save parameters
+        with gzip.open('params_pass_%d.tar.gz' % event.pass_id, 'w') as f:
+            parameters.to_tar(f)
+
         result = trainer.test(reader=paddle.batch(
             paddle.dataset.mnist.test(), batch_size=128))
         print "Test with Pass %d, Cost %f, %s\n" % (
@@ -284,7 +293,7 @@ trainer.train(
             paddle.dataset.mnist.train(), buf_size=8192),
         batch_size=128),
     event_handler=event_handler_plot,
-    num_passes=100)
+    num_passes=5)
 ```
 
 训练过程是完全自动的，event_handler里打印的日志类似如下所示：
@@ -300,6 +309,29 @@ trainer.train(
 
 训练之后，检查模型的预测准确度。用 MNIST 训练的时候，一般 softmax回归模型的分类准确率为约为 92.34%，多层感知器为97.66%，卷积神经网络可以达到 99.20%。
 
+
+## 应用模型
+
+可以使用训练好的模型对手写体数字图片进行分类，下面程序展示了如何使用paddle.infer接口进行推断。
+
+```python
+from PIL import Image
+import numpy as np
+def load_image(file):
+    im = Image.open(file).convert('L')
+    im = im.resize((28, 28), Image.ANTIALIAS)
+    im = np.array(im).astype(np.float32).flatten()
+    im = im / 255.0
+    return im
+test_data = []
+test_data.append((load_image('image/infer_3.png'),))
+
+probs = paddle.infer(
+    output_layer=predict, parameters=parameters, input=test_data)
+lab = np.argsort(-probs) # probs and lab are the results of one batch data
+print "Label of image/infer_3.png is: %d" % lab[0][0]
+```
+
 ## 总结
 
 本教程的softmax回归、多层感知器和卷积神经网络是最基础的深度学习模型，后续章节中复杂的神经网络都是从它们衍生出来的，因此这几个模型对之后的学习大有裨益。同时，我们也观察到从最简单的softmax回归变换到稍复杂的卷积神经网络的时候，MNIST数据集上的识别准确率有了大幅度的提升，原因是卷积层具有局部连接和共享权重的特性。在之后学习新模型的时候，希望大家也要深入到新模型相比原模型带来效果提升的关键之处。此外，本教程还介绍了PaddlePaddle模型搭建的基本流程，从dataprovider的编写、网络层的构建，到最后的训练和预测。对这个流程熟悉以后，大家就可以用自己的数据，定义自己的网络模型，并完成自己的训练和预测任务了。
diff --git a/02.recognize_digits/image/infer_3.png b/02.recognize_digits/image/infer_3.png
new file mode 100644
index 0000000000000000000000000000000000000000..030cd60d3b4af9aecd4941204da4ad15f6e1189f
GIT binary patch
literal 7346
zcmb_g2{={V*Wc%!JDBIWxP*w5A!Bh3nTZslLDxJF*N|jtB2tEW)k{TEl;M^+$q><?
zGD}5<iln;AREGQQOX_{z=X;*-|9#K5So{2}z4qGcx6VHM?1TQ2J_xwXj7*IHf&h>L
ze*k?5gcyc<xdUKn3FH6(OaP0B031Zn1?V7aeq$p<7NE;^3;^+70Q<{l2fQ)_Mq3`U
za>Zn0etTTZMt|e;3|IPRpkeJ95E2mV84xJ0vPltW=$l$%84;l@W9enc)g_wLmkdg<
zA7hy>PR!{?(}y{AO$`j3tZl4}Of3wTiEt{C0|R|ATmbm_hfr*c^~Lu%IEoX7;G7(Q
z9c%)C>=GQPXKii4h`D-Qj{m!v=~>PlbSf}n{Wkw+fZNqA*aecehVIU;!7hFfmjQqk
zatWk_0Dx<ScF98_fecK8n2!Pz1OU(A%jdCzg&5d*1#evT*==J0eRSb1VIz|%9sqDK
z@)r+t@qlqS7&$8XyL$OUd<kM57f-S)#BU(p=;s#zF((tmvd;gA<M9tnCOiL*NhW*z
z#w%RlNI3C!ui!vm^5Nw_{y!T(-%wbuWmyMXHcyI)4ZQNfy5;)>m@_aN#5MlTJFFn)
zf%uUZWb_Na@(eYxg_z+#;Sy{BYY7AZzyMeBc5{f=LM#yKW2^TIE0ZY@E&F43c!ikm
z{)L?>0XDzlW5WD>cQES9h;z!*&2$xCaSJxw1??~gOqjcuktxJ*rD4h<Ja^ke4D-Y^
zg?ZUAo&pYt+k$;|F>+wU8Hn&SVAz*^D4{ltoTZ?B%AI1w;0S$CA-`aVmgA$FT*%9F
z!L@+uhIsBafp$0+-QyO#hmp^64z6z74Izd(pssHIw!d;i;p)<7#AJ+(3-n!H>(C#)
z;^u42u){i|w}ZoWt&Z&oq3mYZVGYq?Z?YL<?K0+?2@J7j)CcB<#Q+On0JZ~h5DL{9
z1ORW~^?ago0{*qqV+6>60z7~lQ21q89bv!R;}6?iAOd^_{?I4*_c;CKUN;a1?Tf#y
zD`ORa`*LsC@(3UB0nXru6~XFYw_+_|s|!^btAW*A9VgDYnkU{6za4LaH^OgNwE!2G
zwJ%f(@cM6T=CIEVvZKJ(f0e_Zc(@O^cHA(o8#jpS19srua+F_8oxF}wRx|h=*%A!G
zXe(85gBAM+JM4OxwJKI0s}1vqxnl*eB0vGV1v1gYk{~x#XkD!yBkR!Lx&5i-YTZ};
z7+H(|gX1qdha89MuPmHbS;0HGT8V#0`P1VCT%niwzdg}YXeru)HlUBu8nhCKqjhK%
z+KS$1;9of#Emz0m_iQ%H74?A}yjFb_3lu*pF8uOeWk80#jQJUNAUMP=JOr*iU=R>^
znBwK(86vI+cVjnkQ-7CD8^x6smDB-X?ClI60KN+>@7ajJlRvhgdH^&N;l9AwR>c`!
zaQBx4;O++icxV3DB)`Gso&v!AHkVLJ*oq&Palru=zzLrUVIT%1fh^>s4Aj6@pbHFv
z8L$Gofde=IEA9#WV9tj?BsdD<z-jpQ`wL`%EN~6vgCbA@DnSis0L|bjXan8gHCz|(
z!6!fiGhiM;5CX!E@FKzp5s^mZ5oJUJ(LoFm3&aL-Kn@}vh(8jFL?XwL(?}YUfm}sy
zB6pCxNCWa1X-E2yA><?S4f%;dF>Dw<j3{P3W-~?uqlYoa?8fZJcwmAs5ttL0vzUvR
z984jm0@Hwbis{A-Vm@J}QGl|d0;mM4fNG!ys1@pnx}y{{8cjsg(HyiGt%mox6CFe+
z&>vVlmKQ6IRe)>L1Z#_R!3JTYu}RnrY(BOE+l1}J4q<87B^*0$ElwV%g)_zN!Fk{g
z;o@-VxEr`~+(Y=>yvNPp@pu8e3|<{RmkxMu{1JQ-{xY75ugACJNAS}G0zsG{PtYb<
z5y*rPLLA|5LLs4!&_Q@lm}6pPA~Gp688JCB`7<43N@u#oRLj)CG|Dv3%*8Ctti^1_
z?8<zYIhi?^xtjR}^Lyrb7H$?97HyW@EZ!_fSuU~^vpi&Z!}6V#m31AfChJaCFV<Mr
zi>$X<AF&Rx{$S%_lVdYr+s78lc9t!Vt)8uq?K?X=`+9a=c1QLQ_Ot9a*&Eph*ylKS
zIW}>aa=3EDaAa~+aCC5d;bi8N=G5anz!|}r&RNR&f^&k4nQJ|l0T-Donk$p*E>|zt
zG&e7|61Nq%A9oV>E$+wMV>|?&^*n|=t~@7ruJJVTjPRnolDr1IF1*Kib9o=~zURa9
z$?%!-dGnp-E8=_3N8{(=-@<RlAI_i2f1iI)02Np-U@G7%kStIl&?E3uP*hM)&`mHw
zuvoA|a8_uIkgkxMP@)i3s9Wf#u(+_Hu#a%6aHVj+2v$T+WT(g>kt-q(MJCqpt=YQ9
zWliFmk~Oc^V%Ey7wOM;)?X|V7Yo|rUM2$rQMgJCU6rB(g5YrX&7CSFiEB2AdOVlBH
z5ziCrh~wh?;(Fq~;upo6#Ay<1B}^njC9X<5mzZBCv(9$iv31mS{gNz_8j|jk=OrIV
z(xiw|mQs;Y1yZl1nWZ(PJ*6*5w@A;fmsxMWK7M`W`Y{<H8B>`EnF5(Nvh1=X*&x{*
z*{%)v4H_GKHeBA&CWnzzmGhL#lzSnMkyn%VlD{n9z7e-kbEE&poQ=H-Yzle`VG0Eb
zLz@IPS!_DCsdCeo%~G2kH>YlH*}SBvs_3hjtN2=pN6Ad-m{PUUH)T0x7v)UlE){ka
zBb6AHDwWAC@>|@tT-owcl~>hLHD2|B>Y|#u8bz&G?W4Ms`a$(e>b)9#8rB*~8jmz_
zn);eCnl+j~wA8dhv`VzTZdKUov-Q^2v28Nj+_vRz8_`~;P1e4uJ*XqDb5JK+XOJX8
zB9n4R!@82XuDUmLNA))7dFvJGebHCcr|6gK&l+eML>bg?N4FbqPu%|8kjK#0FvD=b
zXq}OVQGpT7Sk?H5alHx7#M~s+q}No`)W!6sDa}mXEXu6OoXvcfd4~D0g`5S&qS_K;
zX=ZuO^34wE9sWBit$>xO)j6wvYZ>bx>w7!#JFRzS?)+e*WD{xAvWs_@)2>^)W_IiE
zPTu|6R@OGu_JJLz-9EdUcC+@|?bGZB_iWx1wdbjWh=Z3yl_SB?&hduh^j^cgf9-w0
zPjz41zMlOu`@{D?J|J?y_rQH8PA9Tc=|S8<`-8U*E|9IrIpk?)Q|C+0G#3Mx3of5r
zbzRT9est4zOLH4_*LF{HAM?=mIOp-vljNE1IpJmCmEkq%ZQ`BfJ?mrTljlSCwfCj^
zG5H<zyX(*6@8jPTAQliF&>kos7#BDgq!sj65RGC^xe<&6?+>mD;e*GV)==5dlc7Ul
zI$@b%bBF8>m4<VN`-it4mOGqqcr?N&;`$Nn5tkzmA|)b^Mh->kMO}?XqMf53#7M@R
zh<P7t9GicX<*3imXU7zer5&3(ZhyS`gy@Ob6C)>$PZq>+#8KjU<G03Vox+~-I`uq3
zCE@Rcr9{`nC#Mxpr=MO(a!Gn}M(NDOGxW3WXP+mlC0|Lwr}(Gzq>@te)40<j(nii%
zo~t-7em?R1)L%}2Jx<?}o^^rcLg<CTixwBF{+9YX<?n?I&y4O&{Y>hmwU-hu&0coB
z+;K(sN^zEG*6FOD*<RT%uNq&i$XTD0ehq&u?AnK1yWE!R8rN^$5V>*s#$uj--eA5>
ze$!3$n>TN*y_H;mDF`k2Sh%mSt!R5uRk1?xRjL5>^lflE^!E6jgLisL%u61WYLph2
zNtazJ=PggHKq?Mb&?-GE2df;a+V7g(eNer%y8PazdwDeyHJSJM?<d!?)SjrN*G1G#
z*9X>5G<Y<OJaBsOx^YiqSJTd>=MT*vK58~<ZfwzOse7dTsOGWO<GW8Zo>V?nds@+|
z+FJfh^;!9IwdWNt)L&G!X|`3jZ)>mZAayi!ZtraFGVOZWy`#Im$F}EX@4nu_m##0z
z`h5E)UxmGze;xY<_a?EQt3Q2U?Lf}k4R5J~YJ>NOwhy%q?;3tR;xh8-UGTew_a{EE
ze@GuCj@}$o9;^9i^s#Mx@A&&qfuH6l;y!bKzVt=*OW9Z5udTE_wD*&gN&2^>@50~n
zrnXEyn6{oCnDLvLpG}+-p3DEC@uTIZ{m;?)Lkon3i;Ei;tC!4|-q8K%^guF&ynGfw
zVT*BxU&Y_@0AP23XNNWbSU6U`y_P+YmG4D}kzdL%{|m2tpD{Y%83N?#0$>{pfJHq3
zSD;Em%m%NFqxWuIfKgHTt<b`dV0RVeWq`0z;L&7`PX8_n0HGRyMGBohf0<5S%!Oz6
zJ^<>2R=)Wd-gqtmvV|F_wHLyF3B4Y0GlBEqB8sd77;XgRM(9m|2y@55g9(&Xe*}YK
zad-j~GYczpDCYtg1Vu4e6o+Gcs3TFZA7Ht0JQ7NJc;204!nz<n<)f)rnI!e^H1ONB
z)1*|KDaV*u1O$bIMWolu$Zn9^qN=8@p{ZrC-O$L`#MErpZd*HhcqDUib#wRd^zsf4
z2@N|GemLUziIZ{hrxFs=&Yk}&{ldk+GjguwUcZr-fAdyJX<2ziW!2s42aQb+n_C_|
ze$vs|)!ozkvhUT<@W{LOA4bPMj!%C3J~cfvJNM%!gBJqO6<WWU{fiej<b}avQ7nPM
z3&9+MigIId5=wX;y`2Pd5brwWqfC7IsaNkbFiWb~(D<Dx?JNRPTZW`38Pt}U{b$6E
z{hyfqCiaKdYj|YFEDMUkpg0soad;dQJQF-^;qgo?Ov}RZOW2l$gCU&1g${!tFa{Qj
zCBR=UR%TYN|FzKj;Xhee=&t}9ionH$asv`riW$pE1hW5u(%V*j%gUbe#so?nm_jmb
z8hI_n&uC@L8xOvnXbhT^Xy+IDGDWS}rcMXg-n&;mXgbOawh`X(iLrDSuj9#~McrzR
z20gifiI=jxmrhP4&&kBbHAs4L7?=C*jcFiB9&=00-X;PT*gNRJgAPQ-+Y|h9q=+v2
zL$f9_C)dx4?Z%ESo^$HBaJ<g#2s^%8BCUHz`&q*y(I;shW}S)YB}pUQh9G8RYIIYU
z!1dG5_PQj`vb)nk<C+DV?-nGFt?|T=-Wg_}AqAFKt@S-zQ%hsTN;SBl_6T>ilyAXp
z)`V{%G0xP)A@jvcgKUe92M!He^}T4(5lVR9wN8$g`ou8C&849l+g29Tr%zFuHH=K2
zd@&PtXA+-qXro%<T|#y?=R2D(ugtf`S6uii(QvDKX7)2Wzpd^l^=l~mNxh9e!|N1H
zrn0d)iLwAHN^f5&t9%uWcW-e?+`HIIp~Yf1;tngkjWou`lCqOuK5Y_X>2$4BKcpmM
z@h)+3U-?|Y;F|S|{R;+S!*wZ}<KObDzF;$9v)@>yQ~sGSb8b?YG&%QnwjGuaEEV>S
zP>-c5EnXEA8?H*`j_$a^+WDMRmP4dTIJI&w=GK@dMct|UdhLMQ@Yk~k6uMq34pfi^
zwjhf;TIP3$Z%Ed<<TTq>++w_#8_9c^4wQtF7ntlP$Fc;rd7j{o9Gz4h6I(MkI{aEd
z%<ogoTccRgt*^pM9S68?m!w|pl6-@VJ*bthTP!wwUMgLFdFFlp(KzZu;+*3Fl}W$x
zJq<yUhcAU{f0}SQPArW%yI>l`aZ|~;B<0PASW<uvZo%yC<gu&iHa~<vIc*Q`33s8r
z`DRfsODKwbHcyI_?^@vYjawM;?sc0SZ5H@RI!X;vw71n>%tt3L%nWo-`J860D!Oi$
zf`7z67e@zCwKr-@=jJDsM-NPH%5(2Xx1J#AOn-BD_aT-iQ8pU`m6P7Fy2ulOwaHk}
zj_<^-PT6e2kK}Q$+;d$Y(yqs;Y$*^LZ{Y)mZ0FQoHd}`NR6n|4T<}7~VQ=Xd$!ygx
zS<KPk(-p;<W1j0gj3u+FuQ~f(%;=SOHVKOK#|FhlyJd4G(}9~)pV_Fxyw0`4y~?-6
zzsb)Y8LDjbBQ{i9)>!i7pE2I~asP!AwQD@Zgv!s#v$~%46vgeC{Pfi8dSzdN4c}BY
z2XUD5A&E15$CIc|DMP-I6nR?9%(cbBFJFrN%l690wmq&2^eJ4t6KOD_@vQz%b*jD0
zRn@tB!=J5e?{+!O8`&M!obN&shS|+5?d|W@rMzox>QUXGshPW6hm~4%{;7q$u~~`w
zY`bIr<KV>S#q&c~OT`pBpG`LD9PFQZ2BNZPRx@Uq!y9S2>7%|E-<{Q@wiWR%F}wJR
zuvVPW1ikQKE;YJGi!rBlC#CjhS0fY+YISlmC+gsM)2E)_xClh{(oWBqch-s;v(yA7
z%Zptu_-v{C!lL7|P5*%{ue1x^lZ2PLvN%K9rM&X<gR+LHX*F*1<gq)4v&eOXVjXX=
z7^sz=eo3{<WeF?K>tMOrA+~<gHQ%JDA*UCc&&2rckCwk7Ab5gWYMT|8RdM59(5;;D
z3nz@LJQQ?^x9WJ|4e2Mf<XHUht5f|kIvKpgd_TbF#v7m8O(&X}hwF5s1tNpXCr<=L
zrH{6{qxYl8(&u%gXbb7RB;`l4=-i{ZEZUXP2FH`#rS*?)r>P{H(Rh36u2Nsm4>rdS
zQ91T`_uM%ub*goT{ExA7@#HU_$oZXyfDdX6z3Wev<sKF_rI!}Aix%dIcSp#gAG6|#
zYgE6oJ<t65_UXQ$>e{$&I`DpGH2&hr*{S1|#E3c#Wy4KYMc@b_X-RI5>d+<TIlTd+
zB!ip@v<bi06dY4nn_4>VlX-KfGA)c%=<yaLbUMmrsP=GQ!YtKp&S8keGuL8oF3&8=
zstA%JDrrxL)>jS}c@OYc97=ff;%TZ=T}-Lqgh#Gtg`MM@nXB#+d)^(&W_eqpULV6B
z?ky|RHJYYZM$A<G*>L^Ami_XxqhHQW<Bt!0vSRN$vE7!Nns+^%*ur^6#Oh?EW>^6w
zK^Z-ongQlImss?M@2k;41J7Q4`-rB-<m)j?$}xp8H>q`XUZhuBcTRRM&Yb^#A;DaB
zv^+ZI&SROLe>|k!ze;wE%D*{vle(WqHdB61u8C{P5MP=nMk~-x2Jr6Bi{G}UaC}yN
ztzBXLy!`+j;OM~h$Xj8ifp0HwOoTduImrhD9JP}Q@50jCOI1>|?E8uABo|Kp@vpc}
zM<pZiDQaiHN#gCOxcDgCR6fT8PI;%i11xhMIdk648Wybcx3@-E6CRRE<0p#p!kwFi
zRee->inWTOj~nAJ4~c5qs^y4}l)HuJJsc3BRb)yP1*Vjs&AK0*{;De@d``<Cz4F_b
zH^3`S&POMxr%7eK@ih`2!E1Zvipq{Yi_v*o_V%;Pt?+A3SG2W0X7oQEROf$32SOyz
zBB$o>W;yOi!dEAmx8s6>ox<*vrk`z?ajm4;S>=6Zl;;#5t(BL{$_u84QLXc#e8}r?
zp9ZbUQ~u6ppD_;@>p9s!oZm3l@wG7_hP~i&V{zwx!HEVpkD&ZM=G48?5yN%4U*n>2
zZPNkqGj|r#1e~wko`UbTEbGO~3!!BBjTIA$L9><-ZyW3S?3-WR@8Y>%TIQOxkas=C
zR7ZL-V`|aS$g}X;yU~;UpNO1GTwY>AWhU+=$&|C>vgmi#L92-v58s35?C*>wz4w{s
zZHU1~stoN7uYK&z>nU2$PJRCO(7ctZ<XP=HJtyMA{>9?5x_Egh8;j!ywa3s;@}C0?
zY42R0U`|pwC#jz|3>IN}LeoR+SYl3vQXhRyB+;y&vhT4Bz&*m1Xi%TkB{~tOiGnq8
zucqrM5lY#dr6eEDSF?NWci*U>b<c=v66Nhb$edb|@>!BTbmT|h)9DXYr~CE4{4`4Y
zV3%^P`>gjFp!xEifJ>TJ*-l*?-ybE?dsi0Y%;tC^&oq(6dnOJqcdIeQXZFI(;l;un
zOM#B3)^*?N0i}DPzxnf;c!Oi|cRFjLhW!-u`}+CNJou_j4|kb~qp7|L%Dj9)+(h^(
z%iCTZ?FF4<54<FLBsOM`u*uI2#E&F5nFnGW&m|qn$Z$#~@<`hx-@HqB(?<A8{LDY^
z#IE*ySX*qqwK=G~VA6c}&}Uq6`1p8G_?P-SYcnR#>}si%>Oll&jVz`gtG1|=rakLw
g!=1i&EmR`4y4!K(?Z?>l|EZjRj(q>~5s}{aUjy@`qyPW_

literal 0
HcmV?d00001

diff --git a/02.recognize_digits/index.en.html b/02.recognize_digits/index.en.html
index 6298165..924810d 100644
--- a/02.recognize_digits/index.en.html
+++ b/02.recognize_digits/index.en.html
@@ -173,6 +173,7 @@ PaddlePaddle provides a Python module, `paddle.dataset.mnist`, which downloads a
 A PaddlePaddle program starts from importing the API package:
 
 ```python
+import gzip
 import paddle.v2 as paddle
 ```
 
@@ -291,6 +292,10 @@ def event_handler_plot(event):
             cost_ploter.plot()
         step += 1
     if isinstance(event, paddle.event.EndPass):
+        # save parameters
+        with gzip.open('params_pass_%d.tar.gz' % event.pass_id, 'w') as f:
+            parameters.to_tar(f)
+
         result = trainer.test(reader=paddle.batch(
             paddle.dataset.mnist.test(), batch_size=128))
         cost_ploter.append(test_title, step, result.cost)
@@ -307,6 +312,10 @@ def event_handler(event):
             print "Pass %d, Batch %d, Cost %f, %s" % (
                 event.pass_id, event.batch_id, event.cost, event.metrics)
     if isinstance(event, paddle.event.EndPass):
+        # save parameters
+        with gzip.open('params_pass_%d.tar.gz' % event.pass_id, 'w') as f:
+            parameters.to_tar(f)
+
         result = trainer.test(reader=paddle.batch(
             paddle.dataset.mnist.test(), batch_size=128))
         print "Test with Pass %d, Cost %f, %s\n" % (
@@ -322,7 +331,7 @@ trainer.train(
             paddle.dataset.mnist.train(), buf_size=8192),
         batch_size=128),
     event_handler=event_handler_plot,
-    num_passes=100)
+    num_passes=5)
 ```
 
 During training, `trainer.train` invokes `event_handler` for certain events. This gives us a chance to print the training progress.
@@ -347,8 +356,30 @@ print 'The classification accuracy is %.2f%%' % (100 - float(best[2]) * 100)
 
 Usually, with MNIST data, the softmax regression model can get accuracy around 92.34%, MLP can get about 97.66%, and convolution network can get up to around 99.20%.  Convolution layers have been widely considered a great invention for image processsing.
 
+## Application
+
+After training is done, user can use the trained model to classify images. The following code shows how to inference MNIST images through `paddle.infer` interface.
+
+```python
+from PIL import Image
+import numpy as np
+def load_image(file):
+    im = Image.open(file).convert('L')
+    im = im.resize((28, 28), Image.ANTIALIAS)
+    im = np.array(im).astype(np.float32).flatten()
+    im = im / 255.0
+    return im
+test_data = []
+test_data.append((load_image('image/infer_3.png'),))
+
+probs = paddle.infer(
+    output_layer=predict, parameters=parameters, input=test_data)
+lab = np.argsort(-probs) # probs and lab are the results of one batch data
+print "Label of image/infer_3.png is: %d" % lab[0][0]
+```
 
 ## Conclusion
+
 This tutorial describes a few basic Deep Learning models viz. Softmax regression, Multilayer Perceptron Network and Convolutional Neural Network. The subsequent tutorials will derive more sophisticated models from these. So it is crucial to understand these models for future learning. When our model evolved from a simple softmax regression to slightly complex Convolutional Neural Network, the recognition accuracy on the MNIST data set achieved large improvement in accuracy. This is due to the Convolutional layers' local connections and parameter sharing. While learning new models in the future, we encourage the readers to understand the key ideas that lead a new model to improve results of an old one. Moreover, this tutorial introduced the basic flow of PaddlePaddle model design, starting with a dataprovider, model layer construction, to final training and prediction. Readers can leverage the flow used in this MNIST handwritten digit classification example and experiment with different data and network architectures to train models for classification tasks of their choice.
 
 ## References
diff --git a/02.recognize_digits/index.html b/02.recognize_digits/index.html
index 2568393..2717d93 100644
--- a/02.recognize_digits/index.html
+++ b/02.recognize_digits/index.html
@@ -174,6 +174,7 @@ PaddlePaddle在API中提供了自动加载[MNIST](http://yann.lecun.com/exdb/mni
 首先，加载PaddlePaddle的V2 api包。
 
 ```python
+import gzip
 import paddle.v2 as paddle
 ```
 其次，定义三个不同的分类器：
@@ -296,6 +297,10 @@ def event_handler_plot(event):
             cost_ploter.plot()
         step += 1
     if isinstance(event, paddle.event.EndPass):
+        # save parameters
+        with gzip.open('params_pass_%d.tar.gz' % event.pass_id, 'w') as f:
+            parameters.to_tar(f)
+
         result = trainer.test(reader=paddle.batch(
             paddle.dataset.mnist.test(), batch_size=128))
         cost_ploter.append(test_title, step, result.cost)
@@ -311,6 +316,10 @@ def event_handler(event):
             print "Pass %d, Batch %d, Cost %f, %s" % (
                 event.pass_id, event.batch_id, event.cost, event.metrics)
     if isinstance(event, paddle.event.EndPass):
+        # save parameters
+        with gzip.open('params_pass_%d.tar.gz' % event.pass_id, 'w') as f:
+            parameters.to_tar(f)
+
         result = trainer.test(reader=paddle.batch(
             paddle.dataset.mnist.test(), batch_size=128))
         print "Test with Pass %d, Cost %f, %s\n" % (
@@ -326,7 +335,7 @@ trainer.train(
             paddle.dataset.mnist.train(), buf_size=8192),
         batch_size=128),
     event_handler=event_handler_plot,
-    num_passes=100)
+    num_passes=5)
 ```
 
 训练过程是完全自动的，event_handler里打印的日志类似如下所示：
@@ -342,6 +351,29 @@ trainer.train(
 
 训练之后，检查模型的预测准确度。用 MNIST 训练的时候，一般 softmax回归模型的分类准确率为约为 92.34%，多层感知器为97.66%，卷积神经网络可以达到 99.20%。
 
+
+## 应用模型
+
+可以使用训练好的模型对手写体数字图片进行分类，下面程序展示了如何使用paddle.infer接口进行推断。
+
+```python
+from PIL import Image
+import numpy as np
+def load_image(file):
+    im = Image.open(file).convert('L')
+    im = im.resize((28, 28), Image.ANTIALIAS)
+    im = np.array(im).astype(np.float32).flatten()
+    im = im / 255.0
+    return im
+test_data = []
+test_data.append((load_image('image/infer_3.png'),))
+
+probs = paddle.infer(
+    output_layer=predict, parameters=parameters, input=test_data)
+lab = np.argsort(-probs) # probs and lab are the results of one batch data
+print "Label of image/infer_3.png is: %d" % lab[0][0]
+```
+
 ## 总结
 
 本教程的softmax回归、多层感知器和卷积神经网络是最基础的深度学习模型，后续章节中复杂的神经网络都是从它们衍生出来的，因此这几个模型对之后的学习大有裨益。同时，我们也观察到从最简单的softmax回归变换到稍复杂的卷积神经网络的时候，MNIST数据集上的识别准确率有了大幅度的提升，原因是卷积层具有局部连接和共享权重的特性。在之后学习新模型的时候，希望大家也要深入到新模型相比原模型带来效果提升的关键之处。此外，本教程还介绍了PaddlePaddle模型搭建的基本流程，从dataprovider的编写、网络层的构建，到最后的训练和预测。对这个流程熟悉以后，大家就可以用自己的数据，定义自己的网络模型，并完成自己的训练和预测任务了。
diff --git a/02.recognize_digits/train.py b/02.recognize_digits/train.py
index 6a11839..7dfd9f3 100644
--- a/02.recognize_digits/train.py
+++ b/02.recognize_digits/train.py
@@ -1,3 +1,6 @@
+import gzip
+from PIL import Image
+import numpy as np
 import paddle.v2 as paddle
 
 
@@ -79,6 +82,10 @@ def event_handler(event):
             print "Pass %d, Batch %d, Cost %f, %s" % (
                 event.pass_id, event.batch_id, event.cost, event.metrics)
     if isinstance(event, paddle.event.EndPass):
+        # save parameters
+        with gzip.open('params_pass_%d.tar.gz' % event.pass_id, 'w') as f:
+            parameters.to_tar(f)
+
         result = trainer.test(reader=paddle.batch(
             paddle.dataset.mnist.test(), batch_size=128))
         print "Test with Pass %d, Cost %f, %s\n" % (event.pass_id, result.cost,
@@ -92,9 +99,26 @@ trainer.train(
         paddle.reader.shuffle(paddle.dataset.mnist.train(), buf_size=8192),
         batch_size=128),
     event_handler=event_handler,
-    num_passes=100)
+    num_passes=1)
 
 # find the best pass
 best = sorted(lists, key=lambda list: float(list[1]))[0]
 print 'Best pass is %s, testing Avgcost is %s' % (best[0], best[1])
 print 'The classification accuracy is %.2f%%' % (100 - float(best[2]) * 100)
+
+
+def load_image(file):
+    im = Image.open(file).convert('L')
+    im = im.resize((28, 28), Image.ANTIALIAS)
+    im = np.array(im).astype(np.float32).flatten()
+    im = im / 255.0
+    return im
+
+
+test_data = []
+test_data.append((load_image('image/infer_3.png'), ))
+
+probs = paddle.infer(
+    output_layer=predict, parameters=parameters, input=test_data)
+lab = np.argsort(-probs)  # probs and lab are the results of one batch data
+print "Label of image/infer_3.png is: %d" % lab[0][0]
-- 
GitLab