From 0ec8775b68512ad96564c80603207995c2681874 Mon Sep 17 00:00:00 2001 From: tangwei12 Date: Wed, 5 Dec 2018 19:33:38 +0800 Subject: [PATCH] add cloud --- fluid/PaddleRec/ctr/README.cn.md | 3 +++ fluid/PaddleRec/ctr/README.md | 5 ++++- fluid/PaddleRec/ctr/cloud.py | 3 ++- 3 files changed, 9 insertions(+), 2 deletions(-) diff --git a/fluid/PaddleRec/ctr/README.cn.md b/fluid/PaddleRec/ctr/README.cn.md index 04c5eb9c..05d1653e 100644 --- a/fluid/PaddleRec/ctr/README.cn.md +++ b/fluid/PaddleRec/ctr/README.cn.md @@ -74,3 +74,6 @@ python infer.py \ 1. 用preprocess.py处理训练数据生成train.txt。 1. 将train.txt切分成集群机器份,放到每台机器上。 1. 用上面的 `分布式训练` 中的命令行启动分布式训练任务. + +## 在PaddleCloud上运行集群训练 +如果你正在使用PaddleCloud做集群训练,你可以使用```cloud.py```这个文件来帮助你提交任务,```trian.py```中所需要的参数可以通过PaddleCloud的环境变量来提交。 \ No newline at end of file diff --git a/fluid/PaddleRec/ctr/README.md b/fluid/PaddleRec/ctr/README.md index 13e71190..e29e2e1e 100644 --- a/fluid/PaddleRec/ctr/README.md +++ b/fluid/PaddleRec/ctr/README.md @@ -90,4 +90,7 @@ Note: The AUC value in the last log info is the total AUC for all test dataset. 1. Please prepare some CPU machines on Baidu Cloud following the steps in [train_on_baidu_cloud](https://github.com/PaddlePaddle/FluidDoc/blob/develop/doc/fluid/user_guides/howto/training/train_on_baidu_cloud_cn.rst) 1. Prepare dataset using preprocess.py. 1. Split the train.txt to trainer_num parts and put them on the machines. -1. Run training with the cluster train using the command in `Distributed Train` above. \ No newline at end of file +1. Run training with the cluster train using the command in `Distributed Train` above. + +## Train on Paddle Cloud +If you want to run this training on PaddleCloud, you can use the script ```cloud.py```, you can change the arguments in ```trian.py``` through environments in PaddleCloud. \ No newline at end of file diff --git a/fluid/PaddleRec/ctr/cloud.py b/fluid/PaddleRec/ctr/cloud.py index eaf18e2b..c5388c6a 100644 --- a/fluid/PaddleRec/ctr/cloud.py +++ b/fluid/PaddleRec/ctr/cloud.py @@ -5,12 +5,13 @@ # Copyright (c) 2017 Baidu.com, Inc. All Rights Reserved # # ====================================================================== +"""this file is only for PaddleCloud""" import os import logging -import hdfs_utils +import paddle.fluid.contrib.utils.hdfs_utils as hdfs_utils logging.basicConfig( format='%(asctime)s - %(levelname)s - %(message)s') -- GitLab