提交 654ba717 编写于 作者: X xjqbest

fix

上级 421c293f
...@@ -132,7 +132,7 @@ class SingleTrainer(TranspileTrainer): ...@@ -132,7 +132,7 @@ class SingleTrainer(TranspileTrainer):
padding = 0 padding = 0
if type_name == "DataLoader": if type_name == "DataLoader":
return None#self._get_dataloader(dataset_name) return None
else: else:
return self._get_dataset(dataset_name) return self._get_dataset(dataset_name)
...@@ -243,7 +243,6 @@ class SingleTrainer(TranspileTrainer): ...@@ -243,7 +243,6 @@ class SingleTrainer(TranspileTrainer):
metrics_varnames = [] metrics_varnames = []
metrics_format = [] metrics_format = []
fetch_period = 20 fetch_period = 20
#metrics_format.append("{}: {{}}".format("epoch"))
metrics_format.append("{}: {{}}".format("batch")) metrics_format.append("{}: {{}}".format("batch"))
for name, var in model_class.get_metrics().items(): for name, var in model_class.get_metrics().items():
metrics_varnames.append(var.name) metrics_varnames.append(var.name)
...@@ -259,7 +258,7 @@ class SingleTrainer(TranspileTrainer): ...@@ -259,7 +258,7 @@ class SingleTrainer(TranspileTrainer):
while True: while True:
metrics_rets = self._exe.run(program=program, metrics_rets = self._exe.run(program=program,
fetch_list=metrics_varnames) fetch_list=metrics_varnames)
metrics = [batch_id]#[epoch, batch_id] metrics = [batch_id]
metrics.extend(metrics_rets) metrics.extend(metrics_rets)
if batch_id % fetch_period == 0 and batch_id != 0: if batch_id % fetch_period == 0 and batch_id != 0:
...@@ -275,7 +274,6 @@ class SingleTrainer(TranspileTrainer): ...@@ -275,7 +274,6 @@ class SingleTrainer(TranspileTrainer):
dirname = envs.get_global_env("epoch.init_model_path", None) dirname = envs.get_global_env("epoch.init_model_path", None)
if dirname is None: if dirname is None:
return return
dirname = os.path.join(dirname, str(epoch_id))
if is_fleet: if is_fleet:
fleet.load_persistables(self._exe, dirname) fleet.load_persistables(self._exe, dirname)
else: else:
......
...@@ -12,43 +12,52 @@ ...@@ -12,43 +12,52 @@
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
debug: false # 轮数
cold_start: true
epochs: 10 epochs: 10
# 设备
device: cpu device: cpu
# 工作目录
workspace: "paddlerec.models.rank.dnn" workspace: "paddlerec.models.rank.dnn"
# dataset列表
dataset: dataset:
- name: dataset_2 - name: dataset_2 # 名字,用来区分不同的dataset
batch_size: 2 batch_size: 2
#type: QueueDataset type: DataLoader # 或者QueueDataset
type: DataLoader data_path: "{workspace}/data/sample_data/train" # 数据路径
data_path: "{workspace}/data/sample_data/train"
sparse_slots: "click 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26" sparse_slots: "click 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26"
dense_slots: "dense_var:13" dense_slots: "dense_var:13"
# 超参数
hyper_parameters: hyper_parameters:
#优化器
optimizer: optimizer:
class: Adam class: Adam
learning_rate: 0.001 learning_rate: 0.001
strategy: async strategy: async
# 用户自定义
sparse_inputs_slots: 27 sparse_inputs_slots: 27
sparse_feature_number: 1000001 sparse_feature_number: 1000001
sparse_feature_dim: 9 sparse_feature_dim: 9
dense_input_dim: 13 dense_input_dim: 13
fc_sizes: [512, 256, 128, 32] fc_sizes: [512, 256, 128, 32]
# executor配置
epoch: epoch:
name: name:
trainer_class: single trainer_class: single
save_checkpoint_interval: 2 save_checkpoint_interval: 2 # 保存模型
save_inference_interval: 4 save_inference_interval: 4 # 保存预测模型
save_checkpoint_path: "increment" save_checkpoint_path: "increment" # 保存模型路径
save_inference_path: "inference" save_inference_path: "inference" # 保存预测模型路径
#save_inference_feed_varnames: [] # 预测模型feed vars
#save_inference_fetch_varnames: [] # 预测模型 fetch vars
#init_model_path: "xxxx" # 加载模型
# 执行器,每轮要跑的所有模型
executor: executor:
- name: train - name: train
model: "{workspace}/model.py" model: "{workspace}/model.py" # 模型路径
dataset_name: dataset_2 dataset_name: dataset_2 # 名字,用来区分不同的阶段
thread_num: 1 thread_num: 1 # 线程数
is_infer: False is_infer: False # 是否是infer
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册