config.yaml 2.4 KB
Newer Older
M
malin10 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

M
malin10 已提交
15

C
Chengmo 已提交
16
workspace: "models/match/dssm"
M
malin10 已提交
17

M
malin10 已提交
18
dataset:
M
malin10 已提交
19
- name: dataset_train
Y
yinhaofeng 已提交
20 21
  batch_size: 8
  type: DataLoader # or QueueDataset
M
malin10 已提交
22
  data_path: "{workspace}/data/train" 
M
malin10 已提交
23
  data_converter: "{workspace}/synthetic_reader.py"
M
malin10 已提交
24 25
- name: dataset_infer
  batch_size: 1
Y
yinhaofeng 已提交
26 27
  type: DataLoader # or QueueDataset
  data_path: "{workspace}/data/test"
M
malin10 已提交
28
  data_converter: "{workspace}/synthetic_evaluate_reader.py"
M
malin10 已提交
29

M
malin10 已提交
30 31 32
hyper_parameters:
  optimizer:
    class: sgd
Y
change  
yinhaofeng 已提交
33
    learning_rate: 0.001
M
malin10 已提交
34
    strategy: async
Y
yinhaofeng 已提交
35 36
  trigram_d: 1439
  neg_num: 1
M
malin10 已提交
37 38
  fc_sizes: [300, 300, 128]
  fc_acts: ['tanh', 'tanh', 'tanh']
M
malin10 已提交
39

Y
yinhaofeng 已提交
40
mode: [train_runner,infer_runner]
M
malin10 已提交
41 42 43
# config of each runner.
# runner is a kind of paddle training class, which wraps the train/infer process.
runner:
M
malin10 已提交
44
- name: train_runner
J
Jinhua Liang 已提交
45
  class: train
M
malin10 已提交
46
  # num of epochs
Y
change  
yinhaofeng 已提交
47
  epochs: 3
M
malin10 已提交
48 49
  # device to run training or infer
  device: cpu
Y
yinhaofeng 已提交
50 51
  save_checkpoint_interval: 1 # save model interval of epochs
  save_inference_interval: 1 # save inference
M
malin10 已提交
52 53 54 55 56
  save_checkpoint_path: "increment" # save checkpoint path
  save_inference_path: "inference" # save inference path
  save_inference_feed_varnames: ["query", "doc_pos"] # feed vars of save inference
  save_inference_fetch_varnames: ["cos_sim_0.tmp_0"] # fetch vars of save inference
  init_model_path: "" # load model path
C
Chengmo 已提交
57
  print_interval: 2
Y
yinhaofeng 已提交
58
  phases: phase1
M
malin10 已提交
59
- name: infer_runner
C
Chengmo 已提交
60
  class: infer
M
malin10 已提交
61 62
  # device to run training or infer
  device: cpu
C
Chengmo 已提交
63
  print_interval: 1
Y
change  
yinhaofeng 已提交
64
  init_model_path: "increment/2" # load model path
Y
yinhaofeng 已提交
65
  phases: phase2
M
malin10 已提交
66

M
malin10 已提交
67 68 69 70 71 72
# runner will run all the phase in each epoch
phase:
- name: phase1
  model: "{workspace}/model.py" # user-defined model
  dataset_name: dataset_train # select dataset by name
  thread_num: 1
Y
yinhaofeng 已提交
73 74 75 76
- name: phase2
  model: "{workspace}/model.py" # user-defined model
  dataset_name: dataset_infer # select dataset by name
  thread_num: 1